{"train/loss": 4.3369, "train/learning_rate": 9.574468085106382e-07, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 6944, "_timestamp": 1646137871, "_step": 596, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 67.0, 918.0, 32.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.59164047241211, -13.245392799377441, -7.899145126342773, -2.552898406982422, 2.7933502197265625, 8.139598846435547, 13.485843658447266, 18.83209228515625, 24.178340911865234, 29.52458953857422, 34.87083435058594, 40.21708297729492, 45.563331604003906, 50.90958023071289, 56.25582504272461, 61.602073669433594, 66.94831848144531, 72.29456329345703, 77.64081573486328, 82.987060546875, 88.33331298828125, 93.67955780029297, 99.02580261230469, 104.37205505371094, 109.71830749511719, 115.0645523071289, 120.41080474853516, 125.75704956054688, 131.10330200195312, 136.44955444335938, 141.79579162597656, 147.1420440673828, 152.48828125, 157.83453369140625, 163.18077087402344, 168.5270233154297, 173.87327575683594, 179.21951293945312, 184.56576538085938, 189.91201782226562, 195.25827026367188, 200.60452270507812, 205.9507598876953, 211.29701232910156, 216.6432647705078, 221.989501953125, 227.33575439453125, 232.6820068359375, 238.0282440185547, 243.37449645996094, 248.72073364257812, 254.06698608398438, 259.4132385253906, 264.7594909667969, 270.105712890625, 275.45196533203125, 280.7982177734375, 286.14447021484375, 291.49072265625, 296.83697509765625, 302.1831970214844, 307.5294494628906, 312.8757019042969, 318.2219543457031, 323.5682067871094]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 5.0, 5.0, 10.0, 13.0, 15.0, 20.0, 21.0, 21.0, 34.0, 28.0, 40.0, 38.0, 47.0, 43.0, 55.0, 39.0, 62.0, 57.0, 49.0, 51.0, 52.0, 53.0, 40.0, 29.0, 31.0, 24.0, 25.0, 24.0, 19.0, 10.0, 10.0, 9.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.58059310913086, -23.754621505737305, -22.92864990234375, -22.102678298950195, -21.27670669555664, -20.450735092163086, -19.62476348876953, -18.798791885375977, -17.972820281982422, -17.146848678588867, -16.320877075195312, -15.494905471801758, -14.668933868408203, -13.842962265014648, -13.016990661621094, -12.191019058227539, -11.3650484085083, -10.539076805114746, -9.713105201721191, -8.887133598327637, -8.061161994934082, -7.2351908683776855, -6.409219264984131, -5.583247661590576, -4.7572760581970215, -3.931304454803467, -3.105332851409912, -2.2793614864349365, -1.4533898830413818, -0.6274185180664062, 0.19855308532714844, 1.0245246887207031, 1.8504962921142578, 2.6764678955078125, 3.502439498901367, 4.328411102294922, 5.154382705688477, 5.980353832244873, 6.806325435638428, 7.632297039031982, 8.458269119262695, 9.28424072265625, 10.110212326049805, 10.93618392944336, 11.762155532836914, 12.588127136230469, 13.414098739624023, 14.240070343017578, 15.066040992736816, 15.892012596130371, 16.71798324584961, 17.543954849243164, 18.36992645263672, 19.195898056030273, 20.021869659423828, 20.847841262817383, 21.673812866210938, 22.499784469604492, 23.325756072998047, 24.1517276763916, 24.977699279785156, 25.80367088317871, 26.629642486572266, 27.45561408996582, 28.281585693359375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 3.0, 6.0, 12.0, 16.0, 12.0, 18.0, 16.0, 26.0, 23.0, 22.0, 32.0, 33.0, 36.0, 32.0, 35.0, 44.0, 39.0, 48.0, 44.0, 33.0, 48.0, 42.0, 41.0, 36.0, 33.0, 34.0, 33.0, 37.0, 25.0, 25.0, 21.0, 26.0, 8.0, 10.0, 11.0, 12.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0830078125, -1.0488433837890625, -1.014678955078125, -0.9805145263671875, -0.94635009765625, -0.9121856689453125, -0.878021240234375, -0.8438568115234375, -0.8096923828125, -0.7755279541015625, -0.741363525390625, -0.7071990966796875, -0.67303466796875, -0.6388702392578125, -0.604705810546875, -0.5705413818359375, -0.536376953125, -0.5022125244140625, -0.468048095703125, -0.4338836669921875, -0.39971923828125, -0.3655548095703125, -0.331390380859375, -0.2972259521484375, -0.2630615234375, -0.2288970947265625, -0.194732666015625, -0.1605682373046875, -0.12640380859375, -0.0922393798828125, -0.058074951171875, -0.0239105224609375, 0.01025390625, 0.0444183349609375, 0.078582763671875, 0.1127471923828125, 0.14691162109375, 0.1810760498046875, 0.215240478515625, 0.2494049072265625, 0.2835693359375, 0.3177337646484375, 0.351898193359375, 0.3860626220703125, 0.42022705078125, 0.4543914794921875, 0.488555908203125, 0.5227203369140625, 0.556884765625, 0.5910491943359375, 0.625213623046875, 0.6593780517578125, 0.69354248046875, 0.7277069091796875, 0.761871337890625, 0.7960357666015625, 0.8302001953125, 0.8643646240234375, 0.898529052734375, 0.9326934814453125, 0.96685791015625, 1.0010223388671875, 1.035186767578125, 1.0693511962890625, 1.103515625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 9.0, 13.0, 19.0, 24.0, 30.0, 39.0, 58.0, 73.0, 108.0, 176.0, 240.0, 336.0, 519.0, 853.0, 1507.0, 2550.0, 5584.0, 14655.0, 54536.0, 337513.0, 2318331.0, 1256090.0, 151546.0, 30755.0, 9536.0, 4005.0, 2002.0, 1127.0, 651.0, 439.0, 283.0, 214.0, 145.0, 87.0, 61.0, 36.0, 31.0, 21.0, 21.0, 11.0, 9.0, 8.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.21484375, -3.106964111328125, -2.99908447265625, -2.891204833984375, -2.7833251953125, -2.675445556640625, -2.56756591796875, -2.459686279296875, -2.351806640625, -2.243927001953125, -2.13604736328125, -2.028167724609375, -1.9202880859375, -1.812408447265625, -1.70452880859375, -1.596649169921875, -1.48876953125, -1.380889892578125, -1.27301025390625, -1.165130615234375, -1.0572509765625, -0.949371337890625, -0.84149169921875, -0.733612060546875, -0.625732421875, -0.517852783203125, -0.40997314453125, -0.302093505859375, -0.1942138671875, -0.086334228515625, 0.02154541015625, 0.129425048828125, 0.2373046875, 0.345184326171875, 0.45306396484375, 0.560943603515625, 0.6688232421875, 0.776702880859375, 0.88458251953125, 0.992462158203125, 1.100341796875, 1.208221435546875, 1.31610107421875, 1.423980712890625, 1.5318603515625, 1.639739990234375, 1.74761962890625, 1.855499267578125, 1.96337890625, 2.071258544921875, 2.17913818359375, 2.287017822265625, 2.3948974609375, 2.502777099609375, 2.61065673828125, 2.718536376953125, 2.826416015625, 2.934295654296875, 3.04217529296875, 3.150054931640625, 3.2579345703125, 3.365814208984375, 3.47369384765625, 3.581573486328125, 3.689453125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 20.0, 27.0, 62.0, 105.0, 171.0, 293.0, 511.0, 856.0, 824.0, 513.0, 281.0, 163.0, 77.0, 71.0, 25.0, 24.0, 17.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.56292724609375, -8.3367919921875, -8.11065673828125, -7.884521484375, -7.65838623046875, -7.4322509765625, -7.20611572265625, -6.97998046875, -6.75384521484375, -6.5277099609375, -6.30157470703125, -6.075439453125, -5.84930419921875, -5.6231689453125, -5.39703369140625, -5.1708984375, -4.94476318359375, -4.7186279296875, -4.49249267578125, -4.266357421875, -4.04022216796875, -3.8140869140625, -3.58795166015625, -3.36181640625, -3.13568115234375, -2.9095458984375, -2.68341064453125, -2.457275390625, -2.23114013671875, -2.0050048828125, -1.77886962890625, -1.552734375, -1.32659912109375, -1.1004638671875, -0.87432861328125, -0.648193359375, -0.42205810546875, -0.1959228515625, 0.03021240234375, 0.25634765625, 0.48248291015625, 0.7086181640625, 0.93475341796875, 1.160888671875, 1.38702392578125, 1.6131591796875, 1.83929443359375, 2.0654296875, 2.29156494140625, 2.5177001953125, 2.74383544921875, 2.969970703125, 3.19610595703125, 3.4222412109375, 3.64837646484375, 3.87451171875, 4.10064697265625, 4.3267822265625, 4.55291748046875, 4.779052734375, 5.00518798828125, 5.2313232421875, 5.45745849609375, 5.68359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 19.0, 26.0, 54.0, 92.0, 232.0, 469.0, 1130.0, 4021.0, 263401.0, 3910513.0, 11003.0, 1959.0, 660.0, 330.0, 155.0, 86.0, 37.0, 40.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.8125, -26.029052734375, -25.24560546875, -24.462158203125, -23.6787109375, -22.895263671875, -22.11181640625, -21.328369140625, -20.544921875, -19.761474609375, -18.97802734375, -18.194580078125, -17.4111328125, -16.627685546875, -15.84423828125, -15.060791015625, -14.27734375, -13.493896484375, -12.71044921875, -11.927001953125, -11.1435546875, -10.360107421875, -9.57666015625, -8.793212890625, -8.009765625, -7.226318359375, -6.44287109375, -5.659423828125, -4.8759765625, -4.092529296875, -3.30908203125, -2.525634765625, -1.7421875, -0.958740234375, -0.17529296875, 0.608154296875, 1.3916015625, 2.175048828125, 2.95849609375, 3.741943359375, 4.525390625, 5.308837890625, 6.09228515625, 6.875732421875, 7.6591796875, 8.442626953125, 9.22607421875, 10.009521484375, 10.79296875, 11.576416015625, 12.35986328125, 13.143310546875, 13.9267578125, 14.710205078125, 15.49365234375, 16.277099609375, 17.060546875, 17.843994140625, 18.62744140625, 19.410888671875, 20.1943359375, 20.977783203125, 21.76123046875, 22.544677734375, 23.328125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 389.0, 615.0, 9.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-239.70358276367188, -235.50018310546875, -231.2967987060547, -227.09339904785156, -222.8900146484375, -218.68661499023438, -214.4832305908203, -210.2798309326172, -206.07644653320312, -201.873046875, -197.66966247558594, -193.4662628173828, -189.26287841796875, -185.05947875976562, -180.85609436035156, -176.65269470214844, -172.4492950439453, -168.2458953857422, -164.04251098632812, -159.839111328125, -155.63572692871094, -151.4323272705078, -147.22894287109375, -143.02554321289062, -138.8221435546875, -134.61874389648438, -130.4153594970703, -126.21196746826172, -122.00857543945312, -117.80517578125, -113.6017837524414, -109.39839172363281, -105.19499969482422, -100.99160766601562, -96.78821563720703, -92.58482360839844, -88.38142395019531, -84.17803955078125, -79.97463989257812, -75.77124786376953, -71.56785583496094, -67.36446380615234, -63.16107177734375, -58.95767593383789, -54.7542839050293, -50.5508918762207, -46.347496032714844, -42.14410400390625, -37.940711975097656, -33.73731994628906, -29.533926010131836, -25.33053207397461, -21.127140045166016, -16.923748016357422, -12.720354080200195, -8.516960144042969, -4.313568115234375, -0.11017513275146484, 4.093217849731445, 8.296610832214355, 12.500003814697266, 16.70339584350586, 20.906789779663086, 25.110183715820312, 29.313575744628906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 6.0, 4.0, 5.0, 15.0, 17.0, 21.0, 25.0, 15.0, 27.0, 37.0, 45.0, 28.0, 52.0, 43.0, 49.0, 41.0, 52.0, 51.0, 62.0, 49.0, 46.0, 48.0, 36.0, 46.0, 18.0, 28.0, 27.0, 30.0, 16.0, 14.0, 12.0, 7.0, 8.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.197795867919922, -20.582115173339844, -19.966432571411133, -19.350751876831055, -18.735069274902344, -18.119388580322266, -17.503707885742188, -16.888025283813477, -16.2723445892334, -15.656662940979004, -15.04098129272461, -14.425300598144531, -13.809618949890137, -13.193937301635742, -12.578255653381348, -11.962574005126953, -11.346892356872559, -10.731210708618164, -10.11552906036377, -9.499847412109375, -8.884166717529297, -8.268485069274902, -7.652803421020508, -7.0371222496032715, -6.421440601348877, -5.805758953094482, -5.190077781677246, -4.574396133422852, -3.958714723587036, -3.3430333137512207, -2.727351665496826, -2.11167049407959, -1.4959888458251953, -0.8803073763847351, -0.2646259069442749, 0.3510556221008301, 0.9667370319366455, 1.582418441772461, 2.1981000900268555, 2.813781261444092, 3.4294629096984863, 4.045144557952881, 4.660825729370117, 5.276507377624512, 5.892189025878906, 6.507870197296143, 7.123551845550537, 7.739233016967773, 8.354914665222168, 8.970596313476562, 9.586277961730957, 10.201959609985352, 10.81764030456543, 11.433321952819824, 12.049003601074219, 12.664684295654297, 13.280366897583008, 13.896048545837402, 14.511730194091797, 15.127410888671875, 15.74309253692627, 16.358774185180664, 16.974456787109375, 17.590137481689453, 18.20581817626953]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 18.0, 11.0, 21.0, 19.0, 25.0, 19.0, 20.0, 26.0, 22.0, 34.0, 35.0, 29.0, 43.0, 34.0, 54.0, 41.0, 48.0, 46.0, 39.0, 41.0, 38.0, 43.0, 31.0, 29.0, 30.0, 23.0, 24.0, 16.0, 30.0, 18.0, 18.0, 9.0, 5.0, 7.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.9550628662109375, -0.919891357421875, -0.8847198486328125, -0.84954833984375, -0.8143768310546875, -0.779205322265625, -0.7440338134765625, -0.7088623046875, -0.6736907958984375, -0.638519287109375, -0.6033477783203125, -0.56817626953125, -0.5330047607421875, -0.497833251953125, -0.4626617431640625, -0.427490234375, -0.3923187255859375, -0.357147216796875, -0.3219757080078125, -0.28680419921875, -0.2516326904296875, -0.216461181640625, -0.1812896728515625, -0.1461181640625, -0.1109466552734375, -0.075775146484375, -0.0406036376953125, -0.00543212890625, 0.0297393798828125, 0.064910888671875, 0.1000823974609375, 0.13525390625, 0.1704254150390625, 0.205596923828125, 0.2407684326171875, 0.27593994140625, 0.3111114501953125, 0.346282958984375, 0.3814544677734375, 0.4166259765625, 0.4517974853515625, 0.486968994140625, 0.5221405029296875, 0.55731201171875, 0.5924835205078125, 0.627655029296875, 0.6628265380859375, 0.697998046875, 0.7331695556640625, 0.768341064453125, 0.8035125732421875, 0.83868408203125, 0.8738555908203125, 0.909027099609375, 0.9441986083984375, 0.9793701171875, 1.0145416259765625, 1.049713134765625, 1.0848846435546875, 1.12005615234375, 1.1552276611328125, 1.190399169921875, 1.2255706787109375, 1.2607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 11.0, 25.0, 23.0, 32.0, 66.0, 73.0, 119.0, 187.0, 279.0, 361.0, 549.0, 815.0, 1171.0, 1817.0, 2620.0, 3770.0, 5787.0, 8687.0, 13711.0, 21180.0, 34597.0, 55046.0, 89843.0, 151260.0, 224994.0, 166624.0, 99576.0, 60592.0, 37402.0, 23540.0, 15026.0, 9661.0, 6371.0, 4206.0, 2705.0, 1905.0, 1306.0, 876.0, 557.0, 402.0, 268.0, 153.0, 121.0, 84.0, 41.0, 41.0, 22.0, 15.0, 15.0, 6.0, 2.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11016845703125, -0.1064462661743164, -0.10272407531738281, -0.09900188446044922, -0.09527969360351562, -0.09155750274658203, -0.08783531188964844, -0.08411312103271484, -0.08039093017578125, -0.07666873931884766, -0.07294654846191406, -0.06922435760498047, -0.06550216674804688, -0.06177997589111328, -0.05805778503417969, -0.054335594177246094, -0.0506134033203125, -0.046891212463378906, -0.04316902160644531, -0.03944683074951172, -0.035724639892578125, -0.03200244903564453, -0.028280258178710938, -0.024558067321777344, -0.02083587646484375, -0.017113685607910156, -0.013391494750976562, -0.009669303894042969, -0.005947113037109375, -0.0022249221801757812, 0.0014972686767578125, 0.005219459533691406, 0.008941650390625, 0.012663841247558594, 0.016386032104492188, 0.02010822296142578, 0.023830413818359375, 0.02755260467529297, 0.03127479553222656, 0.034996986389160156, 0.03871917724609375, 0.042441368103027344, 0.04616355895996094, 0.04988574981689453, 0.053607940673828125, 0.05733013153076172, 0.06105232238769531, 0.0647745132446289, 0.0684967041015625, 0.0722188949584961, 0.07594108581542969, 0.07966327667236328, 0.08338546752929688, 0.08710765838623047, 0.09082984924316406, 0.09455204010009766, 0.09827423095703125, 0.10199642181396484, 0.10571861267089844, 0.10944080352783203, 0.11316299438476562, 0.11688518524169922, 0.12060737609863281, 0.1243295669555664, 0.1280517578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 13.0, 18.0, 15.0, 10.0, 25.0, 20.0, 29.0, 24.0, 20.0, 38.0, 43.0, 34.0, 40.0, 42.0, 52.0, 1060.0, 53.0, 37.0, 44.0, 32.0, 41.0, 39.0, 35.0, 33.0, 29.0, 28.0, 31.0, 22.0, 12.0, 18.0, 12.0, 13.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6590194702148438, -0.6359100341796875, -0.6128005981445312, -0.589691162109375, -0.5665817260742188, -0.5434722900390625, -0.5203628540039062, -0.49725341796875, -0.47414398193359375, -0.4510345458984375, -0.42792510986328125, -0.404815673828125, -0.38170623779296875, -0.3585968017578125, -0.33548736572265625, -0.3123779296875, -0.28926849365234375, -0.2661590576171875, -0.24304962158203125, -0.219940185546875, -0.19683074951171875, -0.1737213134765625, -0.15061187744140625, -0.12750244140625, -0.10439300537109375, -0.0812835693359375, -0.05817413330078125, -0.035064697265625, -0.01195526123046875, 0.0111541748046875, 0.03426361083984375, 0.057373046875, 0.08048248291015625, 0.1035919189453125, 0.12670135498046875, 0.149810791015625, 0.17292022705078125, 0.1960296630859375, 0.21913909912109375, 0.24224853515625, 0.26535797119140625, 0.2884674072265625, 0.31157684326171875, 0.334686279296875, 0.35779571533203125, 0.3809051513671875, 0.40401458740234375, 0.4271240234375, 0.45023345947265625, 0.4733428955078125, 0.49645233154296875, 0.519561767578125, 0.5426712036132812, 0.5657806396484375, 0.5888900756835938, 0.61199951171875, 0.6351089477539062, 0.6582183837890625, 0.6813278198242188, 0.704437255859375, 0.7275466918945312, 0.7506561279296875, 0.7737655639648438, 0.796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 11.0, 17.0, 12.0, 22.0, 36.0, 45.0, 73.0, 115.0, 163.0, 255.0, 349.0, 528.0, 807.0, 1231.0, 1787.0, 2796.0, 4221.0, 6372.0, 10405.0, 16721.0, 27761.0, 46524.0, 80060.0, 140423.0, 1261154.0, 205011.0, 117839.0, 67991.0, 40187.0, 23975.0, 14617.0, 9283.0, 5714.0, 3692.0, 2301.0, 1507.0, 1019.0, 671.0, 433.0, 314.0, 205.0, 129.0, 104.0, 58.0, 53.0, 38.0, 32.0, 17.0, 16.0, 8.0, 5.0, 8.0, 6.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.10205078125, -0.098846435546875, -0.09564208984375, -0.092437744140625, -0.0892333984375, -0.086029052734375, -0.08282470703125, -0.079620361328125, -0.076416015625, -0.073211669921875, -0.07000732421875, -0.066802978515625, -0.0635986328125, -0.060394287109375, -0.05718994140625, -0.053985595703125, -0.05078125, -0.047576904296875, -0.04437255859375, -0.041168212890625, -0.0379638671875, -0.034759521484375, -0.03155517578125, -0.028350830078125, -0.025146484375, -0.021942138671875, -0.01873779296875, -0.015533447265625, -0.0123291015625, -0.009124755859375, -0.00592041015625, -0.002716064453125, 0.00048828125, 0.003692626953125, 0.00689697265625, 0.010101318359375, 0.0133056640625, 0.016510009765625, 0.01971435546875, 0.022918701171875, 0.026123046875, 0.029327392578125, 0.03253173828125, 0.035736083984375, 0.0389404296875, 0.042144775390625, 0.04534912109375, 0.048553466796875, 0.0517578125, 0.054962158203125, 0.05816650390625, 0.061370849609375, 0.0645751953125, 0.067779541015625, 0.07098388671875, 0.074188232421875, 0.077392578125, 0.080596923828125, 0.08380126953125, 0.087005615234375, 0.0902099609375, 0.093414306640625, 0.09661865234375, 0.099822998046875, 0.10302734375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 6.0, 2.0, 7.0, 10.0, 18.0, 16.0, 19.0, 12.0, 25.0, 34.0, 37.0, 35.0, 60.0, 68.0, 62.0, 66.0, 77.0, 57.0, 54.0, 51.0, 53.0, 38.0, 21.0, 20.0, 24.0, 14.0, 15.0, 17.0, 18.0, 9.0, 11.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005459785461425781, -0.0005276501178741455, -0.0005093216896057129, -0.0004909932613372803, -0.00047266483306884766, -0.00045433640480041504, -0.0004360079765319824, -0.0004176795482635498, -0.0003993511199951172, -0.00038102269172668457, -0.00036269426345825195, -0.00034436583518981934, -0.0003260374069213867, -0.0003077089786529541, -0.0002893805503845215, -0.00027105212211608887, -0.00025272369384765625, -0.00023439526557922363, -0.00021606683731079102, -0.0001977384090423584, -0.00017940998077392578, -0.00016108155250549316, -0.00014275312423706055, -0.00012442469596862793, -0.00010609626770019531, -8.77678394317627e-05, -6.943941116333008e-05, -5.111098289489746e-05, -3.2782554626464844e-05, -1.4454126358032227e-05, 3.874301910400391e-06, 2.2202730178833008e-05, 4.0531158447265625e-05, 5.885958671569824e-05, 7.718801498413086e-05, 9.551644325256348e-05, 0.0001138448715209961, 0.0001321732997894287, 0.00015050172805786133, 0.00016883015632629395, 0.00018715858459472656, 0.00020548701286315918, 0.0002238154411315918, 0.00024214386940002441, 0.00026047229766845703, 0.00027880072593688965, 0.00029712915420532227, 0.0003154575824737549, 0.0003337860107421875, 0.0003521144390106201, 0.00037044286727905273, 0.00038877129554748535, 0.00040709972381591797, 0.0004254281520843506, 0.0004437565803527832, 0.0004620850086212158, 0.00048041343688964844, 0.0004987418651580811, 0.0005170702934265137, 0.0005353987216949463, 0.0005537271499633789, 0.0005720555782318115, 0.0005903840065002441, 0.0006087124347686768, 0.0006270408630371094]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 15.0, 11.0, 15.0, 20.0, 26.0, 23.0, 36.0, 40.0, 63.0, 96.0, 82.0, 123.0, 162.0, 262.0, 389.0, 724.0, 155899.0, 888204.0, 841.0, 387.0, 310.0, 190.0, 133.0, 112.0, 75.0, 65.0, 64.0, 47.0, 33.0, 20.0, 11.0, 11.0, 10.0, 8.0, 6.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.012969970703125, -0.012589335441589355, -0.012208700180053711, -0.011828064918518066, -0.011447429656982422, -0.011066794395446777, -0.010686159133911133, -0.010305523872375488, -0.009924888610839844, -0.0095442533493042, -0.009163618087768555, -0.00878298282623291, -0.008402347564697266, -0.008021712303161621, -0.0076410770416259766, -0.007260441780090332, -0.0068798065185546875, -0.006499171257019043, -0.0061185359954833984, -0.005737900733947754, -0.005357265472412109, -0.004976630210876465, -0.00459599494934082, -0.004215359687805176, -0.0038347244262695312, -0.0034540891647338867, -0.003073453903198242, -0.0026928186416625977, -0.002312183380126953, -0.0019315481185913086, -0.001550912857055664, -0.0011702775955200195, -0.000789642333984375, -0.00040900707244873047, -2.8371810913085938e-05, 0.0003522634506225586, 0.0007328987121582031, 0.0011135339736938477, 0.0014941692352294922, 0.0018748044967651367, 0.0022554397583007812, 0.0026360750198364258, 0.0030167102813720703, 0.003397345542907715, 0.0037779808044433594, 0.004158616065979004, 0.0045392513275146484, 0.004919886589050293, 0.0053005218505859375, 0.005681157112121582, 0.0060617923736572266, 0.006442427635192871, 0.006823062896728516, 0.00720369815826416, 0.007584333419799805, 0.00796496868133545, 0.008345603942871094, 0.008726239204406738, 0.009106874465942383, 0.009487509727478027, 0.009868144989013672, 0.010248780250549316, 0.010629415512084961, 0.011010050773620605, 0.01139068603515625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 24.0, 906.0, 85.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010611843317747116, -0.0009833176154643297, -0.0009054508409462869, -0.000827584124635905, -0.0007497173501178622, -0.0006718506338074803, -0.0005939839174970984, -0.0005161171429790556, -0.00043825042666867375, -0.0003603836812544614, -0.00028251693584024906, -0.00020465021952986717, -0.00012678347411565483, -4.891672870144248e-05, 2.894998760893941e-05, 0.00010681676212698221, 0.0001846834784373641, 0.00026255022385157645, 0.0003404169692657888, 0.0004182836855761707, 0.0004961504600942135, 0.0005740171764045954, 0.0006518838927149773, 0.0007297506672330201, 0.000807617383543402, 0.0008854840998537838, 0.0009633508743718266, 0.0010412175906822085, 0.0011190843069925904, 0.0011969511397182941, 0.001274817856028676, 0.001352684572339058, 0.0014305512886494398, 0.0015084180049598217, 0.0015862847212702036, 0.0016641514375805855, 0.0017420182703062892, 0.001819884986616671, 0.001897751702927053, 0.0019756185356527567, 0.0020534852519631386, 0.0021313519682735205, 0.0022092186845839024, 0.0022870854008942842, 0.002364952117204666, 0.0024428190663456917, 0.00252068554982543, 0.0025985524989664555, 0.0026764189824461937, 0.0027542856987565756, 0.0028321524150669575, 0.0029100191313773394, 0.0029878858476877213, 0.003065752796828747, 0.003143619280308485, 0.0032214862294495106, 0.0032993529457598925, 0.0033772196620702744, 0.0034550863783806562, 0.003532953094691038, 0.00361081981100142, 0.003688686527311802, 0.0037665534764528275, 0.0038444201927632093, 0.003922286909073591]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 3.0, 7.0, 9.0, 14.0, 15.0, 16.0, 18.0, 22.0, 24.0, 20.0, 24.0, 32.0, 29.0, 36.0, 30.0, 31.0, 44.0, 46.0, 46.0, 44.0, 36.0, 38.0, 50.0, 42.0, 42.0, 36.0, 28.0, 32.0, 32.0, 25.0, 12.0, 21.0, 16.0, 12.0, 16.0, 5.0, 9.0, 14.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0003165006637573242, -0.0003069555386900902, -0.00029741041362285614, -0.0002878652885556221, -0.00027832016348838806, -0.000268775038421154, -0.00025922991335392, -0.00024968478828668594, -0.0002401396632194519, -0.00023059453815221786, -0.00022104941308498383, -0.00021150428801774979, -0.00020195916295051575, -0.0001924140378832817, -0.00018286891281604767, -0.00017332378774881363, -0.0001637786626815796, -0.00015423353761434555, -0.0001446884125471115, -0.00013514328747987747, -0.00012559816241264343, -0.0001160530373454094, -0.00010650791227817535, -9.696278721094131e-05, -8.741766214370728e-05, -7.787253707647324e-05, -6.83274120092392e-05, -5.878228694200516e-05, -4.923716187477112e-05, -3.969203680753708e-05, -3.014691174030304e-05, -2.0601786673069e-05, -1.1056661605834961e-05, -1.5115365386009216e-06, 8.033588528633118e-06, 1.7578713595867157e-05, 2.7123838663101196e-05, 3.6668963730335236e-05, 4.6214088797569275e-05, 5.5759213864803314e-05, 6.530433893203735e-05, 7.484946399927139e-05, 8.439458906650543e-05, 9.393971413373947e-05, 0.00010348483920097351, 0.00011302996426820755, 0.0001225750893354416, 0.00013212021440267563, 0.00014166533946990967, 0.0001512104645371437, 0.00016075558960437775, 0.00017030071467161179, 0.00017984583973884583, 0.00018939096480607986, 0.0001989360898733139, 0.00020848121494054794, 0.00021802634000778198, 0.00022757146507501602, 0.00023711659014225006, 0.0002466617152094841, 0.00025620684027671814, 0.0002657519653439522, 0.0002752970904111862, 0.00028484221547842026, 0.0002943873405456543]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 18.0, 11.0, 21.0, 19.0, 25.0, 19.0, 20.0, 26.0, 22.0, 34.0, 35.0, 29.0, 43.0, 34.0, 54.0, 41.0, 48.0, 46.0, 39.0, 41.0, 38.0, 42.0, 32.0, 29.0, 30.0, 23.0, 24.0, 16.0, 30.0, 18.0, 18.0, 9.0, 5.0, 7.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.9550628662109375, -0.919891357421875, -0.8847198486328125, -0.84954833984375, -0.8143768310546875, -0.779205322265625, -0.7440338134765625, -0.7088623046875, -0.6736907958984375, -0.638519287109375, -0.6033477783203125, -0.56817626953125, -0.5330047607421875, -0.497833251953125, -0.4626617431640625, -0.427490234375, -0.3923187255859375, -0.357147216796875, -0.3219757080078125, -0.28680419921875, -0.2516326904296875, -0.216461181640625, -0.1812896728515625, -0.1461181640625, -0.1109466552734375, -0.075775146484375, -0.0406036376953125, -0.00543212890625, 0.0297393798828125, 0.064910888671875, 0.1000823974609375, 0.13525390625, 0.1704254150390625, 0.205596923828125, 0.2407684326171875, 0.27593994140625, 0.3111114501953125, 0.346282958984375, 0.3814544677734375, 0.4166259765625, 0.4517974853515625, 0.486968994140625, 0.5221405029296875, 0.55731201171875, 0.5924835205078125, 0.627655029296875, 0.6628265380859375, 0.697998046875, 0.7331695556640625, 0.768341064453125, 0.8035125732421875, 0.83868408203125, 0.8738555908203125, 0.909027099609375, 0.9441986083984375, 0.9793701171875, 1.0145416259765625, 1.049713134765625, 1.0848846435546875, 1.12005615234375, 1.1552276611328125, 1.190399169921875, 1.2255706787109375, 1.2607421875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 10.0, 19.0, 14.0, 31.0, 51.0, 70.0, 83.0, 116.0, 180.0, 277.0, 426.0, 566.0, 881.0, 1334.0, 2011.0, 3078.0, 4811.0, 8300.0, 16312.0, 41142.0, 161867.0, 479381.0, 228686.0, 54414.0, 19284.0, 9637.0, 5511.0, 3408.0, 2148.0, 1486.0, 938.0, 643.0, 432.0, 286.0, 211.0, 169.0, 91.0, 78.0, 37.0, 39.0, 23.0, 15.0, 14.0, 13.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.259765625, -3.153289794921875, -3.04681396484375, -2.940338134765625, -2.8338623046875, -2.727386474609375, -2.62091064453125, -2.514434814453125, -2.407958984375, -2.301483154296875, -2.19500732421875, -2.088531494140625, -1.9820556640625, -1.875579833984375, -1.76910400390625, -1.662628173828125, -1.55615234375, -1.449676513671875, -1.34320068359375, -1.236724853515625, -1.1302490234375, -1.023773193359375, -0.91729736328125, -0.810821533203125, -0.704345703125, -0.597869873046875, -0.49139404296875, -0.384918212890625, -0.2784423828125, -0.171966552734375, -0.06549072265625, 0.040985107421875, 0.1474609375, 0.253936767578125, 0.36041259765625, 0.466888427734375, 0.5733642578125, 0.679840087890625, 0.78631591796875, 0.892791748046875, 0.999267578125, 1.105743408203125, 1.21221923828125, 1.318695068359375, 1.4251708984375, 1.531646728515625, 1.63812255859375, 1.744598388671875, 1.85107421875, 1.957550048828125, 2.06402587890625, 2.170501708984375, 2.2769775390625, 2.383453369140625, 2.48992919921875, 2.596405029296875, 2.702880859375, 2.809356689453125, 2.91583251953125, 3.022308349609375, 3.1287841796875, 3.235260009765625, 3.34173583984375, 3.448211669921875, 3.5546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 5.0, 6.0, 7.0, 11.0, 9.0, 15.0, 12.0, 20.0, 21.0, 28.0, 19.0, 26.0, 34.0, 52.0, 49.0, 41.0, 71.0, 132.0, 253.0, 1348.0, 266.0, 128.0, 71.0, 61.0, 47.0, 49.0, 37.0, 36.0, 38.0, 32.0, 14.0, 20.0, 13.0, 20.0, 9.0, 12.0, 8.0, 7.0, 5.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.765625, -3.655975341796875, -3.54632568359375, -3.436676025390625, -3.3270263671875, -3.217376708984375, -3.10772705078125, -2.998077392578125, -2.888427734375, -2.778778076171875, -2.66912841796875, -2.559478759765625, -2.4498291015625, -2.340179443359375, -2.23052978515625, -2.120880126953125, -2.01123046875, -1.901580810546875, -1.79193115234375, -1.682281494140625, -1.5726318359375, -1.462982177734375, -1.35333251953125, -1.243682861328125, -1.134033203125, -1.024383544921875, -0.91473388671875, -0.805084228515625, -0.6954345703125, -0.585784912109375, -0.47613525390625, -0.366485595703125, -0.2568359375, -0.147186279296875, -0.03753662109375, 0.072113037109375, 0.1817626953125, 0.291412353515625, 0.40106201171875, 0.510711669921875, 0.620361328125, 0.730010986328125, 0.83966064453125, 0.949310302734375, 1.0589599609375, 1.168609619140625, 1.27825927734375, 1.387908935546875, 1.49755859375, 1.607208251953125, 1.71685791015625, 1.826507568359375, 1.9361572265625, 2.045806884765625, 2.15545654296875, 2.265106201171875, 2.374755859375, 2.484405517578125, 2.59405517578125, 2.703704833984375, 2.8133544921875, 2.923004150390625, 3.03265380859375, 3.142303466796875, 3.251953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 11.0, 13.0, 22.0, 24.0, 29.0, 31.0, 54.0, 57.0, 91.0, 155.0, 297.0, 903.0, 8688.0, 3022259.0, 110387.0, 1630.0, 424.0, 207.0, 110.0, 62.0, 41.0, 31.0, 26.0, 22.0, 17.0, 13.0, 15.0, 8.0, 10.0, 3.0, 3.0, 6.0, 7.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.68310546875, -12.2255859375, -11.76806640625, -11.310546875, -10.85302734375, -10.3955078125, -9.93798828125, -9.48046875, -9.02294921875, -8.5654296875, -8.10791015625, -7.650390625, -7.19287109375, -6.7353515625, -6.27783203125, -5.8203125, -5.36279296875, -4.9052734375, -4.44775390625, -3.990234375, -3.53271484375, -3.0751953125, -2.61767578125, -2.16015625, -1.70263671875, -1.2451171875, -0.78759765625, -0.330078125, 0.12744140625, 0.5849609375, 1.04248046875, 1.5, 1.95751953125, 2.4150390625, 2.87255859375, 3.330078125, 3.78759765625, 4.2451171875, 4.70263671875, 5.16015625, 5.61767578125, 6.0751953125, 6.53271484375, 6.990234375, 7.44775390625, 7.9052734375, 8.36279296875, 8.8203125, 9.27783203125, 9.7353515625, 10.19287109375, 10.650390625, 11.10791015625, 11.5654296875, 12.02294921875, 12.48046875, 12.93798828125, 13.3955078125, 13.85302734375, 14.310546875, 14.76806640625, 15.2255859375, 15.68310546875, 16.140625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1005.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.59013366699219, -43.11700439453125, -38.64387512207031, -34.17074203491211, -29.697612762451172, -25.224483489990234, -20.751352310180664, -16.278221130371094, -11.805091857910156, -7.331961631774902, -2.8588314056396484, 1.6142988204956055, 6.087429046630859, 10.560558319091797, 15.033689498901367, 19.506820678710938, 23.979949951171875, 28.453079223632812, 32.92620849609375, 37.39934158325195, 41.87247085571289, 46.34560012817383, 50.81873321533203, 55.29186248779297, 59.764991760253906, 64.23812103271484, 68.71125030517578, 73.18437957763672, 77.65751647949219, 82.13064575195312, 86.60377502441406, 91.076904296875, 95.550048828125, 100.02317810058594, 104.49630737304688, 108.96943664550781, 113.44256591796875, 117.91569519042969, 122.38883209228516, 126.8619613647461, 131.3350830078125, 135.80821228027344, 140.28134155273438, 144.7544708251953, 149.22760009765625, 153.7007293701172, 158.17385864257812, 162.64700317382812, 167.12013244628906, 171.59326171875, 176.06639099121094, 180.53952026367188, 185.0126495361328, 189.48577880859375, 193.9589080810547, 198.43203735351562, 202.90518188476562, 207.37831115722656, 211.8514404296875, 216.32456970214844, 220.79769897460938, 225.2708282470703, 229.74395751953125, 234.21710205078125, 238.69021606445312]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 7.0, 8.0, 13.0, 8.0, 21.0, 7.0, 13.0, 10.0, 12.0, 20.0, 34.0, 26.0, 35.0, 38.0, 41.0, 37.0, 44.0, 41.0, 44.0, 38.0, 41.0, 34.0, 52.0, 29.0, 30.0, 43.0, 37.0, 23.0, 31.0, 19.0, 19.0, 18.0, 22.0, 13.0, 12.0, 17.0, 7.0, 9.0, 6.0, 7.0, 7.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.096226692199707, -9.73198127746582, -9.367735862731934, -9.003490447998047, -8.63924503326416, -8.274999618530273, -7.910754203796387, -7.5465087890625, -7.182263374328613, -6.818017959594727, -6.45377254486084, -6.089527130126953, -5.725281715393066, -5.36103630065918, -4.996790885925293, -4.632545471191406, -4.2683000564575195, -3.904054641723633, -3.539809226989746, -3.1755638122558594, -2.8113183975219727, -2.447072982788086, -2.082827568054199, -1.7185821533203125, -1.3543367385864258, -0.9900913238525391, -0.6258459091186523, -0.2616004943847656, 0.1026449203491211, 0.4668903350830078, 0.8311357498168945, 1.1953811645507812, 1.5596275329589844, 1.923872947692871, 2.288118362426758, 2.6523637771606445, 3.0166091918945312, 3.380854606628418, 3.7451000213623047, 4.109345436096191, 4.473590850830078, 4.837836265563965, 5.202081680297852, 5.566327095031738, 5.930572509765625, 6.294817924499512, 6.659063339233398, 7.023308753967285, 7.387554168701172, 7.751799583435059, 8.116044998168945, 8.480290412902832, 8.844535827636719, 9.208781242370605, 9.573026657104492, 9.937272071838379, 10.301517486572266, 10.665762901306152, 11.030008316040039, 11.394253730773926, 11.758499145507812, 12.1227445602417, 12.486989974975586, 12.851235389709473, 13.21548080444336]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 2.0, 17.0, 13.0, 8.0, 11.0, 24.0, 17.0, 25.0, 15.0, 16.0, 34.0, 26.0, 30.0, 42.0, 36.0, 34.0, 38.0, 49.0, 57.0, 41.0, 44.0, 40.0, 46.0, 23.0, 42.0, 36.0, 45.0, 28.0, 19.0, 24.0, 20.0, 21.0, 19.0, 11.0, 8.0, 16.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1253204345703125, -1.086578369140625, -1.0478363037109375, -1.00909423828125, -0.9703521728515625, -0.931610107421875, -0.8928680419921875, -0.8541259765625, -0.8153839111328125, -0.776641845703125, -0.7378997802734375, -0.69915771484375, -0.6604156494140625, -0.621673583984375, -0.5829315185546875, -0.544189453125, -0.5054473876953125, -0.466705322265625, -0.4279632568359375, -0.38922119140625, -0.3504791259765625, -0.311737060546875, -0.2729949951171875, -0.2342529296875, -0.1955108642578125, -0.156768798828125, -0.1180267333984375, -0.07928466796875, -0.0405426025390625, -0.001800537109375, 0.0369415283203125, 0.07568359375, 0.1144256591796875, 0.153167724609375, 0.1919097900390625, 0.23065185546875, 0.2693939208984375, 0.308135986328125, 0.3468780517578125, 0.3856201171875, 0.4243621826171875, 0.463104248046875, 0.5018463134765625, 0.54058837890625, 0.5793304443359375, 0.618072509765625, 0.6568145751953125, 0.695556640625, 0.7342987060546875, 0.773040771484375, 0.8117828369140625, 0.85052490234375, 0.8892669677734375, 0.928009033203125, 0.9667510986328125, 1.0054931640625, 1.0442352294921875, 1.082977294921875, 1.1217193603515625, 1.16046142578125, 1.1992034912109375, 1.237945556640625, 1.2766876220703125, 1.3154296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 12.0, 15.0, 22.0, 22.0, 19.0, 35.0, 56.0, 82.0, 117.0, 138.0, 212.0, 324.0, 521.0, 1008.0, 2043.0, 5840.0, 23026.0, 139137.0, 1701901.0, 2105413.0, 175187.0, 27508.0, 6718.0, 2284.0, 1018.0, 529.0, 338.0, 204.0, 154.0, 104.0, 98.0, 51.0, 37.0, 39.0, 19.0, 14.0, 8.0, 6.0, 5.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71484375, -4.5677490234375, -4.420654296875, -4.2735595703125, -4.12646484375, -3.9793701171875, -3.832275390625, -3.6851806640625, -3.5380859375, -3.3909912109375, -3.243896484375, -3.0968017578125, -2.94970703125, -2.8026123046875, -2.655517578125, -2.5084228515625, -2.361328125, -2.2142333984375, -2.067138671875, -1.9200439453125, -1.77294921875, -1.6258544921875, -1.478759765625, -1.3316650390625, -1.1845703125, -1.0374755859375, -0.890380859375, -0.7432861328125, -0.59619140625, -0.4490966796875, -0.302001953125, -0.1549072265625, -0.0078125, 0.1392822265625, 0.286376953125, 0.4334716796875, 0.58056640625, 0.7276611328125, 0.874755859375, 1.0218505859375, 1.1689453125, 1.3160400390625, 1.463134765625, 1.6102294921875, 1.75732421875, 1.9044189453125, 2.051513671875, 2.1986083984375, 2.345703125, 2.4927978515625, 2.639892578125, 2.7869873046875, 2.93408203125, 3.0811767578125, 3.228271484375, 3.3753662109375, 3.5224609375, 3.6695556640625, 3.816650390625, 3.9637451171875, 4.11083984375, 4.2579345703125, 4.405029296875, 4.5521240234375, 4.69921875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 9.0, 15.0, 19.0, 41.0, 63.0, 98.0, 130.0, 231.0, 321.0, 479.0, 573.0, 606.0, 473.0, 313.0, 236.0, 159.0, 124.0, 60.0, 38.0, 34.0, 19.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.26763916015625, -6.0977783203125, -5.92791748046875, -5.758056640625, -5.58819580078125, -5.4183349609375, -5.24847412109375, -5.07861328125, -4.90875244140625, -4.7388916015625, -4.56903076171875, -4.399169921875, -4.22930908203125, -4.0594482421875, -3.88958740234375, -3.7197265625, -3.54986572265625, -3.3800048828125, -3.21014404296875, -3.040283203125, -2.87042236328125, -2.7005615234375, -2.53070068359375, -2.36083984375, -2.19097900390625, -2.0211181640625, -1.85125732421875, -1.681396484375, -1.51153564453125, -1.3416748046875, -1.17181396484375, -1.001953125, -0.83209228515625, -0.6622314453125, -0.49237060546875, -0.322509765625, -0.15264892578125, 0.0172119140625, 0.18707275390625, 0.35693359375, 0.52679443359375, 0.6966552734375, 0.86651611328125, 1.036376953125, 1.20623779296875, 1.3760986328125, 1.54595947265625, 1.7158203125, 1.88568115234375, 2.0555419921875, 2.22540283203125, 2.395263671875, 2.56512451171875, 2.7349853515625, 2.90484619140625, 3.07470703125, 3.24456787109375, 3.4144287109375, 3.58428955078125, 3.754150390625, 3.92401123046875, 4.0938720703125, 4.26373291015625, 4.43359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 15.0, 18.0, 31.0, 67.0, 136.0, 301.0, 946.0, 5874.0, 1240925.0, 2935294.0, 9157.0, 1042.0, 279.0, 114.0, 46.0, 19.0, 11.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -12.88916015625, -12.2470703125, -11.60498046875, -10.962890625, -10.32080078125, -9.6787109375, -9.03662109375, -8.39453125, -7.75244140625, -7.1103515625, -6.46826171875, -5.826171875, -5.18408203125, -4.5419921875, -3.89990234375, -3.2578125, -2.61572265625, -1.9736328125, -1.33154296875, -0.689453125, -0.04736328125, 0.5947265625, 1.23681640625, 1.87890625, 2.52099609375, 3.1630859375, 3.80517578125, 4.447265625, 5.08935546875, 5.7314453125, 6.37353515625, 7.015625, 7.65771484375, 8.2998046875, 8.94189453125, 9.583984375, 10.22607421875, 10.8681640625, 11.51025390625, 12.15234375, 12.79443359375, 13.4365234375, 14.07861328125, 14.720703125, 15.36279296875, 16.0048828125, 16.64697265625, 17.2890625, 17.93115234375, 18.5732421875, 19.21533203125, 19.857421875, 20.49951171875, 21.1416015625, 21.78369140625, 22.42578125, 23.06787109375, 23.7099609375, 24.35205078125, 24.994140625, 25.63623046875, 26.2783203125, 26.92041015625, 27.5625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 180.0, 771.0, 63.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.1727180480957, -56.4937744140625, -52.81482696533203, -49.13588333129883, -45.456939697265625, -41.777992248535156, -38.09904861450195, -34.42010498046875, -30.741159439086914, -27.062213897705078, -23.383270263671875, -19.70432472229004, -16.025379180908203, -12.346435546875, -8.667490005493164, -4.988546371459961, -1.309600830078125, 2.3693439960479736, 6.048288822174072, 9.72723388671875, 13.40617847442627, 17.08512306213379, 20.764068603515625, 24.443012237548828, 28.121957778930664, 31.8009033203125, 35.4798469543457, 39.158790588378906, 42.837738037109375, 46.51668167114258, 50.19562530517578, 53.87457275390625, 57.55352020263672, 61.23246383666992, 64.91140747070312, 68.5903549194336, 72.26930236816406, 75.9482421875, 79.62718963623047, 83.30613708496094, 86.98507690429688, 90.66402435302734, 94.34296417236328, 98.02191162109375, 101.70085906982422, 105.37979888916016, 109.05874633789062, 112.73768615722656, 116.41664123535156, 120.09558868408203, 123.77452850341797, 127.45347595214844, 131.13241577148438, 134.81137084960938, 138.4903106689453, 142.16925048828125, 145.8481903076172, 149.52713012695312, 153.20608520507812, 156.88502502441406, 160.56396484375, 164.242919921875, 167.92185974121094, 171.60079956054688, 175.27975463867188]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 15.0, 9.0, 17.0, 22.0, 21.0, 16.0, 27.0, 25.0, 22.0, 38.0, 23.0, 29.0, 44.0, 47.0, 33.0, 34.0, 41.0, 51.0, 54.0, 53.0, 42.0, 35.0, 36.0, 34.0, 29.0, 20.0, 33.0, 23.0, 20.0, 15.0, 20.0, 11.0, 13.0, 7.0, 8.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.660313606262207, -15.168632507324219, -14.67695140838623, -14.185270309448242, -13.69359016418457, -13.201908111572266, -12.710227966308594, -12.218546867370605, -11.726865768432617, -11.235184669494629, -10.74350357055664, -10.251822471618652, -9.760141372680664, -9.268461227416992, -8.776780128479004, -8.285099029541016, -7.793417930603027, -7.301736831665039, -6.810055732727051, -6.318375110626221, -5.826694011688232, -5.335012912750244, -4.843332290649414, -4.351651191711426, -3.8599700927734375, -3.368288993835449, -2.87660813331604, -2.384927272796631, -1.8932461738586426, -1.4015650749206543, -0.9098842144012451, -0.41820335388183594, 0.07347679138183594, 0.5651577711105347, 1.0568387508392334, 1.5485197305679321, 2.040200710296631, 2.531881809234619, 3.0235626697540283, 3.5152435302734375, 4.006924629211426, 4.498605728149414, 4.990286827087402, 5.481967449188232, 5.973648548126221, 6.465329647064209, 6.957010269165039, 7.448691368103027, 7.940372467041016, 8.432053565979004, 8.923734664916992, 9.41541576385498, 9.907096862792969, 10.39877700805664, 10.890458106994629, 11.382139205932617, 11.873820304870605, 12.365501403808594, 12.857182502746582, 13.34886360168457, 13.840543746948242, 14.332225799560547, 14.823905944824219, 15.315587043762207, 15.807268142700195]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 12.0, 21.0, 32.0, 24.0, 27.0, 30.0, 30.0, 40.0, 46.0, 49.0, 51.0, 45.0, 42.0, 45.0, 39.0, 53.0, 45.0, 41.0, 36.0, 30.0, 37.0, 26.0, 36.0, 25.0, 21.0, 15.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374420166015625, -1.194610595703125, -1.1517791748046875, -1.10894775390625, -1.0661163330078125, -1.023284912109375, -0.9804534912109375, -0.9376220703125, -0.8947906494140625, -0.851959228515625, -0.8091278076171875, -0.76629638671875, -0.7234649658203125, -0.680633544921875, -0.6378021240234375, -0.594970703125, -0.5521392822265625, -0.509307861328125, -0.4664764404296875, -0.42364501953125, -0.3808135986328125, -0.337982177734375, -0.2951507568359375, -0.2523193359375, -0.2094879150390625, -0.166656494140625, -0.1238250732421875, -0.08099365234375, -0.0381622314453125, 0.004669189453125, 0.0475006103515625, 0.09033203125, 0.1331634521484375, 0.175994873046875, 0.2188262939453125, 0.26165771484375, 0.3044891357421875, 0.347320556640625, 0.3901519775390625, 0.4329833984375, 0.4758148193359375, 0.518646240234375, 0.5614776611328125, 0.60430908203125, 0.6471405029296875, 0.689971923828125, 0.7328033447265625, 0.775634765625, 0.8184661865234375, 0.861297607421875, 0.9041290283203125, 0.94696044921875, 0.9897918701171875, 1.032623291015625, 1.0754547119140625, 1.1182861328125, 1.1611175537109375, 1.203948974609375, 1.2467803955078125, 1.28961181640625, 1.3324432373046875, 1.375274658203125, 1.4181060791015625, 1.4609375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 13.0, 18.0, 28.0, 34.0, 62.0, 89.0, 140.0, 238.0, 313.0, 527.0, 838.0, 1315.0, 2079.0, 3288.0, 5386.0, 8524.0, 14280.0, 24163.0, 40672.0, 71941.0, 128851.0, 228163.0, 222296.0, 125603.0, 70078.0, 39775.0, 23256.0, 13817.0, 8576.0, 5358.0, 3241.0, 2067.0, 1247.0, 807.0, 531.0, 297.0, 228.0, 134.0, 87.0, 54.0, 50.0, 28.0, 18.0, 13.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.169921875, -0.16492080688476562, -0.15991973876953125, -0.15491867065429688, -0.1499176025390625, -0.14491653442382812, -0.13991546630859375, -0.13491439819335938, -0.129913330078125, -0.12491226196289062, -0.11991119384765625, -0.11491012573242188, -0.1099090576171875, -0.10490798950195312, -0.09990692138671875, -0.09490585327148438, -0.08990478515625, -0.08490371704101562, -0.07990264892578125, -0.07490158081054688, -0.0699005126953125, -0.06489944458007812, -0.05989837646484375, -0.054897308349609375, -0.049896240234375, -0.044895172119140625, -0.03989410400390625, -0.034893035888671875, -0.0298919677734375, -0.024890899658203125, -0.01988983154296875, -0.014888763427734375, -0.0098876953125, -0.004886627197265625, 0.00011444091796875, 0.005115509033203125, 0.0101165771484375, 0.015117645263671875, 0.02011871337890625, 0.025119781494140625, 0.030120849609375, 0.035121917724609375, 0.04012298583984375, 0.045124053955078125, 0.0501251220703125, 0.055126190185546875, 0.06012725830078125, 0.06512832641601562, 0.07012939453125, 0.07513046264648438, 0.08013153076171875, 0.08513259887695312, 0.0901336669921875, 0.09513473510742188, 0.10013580322265625, 0.10513687133789062, 0.110137939453125, 0.11513900756835938, 0.12014007568359375, 0.12514114379882812, 0.1301422119140625, 0.13514328002929688, 0.14014434814453125, 0.14514541625976562, 0.150146484375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 3.0, 10.0, 5.0, 4.0, 14.0, 7.0, 13.0, 12.0, 15.0, 14.0, 19.0, 20.0, 20.0, 23.0, 33.0, 27.0, 31.0, 29.0, 36.0, 34.0, 31.0, 37.0, 36.0, 1059.0, 33.0, 31.0, 41.0, 41.0, 49.0, 33.0, 39.0, 37.0, 24.0, 19.0, 17.0, 23.0, 13.0, 16.0, 12.0, 12.0, 6.0, 6.0, 11.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0], "bins": [-0.72412109375, -0.702301025390625, -0.68048095703125, -0.658660888671875, -0.6368408203125, -0.615020751953125, -0.59320068359375, -0.571380615234375, -0.549560546875, -0.527740478515625, -0.50592041015625, -0.484100341796875, -0.4622802734375, -0.440460205078125, -0.41864013671875, -0.396820068359375, -0.375, -0.353179931640625, -0.33135986328125, -0.309539794921875, -0.2877197265625, -0.265899658203125, -0.24407958984375, -0.222259521484375, -0.200439453125, -0.178619384765625, -0.15679931640625, -0.134979248046875, -0.1131591796875, -0.091339111328125, -0.06951904296875, -0.047698974609375, -0.02587890625, -0.004058837890625, 0.01776123046875, 0.039581298828125, 0.0614013671875, 0.083221435546875, 0.10504150390625, 0.126861572265625, 0.148681640625, 0.170501708984375, 0.19232177734375, 0.214141845703125, 0.2359619140625, 0.257781982421875, 0.27960205078125, 0.301422119140625, 0.3232421875, 0.345062255859375, 0.36688232421875, 0.388702392578125, 0.4105224609375, 0.432342529296875, 0.45416259765625, 0.475982666015625, 0.497802734375, 0.519622802734375, 0.54144287109375, 0.563262939453125, 0.5850830078125, 0.606903076171875, 0.62872314453125, 0.650543212890625, 0.67236328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 10.0, 29.0, 33.0, 52.0, 67.0, 92.0, 144.0, 206.0, 269.0, 399.0, 568.0, 754.0, 1131.0, 1726.0, 2407.0, 3613.0, 5323.0, 8177.0, 12404.0, 19155.0, 30545.0, 48243.0, 79312.0, 133233.0, 1246298.0, 195477.0, 116978.0, 70407.0, 42587.0, 26645.0, 17198.0, 10899.0, 7248.0, 4936.0, 3352.0, 2243.0, 1508.0, 1030.0, 737.0, 490.0, 380.0, 256.0, 155.0, 122.0, 93.0, 62.0, 43.0, 27.0, 19.0, 16.0, 11.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09942626953125, -0.0962057113647461, -0.09298515319824219, -0.08976459503173828, -0.08654403686523438, -0.08332347869873047, -0.08010292053222656, -0.07688236236572266, -0.07366180419921875, -0.07044124603271484, -0.06722068786621094, -0.06400012969970703, -0.060779571533203125, -0.05755901336669922, -0.05433845520019531, -0.051117897033691406, -0.0478973388671875, -0.044676780700683594, -0.04145622253417969, -0.03823566436767578, -0.035015106201171875, -0.03179454803466797, -0.028573989868164062, -0.025353431701660156, -0.02213287353515625, -0.018912315368652344, -0.015691757202148438, -0.012471199035644531, -0.009250640869140625, -0.006030082702636719, -0.0028095245361328125, 0.00041103363037109375, 0.003631591796875, 0.006852149963378906, 0.010072708129882812, 0.013293266296386719, 0.016513824462890625, 0.01973438262939453, 0.022954940795898438, 0.026175498962402344, 0.02939605712890625, 0.032616615295410156, 0.03583717346191406, 0.03905773162841797, 0.042278289794921875, 0.04549884796142578, 0.04871940612792969, 0.051939964294433594, 0.0551605224609375, 0.058381080627441406, 0.06160163879394531, 0.06482219696044922, 0.06804275512695312, 0.07126331329345703, 0.07448387145996094, 0.07770442962646484, 0.08092498779296875, 0.08414554595947266, 0.08736610412597656, 0.09058666229248047, 0.09380722045898438, 0.09702777862548828, 0.10024833679199219, 0.1034688949584961, 0.106689453125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 6.0, 7.0, 9.0, 6.0, 13.0, 8.0, 5.0, 19.0, 21.0, 27.0, 40.0, 46.0, 48.0, 55.0, 57.0, 79.0, 77.0, 55.0, 63.0, 60.0, 57.0, 33.0, 35.0, 21.0, 34.0, 26.0, 19.0, 12.0, 10.0, 6.0, 15.0, 5.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0004394054412841797, -0.00042537227272987366, -0.0004113391041755676, -0.0003973059356212616, -0.00038327276706695557, -0.00036923959851264954, -0.0003552064299583435, -0.0003411732614040375, -0.00032714009284973145, -0.0003131069242954254, -0.0002990737557411194, -0.00028504058718681335, -0.0002710074186325073, -0.0002569742500782013, -0.00024294108152389526, -0.00022890791296958923, -0.0002148747444152832, -0.00020084157586097717, -0.00018680840730667114, -0.0001727752387523651, -0.00015874207019805908, -0.00014470890164375305, -0.00013067573308944702, -0.00011664256453514099, -0.00010260939598083496, -8.857622742652893e-05, -7.45430588722229e-05, -6.050989031791687e-05, -4.647672176361084e-05, -3.244355320930481e-05, -1.841038465499878e-05, -4.377216100692749e-06, 9.655952453613281e-06, 2.368912100791931e-05, 3.772228956222534e-05, 5.175545811653137e-05, 6.57886266708374e-05, 7.982179522514343e-05, 9.385496377944946e-05, 0.00010788813233375549, 0.00012192130088806152, 0.00013595446944236755, 0.00014998763799667358, 0.00016402080655097961, 0.00017805397510528564, 0.00019208714365959167, 0.0002061203122138977, 0.00022015348076820374, 0.00023418664932250977, 0.0002482198178768158, 0.0002622529864311218, 0.00027628615498542786, 0.0002903193235397339, 0.0003043524920940399, 0.00031838566064834595, 0.000332418829202652, 0.000346451997756958, 0.00036048516631126404, 0.00037451833486557007, 0.0003885515034198761, 0.00040258467197418213, 0.00041661784052848816, 0.0004306510090827942, 0.0004446841776371002, 0.00045871734619140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 2.0, 10.0, 6.0, 12.0, 16.0, 18.0, 16.0, 17.0, 32.0, 27.0, 57.0, 58.0, 56.0, 87.0, 152.0, 230.0, 328.0, 652.0, 2894.0, 1023302.0, 18590.0, 799.0, 369.0, 206.0, 136.0, 118.0, 87.0, 63.0, 34.0, 33.0, 23.0, 22.0, 16.0, 16.0, 12.0, 12.0, 11.0, 12.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0113372802734375, -0.011010169982910156, -0.010683059692382812, -0.010355949401855469, -0.010028839111328125, -0.009701728820800781, -0.009374618530273438, -0.009047508239746094, -0.00872039794921875, -0.008393287658691406, -0.008066177368164062, -0.007739067077636719, -0.007411956787109375, -0.007084846496582031, -0.0067577362060546875, -0.006430625915527344, -0.006103515625, -0.005776405334472656, -0.0054492950439453125, -0.005122184753417969, -0.004795074462890625, -0.004467964172363281, -0.0041408538818359375, -0.0038137435913085938, -0.00348663330078125, -0.0031595230102539062, -0.0028324127197265625, -0.0025053024291992188, -0.002178192138671875, -0.0018510818481445312, -0.0015239715576171875, -0.0011968612670898438, -0.0008697509765625, -0.0005426406860351562, -0.0002155303955078125, 0.00011157989501953125, 0.000438690185546875, 0.0007658004760742188, 0.0010929107666015625, 0.0014200210571289062, 0.00174713134765625, 0.0020742416381835938, 0.0024013519287109375, 0.0027284622192382812, 0.003055572509765625, 0.0033826828002929688, 0.0037097930908203125, 0.004036903381347656, 0.004364013671875, 0.004691123962402344, 0.0050182342529296875, 0.005345344543457031, 0.005672454833984375, 0.005999565124511719, 0.0063266754150390625, 0.006653785705566406, 0.00698089599609375, 0.007308006286621094, 0.0076351165771484375, 0.007962226867675781, 0.008289337158203125, 0.008616447448730469, 0.008943557739257812, 0.009270668029785156, 0.0095977783203125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 218.0, 790.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006028346251696348, -0.005922951735556126, -0.00581755768507719, -0.005712163168936968, -0.005606768652796745, -0.005501374136656523, -0.0053959800861775875, -0.005290585570037365, -0.005185191053897142, -0.00507979653775692, -0.004974402487277985, -0.004869007971137762, -0.0047636134549975395, -0.004658218938857317, -0.004552824888378382, -0.004447430372238159, -0.004342035856097937, -0.004236641339957714, -0.004131247289478779, -0.004025852773338556, -0.003920458257198334, -0.003815063973888755, -0.0037096694577485323, -0.0036042751744389534, -0.0034988808911293745, -0.0033934866078197956, -0.003288092091679573, -0.003182697808369994, -0.0030773032922297716, -0.0029719090089201927, -0.00286651449277997, -0.0027611202094703913, -0.002655725460499525, -0.002550331177189946, -0.0024449366610497236, -0.0023395423777401447, -0.002234147861599922, -0.0021287535782903433, -0.0020233590621501207, -0.0019179647788405418, -0.001812570495530963, -0.0017071760958060622, -0.0016017816960811615, -0.0014963872963562608, -0.00139099289663136, -0.0012855986133217812, -0.0011802040971815586, -0.0010748098138719797, -0.0009694152977317572, -0.0008640208980068564, -0.0007586264982819557, -0.000653232098557055, -0.0005478376988321543, -0.00044244335731491446, -0.00033704895759001374, -0.00023165455786511302, -0.0001262601581402123, -2.086576569126919e-05, 8.452862675767392e-05, 0.0001899230119306594, 0.00029531741165556014, 0.0004007117822766304, 0.0005061061820015311, 0.0006115005817264318, 0.0007168949814513326]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 7.0, 8.0, 10.0, 12.0, 17.0, 17.0, 21.0, 16.0, 28.0, 21.0, 20.0, 35.0, 33.0, 34.0, 34.0, 38.0, 45.0, 34.0, 39.0, 39.0, 43.0, 33.0, 30.0, 38.0, 33.0, 42.0, 32.0, 29.0, 30.0, 27.0, 24.0, 16.0, 18.0, 13.0, 11.0, 13.0, 11.0, 8.0, 10.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 5.0], "bins": [-0.00024271011352539062, -0.0002358676865696907, -0.00022902525961399078, -0.00022218283265829086, -0.00021534040570259094, -0.00020849797874689102, -0.0002016555517911911, -0.00019481312483549118, -0.00018797069787979126, -0.00018112827092409134, -0.00017428584396839142, -0.0001674434170126915, -0.00016060099005699158, -0.00015375856310129166, -0.00014691613614559174, -0.00014007370918989182, -0.0001332312822341919, -0.00012638885527849197, -0.00011954642832279205, -0.00011270400136709213, -0.00010586157441139221, -9.901914745569229e-05, -9.217672049999237e-05, -8.533429354429245e-05, -7.849186658859253e-05, -7.164943963289261e-05, -6.480701267719269e-05, -5.796458572149277e-05, -5.112215876579285e-05, -4.4279731810092926e-05, -3.7437304854393005e-05, -3.0594877898693085e-05, -2.3752450942993164e-05, -1.6910023987293243e-05, -1.0067597031593323e-05, -3.225170075893402e-06, 3.6172568798065186e-06, 1.045968383550644e-05, 1.730211079120636e-05, 2.414453774690628e-05, 3.09869647026062e-05, 3.782939165830612e-05, 4.467181861400604e-05, 5.151424556970596e-05, 5.8356672525405884e-05, 6.51990994811058e-05, 7.204152643680573e-05, 7.888395339250565e-05, 8.572638034820557e-05, 9.256880730390549e-05, 9.941123425960541e-05, 0.00010625366121530533, 0.00011309608817100525, 0.00011993851512670517, 0.0001267809420824051, 0.000133623369038105, 0.00014046579599380493, 0.00014730822294950485, 0.00015415064990520477, 0.0001609930768609047, 0.00016783550381660461, 0.00017467793077230453, 0.00018152035772800446, 0.00018836278468370438, 0.0001952052116394043]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 12.0, 21.0, 32.0, 24.0, 27.0, 30.0, 30.0, 40.0, 46.0, 49.0, 51.0, 45.0, 42.0, 45.0, 39.0, 53.0, 45.0, 41.0, 36.0, 30.0, 37.0, 26.0, 36.0, 25.0, 21.0, 15.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374420166015625, -1.194610595703125, -1.1517791748046875, -1.10894775390625, -1.0661163330078125, -1.023284912109375, -0.9804534912109375, -0.9376220703125, -0.8947906494140625, -0.851959228515625, -0.8091278076171875, -0.76629638671875, -0.7234649658203125, -0.680633544921875, -0.6378021240234375, -0.594970703125, -0.5521392822265625, -0.509307861328125, -0.4664764404296875, -0.42364501953125, -0.3808135986328125, -0.337982177734375, -0.2951507568359375, -0.2523193359375, -0.2094879150390625, -0.166656494140625, -0.1238250732421875, -0.08099365234375, -0.0381622314453125, 0.004669189453125, 0.0475006103515625, 0.09033203125, 0.1331634521484375, 0.175994873046875, 0.2188262939453125, 0.26165771484375, 0.3044891357421875, 0.347320556640625, 0.3901519775390625, 0.4329833984375, 0.4758148193359375, 0.518646240234375, 0.5614776611328125, 0.60430908203125, 0.6471405029296875, 0.689971923828125, 0.7328033447265625, 0.775634765625, 0.8184661865234375, 0.861297607421875, 0.9041290283203125, 0.94696044921875, 0.9897918701171875, 1.032623291015625, 1.0754547119140625, 1.1182861328125, 1.1611175537109375, 1.203948974609375, 1.2467803955078125, 1.28961181640625, 1.3324432373046875, 1.375274658203125, 1.4181060791015625, 1.4609375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 10.0, 12.0, 16.0, 21.0, 46.0, 42.0, 77.0, 100.0, 153.0, 300.0, 443.0, 751.0, 1418.0, 3032.0, 7683.0, 22073.0, 66514.0, 193782.0, 362484.0, 248662.0, 92745.0, 30138.0, 10160.0, 3894.0, 1759.0, 898.0, 499.0, 316.0, 183.0, 101.0, 80.0, 58.0, 36.0, 24.0, 17.0, 15.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.5004119873046875, -1.446136474609375, -1.3918609619140625, -1.33758544921875, -1.2833099365234375, -1.229034423828125, -1.1747589111328125, -1.1204833984375, -1.0662078857421875, -1.011932373046875, -0.9576568603515625, -0.90338134765625, -0.8491058349609375, -0.794830322265625, -0.7405548095703125, -0.686279296875, -0.6320037841796875, -0.577728271484375, -0.5234527587890625, -0.46917724609375, -0.4149017333984375, -0.360626220703125, -0.3063507080078125, -0.2520751953125, -0.1977996826171875, -0.143524169921875, -0.0892486572265625, -0.03497314453125, 0.0193023681640625, 0.073577880859375, 0.1278533935546875, 0.18212890625, 0.2364044189453125, 0.290679931640625, 0.3449554443359375, 0.39923095703125, 0.4535064697265625, 0.507781982421875, 0.5620574951171875, 0.6163330078125, 0.6706085205078125, 0.724884033203125, 0.7791595458984375, 0.83343505859375, 0.8877105712890625, 0.941986083984375, 0.9962615966796875, 1.050537109375, 1.1048126220703125, 1.159088134765625, 1.2133636474609375, 1.26763916015625, 1.3219146728515625, 1.376190185546875, 1.4304656982421875, 1.4847412109375, 1.5390167236328125, 1.593292236328125, 1.6475677490234375, 1.70184326171875, 1.7561187744140625, 1.810394287109375, 1.8646697998046875, 1.9189453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 5.0, 5.0, 5.0, 6.0, 19.0, 7.0, 16.0, 20.0, 31.0, 32.0, 30.0, 35.0, 46.0, 43.0, 54.0, 64.0, 104.0, 179.0, 1342.0, 310.0, 175.0, 103.0, 65.0, 40.0, 41.0, 39.0, 42.0, 26.0, 29.0, 23.0, 17.0, 18.0, 12.0, 8.0, 12.0, 7.0, 7.0, 6.0, 10.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30999755859375, -4.1707763671875, -4.03155517578125, -3.892333984375, -3.75311279296875, -3.6138916015625, -3.47467041015625, -3.33544921875, -3.19622802734375, -3.0570068359375, -2.91778564453125, -2.778564453125, -2.63934326171875, -2.5001220703125, -2.36090087890625, -2.2216796875, -2.08245849609375, -1.9432373046875, -1.80401611328125, -1.664794921875, -1.52557373046875, -1.3863525390625, -1.24713134765625, -1.10791015625, -0.96868896484375, -0.8294677734375, -0.69024658203125, -0.551025390625, -0.41180419921875, -0.2725830078125, -0.13336181640625, 0.005859375, 0.14508056640625, 0.2843017578125, 0.42352294921875, 0.562744140625, 0.70196533203125, 0.8411865234375, 0.98040771484375, 1.11962890625, 1.25885009765625, 1.3980712890625, 1.53729248046875, 1.676513671875, 1.81573486328125, 1.9549560546875, 2.09417724609375, 2.2333984375, 2.37261962890625, 2.5118408203125, 2.65106201171875, 2.790283203125, 2.92950439453125, 3.0687255859375, 3.20794677734375, 3.34716796875, 3.48638916015625, 3.6256103515625, 3.76483154296875, 3.904052734375, 4.04327392578125, 4.1824951171875, 4.32171630859375, 4.4609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 9.0, 12.0, 4.0, 8.0, 10.0, 13.0, 15.0, 22.0, 29.0, 36.0, 38.0, 71.0, 90.0, 137.0, 247.0, 480.0, 1223.0, 8411.0, 1323228.0, 1798725.0, 10412.0, 1294.0, 442.0, 215.0, 141.0, 101.0, 71.0, 40.0, 47.0, 31.0, 25.0, 16.0, 16.0, 10.0, 3.0, 7.0, 3.0, 12.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0501708984375, -8.748779296875, -8.4473876953125, -8.14599609375, -7.8446044921875, -7.543212890625, -7.2418212890625, -6.9404296875, -6.6390380859375, -6.337646484375, -6.0362548828125, -5.73486328125, -5.4334716796875, -5.132080078125, -4.8306884765625, -4.529296875, -4.2279052734375, -3.926513671875, -3.6251220703125, -3.32373046875, -3.0223388671875, -2.720947265625, -2.4195556640625, -2.1181640625, -1.8167724609375, -1.515380859375, -1.2139892578125, -0.91259765625, -0.6112060546875, -0.309814453125, -0.0084228515625, 0.29296875, 0.5943603515625, 0.895751953125, 1.1971435546875, 1.49853515625, 1.7999267578125, 2.101318359375, 2.4027099609375, 2.7041015625, 3.0054931640625, 3.306884765625, 3.6082763671875, 3.90966796875, 4.2110595703125, 4.512451171875, 4.8138427734375, 5.115234375, 5.4166259765625, 5.718017578125, 6.0194091796875, 6.32080078125, 6.6221923828125, 6.923583984375, 7.2249755859375, 7.5263671875, 7.8277587890625, 8.129150390625, 8.4305419921875, 8.73193359375, 9.0333251953125, 9.334716796875, 9.6361083984375, 9.9375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 47.0, 280.0, 493.0, 166.0, 19.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.51102066040039, -24.72133445739746, -23.93164825439453, -23.141963958740234, -22.352277755737305, -21.562591552734375, -20.772905349731445, -19.983219146728516, -19.19353485107422, -18.40384864807129, -17.61416244506836, -16.824478149414062, -16.034791946411133, -15.245105743408203, -14.455419540405273, -13.66573429107666, -12.87604808807373, -12.0863618850708, -11.296676635742188, -10.506990432739258, -9.717305183410645, -8.927618980407715, -8.137933731079102, -7.348247528076172, -6.5585618019104, -5.768876075744629, -4.979190349578857, -4.189504623413086, -3.3998186588287354, -2.610132932662964, -1.8204469680786133, -1.0307612419128418, -0.2410755157470703, 0.548610270023346, 1.3382960557937622, 2.1279819011688232, 2.9176676273345947, 3.707353353500366, 4.497039318084717, 5.286725044250488, 6.07641077041626, 6.866096496582031, 7.655782222747803, 8.445467948913574, 9.235154151916504, 10.024839401245117, 10.814525604248047, 11.604211807250977, 12.39389705657959, 13.18358325958252, 13.973268508911133, 14.762954711914062, 15.552639961242676, 16.34232521057129, 17.13201141357422, 17.92169761657715, 18.711383819580078, 19.501070022583008, 20.290756225585938, 21.080440521240234, 21.870126724243164, 22.659812927246094, 23.449499130249023, 24.239185333251953, 25.02886962890625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 6.0, 10.0, 12.0, 9.0, 12.0, 20.0, 10.0, 27.0, 32.0, 17.0, 16.0, 35.0, 28.0, 24.0, 24.0, 43.0, 33.0, 40.0, 51.0, 49.0, 29.0, 20.0, 31.0, 46.0, 29.0, 26.0, 40.0, 34.0, 23.0, 22.0, 31.0, 17.0, 20.0, 10.0, 18.0, 18.0, 10.0, 14.0, 10.0, 6.0, 11.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-12.911194801330566, -12.52262020111084, -12.134044647216797, -11.74547004699707, -11.356895446777344, -10.9683198928833, -10.579745292663574, -10.191169738769531, -9.802595138549805, -9.414020538330078, -9.025444984436035, -8.636870384216309, -8.248294830322266, -7.859720230102539, -7.4711456298828125, -7.082570552825928, -6.693995475769043, -6.305420398712158, -5.916845321655273, -5.528270721435547, -5.139695644378662, -4.751120567321777, -4.362545967102051, -3.973970890045166, -3.5853958129882812, -3.1968207359313965, -2.808245897293091, -2.419671058654785, -2.0310959815979004, -1.6425210237503052, -1.25394606590271, -0.8653712272644043, -0.4767951965332031, -0.08822023868560791, 0.3003547191619873, 0.6889296770095825, 1.0775046348571777, 1.466079592704773, 1.8546545505523682, 2.243229389190674, 2.6318044662475586, 3.0203795433044434, 3.408954381942749, 3.7975292205810547, 4.1861042976379395, 4.574679374694824, 4.963253974914551, 5.3518290519714355, 5.74040412902832, 6.128979206085205, 6.51755428314209, 6.906128883361816, 7.294703960418701, 7.683279037475586, 8.071853637695312, 8.460428237915039, 8.849003791809082, 9.237578392028809, 9.626153945922852, 10.014728546142578, 10.403303146362305, 10.791878700256348, 11.180453300476074, 11.569028854370117, 11.957603454589844]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 12.0, 7.0, 17.0, 24.0, 14.0, 23.0, 30.0, 34.0, 29.0, 37.0, 31.0, 56.0, 48.0, 43.0, 45.0, 50.0, 42.0, 41.0, 55.0, 36.0, 42.0, 37.0, 42.0, 36.0, 21.0, 22.0, 22.0, 20.0, 19.0, 13.0, 12.0, 13.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.3092193603515625, -1.263946533203125, -1.2186737060546875, -1.17340087890625, -1.1281280517578125, -1.082855224609375, -1.0375823974609375, -0.9923095703125, -0.9470367431640625, -0.901763916015625, -0.8564910888671875, -0.81121826171875, -0.7659454345703125, -0.720672607421875, -0.6753997802734375, -0.630126953125, -0.5848541259765625, -0.539581298828125, -0.4943084716796875, -0.44903564453125, -0.4037628173828125, -0.358489990234375, -0.3132171630859375, -0.2679443359375, -0.2226715087890625, -0.177398681640625, -0.1321258544921875, -0.08685302734375, -0.0415802001953125, 0.003692626953125, 0.0489654541015625, 0.09423828125, 0.1395111083984375, 0.184783935546875, 0.2300567626953125, 0.27532958984375, 0.3206024169921875, 0.365875244140625, 0.4111480712890625, 0.4564208984375, 0.5016937255859375, 0.546966552734375, 0.5922393798828125, 0.63751220703125, 0.6827850341796875, 0.728057861328125, 0.7733306884765625, 0.818603515625, 0.8638763427734375, 0.909149169921875, 0.9544219970703125, 0.99969482421875, 1.0449676513671875, 1.090240478515625, 1.1355133056640625, 1.1807861328125, 1.2260589599609375, 1.271331787109375, 1.3166046142578125, 1.36187744140625, 1.4071502685546875, 1.452423095703125, 1.4976959228515625, 1.54296875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 8.0, 14.0, 11.0, 21.0, 30.0, 38.0, 34.0, 55.0, 86.0, 122.0, 197.0, 449.0, 1221.0, 4672.0, 30195.0, 358525.0, 3049782.0, 690835.0, 48172.0, 6919.0, 1616.0, 489.0, 258.0, 150.0, 89.0, 67.0, 50.0, 40.0, 27.0, 20.0, 15.0, 17.0, 13.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.32537841796875, -4.1741943359375, -4.02301025390625, -3.871826171875, -3.72064208984375, -3.5694580078125, -3.41827392578125, -3.26708984375, -3.11590576171875, -2.9647216796875, -2.81353759765625, -2.662353515625, -2.51116943359375, -2.3599853515625, -2.20880126953125, -2.0576171875, -1.90643310546875, -1.7552490234375, -1.60406494140625, -1.452880859375, -1.30169677734375, -1.1505126953125, -0.99932861328125, -0.84814453125, -0.69696044921875, -0.5457763671875, -0.39459228515625, -0.243408203125, -0.09222412109375, 0.0589599609375, 0.21014404296875, 0.361328125, 0.51251220703125, 0.6636962890625, 0.81488037109375, 0.966064453125, 1.11724853515625, 1.2684326171875, 1.41961669921875, 1.57080078125, 1.72198486328125, 1.8731689453125, 2.02435302734375, 2.175537109375, 2.32672119140625, 2.4779052734375, 2.62908935546875, 2.7802734375, 2.93145751953125, 3.0826416015625, 3.23382568359375, 3.385009765625, 3.53619384765625, 3.6873779296875, 3.83856201171875, 3.98974609375, 4.14093017578125, 4.2921142578125, 4.44329833984375, 4.594482421875, 4.74566650390625, 4.8968505859375, 5.04803466796875, 5.19921875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 13.0, 14.0, 19.0, 25.0, 34.0, 56.0, 76.0, 97.0, 155.0, 234.0, 327.0, 391.0, 432.0, 515.0, 419.0, 355.0, 243.0, 205.0, 132.0, 93.0, 63.0, 56.0, 41.0, 26.0, 9.0, 10.0, 10.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.222808837890625, -5.08624267578125, -4.949676513671875, -4.8131103515625, -4.676544189453125, -4.53997802734375, -4.403411865234375, -4.266845703125, -4.130279541015625, -3.99371337890625, -3.857147216796875, -3.7205810546875, -3.584014892578125, -3.44744873046875, -3.310882568359375, -3.17431640625, -3.037750244140625, -2.90118408203125, -2.764617919921875, -2.6280517578125, -2.491485595703125, -2.35491943359375, -2.218353271484375, -2.081787109375, -1.945220947265625, -1.80865478515625, -1.672088623046875, -1.5355224609375, -1.398956298828125, -1.26239013671875, -1.125823974609375, -0.9892578125, -0.852691650390625, -0.71612548828125, -0.579559326171875, -0.4429931640625, -0.306427001953125, -0.16986083984375, -0.033294677734375, 0.103271484375, 0.239837646484375, 0.37640380859375, 0.512969970703125, 0.6495361328125, 0.786102294921875, 0.92266845703125, 1.059234619140625, 1.19580078125, 1.332366943359375, 1.46893310546875, 1.605499267578125, 1.7420654296875, 1.878631591796875, 2.01519775390625, 2.151763916015625, 2.288330078125, 2.424896240234375, 2.56146240234375, 2.698028564453125, 2.8345947265625, 2.971160888671875, 3.10772705078125, 3.244293212890625, 3.380859375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 16.0, 29.0, 40.0, 79.0, 143.0, 278.0, 586.0, 1598.0, 8209.0, 123993.0, 2873267.0, 1137180.0, 42722.0, 4276.0, 1012.0, 401.0, 188.0, 97.0, 61.0, 32.0, 19.0, 15.0, 12.0, 11.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.828125, -8.5218505859375, -8.215576171875, -7.9093017578125, -7.60302734375, -7.2967529296875, -6.990478515625, -6.6842041015625, -6.3779296875, -6.0716552734375, -5.765380859375, -5.4591064453125, -5.15283203125, -4.8465576171875, -4.540283203125, -4.2340087890625, -3.927734375, -3.6214599609375, -3.315185546875, -3.0089111328125, -2.70263671875, -2.3963623046875, -2.090087890625, -1.7838134765625, -1.4775390625, -1.1712646484375, -0.864990234375, -0.5587158203125, -0.25244140625, 0.0538330078125, 0.360107421875, 0.6663818359375, 0.97265625, 1.2789306640625, 1.585205078125, 1.8914794921875, 2.19775390625, 2.5040283203125, 2.810302734375, 3.1165771484375, 3.4228515625, 3.7291259765625, 4.035400390625, 4.3416748046875, 4.64794921875, 4.9542236328125, 5.260498046875, 5.5667724609375, 5.873046875, 6.1793212890625, 6.485595703125, 6.7918701171875, 7.09814453125, 7.4044189453125, 7.710693359375, 8.0169677734375, 8.3232421875, 8.6295166015625, 8.935791015625, 9.2420654296875, 9.54833984375, 9.8546142578125, 10.160888671875, 10.4671630859375, 10.7734375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 25.0, 62.0, 109.0, 213.0, 224.0, 189.0, 110.0, 57.0, 18.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.527366638183594, -36.52328872680664, -35.51920700073242, -34.51512908935547, -33.511051177978516, -32.5069694519043, -31.502891540527344, -30.498811721801758, -29.494731903076172, -28.490652084350586, -27.486574172973633, -26.482494354248047, -25.47841453552246, -24.474334716796875, -23.470256805419922, -22.466176986694336, -21.462099075317383, -20.458019256591797, -19.453941345214844, -18.449861526489258, -17.445781707763672, -16.44170379638672, -15.437623977661133, -14.433544158935547, -13.429465293884277, -12.425386428833008, -11.421306610107422, -10.417227745056152, -9.413148880004883, -8.409069061279297, -7.404990196228027, -6.4009108543396, -5.396829605102539, -4.392750263214111, -3.3886711597442627, -2.384592056274414, -1.3805127143859863, -0.3764333724975586, 0.6276454925537109, 1.6317248344421387, 2.6358041763305664, 3.639883518218994, 4.643962860107422, 5.648041725158691, 6.652121067047119, 7.656200408935547, 8.660279273986816, 9.664358139038086, 10.668437957763672, 11.672516822814941, 12.676596641540527, 13.680675506591797, 14.684755325317383, 15.688834190368652, 16.692913055419922, 17.696992874145508, 18.701072692871094, 19.70515251159668, 20.709230422973633, 21.71331024169922, 22.717390060424805, 23.72146987915039, 24.725547790527344, 25.72962760925293, 26.733705520629883]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 15.0, 12.0, 15.0, 12.0, 26.0, 20.0, 27.0, 29.0, 35.0, 37.0, 31.0, 31.0, 47.0, 35.0, 39.0, 46.0, 43.0, 38.0, 41.0, 46.0, 44.0, 42.0, 33.0, 24.0, 38.0, 35.0, 33.0, 14.0, 17.0, 12.0, 18.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.223062515258789, -11.807843208312988, -11.392623901367188, -10.97740364074707, -10.56218433380127, -10.146965026855469, -9.731745719909668, -9.316526412963867, -8.901307106018066, -8.486087799072266, -8.070868492126465, -7.655648708343506, -7.240429401397705, -6.825209617614746, -6.409990310668945, -5.9947710037231445, -5.5795512199401855, -5.164331912994385, -4.749112129211426, -4.333892822265625, -3.918673515319824, -3.5034539699554443, -3.0882344245910645, -2.6730151176452637, -2.257795572280884, -1.8425761461257935, -1.4273567199707031, -1.0121371746063232, -0.5969177484512329, -0.18169832229614258, 0.2335212230682373, 0.6487405300140381, 1.063960075378418, 1.4791795015335083, 1.8943989276885986, 2.3096184730529785, 2.7248377799987793, 3.140057325363159, 3.555276870727539, 3.97049617767334, 4.385715484619141, 4.800934791564941, 5.2161545753479, 5.631373882293701, 6.046593189239502, 6.461812973022461, 6.877032279968262, 7.2922515869140625, 7.7074713706970215, 8.12269115447998, 8.537910461425781, 8.953129768371582, 9.368349075317383, 9.783568382263184, 10.198787689208984, 10.614007949829102, 11.029227256774902, 11.444446563720703, 11.859665870666504, 12.274885177612305, 12.690105438232422, 13.105324745178223, 13.520544052124023, 13.935763359069824, 14.350982666015625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 5.0, 13.0, 18.0, 19.0, 17.0, 22.0, 18.0, 33.0, 30.0, 28.0, 39.0, 43.0, 35.0, 38.0, 37.0, 53.0, 51.0, 39.0, 56.0, 41.0, 37.0, 47.0, 36.0, 27.0, 25.0, 34.0, 20.0, 22.0, 20.0, 18.0, 8.0, 7.0, 12.0, 14.0, 8.0, 9.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2894134521484375, -1.245819091796875, -1.2022247314453125, -1.15863037109375, -1.1150360107421875, -1.071441650390625, -1.0278472900390625, -0.9842529296875, -0.9406585693359375, -0.897064208984375, -0.8534698486328125, -0.80987548828125, -0.7662811279296875, -0.722686767578125, -0.6790924072265625, -0.635498046875, -0.5919036865234375, -0.548309326171875, -0.5047149658203125, -0.46112060546875, -0.4175262451171875, -0.373931884765625, -0.3303375244140625, -0.2867431640625, -0.2431488037109375, -0.199554443359375, -0.1559600830078125, -0.11236572265625, -0.0687713623046875, -0.025177001953125, 0.0184173583984375, 0.06201171875, 0.1056060791015625, 0.149200439453125, 0.1927947998046875, 0.23638916015625, 0.2799835205078125, 0.323577880859375, 0.3671722412109375, 0.4107666015625, 0.4543609619140625, 0.497955322265625, 0.5415496826171875, 0.58514404296875, 0.6287384033203125, 0.672332763671875, 0.7159271240234375, 0.759521484375, 0.8031158447265625, 0.846710205078125, 0.8903045654296875, 0.93389892578125, 0.9774932861328125, 1.021087646484375, 1.0646820068359375, 1.1082763671875, 1.1518707275390625, 1.195465087890625, 1.2390594482421875, 1.28265380859375, 1.3262481689453125, 1.369842529296875, 1.4134368896484375, 1.45703125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 6.0, 14.0, 13.0, 23.0, 41.0, 56.0, 85.0, 141.0, 193.0, 366.0, 502.0, 950.0, 1415.0, 2287.0, 3907.0, 6326.0, 10934.0, 19152.0, 35089.0, 65272.0, 129089.0, 248485.0, 248533.0, 128879.0, 65203.0, 34969.0, 19155.0, 11118.0, 6515.0, 3814.0, 2215.0, 1393.0, 877.0, 514.0, 383.0, 221.0, 138.0, 99.0, 59.0, 36.0, 29.0, 24.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17667388916015625, -0.1709747314453125, -0.16527557373046875, -0.159576416015625, -0.15387725830078125, -0.1481781005859375, -0.14247894287109375, -0.13677978515625, -0.13108062744140625, -0.1253814697265625, -0.11968231201171875, -0.113983154296875, -0.10828399658203125, -0.1025848388671875, -0.09688568115234375, -0.0911865234375, -0.08548736572265625, -0.0797882080078125, -0.07408905029296875, -0.068389892578125, -0.06269073486328125, -0.0569915771484375, -0.05129241943359375, -0.04559326171875, -0.03989410400390625, -0.0341949462890625, -0.02849578857421875, -0.022796630859375, -0.01709747314453125, -0.0113983154296875, -0.00569915771484375, 0.0, 0.00569915771484375, 0.0113983154296875, 0.01709747314453125, 0.022796630859375, 0.02849578857421875, 0.0341949462890625, 0.03989410400390625, 0.04559326171875, 0.05129241943359375, 0.0569915771484375, 0.06269073486328125, 0.068389892578125, 0.07408905029296875, 0.0797882080078125, 0.08548736572265625, 0.0911865234375, 0.09688568115234375, 0.1025848388671875, 0.10828399658203125, 0.113983154296875, 0.11968231201171875, 0.1253814697265625, 0.13108062744140625, 0.13677978515625, 0.14247894287109375, 0.1481781005859375, 0.15387725830078125, 0.159576416015625, 0.16527557373046875, 0.1709747314453125, 0.17667388916015625, 0.182373046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 11.0, 21.0, 15.0, 15.0, 20.0, 20.0, 24.0, 24.0, 33.0, 36.0, 20.0, 45.0, 25.0, 32.0, 34.0, 33.0, 38.0, 1067.0, 32.0, 33.0, 33.0, 37.0, 30.0, 26.0, 22.0, 29.0, 25.0, 22.0, 20.0, 20.0, 28.0, 16.0, 11.0, 15.0, 14.0, 8.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69287109375, -0.6699142456054688, -0.6469573974609375, -0.6240005493164062, -0.601043701171875, -0.5780868530273438, -0.5551300048828125, -0.5321731567382812, -0.50921630859375, -0.48625946044921875, -0.4633026123046875, -0.44034576416015625, -0.417388916015625, -0.39443206787109375, -0.3714752197265625, -0.34851837158203125, -0.3255615234375, -0.30260467529296875, -0.2796478271484375, -0.25669097900390625, -0.233734130859375, -0.21077728271484375, -0.1878204345703125, -0.16486358642578125, -0.14190673828125, -0.11894989013671875, -0.0959930419921875, -0.07303619384765625, -0.050079345703125, -0.02712249755859375, -0.0041656494140625, 0.01879119873046875, 0.041748046875, 0.06470489501953125, 0.0876617431640625, 0.11061859130859375, 0.133575439453125, 0.15653228759765625, 0.1794891357421875, 0.20244598388671875, 0.22540283203125, 0.24835968017578125, 0.2713165283203125, 0.29427337646484375, 0.317230224609375, 0.34018707275390625, 0.3631439208984375, 0.38610076904296875, 0.4090576171875, 0.43201446533203125, 0.4549713134765625, 0.47792816162109375, 0.500885009765625, 0.5238418579101562, 0.5467987060546875, 0.5697555541992188, 0.59271240234375, 0.6156692504882812, 0.6386260986328125, 0.6615829467773438, 0.684539794921875, 0.7074966430664062, 0.7304534912109375, 0.7534103393554688, 0.7763671875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 12.0, 5.0, 24.0, 23.0, 37.0, 70.0, 108.0, 171.0, 261.0, 423.0, 604.0, 1117.0, 1773.0, 2849.0, 4900.0, 8457.0, 15187.0, 27707.0, 50495.0, 93891.0, 179794.0, 1318894.0, 181355.0, 94524.0, 50428.0, 27588.0, 15127.0, 8732.0, 5096.0, 2927.0, 1770.0, 1045.0, 656.0, 429.0, 239.0, 137.0, 99.0, 60.0, 41.0, 26.0, 14.0, 10.0, 11.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13031578063964844, -0.12574386596679688, -0.12117195129394531, -0.11660003662109375, -0.11202812194824219, -0.10745620727539062, -0.10288429260253906, -0.0983123779296875, -0.09374046325683594, -0.08916854858398438, -0.08459663391113281, -0.08002471923828125, -0.07545280456542969, -0.07088088989257812, -0.06630897521972656, -0.061737060546875, -0.05716514587402344, -0.052593231201171875, -0.04802131652832031, -0.04344940185546875, -0.03887748718261719, -0.034305572509765625, -0.029733657836914062, -0.0251617431640625, -0.020589828491210938, -0.016017913818359375, -0.011445999145507812, -0.00687408447265625, -0.0023021697998046875, 0.002269744873046875, 0.0068416595458984375, 0.01141357421875, 0.015985488891601562, 0.020557403564453125, 0.025129318237304688, 0.02970123291015625, 0.03427314758300781, 0.038845062255859375, 0.04341697692871094, 0.0479888916015625, 0.05256080627441406, 0.057132720947265625, 0.06170463562011719, 0.06627655029296875, 0.07084846496582031, 0.07542037963867188, 0.07999229431152344, 0.084564208984375, 0.08913612365722656, 0.09370803833007812, 0.09827995300292969, 0.10285186767578125, 0.10742378234863281, 0.11199569702148438, 0.11656761169433594, 0.1211395263671875, 0.12571144104003906, 0.13028335571289062, 0.1348552703857422, 0.13942718505859375, 0.1439990997314453, 0.14857101440429688, 0.15314292907714844, 0.15771484375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 5.0, 11.0, 19.0, 20.0, 23.0, 31.0, 45.0, 55.0, 62.0, 68.0, 78.0, 84.0, 75.0, 78.0, 56.0, 53.0, 50.0, 38.0, 41.0, 18.0, 15.0, 9.0, 10.0, 11.0, 3.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005235671997070312, -0.0005041211843490601, -0.00048467516899108887, -0.0004652291536331177, -0.0004457831382751465, -0.0004263371229171753, -0.0004068911075592041, -0.0003874450922012329, -0.0003679990768432617, -0.00034855306148529053, -0.00032910704612731934, -0.00030966103076934814, -0.00029021501541137695, -0.00027076900005340576, -0.00025132298469543457, -0.00023187696933746338, -0.0002124309539794922, -0.000192984938621521, -0.0001735389232635498, -0.0001540929079055786, -0.00013464689254760742, -0.00011520087718963623, -9.575486183166504e-05, -7.630884647369385e-05, -5.6862831115722656e-05, -3.7416815757751465e-05, -1.7970800399780273e-05, 1.475214958190918e-06, 2.092123031616211e-05, 4.03672456741333e-05, 5.981326103210449e-05, 7.925927639007568e-05, 9.870529174804688e-05, 0.00011815130710601807, 0.00013759732246398926, 0.00015704333782196045, 0.00017648935317993164, 0.00019593536853790283, 0.00021538138389587402, 0.00023482739925384521, 0.0002542734146118164, 0.0002737194299697876, 0.0002931654453277588, 0.00031261146068573, 0.00033205747604370117, 0.00035150349140167236, 0.00037094950675964355, 0.00039039552211761475, 0.00040984153747558594, 0.00042928755283355713, 0.0004487335681915283, 0.0004681795835494995, 0.0004876255989074707, 0.0005070716142654419, 0.0005265176296234131, 0.0005459636449813843, 0.0005654096603393555, 0.0005848556756973267, 0.0006043016910552979, 0.000623747706413269, 0.0006431937217712402, 0.0006626397371292114, 0.0006820857524871826, 0.0007015317678451538, 0.000720977783203125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 11.0, 8.0, 17.0, 20.0, 18.0, 44.0, 50.0, 79.0, 103.0, 161.0, 281.0, 591.0, 4343.0, 1039524.0, 2126.0, 429.0, 260.0, 152.0, 88.0, 63.0, 55.0, 38.0, 16.0, 16.0, 14.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0174407958984375, -0.016986966133117676, -0.01653313636779785, -0.016079306602478027, -0.015625476837158203, -0.015171647071838379, -0.014717817306518555, -0.01426398754119873, -0.013810157775878906, -0.013356328010559082, -0.012902498245239258, -0.012448668479919434, -0.01199483871459961, -0.011541008949279785, -0.011087179183959961, -0.010633349418640137, -0.010179519653320312, -0.009725689888000488, -0.009271860122680664, -0.00881803035736084, -0.008364200592041016, -0.007910370826721191, -0.007456541061401367, -0.007002711296081543, -0.006548881530761719, -0.0060950517654418945, -0.00564122200012207, -0.005187392234802246, -0.004733562469482422, -0.004279732704162598, -0.0038259029388427734, -0.0033720731735229492, -0.002918243408203125, -0.0024644136428833008, -0.0020105838775634766, -0.0015567541122436523, -0.0011029243469238281, -0.0006490945816040039, -0.0001952648162841797, 0.00025856494903564453, 0.0007123947143554688, 0.001166224479675293, 0.0016200542449951172, 0.0020738840103149414, 0.0025277137756347656, 0.00298154354095459, 0.003435373306274414, 0.0038892030715942383, 0.0043430328369140625, 0.004796862602233887, 0.005250692367553711, 0.005704522132873535, 0.006158351898193359, 0.006612181663513184, 0.007066011428833008, 0.007519841194152832, 0.007973670959472656, 0.00842750072479248, 0.008881330490112305, 0.009335160255432129, 0.009788990020751953, 0.010242819786071777, 0.010696649551391602, 0.011150479316711426, 0.01160430908203125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 938.0, 57.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005855758674442768, -0.005739997606724501, -0.005624236539006233, -0.0055084750056266785, -0.005392713937908411, -0.005276952870190144, -0.005161191802471876, -0.005045430269092321, -0.004929669201374054, -0.0048139081336557865, -0.004698147065937519, -0.004582385532557964, -0.004466624464839697, -0.0043508633971214294, -0.004235102329403162, -0.004119340796023607, -0.00400357972830534, -0.0038878186605870724, -0.0037720573600381613, -0.003656296292319894, -0.0035405349917709827, -0.0034247739240527153, -0.003309012623503804, -0.0031932515557855368, -0.0030774904880672693, -0.002961729420349002, -0.002845968119800091, -0.0027302070520818233, -0.0026144457515329123, -0.002498684683814645, -0.0023829233832657337, -0.0022671623155474663, -0.002151401014998555, -0.0020356399472802877, -0.0019198786467313766, -0.0018041174625977874, -0.0016883562784641981, -0.0015725952107459307, -0.0014568339101970196, -0.0013410728424787521, -0.001225311541929841, -0.0011095503577962518, -0.0009937891736626625, -0.0008780279895290732, -0.000762266805395484, -0.0006465056794695556, -0.0005307444953359663, -0.0004149833112023771, -0.0002992221852764487, -0.00018346100114285946, -6.769983156118542e-05, 4.806133802048862e-05, 0.0001638225221540779, 0.0002795836771838367, 0.00039534486131742597, 0.0005111060454510152, 0.0006268672295846045, 0.0007426284137181938, 0.000858389597851783, 0.0009741507237777114, 0.0010899119079113007, 0.00120567309204489, 0.0013214342761784792, 0.0014371954603120685, 0.0015529566444456577]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 13.0, 17.0, 13.0, 15.0, 14.0, 23.0, 31.0, 21.0, 38.0, 26.0, 26.0, 36.0, 56.0, 55.0, 52.0, 46.0, 47.0, 54.0, 52.0, 44.0, 25.0, 44.0, 34.0, 32.0, 28.0, 21.0, 19.0, 18.0, 13.0, 15.0, 11.0, 12.0, 9.0, 2.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002983212471008301, -0.00028892606496810913, -0.0002795308828353882, -0.00027013570070266724, -0.0002607405185699463, -0.00025134533643722534, -0.0002419501543045044, -0.00023255497217178345, -0.0002231597900390625, -0.00021376460790634155, -0.0002043694257736206, -0.00019497424364089966, -0.0001855790615081787, -0.00017618387937545776, -0.00016678869724273682, -0.00015739351511001587, -0.00014799833297729492, -0.00013860315084457397, -0.00012920796871185303, -0.00011981278657913208, -0.00011041760444641113, -0.00010102242231369019, -9.162724018096924e-05, -8.223205804824829e-05, -7.283687591552734e-05, -6.34416937828064e-05, -5.404651165008545e-05, -4.46513295173645e-05, -3.5256147384643555e-05, -2.5860965251922607e-05, -1.646578311920166e-05, -7.070600986480713e-06, 2.3245811462402344e-06, 1.1719763278961182e-05, 2.111494541168213e-05, 3.0510127544403076e-05, 3.9905309677124023e-05, 4.930049180984497e-05, 5.869567394256592e-05, 6.809085607528687e-05, 7.748603820800781e-05, 8.688122034072876e-05, 9.627640247344971e-05, 0.00010567158460617065, 0.0001150667667388916, 0.00012446194887161255, 0.0001338571310043335, 0.00014325231313705444, 0.0001526474952697754, 0.00016204267740249634, 0.00017143785953521729, 0.00018083304166793823, 0.00019022822380065918, 0.00019962340593338013, 0.00020901858806610107, 0.00021841377019882202, 0.00022780895233154297, 0.00023720413446426392, 0.00024659931659698486, 0.0002559944987297058, 0.00026538968086242676, 0.0002747848629951477, 0.00028418004512786865, 0.0002935752272605896, 0.00030297040939331055]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 5.0, 13.0, 18.0, 19.0, 17.0, 22.0, 18.0, 33.0, 30.0, 28.0, 39.0, 43.0, 35.0, 38.0, 37.0, 53.0, 51.0, 39.0, 56.0, 41.0, 37.0, 48.0, 35.0, 27.0, 25.0, 34.0, 20.0, 22.0, 20.0, 18.0, 8.0, 7.0, 12.0, 14.0, 8.0, 9.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2894134521484375, -1.245819091796875, -1.2022247314453125, -1.15863037109375, -1.1150360107421875, -1.071441650390625, -1.0278472900390625, -0.9842529296875, -0.9406585693359375, -0.897064208984375, -0.8534698486328125, -0.80987548828125, -0.7662811279296875, -0.722686767578125, -0.6790924072265625, -0.635498046875, -0.5919036865234375, -0.548309326171875, -0.5047149658203125, -0.46112060546875, -0.4175262451171875, -0.373931884765625, -0.3303375244140625, -0.2867431640625, -0.2431488037109375, -0.199554443359375, -0.1559600830078125, -0.11236572265625, -0.0687713623046875, -0.025177001953125, 0.0184173583984375, 0.06201171875, 0.1056060791015625, 0.149200439453125, 0.1927947998046875, 0.23638916015625, 0.2799835205078125, 0.323577880859375, 0.3671722412109375, 0.4107666015625, 0.4543609619140625, 0.497955322265625, 0.5415496826171875, 0.58514404296875, 0.6287384033203125, 0.672332763671875, 0.7159271240234375, 0.759521484375, 0.8031158447265625, 0.846710205078125, 0.8903045654296875, 0.93389892578125, 0.9774932861328125, 1.021087646484375, 1.0646820068359375, 1.1082763671875, 1.1518707275390625, 1.195465087890625, 1.2390594482421875, 1.28265380859375, 1.3262481689453125, 1.369842529296875, 1.4134368896484375, 1.45703125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 13.0, 15.0, 17.0, 31.0, 39.0, 69.0, 99.0, 128.0, 163.0, 259.0, 388.0, 622.0, 1147.0, 1974.0, 3485.0, 6780.0, 13542.0, 29863.0, 74622.0, 199490.0, 385026.0, 198367.0, 74057.0, 29613.0, 13525.0, 6661.0, 3666.0, 1895.0, 1104.0, 690.0, 389.0, 259.0, 174.0, 112.0, 77.0, 59.0, 38.0, 36.0, 19.0, 16.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.546600341796875, -1.50042724609375, -1.454254150390625, -1.4080810546875, -1.361907958984375, -1.31573486328125, -1.269561767578125, -1.223388671875, -1.177215576171875, -1.13104248046875, -1.084869384765625, -1.0386962890625, -0.992523193359375, -0.94635009765625, -0.900177001953125, -0.85400390625, -0.807830810546875, -0.76165771484375, -0.715484619140625, -0.6693115234375, -0.623138427734375, -0.57696533203125, -0.530792236328125, -0.484619140625, -0.438446044921875, -0.39227294921875, -0.346099853515625, -0.2999267578125, -0.253753662109375, -0.20758056640625, -0.161407470703125, -0.115234375, -0.069061279296875, -0.02288818359375, 0.023284912109375, 0.0694580078125, 0.115631103515625, 0.16180419921875, 0.207977294921875, 0.254150390625, 0.300323486328125, 0.34649658203125, 0.392669677734375, 0.4388427734375, 0.485015869140625, 0.53118896484375, 0.577362060546875, 0.62353515625, 0.669708251953125, 0.71588134765625, 0.762054443359375, 0.8082275390625, 0.854400634765625, 0.90057373046875, 0.946746826171875, 0.992919921875, 1.039093017578125, 1.08526611328125, 1.131439208984375, 1.1776123046875, 1.223785400390625, 1.26995849609375, 1.316131591796875, 1.3623046875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 5.0, 15.0, 10.0, 17.0, 11.0, 15.0, 25.0, 32.0, 28.0, 37.0, 47.0, 38.0, 39.0, 44.0, 68.0, 103.0, 237.0, 1527.0, 234.0, 84.0, 55.0, 47.0, 35.0, 31.0, 32.0, 33.0, 30.0, 29.0, 26.0, 22.0, 23.0, 9.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.94140625, -4.7935791015625, -4.645751953125, -4.4979248046875, -4.35009765625, -4.2022705078125, -4.054443359375, -3.9066162109375, -3.7587890625, -3.6109619140625, -3.463134765625, -3.3153076171875, -3.16748046875, -3.0196533203125, -2.871826171875, -2.7239990234375, -2.576171875, -2.4283447265625, -2.280517578125, -2.1326904296875, -1.98486328125, -1.8370361328125, -1.689208984375, -1.5413818359375, -1.3935546875, -1.2457275390625, -1.097900390625, -0.9500732421875, -0.80224609375, -0.6544189453125, -0.506591796875, -0.3587646484375, -0.2109375, -0.0631103515625, 0.084716796875, 0.2325439453125, 0.38037109375, 0.5281982421875, 0.676025390625, 0.8238525390625, 0.9716796875, 1.1195068359375, 1.267333984375, 1.4151611328125, 1.56298828125, 1.7108154296875, 1.858642578125, 2.0064697265625, 2.154296875, 2.3021240234375, 2.449951171875, 2.5977783203125, 2.74560546875, 2.8934326171875, 3.041259765625, 3.1890869140625, 3.3369140625, 3.4847412109375, 3.632568359375, 3.7803955078125, 3.92822265625, 4.0760498046875, 4.223876953125, 4.3717041015625, 4.51953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 3.0, 11.0, 10.0, 6.0, 16.0, 28.0, 30.0, 44.0, 30.0, 68.0, 61.0, 91.0, 164.0, 258.0, 629.0, 1960.0, 20424.0, 1930017.0, 1172163.0, 16590.0, 1699.0, 496.0, 274.0, 155.0, 106.0, 89.0, 59.0, 41.0, 38.0, 23.0, 23.0, 17.0, 16.0, 14.0, 8.0, 7.0, 8.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.060302734375, -7.80810546875, -7.555908203125, -7.3037109375, -7.051513671875, -6.79931640625, -6.547119140625, -6.294921875, -6.042724609375, -5.79052734375, -5.538330078125, -5.2861328125, -5.033935546875, -4.78173828125, -4.529541015625, -4.27734375, -4.025146484375, -3.77294921875, -3.520751953125, -3.2685546875, -3.016357421875, -2.76416015625, -2.511962890625, -2.259765625, -2.007568359375, -1.75537109375, -1.503173828125, -1.2509765625, -0.998779296875, -0.74658203125, -0.494384765625, -0.2421875, 0.010009765625, 0.26220703125, 0.514404296875, 0.7666015625, 1.018798828125, 1.27099609375, 1.523193359375, 1.775390625, 2.027587890625, 2.27978515625, 2.531982421875, 2.7841796875, 3.036376953125, 3.28857421875, 3.540771484375, 3.79296875, 4.045166015625, 4.29736328125, 4.549560546875, 4.8017578125, 5.053955078125, 5.30615234375, 5.558349609375, 5.810546875, 6.062744140625, 6.31494140625, 6.567138671875, 6.8193359375, 7.071533203125, 7.32373046875, 7.575927734375, 7.828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 11.0, 69.0, 236.0, 379.0, 250.0, 62.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.540201187133789, -11.824516296386719, -11.108830451965332, -10.393145561218262, -9.677459716796875, -8.961774826049805, -8.246089935302734, -7.530404567718506, -6.814719200134277, -6.099033832550049, -5.38334846496582, -4.66766357421875, -3.9519782066345215, -3.236292839050293, -2.5206079483032227, -1.8049225807189941, -1.0892372131347656, -0.37355196475982666, 0.3421332836151123, 1.0578184127807617, 1.7735037803649902, 2.4891891479492188, 3.204874038696289, 3.9205594062805176, 4.636244773864746, 5.351930141448975, 6.067615509033203, 6.783300399780273, 7.498985767364502, 8.21467113494873, 8.9303560256958, 9.646041870117188, 10.36172866821289, 11.077413558959961, 11.793099403381348, 12.508784294128418, 13.224470138549805, 13.940155029296875, 14.655839920043945, 15.371524810791016, 16.08721160888672, 16.80289649963379, 17.51858139038086, 18.234268188476562, 18.949953079223633, 19.665637969970703, 20.381322860717773, 21.097007751464844, 21.812692642211914, 22.528377532958984, 23.244062423706055, 23.959747314453125, 24.675434112548828, 25.3911190032959, 26.10680389404297, 26.82248878479004, 27.53817367553711, 28.25385856628418, 28.96954345703125, 29.685230255126953, 30.400915145874023, 31.116600036621094, 31.832284927368164, 32.547969818115234, 33.26365661621094]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 8.0, 11.0, 18.0, 7.0, 15.0, 21.0, 24.0, 37.0, 26.0, 25.0, 33.0, 34.0, 39.0, 35.0, 42.0, 47.0, 30.0, 50.0, 38.0, 43.0, 46.0, 39.0, 37.0, 37.0, 27.0, 22.0, 25.0, 23.0, 27.0, 12.0, 23.0, 10.0, 14.0, 15.0, 13.0, 6.0, 12.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.035961151123047, -15.573179244995117, -15.110397338867188, -14.647616386413574, -14.184834480285645, -13.722052574157715, -13.259271621704102, -12.796489715576172, -12.333707809448242, -11.870925903320312, -11.408143997192383, -10.94536304473877, -10.48258113861084, -10.01979923248291, -9.557018280029297, -9.094236373901367, -8.631454467773438, -8.168672561645508, -7.705891132354736, -7.243109703063965, -6.780327796936035, -6.3175458908081055, -5.854764461517334, -5.3919830322265625, -4.929201126098633, -4.466419219970703, -4.003637790679932, -3.540856122970581, -3.0780744552612305, -2.61529278755188, -2.1525111198425293, -1.6897294521331787, -1.2269477844238281, -0.7641661167144775, -0.30138444900512695, 0.16139721870422363, 0.6241788864135742, 1.0869605541229248, 1.5497422218322754, 2.012523889541626, 2.4753055572509766, 2.938087224960327, 3.4008688926696777, 3.8636505603790283, 4.326432228088379, 4.789214134216309, 5.25199556350708, 5.714776992797852, 6.177558898925781, 6.640340805053711, 7.103122234344482, 7.565903663635254, 8.028685569763184, 8.491467475891113, 8.954248428344727, 9.417030334472656, 9.879812240600586, 10.342594146728516, 10.805376052856445, 11.268157005310059, 11.730938911437988, 12.193720817565918, 12.656501770019531, 13.119283676147461, 13.58206558227539]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 11.0, 11.0, 9.0, 12.0, 19.0, 20.0, 19.0, 23.0, 32.0, 27.0, 23.0, 35.0, 40.0, 36.0, 32.0, 44.0, 56.0, 38.0, 57.0, 45.0, 43.0, 49.0, 39.0, 28.0, 32.0, 34.0, 24.0, 24.0, 28.0, 19.0, 13.0, 14.0, 14.0, 9.0, 13.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.382354736328125, -1.33599853515625, -1.289642333984375, -1.2432861328125, -1.196929931640625, -1.15057373046875, -1.104217529296875, -1.057861328125, -1.011505126953125, -0.96514892578125, -0.918792724609375, -0.8724365234375, -0.826080322265625, -0.77972412109375, -0.733367919921875, -0.68701171875, -0.640655517578125, -0.59429931640625, -0.547943115234375, -0.5015869140625, -0.455230712890625, -0.40887451171875, -0.362518310546875, -0.316162109375, -0.269805908203125, -0.22344970703125, -0.177093505859375, -0.1307373046875, -0.084381103515625, -0.03802490234375, 0.008331298828125, 0.0546875, 0.101043701171875, 0.14739990234375, 0.193756103515625, 0.2401123046875, 0.286468505859375, 0.33282470703125, 0.379180908203125, 0.425537109375, 0.471893310546875, 0.51824951171875, 0.564605712890625, 0.6109619140625, 0.657318115234375, 0.70367431640625, 0.750030517578125, 0.79638671875, 0.842742919921875, 0.88909912109375, 0.935455322265625, 0.9818115234375, 1.028167724609375, 1.07452392578125, 1.120880126953125, 1.167236328125, 1.213592529296875, 1.25994873046875, 1.306304931640625, 1.3526611328125, 1.399017333984375, 1.44537353515625, 1.491729736328125, 1.5380859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 13.0, 12.0, 15.0, 14.0, 16.0, 21.0, 28.0, 30.0, 31.0, 37.0, 82.0, 156.0, 480.0, 1818.0, 12125.0, 193414.0, 3238021.0, 713958.0, 29248.0, 3424.0, 693.0, 212.0, 93.0, 60.0, 42.0, 26.0, 25.0, 28.0, 25.0, 18.0, 22.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.984619140625, -5.78955078125, -5.594482421875, -5.3994140625, -5.204345703125, -5.00927734375, -4.814208984375, -4.619140625, -4.424072265625, -4.22900390625, -4.033935546875, -3.8388671875, -3.643798828125, -3.44873046875, -3.253662109375, -3.05859375, -2.863525390625, -2.66845703125, -2.473388671875, -2.2783203125, -2.083251953125, -1.88818359375, -1.693115234375, -1.498046875, -1.302978515625, -1.10791015625, -0.912841796875, -0.7177734375, -0.522705078125, -0.32763671875, -0.132568359375, 0.0625, 0.257568359375, 0.45263671875, 0.647705078125, 0.8427734375, 1.037841796875, 1.23291015625, 1.427978515625, 1.623046875, 1.818115234375, 2.01318359375, 2.208251953125, 2.4033203125, 2.598388671875, 2.79345703125, 2.988525390625, 3.18359375, 3.378662109375, 3.57373046875, 3.768798828125, 3.9638671875, 4.158935546875, 4.35400390625, 4.549072265625, 4.744140625, 4.939208984375, 5.13427734375, 5.329345703125, 5.5244140625, 5.719482421875, 5.91455078125, 6.109619140625, 6.3046875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 14.0, 20.0, 18.0, 30.0, 39.0, 53.0, 79.0, 117.0, 145.0, 238.0, 275.0, 403.0, 505.0, 459.0, 437.0, 332.0, 257.0, 188.0, 108.0, 95.0, 69.0, 40.0, 26.0, 32.0, 20.0, 18.0, 8.0, 9.0, 6.0, 10.0, 1.0, 3.0, 6.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.305511474609375, -5.17352294921875, -5.041534423828125, -4.9095458984375, -4.777557373046875, -4.64556884765625, -4.513580322265625, -4.381591796875, -4.249603271484375, -4.11761474609375, -3.985626220703125, -3.8536376953125, -3.721649169921875, -3.58966064453125, -3.457672119140625, -3.32568359375, -3.193695068359375, -3.06170654296875, -2.929718017578125, -2.7977294921875, -2.665740966796875, -2.53375244140625, -2.401763916015625, -2.269775390625, -2.137786865234375, -2.00579833984375, -1.873809814453125, -1.7418212890625, -1.609832763671875, -1.47784423828125, -1.345855712890625, -1.2138671875, -1.081878662109375, -0.94989013671875, -0.817901611328125, -0.6859130859375, -0.553924560546875, -0.42193603515625, -0.289947509765625, -0.157958984375, -0.025970458984375, 0.10601806640625, 0.238006591796875, 0.3699951171875, 0.501983642578125, 0.63397216796875, 0.765960693359375, 0.89794921875, 1.029937744140625, 1.16192626953125, 1.293914794921875, 1.4259033203125, 1.557891845703125, 1.68988037109375, 1.821868896484375, 1.953857421875, 2.085845947265625, 2.21783447265625, 2.349822998046875, 2.4818115234375, 2.613800048828125, 2.74578857421875, 2.877777099609375, 3.009765625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 17.0, 15.0, 32.0, 33.0, 44.0, 65.0, 88.0, 160.0, 226.0, 389.0, 903.0, 2610.0, 11670.0, 106132.0, 1723480.0, 2188735.0, 140675.0, 14057.0, 2878.0, 989.0, 408.0, 223.0, 118.0, 89.0, 68.0, 51.0, 27.0, 27.0, 13.0, 11.0, 10.0, 5.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.027587890625, -5.76611328125, -5.504638671875, -5.2431640625, -4.981689453125, -4.72021484375, -4.458740234375, -4.197265625, -3.935791015625, -3.67431640625, -3.412841796875, -3.1513671875, -2.889892578125, -2.62841796875, -2.366943359375, -2.10546875, -1.843994140625, -1.58251953125, -1.321044921875, -1.0595703125, -0.798095703125, -0.53662109375, -0.275146484375, -0.013671875, 0.247802734375, 0.50927734375, 0.770751953125, 1.0322265625, 1.293701171875, 1.55517578125, 1.816650390625, 2.078125, 2.339599609375, 2.60107421875, 2.862548828125, 3.1240234375, 3.385498046875, 3.64697265625, 3.908447265625, 4.169921875, 4.431396484375, 4.69287109375, 4.954345703125, 5.2158203125, 5.477294921875, 5.73876953125, 6.000244140625, 6.26171875, 6.523193359375, 6.78466796875, 7.046142578125, 7.3076171875, 7.569091796875, 7.83056640625, 8.092041015625, 8.353515625, 8.614990234375, 8.87646484375, 9.137939453125, 9.3994140625, 9.660888671875, 9.92236328125, 10.183837890625, 10.4453125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 19.0, 25.0, 40.0, 74.0, 74.0, 101.0, 111.0, 142.0, 113.0, 101.0, 77.0, 53.0, 35.0, 19.0, 9.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.354969024658203, -28.734386444091797, -28.113805770874023, -27.493223190307617, -26.87264060974121, -26.252059936523438, -25.63147735595703, -25.010894775390625, -24.39031219482422, -23.769729614257812, -23.14914894104004, -22.528566360473633, -21.907983779907227, -21.287403106689453, -20.666820526123047, -20.04623794555664, -19.425657272338867, -18.80507469177246, -18.184494018554688, -17.56391143798828, -16.943328857421875, -16.32274627685547, -15.702165603637695, -15.081583023071289, -14.4610013961792, -13.84041976928711, -13.219837188720703, -12.599255561828613, -11.978673934936523, -11.358091354370117, -10.737509727478027, -10.116928100585938, -9.496347427368164, -8.875765800476074, -8.255183219909668, -7.634601593017578, -7.01401948928833, -6.393437385559082, -5.772855758666992, -5.152273654937744, -4.531691551208496, -3.911109447479248, -3.290527582168579, -2.66994571685791, -2.049363613128662, -1.428781509399414, -0.8081996440887451, -0.18761777877807617, 0.4329643249511719, 1.0535463094711304, 1.6741282939910889, 2.294710159301758, 2.915292263031006, 3.535874366760254, 4.156455993652344, 4.777038097381592, 5.39762020111084, 6.018202304840088, 6.638784408569336, 7.259366035461426, 7.879948139190674, 8.500530242919922, 9.121111869812012, 9.741693496704102, 10.362276077270508]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 10.0, 14.0, 12.0, 13.0, 16.0, 15.0, 26.0, 15.0, 24.0, 25.0, 27.0, 22.0, 28.0, 29.0, 34.0, 34.0, 41.0, 42.0, 38.0, 40.0, 40.0, 39.0, 42.0, 40.0, 36.0, 35.0, 29.0, 24.0, 18.0, 24.0, 13.0, 18.0, 23.0, 24.0, 13.0, 13.0, 8.0, 11.0, 9.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-12.049810409545898, -11.677988052368164, -11.30616569519043, -10.934343338012695, -10.562520980834961, -10.19069766998291, -9.818875312805176, -9.447052955627441, -9.075230598449707, -8.703408241271973, -8.331585884094238, -7.959763050079346, -7.587940692901611, -7.216118335723877, -6.844295501708984, -6.47247314453125, -6.100650787353516, -5.728828430175781, -5.357006072998047, -4.985183238983154, -4.61336088180542, -4.2415385246276855, -3.869715929031372, -3.4978933334350586, -3.126070976257324, -2.75424861907959, -2.3824260234832764, -2.010603427886963, -1.6387810707092285, -1.2669585943222046, -0.8951361179351807, -0.5233135223388672, -0.1514911651611328, 0.2203313112258911, 0.592153787612915, 0.963976263999939, 1.335798740386963, 1.7076212167739868, 2.0794436931610107, 2.451266288757324, 2.8230886459350586, 3.194911003112793, 3.5667335987091064, 3.93855619430542, 4.310378551483154, 4.682200908660889, 5.054023742675781, 5.425846099853516, 5.79766845703125, 6.169490814208984, 6.541313171386719, 6.913136005401611, 7.284958362579346, 7.65678071975708, 8.028603553771973, 8.400425910949707, 8.772248268127441, 9.144070625305176, 9.51589298248291, 9.887715339660645, 10.259538650512695, 10.63136100769043, 11.003183364868164, 11.375005722045898, 11.746828079223633]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 12.0, 9.0, 18.0, 17.0, 13.0, 22.0, 13.0, 15.0, 20.0, 29.0, 27.0, 30.0, 29.0, 40.0, 55.0, 46.0, 49.0, 35.0, 38.0, 42.0, 41.0, 45.0, 32.0, 34.0, 44.0, 29.0, 19.0, 33.0, 20.0, 20.0, 12.0, 15.0, 22.0, 14.0, 6.0, 8.0, 9.0, 5.0, 9.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2734375, -1.2295379638671875, -1.185638427734375, -1.1417388916015625, -1.09783935546875, -1.0539398193359375, -1.010040283203125, -0.9661407470703125, -0.9222412109375, -0.8783416748046875, -0.834442138671875, -0.7905426025390625, -0.74664306640625, -0.7027435302734375, -0.658843994140625, -0.6149444580078125, -0.571044921875, -0.5271453857421875, -0.483245849609375, -0.4393463134765625, -0.39544677734375, -0.3515472412109375, -0.307647705078125, -0.2637481689453125, -0.2198486328125, -0.1759490966796875, -0.132049560546875, -0.0881500244140625, -0.04425048828125, -0.0003509521484375, 0.043548583984375, 0.0874481201171875, 0.13134765625, 0.1752471923828125, 0.219146728515625, 0.2630462646484375, 0.30694580078125, 0.3508453369140625, 0.394744873046875, 0.4386444091796875, 0.4825439453125, 0.5264434814453125, 0.570343017578125, 0.6142425537109375, 0.65814208984375, 0.7020416259765625, 0.745941162109375, 0.7898406982421875, 0.833740234375, 0.8776397705078125, 0.921539306640625, 0.9654388427734375, 1.00933837890625, 1.0532379150390625, 1.097137451171875, 1.1410369873046875, 1.1849365234375, 1.2288360595703125, 1.272735595703125, 1.3166351318359375, 1.36053466796875, 1.4044342041015625, 1.448333740234375, 1.4922332763671875, 1.5361328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 15.0, 24.0, 41.0, 37.0, 56.0, 80.0, 115.0, 184.0, 225.0, 329.0, 469.0, 693.0, 1090.0, 1443.0, 2195.0, 3370.0, 5029.0, 7819.0, 12330.0, 19972.0, 32768.0, 56516.0, 99313.0, 175462.0, 242434.0, 161135.0, 91178.0, 51909.0, 30280.0, 18697.0, 11440.0, 7393.0, 4728.0, 3123.0, 2133.0, 1360.0, 965.0, 664.0, 477.0, 308.0, 214.0, 147.0, 111.0, 71.0, 73.0, 27.0, 26.0, 19.0, 14.0, 10.0, 11.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.166259765625, -0.1607952117919922, -0.15533065795898438, -0.14986610412597656, -0.14440155029296875, -0.13893699645996094, -0.13347244262695312, -0.1280078887939453, -0.1225433349609375, -0.11707878112792969, -0.11161422729492188, -0.10614967346191406, -0.10068511962890625, -0.09522056579589844, -0.08975601196289062, -0.08429145812988281, -0.078826904296875, -0.07336235046386719, -0.06789779663085938, -0.06243324279785156, -0.05696868896484375, -0.05150413513183594, -0.046039581298828125, -0.04057502746582031, -0.0351104736328125, -0.029645919799804688, -0.024181365966796875, -0.018716812133789062, -0.01325225830078125, -0.0077877044677734375, -0.002323150634765625, 0.0031414031982421875, 0.00860595703125, 0.014070510864257812, 0.019535064697265625, 0.024999618530273438, 0.03046417236328125, 0.03592872619628906, 0.041393280029296875, 0.04685783386230469, 0.0523223876953125, 0.05778694152832031, 0.06325149536132812, 0.06871604919433594, 0.07418060302734375, 0.07964515686035156, 0.08510971069335938, 0.09057426452636719, 0.096038818359375, 0.10150337219238281, 0.10696792602539062, 0.11243247985839844, 0.11789703369140625, 0.12336158752441406, 0.12882614135742188, 0.1342906951904297, 0.1397552490234375, 0.1452198028564453, 0.15068435668945312, 0.15614891052246094, 0.16161346435546875, 0.16707801818847656, 0.17254257202148438, 0.1780071258544922, 0.1834716796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 9.0, 3.0, 5.0, 8.0, 6.0, 7.0, 12.0, 8.0, 17.0, 12.0, 20.0, 19.0, 21.0, 29.0, 28.0, 18.0, 24.0, 36.0, 30.0, 54.0, 41.0, 48.0, 38.0, 1064.0, 39.0, 36.0, 35.0, 31.0, 37.0, 32.0, 25.0, 30.0, 40.0, 26.0, 22.0, 14.0, 13.0, 13.0, 21.0, 17.0, 7.0, 7.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.8330841064453125, -0.805328369140625, -0.7775726318359375, -0.74981689453125, -0.7220611572265625, -0.694305419921875, -0.6665496826171875, -0.6387939453125, -0.6110382080078125, -0.583282470703125, -0.5555267333984375, -0.52777099609375, -0.5000152587890625, -0.472259521484375, -0.4445037841796875, -0.416748046875, -0.3889923095703125, -0.361236572265625, -0.3334808349609375, -0.30572509765625, -0.2779693603515625, -0.250213623046875, -0.2224578857421875, -0.1947021484375, -0.1669464111328125, -0.139190673828125, -0.1114349365234375, -0.08367919921875, -0.0559234619140625, -0.028167724609375, -0.0004119873046875, 0.02734375, 0.0550994873046875, 0.082855224609375, 0.1106109619140625, 0.13836669921875, 0.1661224365234375, 0.193878173828125, 0.2216339111328125, 0.2493896484375, 0.2771453857421875, 0.304901123046875, 0.3326568603515625, 0.36041259765625, 0.3881683349609375, 0.415924072265625, 0.4436798095703125, 0.471435546875, 0.4991912841796875, 0.526947021484375, 0.5547027587890625, 0.58245849609375, 0.6102142333984375, 0.637969970703125, 0.6657257080078125, 0.6934814453125, 0.7212371826171875, 0.748992919921875, 0.7767486572265625, 0.80450439453125, 0.8322601318359375, 0.860015869140625, 0.8877716064453125, 0.91552734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 4.0, 7.0, 18.0, 22.0, 27.0, 49.0, 83.0, 110.0, 153.0, 240.0, 393.0, 585.0, 915.0, 1418.0, 2117.0, 3363.0, 5253.0, 8449.0, 14075.0, 22840.0, 38911.0, 67453.0, 122172.0, 230333.0, 1262001.0, 134550.0, 73876.0, 42468.0, 25419.0, 14965.0, 9328.0, 5536.0, 3633.0, 2210.0, 1426.0, 915.0, 610.0, 409.0, 255.0, 166.0, 133.0, 63.0, 61.0, 45.0, 31.0, 15.0, 11.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1375732421875, -0.13299942016601562, -0.12842559814453125, -0.12385177612304688, -0.1192779541015625, -0.11470413208007812, -0.11013031005859375, -0.10555648803710938, -0.100982666015625, -0.09640884399414062, -0.09183502197265625, -0.08726119995117188, -0.0826873779296875, -0.07811355590820312, -0.07353973388671875, -0.06896591186523438, -0.06439208984375, -0.059818267822265625, -0.05524444580078125, -0.050670623779296875, -0.0460968017578125, -0.041522979736328125, -0.03694915771484375, -0.032375335693359375, -0.027801513671875, -0.023227691650390625, -0.01865386962890625, -0.014080047607421875, -0.0095062255859375, -0.004932403564453125, -0.00035858154296875, 0.004215240478515625, 0.0087890625, 0.013362884521484375, 0.01793670654296875, 0.022510528564453125, 0.0270843505859375, 0.031658172607421875, 0.03623199462890625, 0.040805816650390625, 0.045379638671875, 0.049953460693359375, 0.05452728271484375, 0.059101104736328125, 0.0636749267578125, 0.06824874877929688, 0.07282257080078125, 0.07739639282226562, 0.08197021484375, 0.08654403686523438, 0.09111785888671875, 0.09569168090820312, 0.1002655029296875, 0.10483932495117188, 0.10941314697265625, 0.11398696899414062, 0.118560791015625, 0.12313461303710938, 0.12770843505859375, 0.13228225708007812, 0.1368560791015625, 0.14142990112304688, 0.14600372314453125, 0.15057754516601562, 0.1551513671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 1.0, 4.0, 13.0, 12.0, 13.0, 19.0, 34.0, 40.0, 56.0, 56.0, 64.0, 64.0, 61.0, 87.0, 87.0, 75.0, 62.0, 42.0, 46.0, 32.0, 21.0, 19.0, 19.0, 9.0, 10.0, 8.0, 11.0, 6.0, 3.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007195472717285156, -0.0006979405879974365, -0.0006763339042663574, -0.0006547272205352783, -0.0006331205368041992, -0.0006115138530731201, -0.000589907169342041, -0.0005683004856109619, -0.0005466938018798828, -0.0005250871181488037, -0.0005034804344177246, -0.0004818737506866455, -0.0004602670669555664, -0.0004386603832244873, -0.0004170536994934082, -0.0003954470157623291, -0.00037384033203125, -0.0003522336483001709, -0.0003306269645690918, -0.0003090202808380127, -0.0002874135971069336, -0.0002658069133758545, -0.0002442002296447754, -0.0002225935459136963, -0.0002009868621826172, -0.00017938017845153809, -0.00015777349472045898, -0.00013616681098937988, -0.00011456012725830078, -9.295344352722168e-05, -7.134675979614258e-05, -4.9740076065063477e-05, -2.8133392333984375e-05, -6.5267086029052734e-06, 1.5079975128173828e-05, 3.668665885925293e-05, 5.829334259033203e-05, 7.990002632141113e-05, 0.00010150671005249023, 0.00012311339378356934, 0.00014472007751464844, 0.00016632676124572754, 0.00018793344497680664, 0.00020954012870788574, 0.00023114681243896484, 0.00025275349617004395, 0.00027436017990112305, 0.00029596686363220215, 0.00031757354736328125, 0.00033918023109436035, 0.00036078691482543945, 0.00038239359855651855, 0.00040400028228759766, 0.00042560696601867676, 0.00044721364974975586, 0.00046882033348083496, 0.0004904270172119141, 0.0005120337009429932, 0.0005336403846740723, 0.0005552470684051514, 0.0005768537521362305, 0.0005984604358673096, 0.0006200671195983887, 0.0006416738033294678, 0.0006632804870605469]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 10.0, 6.0, 6.0, 9.0, 15.0, 15.0, 27.0, 31.0, 52.0, 53.0, 95.0, 113.0, 174.0, 353.0, 665.0, 6337.0, 1028132.0, 10690.0, 712.0, 327.0, 220.0, 160.0, 102.0, 58.0, 51.0, 28.0, 24.0, 24.0, 15.0, 11.0, 4.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01235198974609375, -0.011919260025024414, -0.011486530303955078, -0.011053800582885742, -0.010621070861816406, -0.01018834114074707, -0.009755611419677734, -0.009322881698608398, -0.008890151977539062, -0.008457422256469727, -0.00802469253540039, -0.007591962814331055, -0.007159233093261719, -0.006726503372192383, -0.006293773651123047, -0.005861043930053711, -0.005428314208984375, -0.004995584487915039, -0.004562854766845703, -0.004130125045776367, -0.0036973953247070312, -0.0032646656036376953, -0.0028319358825683594, -0.0023992061614990234, -0.0019664764404296875, -0.0015337467193603516, -0.0011010169982910156, -0.0006682872772216797, -0.00023555755615234375, 0.0001971721649169922, 0.0006299018859863281, 0.001062631607055664, 0.001495361328125, 0.001928091049194336, 0.002360820770263672, 0.002793550491333008, 0.0032262802124023438, 0.0036590099334716797, 0.004091739654541016, 0.0045244693756103516, 0.0049571990966796875, 0.0053899288177490234, 0.005822658538818359, 0.006255388259887695, 0.006688117980957031, 0.007120847702026367, 0.007553577423095703, 0.007986307144165039, 0.008419036865234375, 0.008851766586303711, 0.009284496307373047, 0.009717226028442383, 0.010149955749511719, 0.010582685470581055, 0.01101541519165039, 0.011448144912719727, 0.011880874633789062, 0.012313604354858398, 0.012746334075927734, 0.01317906379699707, 0.013611793518066406, 0.014044523239135742, 0.014477252960205078, 0.014909982681274414, 0.01534271240234375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 59.0, 825.0, 133.0], "bins": [-0.007198513485491276, -0.007083520758897066, -0.0069685280323028564, -0.006853535771369934, -0.006738543044775724, -0.006623550318181515, -0.006508557591587305, -0.006393564864993095, -0.006278572138398886, -0.006163579411804676, -0.006048586685210466, -0.005933593958616257, -0.005818601697683334, -0.005703608971089125, -0.005588616244494915, -0.005473623517900705, -0.005358631256967783, -0.005243638530373573, -0.005128645803779364, -0.005013653077185154, -0.004898660816252232, -0.004783668089658022, -0.004668675363063812, -0.004553682636469603, -0.004438689909875393, -0.004323697183281183, -0.004208704456686974, -0.004093712195754051, -0.0039787194691598415, -0.003863726742565632, -0.003748734015971422, -0.0036337412893772125, -0.0035187487956136465, -0.003403756069019437, -0.003288763575255871, -0.003173770848661661, -0.0030587781220674515, -0.0029437856283038855, -0.002828792901709676, -0.0027138004079461098, -0.0025988076813519, -0.0024838149547576904, -0.0023688224609941244, -0.0022538297343999147, -0.002138837007805705, -0.002023844514042139, -0.0019088517874479294, -0.0017938591772690415, -0.0016788664506748319, -0.001563873840495944, -0.0014488811139017344, -0.0013338885037228465, -0.0012188958935439587, -0.001103903166949749, -0.0009889105567708611, -0.0008739179465919733, -0.0007589252199977636, -0.0006439325516112149, -0.000528939941432327, -0.0004139472730457783, -0.00029895463376306, -0.00018396199448034167, -6.896932609379292e-05, 4.602328408509493e-05, 0.00016101592336781323]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 4.0, 5.0, 8.0, 8.0, 11.0, 13.0, 20.0, 19.0, 26.0, 15.0, 30.0, 18.0, 35.0, 33.0, 33.0, 49.0, 42.0, 40.0, 31.0, 39.0, 42.0, 47.0, 36.0, 45.0, 30.0, 32.0, 27.0, 26.0, 24.0, 23.0, 15.0, 24.0, 28.0, 17.0, 13.0, 14.0, 10.0, 8.0, 14.0, 4.0, 7.0, 10.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0002689361572265625, -0.0002603195607662201, -0.0002517029643058777, -0.00024308636784553528, -0.00023446977138519287, -0.00022585317492485046, -0.00021723657846450806, -0.00020861998200416565, -0.00020000338554382324, -0.00019138678908348083, -0.00018277019262313843, -0.00017415359616279602, -0.0001655369997024536, -0.0001569204032421112, -0.0001483038067817688, -0.0001396872103214264, -0.00013107061386108398, -0.00012245401740074158, -0.00011383742094039917, -0.00010522082448005676, -9.660422801971436e-05, -8.798763155937195e-05, -7.937103509902954e-05, -7.075443863868713e-05, -6.213784217834473e-05, -5.352124571800232e-05, -4.490464925765991e-05, -3.6288052797317505e-05, -2.7671456336975098e-05, -1.905485987663269e-05, -1.0438263416290283e-05, -1.821666955947876e-06, 6.794929504394531e-06, 1.541152596473694e-05, 2.4028122425079346e-05, 3.264471888542175e-05, 4.126131534576416e-05, 4.987791180610657e-05, 5.8494508266448975e-05, 6.711110472679138e-05, 7.572770118713379e-05, 8.43442976474762e-05, 9.29608941078186e-05, 0.00010157749056816101, 0.00011019408702850342, 0.00011881068348884583, 0.00012742727994918823, 0.00013604387640953064, 0.00014466047286987305, 0.00015327706933021545, 0.00016189366579055786, 0.00017051026225090027, 0.00017912685871124268, 0.00018774345517158508, 0.0001963600516319275, 0.0002049766480922699, 0.0002135932445526123, 0.0002222098410129547, 0.00023082643747329712, 0.00023944303393363953, 0.00024805963039398193, 0.00025667622685432434, 0.00026529282331466675, 0.00027390941977500916, 0.00028252601623535156]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 12.0, 9.0, 18.0, 17.0, 13.0, 22.0, 13.0, 15.0, 20.0, 29.0, 27.0, 30.0, 29.0, 40.0, 55.0, 46.0, 49.0, 35.0, 38.0, 42.0, 41.0, 45.0, 32.0, 34.0, 44.0, 29.0, 19.0, 33.0, 20.0, 20.0, 12.0, 15.0, 22.0, 14.0, 6.0, 8.0, 9.0, 5.0, 9.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2734375, -1.2295379638671875, -1.185638427734375, -1.1417388916015625, -1.09783935546875, -1.0539398193359375, -1.010040283203125, -0.9661407470703125, -0.9222412109375, -0.8783416748046875, -0.834442138671875, -0.7905426025390625, -0.74664306640625, -0.7027435302734375, -0.658843994140625, -0.6149444580078125, -0.571044921875, -0.5271453857421875, -0.483245849609375, -0.4393463134765625, -0.39544677734375, -0.3515472412109375, -0.307647705078125, -0.2637481689453125, -0.2198486328125, -0.1759490966796875, -0.132049560546875, -0.0881500244140625, -0.04425048828125, -0.0003509521484375, 0.043548583984375, 0.0874481201171875, 0.13134765625, 0.1752471923828125, 0.219146728515625, 0.2630462646484375, 0.30694580078125, 0.3508453369140625, 0.394744873046875, 0.4386444091796875, 0.4825439453125, 0.5264434814453125, 0.570343017578125, 0.6142425537109375, 0.65814208984375, 0.7020416259765625, 0.745941162109375, 0.7898406982421875, 0.833740234375, 0.8776397705078125, 0.921539306640625, 0.9654388427734375, 1.00933837890625, 1.0532379150390625, 1.097137451171875, 1.1410369873046875, 1.1849365234375, 1.2288360595703125, 1.272735595703125, 1.3166351318359375, 1.36053466796875, 1.4044342041015625, 1.448333740234375, 1.4922332763671875, 1.5361328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 5.0, 8.0, 8.0, 8.0, 15.0, 27.0, 30.0, 39.0, 48.0, 60.0, 105.0, 132.0, 195.0, 258.0, 371.0, 612.0, 1136.0, 2231.0, 5395.0, 14458.0, 47683.0, 193239.0, 480379.0, 220517.0, 54144.0, 15921.0, 5957.0, 2447.0, 1144.0, 640.0, 398.0, 279.0, 167.0, 126.0, 89.0, 80.0, 57.0, 39.0, 26.0, 21.0, 15.0, 11.0, 16.0, 8.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.7939453125, -1.7332305908203125, -1.672515869140625, -1.6118011474609375, -1.55108642578125, -1.4903717041015625, -1.429656982421875, -1.3689422607421875, -1.3082275390625, -1.2475128173828125, -1.186798095703125, -1.1260833740234375, -1.06536865234375, -1.0046539306640625, -0.943939208984375, -0.8832244873046875, -0.822509765625, -0.7617950439453125, -0.701080322265625, -0.6403656005859375, -0.57965087890625, -0.5189361572265625, -0.458221435546875, -0.3975067138671875, -0.3367919921875, -0.2760772705078125, -0.215362548828125, -0.1546478271484375, -0.09393310546875, -0.0332183837890625, 0.027496337890625, 0.0882110595703125, 0.14892578125, 0.2096405029296875, 0.270355224609375, 0.3310699462890625, 0.39178466796875, 0.4524993896484375, 0.513214111328125, 0.5739288330078125, 0.6346435546875, 0.6953582763671875, 0.756072998046875, 0.8167877197265625, 0.87750244140625, 0.9382171630859375, 0.998931884765625, 1.0596466064453125, 1.120361328125, 1.1810760498046875, 1.241790771484375, 1.3025054931640625, 1.36322021484375, 1.4239349365234375, 1.484649658203125, 1.5453643798828125, 1.6060791015625, 1.6667938232421875, 1.727508544921875, 1.7882232666015625, 1.84893798828125, 1.9096527099609375, 1.970367431640625, 2.0310821533203125, 2.091796875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 9.0, 7.0, 5.0, 5.0, 13.0, 10.0, 14.0, 9.0, 12.0, 19.0, 20.0, 27.0, 22.0, 28.0, 36.0, 27.0, 40.0, 49.0, 50.0, 74.0, 120.0, 330.0, 1438.0, 159.0, 77.0, 70.0, 49.0, 39.0, 30.0, 28.0, 33.0, 20.0, 23.0, 22.0, 18.0, 13.0, 16.0, 12.0, 15.0, 12.0, 11.0, 11.0, 3.0, 6.0, 0.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-4.78515625, -4.6451416015625, -4.505126953125, -4.3651123046875, -4.22509765625, -4.0850830078125, -3.945068359375, -3.8050537109375, -3.6650390625, -3.5250244140625, -3.385009765625, -3.2449951171875, -3.10498046875, -2.9649658203125, -2.824951171875, -2.6849365234375, -2.544921875, -2.4049072265625, -2.264892578125, -2.1248779296875, -1.98486328125, -1.8448486328125, -1.704833984375, -1.5648193359375, -1.4248046875, -1.2847900390625, -1.144775390625, -1.0047607421875, -0.86474609375, -0.7247314453125, -0.584716796875, -0.4447021484375, -0.3046875, -0.1646728515625, -0.024658203125, 0.1153564453125, 0.25537109375, 0.3953857421875, 0.535400390625, 0.6754150390625, 0.8154296875, 0.9554443359375, 1.095458984375, 1.2354736328125, 1.37548828125, 1.5155029296875, 1.655517578125, 1.7955322265625, 1.935546875, 2.0755615234375, 2.215576171875, 2.3555908203125, 2.49560546875, 2.6356201171875, 2.775634765625, 2.9156494140625, 3.0556640625, 3.1956787109375, 3.335693359375, 3.4757080078125, 3.61572265625, 3.7557373046875, 3.895751953125, 4.0357666015625, 4.17578125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 7.0, 12.0, 17.0, 19.0, 26.0, 31.0, 31.0, 51.0, 51.0, 77.0, 119.0, 194.0, 380.0, 934.0, 4317.0, 98276.0, 2980788.0, 55237.0, 3370.0, 782.0, 329.0, 173.0, 125.0, 78.0, 52.0, 46.0, 32.0, 29.0, 20.0, 18.0, 12.0, 16.0, 14.0, 5.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.5699462890625, -8.288330078125, -8.0067138671875, -7.72509765625, -7.4434814453125, -7.161865234375, -6.8802490234375, -6.5986328125, -6.3170166015625, -6.035400390625, -5.7537841796875, -5.47216796875, -5.1905517578125, -4.908935546875, -4.6273193359375, -4.345703125, -4.0640869140625, -3.782470703125, -3.5008544921875, -3.21923828125, -2.9376220703125, -2.656005859375, -2.3743896484375, -2.0927734375, -1.8111572265625, -1.529541015625, -1.2479248046875, -0.96630859375, -0.6846923828125, -0.403076171875, -0.1214599609375, 0.16015625, 0.4417724609375, 0.723388671875, 1.0050048828125, 1.28662109375, 1.5682373046875, 1.849853515625, 2.1314697265625, 2.4130859375, 2.6947021484375, 2.976318359375, 3.2579345703125, 3.53955078125, 3.8211669921875, 4.102783203125, 4.3843994140625, 4.666015625, 4.9476318359375, 5.229248046875, 5.5108642578125, 5.79248046875, 6.0740966796875, 6.355712890625, 6.6373291015625, 6.9189453125, 7.2005615234375, 7.482177734375, 7.7637939453125, 8.04541015625, 8.3270263671875, 8.608642578125, 8.8902587890625, 9.171875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [3.0, 5.0, 31.0, 211.0, 485.0, 233.0, 45.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.144052982330322, -3.2300913333892822, -2.316129684448242, -1.4021680355072021, -0.4882063865661621, 0.42575502395629883, 1.339716911315918, 2.253678798675537, 3.167640209197998, 4.081602096557617, 4.995563507080078, 5.909524917602539, 6.823486804962158, 7.737448215484619, 8.651410102844238, 9.565372467041016, 10.479333877563477, 11.393295288085938, 12.307256698608398, 13.221219062805176, 14.135180473327637, 15.049141883850098, 15.963104248046875, 16.877065658569336, 17.791027069091797, 18.704988479614258, 19.61894989013672, 20.53291130065918, 21.44687271118164, 22.360836029052734, 23.274797439575195, 24.188758850097656, 25.102718353271484, 26.016679763793945, 26.930641174316406, 27.844602584838867, 28.758563995361328, 29.672527313232422, 30.586488723754883, 31.500450134277344, 32.41441345214844, 33.32837677001953, 34.24233627319336, 35.15629959106445, 36.07025909423828, 36.984222412109375, 37.8981819152832, 38.8121452331543, 39.726104736328125, 40.64006805419922, 41.55402755737305, 42.46799087524414, 43.38195037841797, 44.29591369628906, 45.20987319946289, 46.123836517333984, 47.03779602050781, 47.951759338378906, 48.865718841552734, 49.77968215942383, 50.693641662597656, 51.60760498046875, 52.52156448364258, 53.43552780151367, 54.349491119384766]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 10.0, 13.0, 4.0, 9.0, 10.0, 16.0, 15.0, 18.0, 16.0, 23.0, 23.0, 23.0, 21.0, 20.0, 31.0, 32.0, 27.0, 35.0, 39.0, 31.0, 34.0, 41.0, 44.0, 34.0, 28.0, 30.0, 31.0, 39.0, 35.0, 31.0, 26.0, 25.0, 30.0, 20.0, 16.0, 23.0, 11.0, 8.0, 14.0, 11.0, 10.0, 11.0, 3.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0], "bins": [-14.873390197753906, -14.422867774963379, -13.972346305847168, -13.52182388305664, -13.071301460266113, -12.620779037475586, -12.170257568359375, -11.719735145568848, -11.26921272277832, -10.818690299987793, -10.368168830871582, -9.917646408081055, -9.467123985290527, -9.0166015625, -8.566080093383789, -8.115557670593262, -7.665035724639893, -7.214513778686523, -6.763991355895996, -6.313469409942627, -5.8629469871521, -5.4124250411987305, -4.961902618408203, -4.511380672454834, -4.060858726501465, -3.6103365421295166, -3.1598143577575684, -2.709292411804199, -2.258769989013672, -1.8082480430603027, -1.3577258586883545, -0.9072036743164062, -0.4566812515258789, -0.006159096956253052, 0.4443630576133728, 0.8948851823806763, 1.3454073667526245, 1.7959294319152832, 2.2464516162872314, 2.6969738006591797, 3.147495985031128, 3.598018169403076, 4.048540115356445, 4.499062538146973, 4.949584484100342, 5.400106430053711, 5.850628852844238, 6.301151275634766, 6.751673221588135, 7.202195167541504, 7.652717590332031, 8.103240013122559, 8.55376148223877, 9.004283905029297, 9.454806327819824, 9.905328750610352, 10.355850219726562, 10.80637264251709, 11.2568941116333, 11.707416534423828, 12.157938957214355, 12.608461380004883, 13.058982849121094, 13.509505271911621, 13.960027694702148]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 2.0, 5.0, 14.0, 9.0, 9.0, 14.0, 16.0, 18.0, 10.0, 14.0, 15.0, 27.0, 21.0, 21.0, 32.0, 38.0, 34.0, 34.0, 33.0, 50.0, 51.0, 45.0, 42.0, 35.0, 43.0, 31.0, 37.0, 42.0, 30.0, 32.0, 31.0, 22.0, 26.0, 18.0, 15.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.33203125, -1.28704833984375, -1.2420654296875, -1.19708251953125, -1.152099609375, -1.10711669921875, -1.0621337890625, -1.01715087890625, -0.97216796875, -0.92718505859375, -0.8822021484375, -0.83721923828125, -0.792236328125, -0.74725341796875, -0.7022705078125, -0.65728759765625, -0.6123046875, -0.56732177734375, -0.5223388671875, -0.47735595703125, -0.432373046875, -0.38739013671875, -0.3424072265625, -0.29742431640625, -0.25244140625, -0.20745849609375, -0.1624755859375, -0.11749267578125, -0.072509765625, -0.02752685546875, 0.0174560546875, 0.06243896484375, 0.107421875, 0.15240478515625, 0.1973876953125, 0.24237060546875, 0.287353515625, 0.33233642578125, 0.3773193359375, 0.42230224609375, 0.46728515625, 0.51226806640625, 0.5572509765625, 0.60223388671875, 0.647216796875, 0.69219970703125, 0.7371826171875, 0.78216552734375, 0.8271484375, 0.87213134765625, 0.9171142578125, 0.96209716796875, 1.007080078125, 1.05206298828125, 1.0970458984375, 1.14202880859375, 1.18701171875, 1.23199462890625, 1.2769775390625, 1.32196044921875, 1.366943359375, 1.41192626953125, 1.4569091796875, 1.50189208984375, 1.546875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 2.0, 7.0, 10.0, 14.0, 12.0, 17.0, 15.0, 29.0, 30.0, 47.0, 75.0, 117.0, 209.0, 514.0, 1385.0, 4384.0, 16195.0, 75600.0, 517653.0, 2254480.0, 1125309.0, 157741.0, 29269.0, 7370.0, 2261.0, 783.0, 311.0, 137.0, 91.0, 56.0, 32.0, 21.0, 17.0, 19.0, 15.0, 16.0, 14.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.95391845703125, -2.8472900390625, -2.74066162109375, -2.634033203125, -2.52740478515625, -2.4207763671875, -2.31414794921875, -2.20751953125, -2.10089111328125, -1.9942626953125, -1.88763427734375, -1.781005859375, -1.67437744140625, -1.5677490234375, -1.46112060546875, -1.3544921875, -1.24786376953125, -1.1412353515625, -1.03460693359375, -0.927978515625, -0.82135009765625, -0.7147216796875, -0.60809326171875, -0.50146484375, -0.39483642578125, -0.2882080078125, -0.18157958984375, -0.074951171875, 0.03167724609375, 0.1383056640625, 0.24493408203125, 0.3515625, 0.45819091796875, 0.5648193359375, 0.67144775390625, 0.778076171875, 0.88470458984375, 0.9913330078125, 1.09796142578125, 1.20458984375, 1.31121826171875, 1.4178466796875, 1.52447509765625, 1.631103515625, 1.73773193359375, 1.8443603515625, 1.95098876953125, 2.0576171875, 2.16424560546875, 2.2708740234375, 2.37750244140625, 2.484130859375, 2.59075927734375, 2.6973876953125, 2.80401611328125, 2.91064453125, 3.01727294921875, 3.1239013671875, 3.23052978515625, 3.337158203125, 3.44378662109375, 3.5504150390625, 3.65704345703125, 3.763671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 14.0, 15.0, 26.0, 35.0, 37.0, 53.0, 79.0, 99.0, 118.0, 154.0, 233.0, 263.0, 359.0, 431.0, 412.0, 353.0, 340.0, 244.0, 189.0, 137.0, 107.0, 82.0, 53.0, 61.0, 35.0, 27.0, 32.0, 25.0, 10.0, 7.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.43157958984375, -3.3143310546875, -3.19708251953125, -3.079833984375, -2.96258544921875, -2.8453369140625, -2.72808837890625, -2.61083984375, -2.49359130859375, -2.3763427734375, -2.25909423828125, -2.141845703125, -2.02459716796875, -1.9073486328125, -1.79010009765625, -1.6728515625, -1.55560302734375, -1.4383544921875, -1.32110595703125, -1.203857421875, -1.08660888671875, -0.9693603515625, -0.85211181640625, -0.73486328125, -0.61761474609375, -0.5003662109375, -0.38311767578125, -0.265869140625, -0.14862060546875, -0.0313720703125, 0.08587646484375, 0.203125, 0.32037353515625, 0.4376220703125, 0.55487060546875, 0.672119140625, 0.78936767578125, 0.9066162109375, 1.02386474609375, 1.14111328125, 1.25836181640625, 1.3756103515625, 1.49285888671875, 1.610107421875, 1.72735595703125, 1.8446044921875, 1.96185302734375, 2.0791015625, 2.19635009765625, 2.3135986328125, 2.43084716796875, 2.548095703125, 2.66534423828125, 2.7825927734375, 2.89984130859375, 3.01708984375, 3.13433837890625, 3.2515869140625, 3.36883544921875, 3.486083984375, 3.60333251953125, 3.7205810546875, 3.83782958984375, 3.955078125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 8.0, 11.0, 31.0, 33.0, 72.0, 168.0, 389.0, 1566.0, 16975.0, 768467.0, 3313250.0, 88018.0, 4119.0, 726.0, 237.0, 111.0, 44.0, 27.0, 13.0, 11.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-18.515625, -18.11517333984375, -17.7147216796875, -17.31427001953125, -16.913818359375, -16.51336669921875, -16.1129150390625, -15.71246337890625, -15.31201171875, -14.91156005859375, -14.5111083984375, -14.11065673828125, -13.710205078125, -13.30975341796875, -12.9093017578125, -12.50885009765625, -12.1083984375, -11.70794677734375, -11.3074951171875, -10.90704345703125, -10.506591796875, -10.10614013671875, -9.7056884765625, -9.30523681640625, -8.90478515625, -8.50433349609375, -8.1038818359375, -7.70343017578125, -7.302978515625, -6.90252685546875, -6.5020751953125, -6.10162353515625, -5.701171875, -5.30072021484375, -4.9002685546875, -4.49981689453125, -4.099365234375, -3.69891357421875, -3.2984619140625, -2.89801025390625, -2.49755859375, -2.09710693359375, -1.6966552734375, -1.29620361328125, -0.895751953125, -0.49530029296875, -0.0948486328125, 0.30560302734375, 0.7060546875, 1.10650634765625, 1.5069580078125, 1.90740966796875, 2.307861328125, 2.70831298828125, 3.1087646484375, 3.50921630859375, 3.90966796875, 4.31011962890625, 4.7105712890625, 5.11102294921875, 5.511474609375, 5.91192626953125, 6.3123779296875, 6.71282958984375, 7.11328125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 20.0, 38.0, 61.0, 93.0, 159.0, 182.0, 176.0, 122.0, 77.0, 49.0, 19.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.47494888305664, -39.52104949951172, -38.56714630126953, -37.61324691772461, -36.65934371948242, -35.7054443359375, -34.75154113769531, -33.79764175415039, -32.84374237060547, -31.889841079711914, -30.93593978881836, -29.982040405273438, -29.028139114379883, -28.074237823486328, -27.120336532592773, -26.16643524169922, -25.212533950805664, -24.25863265991211, -23.304731369018555, -22.350830078125, -21.396930694580078, -20.443029403686523, -19.48912811279297, -18.535226821899414, -17.58132553100586, -16.627424240112305, -15.673523902893066, -14.719622611999512, -13.765722274780273, -12.811820983886719, -11.857919692993164, -10.90401840209961, -9.950117111206055, -8.9962158203125, -8.042315483093262, -7.088414192199707, -6.1345133781433105, -5.180612564086914, -4.226711273193359, -3.272810459136963, -2.3189096450805664, -1.3650087118148804, -0.41110777854919434, 0.5427932739257812, 1.4966940879821777, 2.450594902038574, 3.404496192932129, 4.358397006988525, 5.312297821044922, 6.266198635101318, 7.220099449157715, 8.17400074005127, 9.127901077270508, 10.081802368164062, 11.035703659057617, 11.989604949951172, 12.94350528717041, 13.897406578063965, 14.851306915283203, 15.805208206176758, 16.759109497070312, 17.713008880615234, 18.666912078857422, 19.620811462402344, 20.5747127532959]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 5.0, 8.0, 5.0, 5.0, 14.0, 13.0, 13.0, 12.0, 25.0, 21.0, 18.0, 20.0, 21.0, 31.0, 25.0, 30.0, 31.0, 35.0, 45.0, 29.0, 37.0, 41.0, 43.0, 43.0, 39.0, 32.0, 31.0, 35.0, 27.0, 27.0, 27.0, 32.0, 32.0, 23.0, 21.0, 18.0, 19.0, 16.0, 7.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-12.98921012878418, -12.58332633972168, -12.177443504333496, -11.771559715270996, -11.365676879882812, -10.959793090820312, -10.553909301757812, -10.148026466369629, -9.742143630981445, -9.336259841918945, -8.930377006530762, -8.524493217468262, -8.118610382080078, -7.712726593017578, -7.306843280792236, -6.9009599685668945, -6.4950761795043945, -6.089192867279053, -5.683309555053711, -5.277425765991211, -4.871542930603027, -4.465659141540527, -4.0597758293151855, -3.6538925170898438, -3.248009204864502, -2.84212589263916, -2.4362425804138184, -2.0303590297698975, -1.6244757175445557, -1.2185924053192139, -0.812708854675293, -0.40682554244995117, -0.000942230224609375, 0.4049411416053772, 0.8108245134353638, 1.2167079448699951, 1.622591257095337, 2.0284745693206787, 2.4343581199645996, 2.8402414321899414, 3.246124744415283, 3.652008056640625, 4.057891368865967, 4.463774681091309, 4.869658470153809, 5.275541305541992, 5.681425094604492, 6.087308406829834, 6.493191719055176, 6.899075031280518, 7.304958343505859, 7.710842132568359, 8.116724967956543, 8.522608757019043, 8.928491592407227, 9.334375381469727, 9.740259170532227, 10.146142959594727, 10.55202579498291, 10.95790958404541, 11.363792419433594, 11.769676208496094, 12.175559997558594, 12.581442832946777, 12.987325668334961]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 10.0, 2.0, 4.0, 12.0, 12.0, 14.0, 12.0, 19.0, 19.0, 19.0, 23.0, 14.0, 32.0, 29.0, 40.0, 39.0, 25.0, 49.0, 41.0, 51.0, 36.0, 38.0, 36.0, 37.0, 36.0, 44.0, 33.0, 37.0, 33.0, 42.0, 22.0, 23.0, 17.0, 18.0, 11.0, 12.0, 10.0, 9.0, 10.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4853363037109375, -1.438446044921875, -1.3915557861328125, -1.34466552734375, -1.2977752685546875, -1.250885009765625, -1.2039947509765625, -1.1571044921875, -1.1102142333984375, -1.063323974609375, -1.0164337158203125, -0.96954345703125, -0.9226531982421875, -0.875762939453125, -0.8288726806640625, -0.781982421875, -0.7350921630859375, -0.688201904296875, -0.6413116455078125, -0.59442138671875, -0.5475311279296875, -0.500640869140625, -0.4537506103515625, -0.4068603515625, -0.3599700927734375, -0.313079833984375, -0.2661895751953125, -0.21929931640625, -0.1724090576171875, -0.125518798828125, -0.0786285400390625, -0.03173828125, 0.0151519775390625, 0.062042236328125, 0.1089324951171875, 0.15582275390625, 0.2027130126953125, 0.249603271484375, 0.2964935302734375, 0.3433837890625, 0.3902740478515625, 0.437164306640625, 0.4840545654296875, 0.53094482421875, 0.5778350830078125, 0.624725341796875, 0.6716156005859375, 0.718505859375, 0.7653961181640625, 0.812286376953125, 0.8591766357421875, 0.90606689453125, 0.9529571533203125, 0.999847412109375, 1.0467376708984375, 1.0936279296875, 1.1405181884765625, 1.187408447265625, 1.2342987060546875, 1.28118896484375, 1.3280792236328125, 1.374969482421875, 1.4218597412109375, 1.46875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 8.0, 9.0, 12.0, 16.0, 14.0, 19.0, 25.0, 47.0, 72.0, 100.0, 134.0, 248.0, 275.0, 431.0, 527.0, 849.0, 1217.0, 1769.0, 2623.0, 3923.0, 5699.0, 8573.0, 13125.0, 20907.0, 33252.0, 55572.0, 96692.0, 173062.0, 234694.0, 161654.0, 91091.0, 52600.0, 31396.0, 19741.0, 12683.0, 8287.0, 5569.0, 3606.0, 2439.0, 1754.0, 1159.0, 809.0, 556.0, 366.0, 266.0, 220.0, 146.0, 95.0, 71.0, 42.0, 42.0, 18.0, 19.0, 13.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1795654296875, -0.17385482788085938, -0.16814422607421875, -0.16243362426757812, -0.1567230224609375, -0.15101242065429688, -0.14530181884765625, -0.13959121704101562, -0.133880615234375, -0.12817001342773438, -0.12245941162109375, -0.11674880981445312, -0.1110382080078125, -0.10532760620117188, -0.09961700439453125, -0.09390640258789062, -0.08819580078125, -0.08248519897460938, -0.07677459716796875, -0.07106399536132812, -0.0653533935546875, -0.059642791748046875, -0.05393218994140625, -0.048221588134765625, -0.042510986328125, -0.036800384521484375, -0.03108978271484375, -0.025379180908203125, -0.0196685791015625, -0.013957977294921875, -0.00824737548828125, -0.002536773681640625, 0.003173828125, 0.008884429931640625, 0.01459503173828125, 0.020305633544921875, 0.0260162353515625, 0.031726837158203125, 0.03743743896484375, 0.043148040771484375, 0.048858642578125, 0.054569244384765625, 0.06027984619140625, 0.06599044799804688, 0.0717010498046875, 0.07741165161132812, 0.08312225341796875, 0.08883285522460938, 0.09454345703125, 0.10025405883789062, 0.10596466064453125, 0.11167526245117188, 0.1173858642578125, 0.12309646606445312, 0.12880706787109375, 0.13451766967773438, 0.140228271484375, 0.14593887329101562, 0.15164947509765625, 0.15736007690429688, 0.1630706787109375, 0.16878128051757812, 0.17449188232421875, 0.18020248413085938, 0.1859130859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 3.0, 6.0, 6.0, 12.0, 10.0, 13.0, 15.0, 15.0, 16.0, 28.0, 18.0, 31.0, 33.0, 37.0, 38.0, 33.0, 39.0, 36.0, 33.0, 48.0, 1057.0, 42.0, 34.0, 35.0, 32.0, 29.0, 35.0, 31.0, 21.0, 23.0, 28.0, 32.0, 19.0, 21.0, 19.0, 15.0, 9.0, 12.0, 6.0, 7.0, 8.0, 9.0, 8.0, 3.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8679733276367188, -0.8399505615234375, -0.8119277954101562, -0.783905029296875, -0.7558822631835938, -0.7278594970703125, -0.6998367309570312, -0.67181396484375, -0.6437911987304688, -0.6157684326171875, -0.5877456665039062, -0.559722900390625, -0.5317001342773438, -0.5036773681640625, -0.47565460205078125, -0.4476318359375, -0.41960906982421875, -0.3915863037109375, -0.36356353759765625, -0.335540771484375, -0.30751800537109375, -0.2794952392578125, -0.25147247314453125, -0.22344970703125, -0.19542694091796875, -0.1674041748046875, -0.13938140869140625, -0.111358642578125, -0.08333587646484375, -0.0553131103515625, -0.02729034423828125, 0.000732421875, 0.02875518798828125, 0.0567779541015625, 0.08480072021484375, 0.112823486328125, 0.14084625244140625, 0.1688690185546875, 0.19689178466796875, 0.22491455078125, 0.25293731689453125, 0.2809600830078125, 0.30898284912109375, 0.337005615234375, 0.36502838134765625, 0.3930511474609375, 0.42107391357421875, 0.4490966796875, 0.47711944580078125, 0.5051422119140625, 0.5331649780273438, 0.561187744140625, 0.5892105102539062, 0.6172332763671875, 0.6452560424804688, 0.67327880859375, 0.7013015747070312, 0.7293243408203125, 0.7573471069335938, 0.785369873046875, 0.8133926391601562, 0.8414154052734375, 0.8694381713867188, 0.8974609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 13.0, 13.0, 28.0, 35.0, 42.0, 63.0, 115.0, 146.0, 223.0, 331.0, 456.0, 746.0, 1070.0, 1657.0, 2500.0, 3789.0, 5844.0, 9139.0, 14025.0, 22658.0, 36649.0, 61013.0, 103994.0, 176672.0, 1269919.0, 155068.0, 90264.0, 53379.0, 32201.0, 19736.0, 12219.0, 7871.0, 5125.0, 3354.0, 2220.0, 1408.0, 994.0, 679.0, 475.0, 355.0, 225.0, 132.0, 92.0, 58.0, 52.0, 43.0, 20.0, 8.0, 6.0, 2.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.145751953125, -0.1412487030029297, -0.13674545288085938, -0.13224220275878906, -0.12773895263671875, -0.12323570251464844, -0.11873245239257812, -0.11422920227050781, -0.1097259521484375, -0.10522270202636719, -0.10071945190429688, -0.09621620178222656, -0.09171295166015625, -0.08720970153808594, -0.08270645141601562, -0.07820320129394531, -0.073699951171875, -0.06919670104980469, -0.06469345092773438, -0.06019020080566406, -0.05568695068359375, -0.05118370056152344, -0.046680450439453125, -0.04217720031738281, -0.0376739501953125, -0.03317070007324219, -0.028667449951171875, -0.024164199829101562, -0.01966094970703125, -0.015157699584960938, -0.010654449462890625, -0.0061511993408203125, -0.00164794921875, 0.0028553009033203125, 0.007358551025390625, 0.011861801147460938, 0.01636505126953125, 0.020868301391601562, 0.025371551513671875, 0.029874801635742188, 0.0343780517578125, 0.03888130187988281, 0.043384552001953125, 0.04788780212402344, 0.05239105224609375, 0.05689430236816406, 0.061397552490234375, 0.06590080261230469, 0.070404052734375, 0.07490730285644531, 0.07941055297851562, 0.08391380310058594, 0.08841705322265625, 0.09292030334472656, 0.09742355346679688, 0.10192680358886719, 0.1064300537109375, 0.11093330383300781, 0.11543655395507812, 0.11993980407714844, 0.12444305419921875, 0.12894630432128906, 0.13344955444335938, 0.1379528045654297, 0.1424560546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 4.0, 8.0, 4.0, 7.0, 6.0, 12.0, 14.0, 9.0, 12.0, 24.0, 20.0, 33.0, 38.0, 40.0, 56.0, 49.0, 63.0, 61.0, 59.0, 50.0, 62.0, 46.0, 35.0, 55.0, 32.0, 27.0, 24.0, 19.0, 18.0, 16.0, 16.0, 13.0, 10.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005083084106445312, -0.0004926994442939758, -0.0004770904779434204, -0.000461481511592865, -0.00044587254524230957, -0.00043026357889175415, -0.00041465461254119873, -0.0003990456461906433, -0.0003834366798400879, -0.00036782771348953247, -0.00035221874713897705, -0.00033660978078842163, -0.0003210008144378662, -0.0003053918480873108, -0.00028978288173675537, -0.00027417391538619995, -0.00025856494903564453, -0.0002429559826850891, -0.0002273470163345337, -0.00021173804998397827, -0.00019612908363342285, -0.00018052011728286743, -0.000164911150932312, -0.0001493021845817566, -0.00013369321823120117, -0.00011808425188064575, -0.00010247528553009033, -8.686631917953491e-05, -7.125735282897949e-05, -5.564838647842407e-05, -4.003942012786865e-05, -2.4430453777313232e-05, -8.821487426757812e-06, 6.787478923797607e-06, 2.2396445274353027e-05, 3.800541162490845e-05, 5.361437797546387e-05, 6.922334432601929e-05, 8.483231067657471e-05, 0.00010044127702713013, 0.00011605024337768555, 0.00013165920972824097, 0.0001472681760787964, 0.0001628771424293518, 0.00017848610877990723, 0.00019409507513046265, 0.00020970404148101807, 0.00022531300783157349, 0.0002409219741821289, 0.0002565309405326843, 0.00027213990688323975, 0.00028774887323379517, 0.0003033578395843506, 0.000318966805934906, 0.0003345757722854614, 0.00035018473863601685, 0.00036579370498657227, 0.0003814026713371277, 0.0003970116376876831, 0.0004126206040382385, 0.00042822957038879395, 0.00044383853673934937, 0.0004594475030899048, 0.0004750564694404602, 0.0004906654357910156]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 20.0, 17.0, 37.0, 36.0, 45.0, 83.0, 143.0, 219.0, 470.0, 1595.0, 882784.0, 161042.0, 1024.0, 388.0, 217.0, 131.0, 73.0, 44.0, 37.0, 19.0, 15.0, 14.0, 11.0, 11.0, 4.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01273345947265625, -0.01229238510131836, -0.011851310729980469, -0.011410236358642578, -0.010969161987304688, -0.010528087615966797, -0.010087013244628906, -0.009645938873291016, -0.009204864501953125, -0.008763790130615234, -0.008322715759277344, -0.007881641387939453, -0.0074405670166015625, -0.006999492645263672, -0.006558418273925781, -0.006117343902587891, -0.00567626953125, -0.005235195159912109, -0.004794120788574219, -0.004353046417236328, -0.0039119720458984375, -0.003470897674560547, -0.0030298233032226562, -0.0025887489318847656, -0.002147674560546875, -0.0017066001892089844, -0.0012655258178710938, -0.0008244514465332031, -0.0003833770751953125, 5.7697296142578125e-05, 0.0004987716674804688, 0.0009398460388183594, 0.00138092041015625, 0.0018219947814941406, 0.0022630691528320312, 0.002704143524169922, 0.0031452178955078125, 0.003586292266845703, 0.004027366638183594, 0.004468441009521484, 0.004909515380859375, 0.005350589752197266, 0.005791664123535156, 0.006232738494873047, 0.0066738128662109375, 0.007114887237548828, 0.007555961608886719, 0.00799703598022461, 0.0084381103515625, 0.00887918472290039, 0.009320259094238281, 0.009761333465576172, 0.010202407836914062, 0.010643482208251953, 0.011084556579589844, 0.011525630950927734, 0.011966705322265625, 0.012407779693603516, 0.012848854064941406, 0.013289928436279297, 0.013731002807617188, 0.014172077178955078, 0.014613151550292969, 0.01505422592163086, 0.01549530029296875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 404.0, 551.0, 41.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037929017562419176, -0.003706950694322586, -0.003620999399572611, -0.0035350483376532793, -0.003449097042903304, -0.0033631459809839725, -0.0032771946862339973, -0.003191243624314666, -0.0031052925623953342, -0.0030193415004760027, -0.0029333902057260275, -0.002847439143806696, -0.0027614878490567207, -0.002675536787137389, -0.0025895857252180576, -0.0025036344304680824, -0.0024176831357181072, -0.0023317320737987757, -0.0022457807790488005, -0.002159829717129469, -0.0020738784223794937, -0.001987927360460162, -0.0019019761821255088, -0.0018160250037908554, -0.001730073825456202, -0.0016441226471215487, -0.0015581714687868953, -0.001472220290452242, -0.0013862692285329103, -0.0013003179337829351, -0.0012143668718636036, -0.0011284156935289502, -0.0010424646316096187, -0.0009565134532749653, -0.0008705622749403119, -0.0007846111548133194, -0.0006986599764786661, -0.0006127087981440127, -0.0005267576780170202, -0.00044080649968236685, -0.00035485532134771347, -0.0002689041430130601, -0.00018295299378223717, -9.700184455141425e-05, -1.1050666216760874e-05, 7.49005121178925e-05, 0.00016085163224488497, 0.00024680281057953835, 0.0003327539889141917, 0.0004187051672488451, 0.0005046563455834985, 0.0005906074657104909, 0.0006765586440451443, 0.0007625098223797977, 0.0008484609425067902, 0.0009344121208414435, 0.001020363299176097, 0.0011063144775107503, 0.0011922656558454037, 0.0012782167177647352, 0.0013641680125147104, 0.001450119074434042, 0.0015360702527686954, 0.0016220214311033487, 0.0017079726094380021]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 4.0, 4.0, 8.0, 8.0, 14.0, 5.0, 14.0, 14.0, 16.0, 18.0, 22.0, 32.0, 34.0, 30.0, 23.0, 32.0, 41.0, 32.0, 46.0, 48.0, 49.0, 33.0, 47.0, 41.0, 42.0, 38.0, 42.0, 32.0, 30.0, 31.0, 25.0, 18.0, 19.0, 15.0, 21.0, 10.0, 13.0, 15.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00027120113372802734, -0.0002622026950120926, -0.00025320425629615784, -0.0002442058175802231, -0.00023520737886428833, -0.00022620894014835358, -0.00021721050143241882, -0.00020821206271648407, -0.00019921362400054932, -0.00019021518528461456, -0.0001812167465686798, -0.00017221830785274506, -0.0001632198691368103, -0.00015422143042087555, -0.0001452229917049408, -0.00013622455298900604, -0.0001272261142730713, -0.00011822767555713654, -0.00010922923684120178, -0.00010023079812526703, -9.123235940933228e-05, -8.223392069339752e-05, -7.323548197746277e-05, -6.423704326152802e-05, -5.523860454559326e-05, -4.624016582965851e-05, -3.7241727113723755e-05, -2.8243288397789e-05, -1.9244849681854248e-05, -1.0246410965919495e-05, -1.2479722499847412e-06, 7.750466465950012e-06, 1.6748905181884766e-05, 2.574734389781952e-05, 3.474578261375427e-05, 4.3744221329689026e-05, 5.274266004562378e-05, 6.174109876155853e-05, 7.073953747749329e-05, 7.973797619342804e-05, 8.873641490936279e-05, 9.773485362529755e-05, 0.0001067332923412323, 0.00011573173105716705, 0.0001247301697731018, 0.00013372860848903656, 0.0001427270472049713, 0.00015172548592090607, 0.00016072392463684082, 0.00016972236335277557, 0.00017872080206871033, 0.00018771924078464508, 0.00019671767950057983, 0.0002057161182165146, 0.00021471455693244934, 0.0002237129956483841, 0.00023271143436431885, 0.0002417098730802536, 0.00025070831179618835, 0.0002597067505121231, 0.00026870518922805786, 0.0002777036279439926, 0.00028670206665992737, 0.0002957005053758621, 0.0003046989440917969]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 10.0, 2.0, 4.0, 12.0, 12.0, 14.0, 12.0, 19.0, 19.0, 19.0, 23.0, 14.0, 32.0, 29.0, 40.0, 39.0, 25.0, 49.0, 41.0, 51.0, 36.0, 38.0, 36.0, 37.0, 36.0, 45.0, 32.0, 37.0, 33.0, 41.0, 23.0, 23.0, 17.0, 17.0, 12.0, 12.0, 10.0, 9.0, 10.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4853363037109375, -1.438446044921875, -1.3915557861328125, -1.34466552734375, -1.2977752685546875, -1.250885009765625, -1.2039947509765625, -1.1571044921875, -1.1102142333984375, -1.063323974609375, -1.0164337158203125, -0.96954345703125, -0.9226531982421875, -0.875762939453125, -0.8288726806640625, -0.781982421875, -0.7350921630859375, -0.688201904296875, -0.6413116455078125, -0.59442138671875, -0.5475311279296875, -0.500640869140625, -0.4537506103515625, -0.4068603515625, -0.3599700927734375, -0.313079833984375, -0.2661895751953125, -0.21929931640625, -0.1724090576171875, -0.125518798828125, -0.0786285400390625, -0.03173828125, 0.0151519775390625, 0.062042236328125, 0.1089324951171875, 0.15582275390625, 0.2027130126953125, 0.249603271484375, 0.2964935302734375, 0.3433837890625, 0.3902740478515625, 0.437164306640625, 0.4840545654296875, 0.53094482421875, 0.5778350830078125, 0.624725341796875, 0.6716156005859375, 0.718505859375, 0.7653961181640625, 0.812286376953125, 0.8591766357421875, 0.90606689453125, 0.9529571533203125, 0.999847412109375, 1.0467376708984375, 1.0936279296875, 1.1405181884765625, 1.187408447265625, 1.2342987060546875, 1.28118896484375, 1.3280792236328125, 1.374969482421875, 1.4218597412109375, 1.46875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 12.0, 11.0, 13.0, 14.0, 27.0, 36.0, 47.0, 52.0, 109.0, 165.0, 270.0, 390.0, 669.0, 1139.0, 1973.0, 3481.0, 6453.0, 12397.0, 25961.0, 55279.0, 117059.0, 212650.0, 256665.0, 178235.0, 91419.0, 42281.0, 19866.0, 9766.0, 5146.0, 2797.0, 1581.0, 989.0, 574.0, 340.0, 217.0, 158.0, 108.0, 52.0, 46.0, 31.0, 24.0, 11.0, 7.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.119140625, -1.0809783935546875, -1.042816162109375, -1.0046539306640625, -0.96649169921875, -0.9283294677734375, -0.890167236328125, -0.8520050048828125, -0.8138427734375, -0.7756805419921875, -0.737518310546875, -0.6993560791015625, -0.66119384765625, -0.6230316162109375, -0.584869384765625, -0.5467071533203125, -0.508544921875, -0.4703826904296875, -0.432220458984375, -0.3940582275390625, -0.35589599609375, -0.3177337646484375, -0.279571533203125, -0.2414093017578125, -0.2032470703125, -0.1650848388671875, -0.126922607421875, -0.0887603759765625, -0.05059814453125, -0.0124359130859375, 0.025726318359375, 0.0638885498046875, 0.10205078125, 0.1402130126953125, 0.178375244140625, 0.2165374755859375, 0.25469970703125, 0.2928619384765625, 0.331024169921875, 0.3691864013671875, 0.4073486328125, 0.4455108642578125, 0.483673095703125, 0.5218353271484375, 0.55999755859375, 0.5981597900390625, 0.636322021484375, 0.6744842529296875, 0.712646484375, 0.7508087158203125, 0.788970947265625, 0.8271331787109375, 0.86529541015625, 0.9034576416015625, 0.941619873046875, 0.9797821044921875, 1.0179443359375, 1.0561065673828125, 1.094268798828125, 1.1324310302734375, 1.17059326171875, 1.2087554931640625, 1.246917724609375, 1.2850799560546875, 1.3232421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 6.0, 9.0, 8.0, 8.0, 14.0, 16.0, 19.0, 26.0, 16.0, 27.0, 30.0, 38.0, 28.0, 39.0, 38.0, 71.0, 84.0, 213.0, 1431.0, 313.0, 146.0, 70.0, 66.0, 40.0, 38.0, 26.0, 28.0, 29.0, 28.0, 21.0, 17.0, 23.0, 11.0, 15.0, 16.0, 7.0, 9.0, 8.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58984375, -5.41943359375, -5.2490234375, -5.07861328125, -4.908203125, -4.73779296875, -4.5673828125, -4.39697265625, -4.2265625, -4.05615234375, -3.8857421875, -3.71533203125, -3.544921875, -3.37451171875, -3.2041015625, -3.03369140625, -2.86328125, -2.69287109375, -2.5224609375, -2.35205078125, -2.181640625, -2.01123046875, -1.8408203125, -1.67041015625, -1.5, -1.32958984375, -1.1591796875, -0.98876953125, -0.818359375, -0.64794921875, -0.4775390625, -0.30712890625, -0.13671875, 0.03369140625, 0.2041015625, 0.37451171875, 0.544921875, 0.71533203125, 0.8857421875, 1.05615234375, 1.2265625, 1.39697265625, 1.5673828125, 1.73779296875, 1.908203125, 2.07861328125, 2.2490234375, 2.41943359375, 2.58984375, 2.76025390625, 2.9306640625, 3.10107421875, 3.271484375, 3.44189453125, 3.6123046875, 3.78271484375, 3.953125, 4.12353515625, 4.2939453125, 4.46435546875, 4.634765625, 4.80517578125, 4.9755859375, 5.14599609375, 5.31640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 13.0, 8.0, 9.0, 21.0, 12.0, 25.0, 43.0, 32.0, 54.0, 48.0, 82.0, 76.0, 132.0, 213.0, 434.0, 1239.0, 7341.0, 228587.0, 2832601.0, 68871.0, 3798.0, 944.0, 337.0, 219.0, 139.0, 89.0, 61.0, 49.0, 51.0, 30.0, 32.0, 26.0, 13.0, 15.0, 18.0, 4.0, 8.0, 4.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-9.09375, -8.8211669921875, -8.548583984375, -8.2760009765625, -8.00341796875, -7.7308349609375, -7.458251953125, -7.1856689453125, -6.9130859375, -6.6405029296875, -6.367919921875, -6.0953369140625, -5.82275390625, -5.5501708984375, -5.277587890625, -5.0050048828125, -4.732421875, -4.4598388671875, -4.187255859375, -3.9146728515625, -3.64208984375, -3.3695068359375, -3.096923828125, -2.8243408203125, -2.5517578125, -2.2791748046875, -2.006591796875, -1.7340087890625, -1.46142578125, -1.1888427734375, -0.916259765625, -0.6436767578125, -0.37109375, -0.0985107421875, 0.174072265625, 0.4466552734375, 0.71923828125, 0.9918212890625, 1.264404296875, 1.5369873046875, 1.8095703125, 2.0821533203125, 2.354736328125, 2.6273193359375, 2.89990234375, 3.1724853515625, 3.445068359375, 3.7176513671875, 3.990234375, 4.2628173828125, 4.535400390625, 4.8079833984375, 5.08056640625, 5.3531494140625, 5.625732421875, 5.8983154296875, 6.1708984375, 6.4434814453125, 6.716064453125, 6.9886474609375, 7.26123046875, 7.5338134765625, 7.806396484375, 8.0789794921875, 8.3515625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 131.0, 771.0, 113.0, 2.0], "bins": [-140.50949096679688, -138.22354125976562, -135.93759155273438, -133.65164184570312, -131.36569213867188, -129.07974243164062, -126.7938003540039, -124.50785064697266, -122.2219009399414, -119.93595123291016, -117.6500015258789, -115.36405944824219, -113.07810974121094, -110.79216003417969, -108.50621032714844, -106.22026062011719, -103.93431091308594, -101.64836120605469, -99.36241149902344, -97.07646179199219, -94.79051971435547, -92.50457000732422, -90.21862030029297, -87.93267059326172, -85.646728515625, -83.36077880859375, -81.0748291015625, -78.78887939453125, -76.50293731689453, -74.21698760986328, -71.93103790283203, -69.64508819580078, -67.35913848876953, -65.07318878173828, -62.7872428894043, -60.50129318237305, -58.2153434753418, -55.92939758300781, -53.64344787597656, -51.35749816894531, -49.07155227661133, -46.78560256958008, -44.499656677246094, -42.213706970214844, -39.927757263183594, -37.641807556152344, -35.35586166381836, -33.06991195678711, -30.783966064453125, -28.498018264770508, -26.212068557739258, -23.92612075805664, -21.64017105102539, -19.354223251342773, -17.068275451660156, -14.782325744628906, -12.496376991271973, -10.210428237915039, -7.924479961395264, -5.638531684875488, -3.3525829315185547, -1.066634178161621, 1.219313621520996, 3.505263328552246, 5.791211128234863]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0, 6.0, 5.0, 8.0, 3.0, 9.0, 11.0, 19.0, 18.0, 14.0, 24.0, 19.0, 26.0, 28.0, 42.0, 24.0, 49.0, 38.0, 35.0, 47.0, 37.0, 42.0, 39.0, 53.0, 53.0, 39.0, 42.0, 26.0, 30.0, 32.0, 26.0, 31.0, 23.0, 25.0, 9.0, 13.0, 13.0, 6.0, 6.0, 7.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.028182983398438, -17.48043441772461, -16.932687759399414, -16.384939193725586, -15.837190628051758, -15.289443016052246, -14.741695404052734, -14.193946838378906, -13.646199226379395, -13.098451614379883, -12.550703048706055, -12.002955436706543, -11.455207824707031, -10.907459259033203, -10.359711647033691, -9.81196403503418, -9.264215469360352, -8.71646785736084, -8.168719291687012, -7.6209716796875, -7.07322359085083, -6.52547550201416, -5.977727890014648, -5.4299798011779785, -4.882231712341309, -4.334483623504639, -3.786735773086548, -3.238987922668457, -2.691239833831787, -2.143491744995117, -1.5957438945770264, -1.0479960441589355, -0.5002479553222656, 0.047500014305114746, 0.5952479839324951, 1.1429959535598755, 1.6907439231872559, 2.238492012023926, 2.7862398624420166, 3.3339877128601074, 3.8817358016967773, 4.429483890533447, 4.977231979370117, 5.524979591369629, 6.072727680206299, 6.620475769042969, 7.1682233810424805, 7.71597146987915, 8.26371955871582, 8.811467170715332, 9.35921573638916, 9.906963348388672, 10.4547119140625, 11.002459526062012, 11.550207138061523, 12.097955703735352, 12.645703315734863, 13.193450927734375, 13.741199493408203, 14.288947105407715, 14.836694717407227, 15.384443283081055, 15.932190895080566, 16.479938507080078, 17.027687072753906]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 11.0, 8.0, 12.0, 25.0, 14.0, 24.0, 19.0, 29.0, 22.0, 33.0, 43.0, 28.0, 41.0, 37.0, 48.0, 43.0, 38.0, 30.0, 40.0, 45.0, 37.0, 42.0, 43.0, 36.0, 29.0, 26.0, 28.0, 27.0, 16.0, 15.0, 10.0, 17.0, 16.0, 6.0, 11.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.578948974609375, -1.52899169921875, -1.479034423828125, -1.4290771484375, -1.379119873046875, -1.32916259765625, -1.279205322265625, -1.229248046875, -1.179290771484375, -1.12933349609375, -1.079376220703125, -1.0294189453125, -0.979461669921875, -0.92950439453125, -0.879547119140625, -0.82958984375, -0.779632568359375, -0.72967529296875, -0.679718017578125, -0.6297607421875, -0.579803466796875, -0.52984619140625, -0.479888916015625, -0.429931640625, -0.379974365234375, -0.33001708984375, -0.280059814453125, -0.2301025390625, -0.180145263671875, -0.13018798828125, -0.080230712890625, -0.0302734375, 0.019683837890625, 0.06964111328125, 0.119598388671875, 0.1695556640625, 0.219512939453125, 0.26947021484375, 0.319427490234375, 0.369384765625, 0.419342041015625, 0.46929931640625, 0.519256591796875, 0.5692138671875, 0.619171142578125, 0.66912841796875, 0.719085693359375, 0.76904296875, 0.819000244140625, 0.86895751953125, 0.918914794921875, 0.9688720703125, 1.018829345703125, 1.06878662109375, 1.118743896484375, 1.168701171875, 1.218658447265625, 1.26861572265625, 1.318572998046875, 1.3685302734375, 1.418487548828125, 1.46844482421875, 1.518402099609375, 1.568359375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 8.0, 6.0, 10.0, 5.0, 8.0, 10.0, 13.0, 11.0, 17.0, 20.0, 28.0, 28.0, 33.0, 55.0, 80.0, 121.0, 235.0, 510.0, 1434.0, 5189.0, 24824.0, 166595.0, 1343461.0, 2189094.0, 398327.0, 50829.0, 9285.0, 2422.0, 770.0, 315.0, 159.0, 102.0, 66.0, 40.0, 45.0, 27.0, 17.0, 24.0, 13.0, 14.0, 12.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.00390625, -3.88330078125, -3.7626953125, -3.64208984375, -3.521484375, -3.40087890625, -3.2802734375, -3.15966796875, -3.0390625, -2.91845703125, -2.7978515625, -2.67724609375, -2.556640625, -2.43603515625, -2.3154296875, -2.19482421875, -2.07421875, -1.95361328125, -1.8330078125, -1.71240234375, -1.591796875, -1.47119140625, -1.3505859375, -1.22998046875, -1.109375, -0.98876953125, -0.8681640625, -0.74755859375, -0.626953125, -0.50634765625, -0.3857421875, -0.26513671875, -0.14453125, -0.02392578125, 0.0966796875, 0.21728515625, 0.337890625, 0.45849609375, 0.5791015625, 0.69970703125, 0.8203125, 0.94091796875, 1.0615234375, 1.18212890625, 1.302734375, 1.42333984375, 1.5439453125, 1.66455078125, 1.78515625, 1.90576171875, 2.0263671875, 2.14697265625, 2.267578125, 2.38818359375, 2.5087890625, 2.62939453125, 2.75, 2.87060546875, 2.9912109375, 3.11181640625, 3.232421875, 3.35302734375, 3.4736328125, 3.59423828125, 3.71484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 20.0, 28.0, 27.0, 36.0, 69.0, 66.0, 109.0, 135.0, 196.0, 228.0, 302.0, 366.0, 416.0, 416.0, 344.0, 310.0, 249.0, 177.0, 138.0, 109.0, 65.0, 54.0, 49.0, 38.0, 13.0, 17.0, 15.0, 9.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.509063720703125, -3.38336181640625, -3.257659912109375, -3.1319580078125, -3.006256103515625, -2.88055419921875, -2.754852294921875, -2.629150390625, -2.503448486328125, -2.37774658203125, -2.252044677734375, -2.1263427734375, -2.000640869140625, -1.87493896484375, -1.749237060546875, -1.62353515625, -1.497833251953125, -1.37213134765625, -1.246429443359375, -1.1207275390625, -0.995025634765625, -0.86932373046875, -0.743621826171875, -0.617919921875, -0.492218017578125, -0.36651611328125, -0.240814208984375, -0.1151123046875, 0.010589599609375, 0.13629150390625, 0.261993408203125, 0.3876953125, 0.513397216796875, 0.63909912109375, 0.764801025390625, 0.8905029296875, 1.016204833984375, 1.14190673828125, 1.267608642578125, 1.393310546875, 1.519012451171875, 1.64471435546875, 1.770416259765625, 1.8961181640625, 2.021820068359375, 2.14752197265625, 2.273223876953125, 2.39892578125, 2.524627685546875, 2.65032958984375, 2.776031494140625, 2.9017333984375, 3.027435302734375, 3.15313720703125, 3.278839111328125, 3.404541015625, 3.530242919921875, 3.65594482421875, 3.781646728515625, 3.9073486328125, 4.033050537109375, 4.15875244140625, 4.284454345703125, 4.41015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 5.0, 17.0, 28.0, 27.0, 46.0, 58.0, 71.0, 125.0, 170.0, 323.0, 569.0, 1468.0, 4415.0, 19605.0, 141518.0, 1328928.0, 2344974.0, 304018.0, 37199.0, 6875.0, 1955.0, 831.0, 382.0, 208.0, 131.0, 81.0, 60.0, 49.0, 38.0, 24.0, 21.0, 10.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.20703125, -5.9942626953125, -5.781494140625, -5.5687255859375, -5.35595703125, -5.1431884765625, -4.930419921875, -4.7176513671875, -4.5048828125, -4.2921142578125, -4.079345703125, -3.8665771484375, -3.65380859375, -3.4410400390625, -3.228271484375, -3.0155029296875, -2.802734375, -2.5899658203125, -2.377197265625, -2.1644287109375, -1.95166015625, -1.7388916015625, -1.526123046875, -1.3133544921875, -1.1005859375, -0.8878173828125, -0.675048828125, -0.4622802734375, -0.24951171875, -0.0367431640625, 0.176025390625, 0.3887939453125, 0.6015625, 0.8143310546875, 1.027099609375, 1.2398681640625, 1.45263671875, 1.6654052734375, 1.878173828125, 2.0909423828125, 2.3037109375, 2.5164794921875, 2.729248046875, 2.9420166015625, 3.15478515625, 3.3675537109375, 3.580322265625, 3.7930908203125, 4.005859375, 4.2186279296875, 4.431396484375, 4.6441650390625, 4.85693359375, 5.0697021484375, 5.282470703125, 5.4952392578125, 5.7080078125, 5.9207763671875, 6.133544921875, 6.3463134765625, 6.55908203125, 6.7718505859375, 6.984619140625, 7.1973876953125, 7.41015625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 9.0, 14.0, 25.0, 44.0, 58.0, 81.0, 111.0, 122.0, 117.0, 119.0, 113.0, 70.0, 51.0, 34.0, 18.0, 14.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.385751724243164, -11.62949275970459, -10.873233795166016, -10.116975784301758, -9.360716819763184, -8.60445785522461, -7.848199367523193, -7.091940879821777, -6.335681915283203, -5.579422950744629, -4.823164463043213, -4.066905975341797, -3.3106470108032227, -2.5543882846832275, -1.7981295585632324, -1.0418710708618164, -0.2856121063232422, 0.47064661979675293, 1.226905345916748, 1.9831640720367432, 2.7394227981567383, 3.4956815242767334, 4.2519402503967285, 5.0081987380981445, 5.764457702636719, 6.520716667175293, 7.276975154876709, 8.033233642578125, 8.7894926071167, 9.545751571655273, 10.302009582519531, 11.058268547058105, 11.814529418945312, 12.570788383483887, 13.327047348022461, 14.083305358886719, 14.839564323425293, 15.595823287963867, 16.352081298828125, 17.108341217041016, 17.864599227905273, 18.62085723876953, 19.377117156982422, 20.13337516784668, 20.889633178710938, 21.645893096923828, 22.402151107788086, 23.158409118652344, 23.914669036865234, 24.670927047729492, 25.427186965942383, 26.18344497680664, 26.93970489501953, 27.69596290588379, 28.452220916748047, 29.208480834960938, 29.964738845825195, 30.720996856689453, 31.477256774902344, 32.233516693115234, 32.98977279663086, 33.74603271484375, 34.50229263305664, 35.258548736572266, 36.014808654785156]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 5.0, 11.0, 10.0, 16.0, 12.0, 21.0, 26.0, 29.0, 35.0, 31.0, 27.0, 22.0, 33.0, 38.0, 50.0, 33.0, 48.0, 35.0, 35.0, 33.0, 43.0, 38.0, 32.0, 31.0, 36.0, 31.0, 23.0, 24.0, 24.0, 22.0, 17.0, 18.0, 9.0, 8.0, 9.0, 14.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.570337295532227, -11.171588897705078, -10.77284049987793, -10.374092102050781, -9.975343704223633, -9.576595306396484, -9.177846908569336, -8.779098510742188, -8.380350112915039, -7.981601715087891, -7.582853317260742, -7.184104919433594, -6.785356521606445, -6.386608123779297, -5.98785924911499, -5.589110851287842, -5.190361976623535, -4.791613578796387, -4.392865180969238, -3.9941165447235107, -3.5953681468963623, -3.196619749069214, -2.7978711128234863, -2.399122714996338, -2.0003743171691895, -1.601625919342041, -1.202877402305603, -0.804128885269165, -0.4053804874420166, -0.006632089614868164, 0.3921165466308594, 0.7908649444580078, 1.1896123886108398, 1.5883607864379883, 1.9871093034744263, 2.3858578205108643, 2.7846062183380127, 3.183354616165161, 3.5821032524108887, 3.980851650238037, 4.3796000480651855, 4.778348445892334, 5.177096843719482, 5.575845718383789, 5.9745941162109375, 6.373342514038086, 6.772090911865234, 7.170839309692383, 7.569587707519531, 7.96833610534668, 8.367084503173828, 8.765832901000977, 9.164581298828125, 9.563329696655273, 9.962078094482422, 10.36082649230957, 10.759574890136719, 11.158323287963867, 11.557071685791016, 11.955820083618164, 12.354568481445312, 12.753316879272461, 13.15206527709961, 13.550813674926758, 13.949563026428223]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 6.0, 12.0, 10.0, 10.0, 18.0, 10.0, 17.0, 19.0, 23.0, 23.0, 30.0, 27.0, 28.0, 38.0, 24.0, 28.0, 47.0, 39.0, 33.0, 33.0, 54.0, 39.0, 46.0, 36.0, 30.0, 40.0, 23.0, 22.0, 31.0, 29.0, 15.0, 20.0, 10.0, 12.0, 17.0, 14.0, 8.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-1.46875, -1.4231719970703125, -1.377593994140625, -1.3320159912109375, -1.28643798828125, -1.2408599853515625, -1.195281982421875, -1.1497039794921875, -1.1041259765625, -1.0585479736328125, -1.012969970703125, -0.9673919677734375, -0.92181396484375, -0.8762359619140625, -0.830657958984375, -0.7850799560546875, -0.739501953125, -0.6939239501953125, -0.648345947265625, -0.6027679443359375, -0.55718994140625, -0.5116119384765625, -0.466033935546875, -0.4204559326171875, -0.3748779296875, -0.3292999267578125, -0.283721923828125, -0.2381439208984375, -0.19256591796875, -0.1469879150390625, -0.101409912109375, -0.0558319091796875, -0.01025390625, 0.0353240966796875, 0.080902099609375, 0.1264801025390625, 0.17205810546875, 0.2176361083984375, 0.263214111328125, 0.3087921142578125, 0.3543701171875, 0.3999481201171875, 0.445526123046875, 0.4911041259765625, 0.53668212890625, 0.5822601318359375, 0.627838134765625, 0.6734161376953125, 0.718994140625, 0.7645721435546875, 0.810150146484375, 0.8557281494140625, 0.90130615234375, 0.9468841552734375, 0.992462158203125, 1.0380401611328125, 1.0836181640625, 1.1291961669921875, 1.174774169921875, 1.2203521728515625, 1.26593017578125, 1.3115081787109375, 1.357086181640625, 1.4026641845703125, 1.4482421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 15.0, 13.0, 40.0, 52.0, 84.0, 112.0, 169.0, 294.0, 408.0, 644.0, 1030.0, 1669.0, 2544.0, 4185.0, 6656.0, 10647.0, 17680.0, 30003.0, 53821.0, 100919.0, 194447.0, 263882.0, 163053.0, 84374.0, 45708.0, 25894.0, 15296.0, 9373.0, 5677.0, 3625.0, 2248.0, 1389.0, 895.0, 597.0, 406.0, 252.0, 148.0, 89.0, 87.0, 46.0, 24.0, 22.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.243896484375, -0.2365856170654297, -0.22927474975585938, -0.22196388244628906, -0.21465301513671875, -0.20734214782714844, -0.20003128051757812, -0.1927204132080078, -0.1854095458984375, -0.1780986785888672, -0.17078781127929688, -0.16347694396972656, -0.15616607666015625, -0.14885520935058594, -0.14154434204101562, -0.1342334747314453, -0.126922607421875, -0.11961174011230469, -0.11230087280273438, -0.10499000549316406, -0.09767913818359375, -0.09036827087402344, -0.08305740356445312, -0.07574653625488281, -0.0684356689453125, -0.06112480163574219, -0.053813934326171875, -0.04650306701660156, -0.03919219970703125, -0.03188133239746094, -0.024570465087890625, -0.017259597778320312, -0.00994873046875, -0.0026378631591796875, 0.004673004150390625, 0.011983871459960938, 0.01929473876953125, 0.026605606079101562, 0.033916473388671875, 0.04122734069824219, 0.0485382080078125, 0.05584907531738281, 0.06315994262695312, 0.07047080993652344, 0.07778167724609375, 0.08509254455566406, 0.09240341186523438, 0.09971427917480469, 0.107025146484375, 0.11433601379394531, 0.12164688110351562, 0.12895774841308594, 0.13626861572265625, 0.14357948303222656, 0.15089035034179688, 0.1582012176513672, 0.1655120849609375, 0.1728229522705078, 0.18013381958007812, 0.18744468688964844, 0.19475555419921875, 0.20206642150878906, 0.20937728881835938, 0.2166881561279297, 0.2239990234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 1.0, 6.0, 10.0, 6.0, 10.0, 18.0, 26.0, 24.0, 18.0, 23.0, 30.0, 24.0, 29.0, 41.0, 33.0, 36.0, 33.0, 41.0, 1082.0, 45.0, 50.0, 47.0, 48.0, 46.0, 26.0, 31.0, 28.0, 26.0, 36.0, 21.0, 24.0, 17.0, 14.0, 13.0, 15.0, 7.0, 5.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1409225463867188, -1.1070404052734375, -1.0731582641601562, -1.039276123046875, -1.0053939819335938, -0.9715118408203125, -0.9376296997070312, -0.90374755859375, -0.8698654174804688, -0.8359832763671875, -0.8021011352539062, -0.768218994140625, -0.7343368530273438, -0.7004547119140625, -0.6665725708007812, -0.6326904296875, -0.5988082885742188, -0.5649261474609375, -0.5310440063476562, -0.497161865234375, -0.46327972412109375, -0.4293975830078125, -0.39551544189453125, -0.36163330078125, -0.32775115966796875, -0.2938690185546875, -0.25998687744140625, -0.226104736328125, -0.19222259521484375, -0.1583404541015625, -0.12445831298828125, -0.090576171875, -0.05669403076171875, -0.0228118896484375, 0.01107025146484375, 0.044952392578125, 0.07883453369140625, 0.1127166748046875, 0.14659881591796875, 0.18048095703125, 0.21436309814453125, 0.2482452392578125, 0.28212738037109375, 0.316009521484375, 0.34989166259765625, 0.3837738037109375, 0.41765594482421875, 0.4515380859375, 0.48542022705078125, 0.5193023681640625, 0.5531845092773438, 0.587066650390625, 0.6209487915039062, 0.6548309326171875, 0.6887130737304688, 0.72259521484375, 0.7564773559570312, 0.7903594970703125, 0.8242416381835938, 0.858123779296875, 0.8920059204101562, 0.9258880615234375, 0.9597702026367188, 0.99365234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 22.0, 19.0, 28.0, 40.0, 66.0, 94.0, 119.0, 183.0, 255.0, 362.0, 568.0, 856.0, 1182.0, 1754.0, 2603.0, 3985.0, 5901.0, 9147.0, 14641.0, 22826.0, 37450.0, 63234.0, 108955.0, 190209.0, 1275113.0, 144850.0, 82674.0, 48316.0, 29522.0, 18422.0, 11648.0, 7446.0, 4751.0, 3243.0, 2124.0, 1443.0, 952.0, 618.0, 460.0, 302.0, 235.0, 158.0, 106.0, 79.0, 37.0, 40.0, 29.0, 21.0, 12.0, 9.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.1719970703125, -0.1669750213623047, -0.16195297241210938, -0.15693092346191406, -0.15190887451171875, -0.14688682556152344, -0.14186477661132812, -0.1368427276611328, -0.1318206787109375, -0.1267986297607422, -0.12177658081054688, -0.11675453186035156, -0.11173248291015625, -0.10671043395996094, -0.10168838500976562, -0.09666633605957031, -0.091644287109375, -0.08662223815917969, -0.08160018920898438, -0.07657814025878906, -0.07155609130859375, -0.06653404235839844, -0.061511993408203125, -0.05648994445800781, -0.0514678955078125, -0.04644584655761719, -0.041423797607421875, -0.03640174865722656, -0.03137969970703125, -0.026357650756835938, -0.021335601806640625, -0.016313552856445312, -0.01129150390625, -0.0062694549560546875, -0.001247406005859375, 0.0037746429443359375, 0.00879669189453125, 0.013818740844726562, 0.018840789794921875, 0.023862838745117188, 0.0288848876953125, 0.03390693664550781, 0.038928985595703125, 0.04395103454589844, 0.04897308349609375, 0.05399513244628906, 0.059017181396484375, 0.06403923034667969, 0.069061279296875, 0.07408332824707031, 0.07910537719726562, 0.08412742614746094, 0.08914947509765625, 0.09417152404785156, 0.09919357299804688, 0.10421562194824219, 0.1092376708984375, 0.11425971984863281, 0.11928176879882812, 0.12430381774902344, 0.12932586669921875, 0.13434791564941406, 0.13936996459960938, 0.1443920135498047, 0.1494140625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 13.0, 7.0, 14.0, 24.0, 26.0, 38.0, 38.0, 52.0, 67.0, 85.0, 72.0, 86.0, 90.0, 64.0, 58.0, 59.0, 41.0, 28.0, 20.0, 24.0, 17.0, 11.0, 6.0, 8.0, 6.0, 9.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007219314575195312, -0.0006989911198616028, -0.0006760507822036743, -0.0006531104445457458, -0.0006301701068878174, -0.0006072297692298889, -0.0005842894315719604, -0.000561349093914032, -0.0005384087562561035, -0.000515468418598175, -0.0004925280809402466, -0.0004695877432823181, -0.00044664740562438965, -0.0004237070679664612, -0.0004007667303085327, -0.00037782639265060425, -0.0003548860549926758, -0.0003319457173347473, -0.00030900537967681885, -0.0002860650420188904, -0.0002631247043609619, -0.00024018436670303345, -0.00021724402904510498, -0.00019430369138717651, -0.00017136335372924805, -0.00014842301607131958, -0.0001254826784133911, -0.00010254234075546265, -7.960200309753418e-05, -5.666166543960571e-05, -3.3721327781677246e-05, -1.078099012374878e-05, 1.2159347534179688e-05, 3.5099685192108154e-05, 5.804002285003662e-05, 8.098036050796509e-05, 0.00010392069816589355, 0.00012686103582382202, 0.0001498013734817505, 0.00017274171113967896, 0.00019568204879760742, 0.0002186223864555359, 0.00024156272411346436, 0.0002645030617713928, 0.0002874433994293213, 0.00031038373708724976, 0.0003333240747451782, 0.0003562644124031067, 0.00037920475006103516, 0.0004021450877189636, 0.0004250854253768921, 0.00044802576303482056, 0.000470966100692749, 0.0004939064383506775, 0.000516846776008606, 0.0005397871136665344, 0.0005627274513244629, 0.0005856677889823914, 0.0006086081266403198, 0.0006315484642982483, 0.0006544888019561768, 0.0006774291396141052, 0.0007003694772720337, 0.0007233098149299622, 0.0007462501525878906]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 5.0, 10.0, 11.0, 6.0, 19.0, 21.0, 25.0, 52.0, 74.0, 142.0, 270.0, 622.0, 4829.0, 1028240.0, 12827.0, 654.0, 316.0, 147.0, 89.0, 61.0, 26.0, 18.0, 18.0, 9.0, 8.0, 7.0, 8.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0178985595703125, -0.017365455627441406, -0.016832351684570312, -0.01629924774169922, -0.015766143798828125, -0.015233039855957031, -0.014699935913085938, -0.014166831970214844, -0.01363372802734375, -0.013100624084472656, -0.012567520141601562, -0.012034416198730469, -0.011501312255859375, -0.010968208312988281, -0.010435104370117188, -0.009902000427246094, -0.009368896484375, -0.008835792541503906, -0.008302688598632812, -0.007769584655761719, -0.007236480712890625, -0.006703376770019531, -0.0061702728271484375, -0.005637168884277344, -0.00510406494140625, -0.004570960998535156, -0.0040378570556640625, -0.0035047531127929688, -0.002971649169921875, -0.0024385452270507812, -0.0019054412841796875, -0.0013723373413085938, -0.0008392333984375, -0.00030612945556640625, 0.0002269744873046875, 0.0007600784301757812, 0.001293182373046875, 0.0018262863159179688, 0.0023593902587890625, 0.0028924942016601562, 0.00342559814453125, 0.003958702087402344, 0.0044918060302734375, 0.005024909973144531, 0.005558013916015625, 0.006091117858886719, 0.0066242218017578125, 0.007157325744628906, 0.0076904296875, 0.008223533630371094, 0.008756637573242188, 0.009289741516113281, 0.009822845458984375, 0.010355949401855469, 0.010889053344726562, 0.011422157287597656, 0.01195526123046875, 0.012488365173339844, 0.013021469116210938, 0.013554573059082031, 0.014087677001953125, 0.014620780944824219, 0.015153884887695312, 0.015686988830566406, 0.0162200927734375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 71.0, 334.0, 454.0, 137.0, 13.0, 4.0], "bins": [-0.0037722978740930557, -0.003709677839651704, -0.003647057805210352, -0.003584437770769, -0.003521817736327648, -0.0034591974690556526, -0.0033965776674449444, -0.003333957400172949, -0.003271337365731597, -0.003208717331290245, -0.003146097296848893, -0.0030834772624075413, -0.0030208572279661894, -0.0029582371935248375, -0.002895616926252842, -0.00283299689181149, -0.002770376857370138, -0.0027077568229287863, -0.0026451367884874344, -0.0025825167540460825, -0.0025198967196047306, -0.002457276452332735, -0.002394656650722027, -0.0023320363834500313, -0.002269416581839323, -0.002206796547397971, -0.0021441765129566193, -0.0020815564785152674, -0.0020189364440739155, -0.00195631617680192, -0.0018936962587758899, -0.001831076224334538, -0.001768456306308508, -0.001705836271867156, -0.0016432162374258041, -0.0015805962029844522, -0.0015179760521277785, -0.0014553560176864266, -0.0013927359832450747, -0.0013301159488037229, -0.0012674957979470491, -0.0012048757635056973, -0.0011422557290643454, -0.0010796356946229935, -0.0010170155437663198, -0.0009543955093249679, -0.000891775474883616, -0.0008291554404422641, -0.0007665353477932513, -0.0007039153133518994, -0.0006412952207028866, -0.0005786751862615347, -0.0005160551518201828, -0.00045343505917117, -0.0003908150247298181, -0.00032819496118463576, -0.0002655748976394534, -0.00020295483409427106, -0.00014033478510100394, -7.771473610773683e-05, -1.5094672562554479e-05, 4.752539098262787e-05, 0.00011014542542397976, 0.0001727654889691621, 0.00023538555251434445]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 7.0, 10.0, 12.0, 13.0, 11.0, 27.0, 32.0, 29.0, 36.0, 39.0, 51.0, 37.0, 37.0, 51.0, 52.0, 47.0, 55.0, 54.0, 45.0, 47.0, 42.0, 37.0, 37.0, 45.0, 23.0, 23.0, 12.0, 18.0, 18.0, 14.0, 11.0, 5.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003330707550048828, -0.0003205714747309685, -0.00030807219445705414, -0.0002955729141831398, -0.00028307363390922546, -0.0002705743536353111, -0.0002580750733613968, -0.00024557579308748245, -0.00023307651281356812, -0.00022057723253965378, -0.00020807795226573944, -0.0001955786719918251, -0.00018307939171791077, -0.00017058011144399643, -0.0001580808311700821, -0.00014558155089616776, -0.00013308227062225342, -0.00012058299034833908, -0.00010808371007442474, -9.55844298005104e-05, -8.308514952659607e-05, -7.058586925268173e-05, -5.8086588978767395e-05, -4.558730870485306e-05, -3.308802843093872e-05, -2.0588748157024384e-05, -8.089467883110046e-06, 4.409812390804291e-06, 1.6909092664718628e-05, 2.9408372938632965e-05, 4.19076532125473e-05, 5.440693348646164e-05, 6.690621376037598e-05, 7.940549403429031e-05, 9.190477430820465e-05, 0.00010440405458211899, 0.00011690333485603333, 0.00012940261512994766, 0.000141901895403862, 0.00015440117567777634, 0.00016690045595169067, 0.000179399736225605, 0.00019189901649951935, 0.00020439829677343369, 0.00021689757704734802, 0.00022939685732126236, 0.0002418961375951767, 0.00025439541786909103, 0.00026689469814300537, 0.0002793939784169197, 0.00029189325869083405, 0.0003043925389647484, 0.0003168918192386627, 0.00032939109951257706, 0.0003418903797864914, 0.00035438966006040573, 0.00036688894033432007, 0.0003793882206082344, 0.00039188750088214874, 0.0004043867811560631, 0.0004168860614299774, 0.00042938534170389175, 0.0004418846219778061, 0.00045438390225172043, 0.00046688318252563477]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 6.0, 12.0, 10.0, 10.0, 18.0, 10.0, 17.0, 19.0, 23.0, 23.0, 30.0, 27.0, 28.0, 38.0, 24.0, 28.0, 47.0, 39.0, 33.0, 33.0, 54.0, 39.0, 46.0, 36.0, 30.0, 40.0, 23.0, 22.0, 31.0, 29.0, 15.0, 20.0, 10.0, 12.0, 17.0, 14.0, 8.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-1.46875, -1.4231719970703125, -1.377593994140625, -1.3320159912109375, -1.28643798828125, -1.2408599853515625, -1.195281982421875, -1.1497039794921875, -1.1041259765625, -1.0585479736328125, -1.012969970703125, -0.9673919677734375, -0.92181396484375, -0.8762359619140625, -0.830657958984375, -0.7850799560546875, -0.739501953125, -0.6939239501953125, -0.648345947265625, -0.6027679443359375, -0.55718994140625, -0.5116119384765625, -0.466033935546875, -0.4204559326171875, -0.3748779296875, -0.3292999267578125, -0.283721923828125, -0.2381439208984375, -0.19256591796875, -0.1469879150390625, -0.101409912109375, -0.0558319091796875, -0.01025390625, 0.0353240966796875, 0.080902099609375, 0.1264801025390625, 0.17205810546875, 0.2176361083984375, 0.263214111328125, 0.3087921142578125, 0.3543701171875, 0.3999481201171875, 0.445526123046875, 0.4911041259765625, 0.53668212890625, 0.5822601318359375, 0.627838134765625, 0.6734161376953125, 0.718994140625, 0.7645721435546875, 0.810150146484375, 0.8557281494140625, 0.90130615234375, 0.9468841552734375, 0.992462158203125, 1.0380401611328125, 1.0836181640625, 1.1291961669921875, 1.174774169921875, 1.2203521728515625, 1.26593017578125, 1.3115081787109375, 1.357086181640625, 1.4026641845703125, 1.4482421875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 3.0, 7.0, 16.0, 13.0, 18.0, 26.0, 35.0, 47.0, 71.0, 92.0, 134.0, 184.0, 270.0, 389.0, 636.0, 1155.0, 1787.0, 3395.0, 6426.0, 13177.0, 31195.0, 86137.0, 293858.0, 407911.0, 124686.0, 42007.0, 16991.0, 7915.0, 4132.0, 2237.0, 1310.0, 780.0, 511.0, 300.0, 214.0, 128.0, 113.0, 63.0, 47.0, 41.0, 26.0, 18.0, 16.0, 13.0, 7.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.34765625, -2.272308349609375, -2.19696044921875, -2.121612548828125, -2.0462646484375, -1.970916748046875, -1.89556884765625, -1.820220947265625, -1.744873046875, -1.669525146484375, -1.59417724609375, -1.518829345703125, -1.4434814453125, -1.368133544921875, -1.29278564453125, -1.217437744140625, -1.14208984375, -1.066741943359375, -0.99139404296875, -0.916046142578125, -0.8406982421875, -0.765350341796875, -0.69000244140625, -0.614654541015625, -0.539306640625, -0.463958740234375, -0.38861083984375, -0.313262939453125, -0.2379150390625, -0.162567138671875, -0.08721923828125, -0.011871337890625, 0.0634765625, 0.138824462890625, 0.21417236328125, 0.289520263671875, 0.3648681640625, 0.440216064453125, 0.51556396484375, 0.590911865234375, 0.666259765625, 0.741607666015625, 0.81695556640625, 0.892303466796875, 0.9676513671875, 1.042999267578125, 1.11834716796875, 1.193695068359375, 1.26904296875, 1.344390869140625, 1.41973876953125, 1.495086669921875, 1.5704345703125, 1.645782470703125, 1.72113037109375, 1.796478271484375, 1.871826171875, 1.947174072265625, 2.02252197265625, 2.097869873046875, 2.1732177734375, 2.248565673828125, 2.32391357421875, 2.399261474609375, 2.474609375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 8.0, 7.0, 10.0, 7.0, 8.0, 10.0, 13.0, 11.0, 18.0, 17.0, 18.0, 22.0, 31.0, 41.0, 26.0, 35.0, 59.0, 62.0, 73.0, 119.0, 207.0, 1390.0, 245.0, 113.0, 81.0, 57.0, 51.0, 45.0, 32.0, 30.0, 27.0, 24.0, 17.0, 22.0, 12.0, 25.0, 16.0, 11.0, 7.0, 15.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.46484375, -5.2918701171875, -5.118896484375, -4.9459228515625, -4.77294921875, -4.5999755859375, -4.427001953125, -4.2540283203125, -4.0810546875, -3.9080810546875, -3.735107421875, -3.5621337890625, -3.38916015625, -3.2161865234375, -3.043212890625, -2.8702392578125, -2.697265625, -2.5242919921875, -2.351318359375, -2.1783447265625, -2.00537109375, -1.8323974609375, -1.659423828125, -1.4864501953125, -1.3134765625, -1.1405029296875, -0.967529296875, -0.7945556640625, -0.62158203125, -0.4486083984375, -0.275634765625, -0.1026611328125, 0.0703125, 0.2432861328125, 0.416259765625, 0.5892333984375, 0.76220703125, 0.9351806640625, 1.108154296875, 1.2811279296875, 1.4541015625, 1.6270751953125, 1.800048828125, 1.9730224609375, 2.14599609375, 2.3189697265625, 2.491943359375, 2.6649169921875, 2.837890625, 3.0108642578125, 3.183837890625, 3.3568115234375, 3.52978515625, 3.7027587890625, 3.875732421875, 4.0487060546875, 4.2216796875, 4.3946533203125, 4.567626953125, 4.7406005859375, 4.91357421875, 5.0865478515625, 5.259521484375, 5.4324951171875, 5.60546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 16.0, 16.0, 18.0, 43.0, 50.0, 80.0, 134.0, 269.0, 749.0, 7972.0, 3087682.0, 46628.0, 1194.0, 377.0, 172.0, 105.0, 69.0, 43.0, 25.0, 25.0, 10.0, 11.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.925048828125, -25.13134765625, -24.337646484375, -23.5439453125, -22.750244140625, -21.95654296875, -21.162841796875, -20.369140625, -19.575439453125, -18.78173828125, -17.988037109375, -17.1943359375, -16.400634765625, -15.60693359375, -14.813232421875, -14.01953125, -13.225830078125, -12.43212890625, -11.638427734375, -10.8447265625, -10.051025390625, -9.25732421875, -8.463623046875, -7.669921875, -6.876220703125, -6.08251953125, -5.288818359375, -4.4951171875, -3.701416015625, -2.90771484375, -2.114013671875, -1.3203125, -0.526611328125, 0.26708984375, 1.060791015625, 1.8544921875, 2.648193359375, 3.44189453125, 4.235595703125, 5.029296875, 5.822998046875, 6.61669921875, 7.410400390625, 8.2041015625, 8.997802734375, 9.79150390625, 10.585205078125, 11.37890625, 12.172607421875, 12.96630859375, 13.760009765625, 14.5537109375, 15.347412109375, 16.14111328125, 16.934814453125, 17.728515625, 18.522216796875, 19.31591796875, 20.109619140625, 20.9033203125, 21.697021484375, 22.49072265625, 23.284423828125, 24.078125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 115.0, 692.0, 206.0, 0.0, 4.0], "bins": [-142.136962890625, -139.78981018066406, -137.4426727294922, -135.09552001953125, -132.7483673095703, -130.40122985839844, -128.0540771484375, -125.7069320678711, -123.35978698730469, -121.01264190673828, -118.66548919677734, -116.31834411621094, -113.97119903564453, -111.62405395507812, -109.27690124511719, -106.92975616455078, -104.58260345458984, -102.23545837402344, -99.8883056640625, -97.5411605834961, -95.19401550292969, -92.84686279296875, -90.49971771240234, -88.15257263183594, -85.805419921875, -83.4582748413086, -81.11112213134766, -78.76397705078125, -76.41683197021484, -74.06968688964844, -71.7225341796875, -69.3753890991211, -67.02824401855469, -64.68109893798828, -62.33395004272461, -59.98680114746094, -57.63965606689453, -55.29250717163086, -52.94535827636719, -50.59821319580078, -48.251060485839844, -45.90391159057617, -43.556766510009766, -41.209617614746094, -38.86247253417969, -36.515323638916016, -34.168174743652344, -31.821027755737305, -29.473880767822266, -27.126733779907227, -24.779586791992188, -22.432437896728516, -20.085290908813477, -17.738143920898438, -15.390995979309082, -13.043848037719727, -10.696701049804688, -8.349554061889648, -6.002406120300293, -3.6552586555480957, -1.3081111907958984, 1.0390357971191406, 3.386183738708496, 5.733331680297852, 8.08047866821289]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 10.0, 6.0, 6.0, 9.0, 6.0, 18.0, 18.0, 20.0, 23.0, 22.0, 20.0, 30.0, 21.0, 32.0, 28.0, 22.0, 32.0, 26.0, 36.0, 36.0, 35.0, 24.0, 29.0, 50.0, 38.0, 48.0, 41.0, 27.0, 25.0, 32.0, 21.0, 25.0, 27.0, 20.0, 24.0, 15.0, 12.0, 10.0, 11.0, 11.0, 0.0, 7.0, 6.0, 6.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.860115051269531, -13.372802734375, -12.885491371154785, -12.39818000793457, -11.910867691040039, -11.423555374145508, -10.936244010925293, -10.448932647705078, -9.961620330810547, -9.474308013916016, -8.9869966506958, -8.499685287475586, -8.012372970581055, -7.525061130523682, -7.037749290466309, -6.5504374504089355, -6.0631256103515625, -5.5758137702941895, -5.088501930236816, -4.601190090179443, -4.11387825012207, -3.6265664100646973, -3.139254570007324, -2.651942729949951, -2.164630889892578, -1.677319049835205, -1.190007209777832, -0.702695369720459, -0.21538352966308594, 0.2719283103942871, 0.7592401504516602, 1.2465519905090332, 1.7338638305664062, 2.2211756706237793, 2.7084875106811523, 3.1957993507385254, 3.6831111907958984, 4.1704230308532715, 4.6577348709106445, 5.145046710968018, 5.632358551025391, 6.119670391082764, 6.606982231140137, 7.09429407119751, 7.581605911254883, 8.068918228149414, 8.556229591369629, 9.043540954589844, 9.530853271484375, 10.018165588378906, 10.505476951599121, 10.992788314819336, 11.480100631713867, 11.967412948608398, 12.454724311828613, 12.942035675048828, 13.42934799194336, 13.91666030883789, 14.403971672058105, 14.89128303527832, 15.378595352172852, 15.865907669067383, 16.35321807861328, 16.840530395507812, 17.327842712402344]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 4.0, 10.0, 4.0, 10.0, 10.0, 12.0, 13.0, 6.0, 15.0, 19.0, 26.0, 23.0, 22.0, 25.0, 29.0, 23.0, 33.0, 44.0, 33.0, 33.0, 47.0, 39.0, 42.0, 45.0, 43.0, 39.0, 31.0, 39.0, 25.0, 26.0, 34.0, 24.0, 21.0, 20.0, 19.0, 16.0, 16.0, 13.0, 14.0, 9.0, 8.0, 7.0, 10.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.6572265625, -1.6068878173828125, -1.556549072265625, -1.5062103271484375, -1.45587158203125, -1.4055328369140625, -1.355194091796875, -1.3048553466796875, -1.2545166015625, -1.2041778564453125, -1.153839111328125, -1.1035003662109375, -1.05316162109375, -1.0028228759765625, -0.952484130859375, -0.9021453857421875, -0.851806640625, -0.8014678955078125, -0.751129150390625, -0.7007904052734375, -0.65045166015625, -0.6001129150390625, -0.549774169921875, -0.4994354248046875, -0.4490966796875, -0.3987579345703125, -0.348419189453125, -0.2980804443359375, -0.24774169921875, -0.1974029541015625, -0.147064208984375, -0.0967254638671875, -0.04638671875, 0.0039520263671875, 0.054290771484375, 0.1046295166015625, 0.15496826171875, 0.2053070068359375, 0.255645751953125, 0.3059844970703125, 0.3563232421875, 0.4066619873046875, 0.457000732421875, 0.5073394775390625, 0.55767822265625, 0.6080169677734375, 0.658355712890625, 0.7086944580078125, 0.759033203125, 0.8093719482421875, 0.859710693359375, 0.9100494384765625, 0.96038818359375, 1.0107269287109375, 1.061065673828125, 1.1114044189453125, 1.1617431640625, 1.2120819091796875, 1.262420654296875, 1.3127593994140625, 1.36309814453125, 1.4134368896484375, 1.463775634765625, 1.5141143798828125, 1.564453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 5.0, 12.0, 11.0, 14.0, 15.0, 27.0, 18.0, 28.0, 51.0, 69.0, 100.0, 130.0, 206.0, 367.0, 647.0, 1141.0, 2390.0, 5170.0, 12430.0, 32695.0, 92402.0, 285713.0, 786094.0, 1355849.0, 997766.0, 409716.0, 135200.0, 45424.0, 16840.0, 7032.0, 3128.0, 1549.0, 794.0, 401.0, 273.0, 186.0, 99.0, 76.0, 47.0, 35.0, 34.0, 30.0, 13.0, 20.0, 6.0, 2.0, 4.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.115234375, -2.05047607421875, -1.9857177734375, -1.92095947265625, -1.856201171875, -1.79144287109375, -1.7266845703125, -1.66192626953125, -1.59716796875, -1.53240966796875, -1.4676513671875, -1.40289306640625, -1.338134765625, -1.27337646484375, -1.2086181640625, -1.14385986328125, -1.0791015625, -1.01434326171875, -0.9495849609375, -0.88482666015625, -0.820068359375, -0.75531005859375, -0.6905517578125, -0.62579345703125, -0.56103515625, -0.49627685546875, -0.4315185546875, -0.36676025390625, -0.302001953125, -0.23724365234375, -0.1724853515625, -0.10772705078125, -0.04296875, 0.02178955078125, 0.0865478515625, 0.15130615234375, 0.216064453125, 0.28082275390625, 0.3455810546875, 0.41033935546875, 0.47509765625, 0.53985595703125, 0.6046142578125, 0.66937255859375, 0.734130859375, 0.79888916015625, 0.8636474609375, 0.92840576171875, 0.9931640625, 1.05792236328125, 1.1226806640625, 1.18743896484375, 1.252197265625, 1.31695556640625, 1.3817138671875, 1.44647216796875, 1.51123046875, 1.57598876953125, 1.6407470703125, 1.70550537109375, 1.770263671875, 1.83502197265625, 1.8997802734375, 1.96453857421875, 2.029296875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 9.0, 6.0, 7.0, 3.0, 12.0, 9.0, 19.0, 14.0, 27.0, 33.0, 42.0, 67.0, 90.0, 114.0, 136.0, 164.0, 219.0, 254.0, 352.0, 321.0, 370.0, 349.0, 270.0, 255.0, 221.0, 165.0, 117.0, 107.0, 81.0, 52.0, 44.0, 37.0, 31.0, 20.0, 13.0, 14.0, 8.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.841827392578125, -3.72662353515625, -3.611419677734375, -3.4962158203125, -3.381011962890625, -3.26580810546875, -3.150604248046875, -3.035400390625, -2.920196533203125, -2.80499267578125, -2.689788818359375, -2.5745849609375, -2.459381103515625, -2.34417724609375, -2.228973388671875, -2.11376953125, -1.998565673828125, -1.88336181640625, -1.768157958984375, -1.6529541015625, -1.537750244140625, -1.42254638671875, -1.307342529296875, -1.192138671875, -1.076934814453125, -0.96173095703125, -0.846527099609375, -0.7313232421875, -0.616119384765625, -0.50091552734375, -0.385711669921875, -0.2705078125, -0.155303955078125, -0.04010009765625, 0.075103759765625, 0.1903076171875, 0.305511474609375, 0.42071533203125, 0.535919189453125, 0.651123046875, 0.766326904296875, 0.88153076171875, 0.996734619140625, 1.1119384765625, 1.227142333984375, 1.34234619140625, 1.457550048828125, 1.57275390625, 1.687957763671875, 1.80316162109375, 1.918365478515625, 2.0335693359375, 2.148773193359375, 2.26397705078125, 2.379180908203125, 2.494384765625, 2.609588623046875, 2.72479248046875, 2.839996337890625, 2.9552001953125, 3.070404052734375, 3.18560791015625, 3.300811767578125, 3.416015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 16.0, 19.0, 22.0, 44.0, 58.0, 67.0, 96.0, 131.0, 260.0, 577.0, 1574.0, 6323.0, 40973.0, 402640.0, 2652225.0, 979291.0, 93953.0, 11799.0, 2429.0, 824.0, 376.0, 200.0, 104.0, 75.0, 51.0, 37.0, 28.0, 20.0, 13.0, 15.0, 9.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.49609375, -6.2696533203125, -6.043212890625, -5.8167724609375, -5.59033203125, -5.3638916015625, -5.137451171875, -4.9110107421875, -4.6845703125, -4.4581298828125, -4.231689453125, -4.0052490234375, -3.77880859375, -3.5523681640625, -3.325927734375, -3.0994873046875, -2.873046875, -2.6466064453125, -2.420166015625, -2.1937255859375, -1.96728515625, -1.7408447265625, -1.514404296875, -1.2879638671875, -1.0615234375, -0.8350830078125, -0.608642578125, -0.3822021484375, -0.15576171875, 0.0706787109375, 0.297119140625, 0.5235595703125, 0.75, 0.9764404296875, 1.202880859375, 1.4293212890625, 1.65576171875, 1.8822021484375, 2.108642578125, 2.3350830078125, 2.5615234375, 2.7879638671875, 3.014404296875, 3.2408447265625, 3.46728515625, 3.6937255859375, 3.920166015625, 4.1466064453125, 4.373046875, 4.5994873046875, 4.825927734375, 5.0523681640625, 5.27880859375, 5.5052490234375, 5.731689453125, 5.9581298828125, 6.1845703125, 6.4110107421875, 6.637451171875, 6.8638916015625, 7.09033203125, 7.3167724609375, 7.543212890625, 7.7696533203125, 7.99609375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 26.0, 68.0, 147.0, 224.0, 245.0, 174.0, 82.0, 31.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.302536010742188, -8.842288970947266, -7.3820414543151855, -5.9217939376831055, -4.461546897888184, -3.0012998580932617, -1.5410518646240234, -0.08080482482910156, 1.3794422149658203, 2.8396894931793213, 4.299936771392822, 5.760184288024902, 7.220431327819824, 8.680678367614746, 10.140926361083984, 11.601173400878906, 13.061420440673828, 14.52166748046875, 15.981914520263672, 17.442161560058594, 18.902408599853516, 20.362655639648438, 21.822904586791992, 23.283151626586914, 24.743398666381836, 26.203645706176758, 27.66389274597168, 29.124141693115234, 30.584388732910156, 32.04463577270508, 33.5048828125, 34.96512985229492, 36.425376892089844, 37.885623931884766, 39.34587097167969, 40.80611801147461, 42.26636505126953, 43.72661209106445, 45.186859130859375, 46.64710998535156, 48.10735321044922, 49.56760025024414, 51.02784729003906, 52.488094329833984, 53.948341369628906, 55.40858840942383, 56.86883544921875, 58.32908630371094, 59.78933334350586, 61.24958038330078, 62.7098274230957, 64.17007446289062, 65.63032531738281, 67.09056854248047, 68.55081939697266, 70.01106262207031, 71.4713134765625, 72.93156433105469, 74.39180755615234, 75.85205841064453, 77.31230163574219, 78.77255249023438, 80.23279571533203, 81.69304656982422, 83.15328979492188]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 15.0, 13.0, 14.0, 6.0, 21.0, 16.0, 19.0, 28.0, 30.0, 32.0, 40.0, 34.0, 45.0, 45.0, 47.0, 38.0, 40.0, 41.0, 58.0, 44.0, 36.0, 34.0, 36.0, 28.0, 24.0, 30.0, 24.0, 24.0, 23.0, 19.0, 18.0, 14.0, 15.0, 5.0, 8.0, 9.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.236427307128906, -15.772708892822266, -15.308990478515625, -14.8452730178833, -14.38155460357666, -13.91783618927002, -13.454117774963379, -12.990400314331055, -12.526681900024414, -12.062963485717773, -11.599245071411133, -11.135527610778809, -10.671809196472168, -10.208090782165527, -9.744372367858887, -9.280654907226562, -8.816936492919922, -8.353218078613281, -7.889500141143799, -7.425781726837158, -6.962063789367676, -6.498345375061035, -6.0346269607543945, -5.570909023284912, -5.107190132141113, -4.643471717834473, -4.17975378036499, -3.7160353660583496, -3.252317428588867, -2.7885990142822266, -2.324880838394165, -1.8611626625061035, -1.397444725036621, -0.9337265491485596, -0.47000831365585327, -0.006290078163146973, 0.45742809772491455, 0.9211463928222656, 1.3848645687103271, 1.8485827445983887, 2.31230092048645, 2.7760190963745117, 3.2397372722625732, 3.7034554481506348, 4.167173862457275, 4.630891799926758, 5.094610214233398, 5.558328628540039, 6.0220465660095215, 6.485764980316162, 6.9494829177856445, 7.413201332092285, 7.876919269561768, 8.34063720703125, 8.80435562133789, 9.268074035644531, 9.731792449951172, 10.195510864257812, 10.659229278564453, 11.122946739196777, 11.586665153503418, 12.050383567810059, 12.5141019821167, 12.977819442749023, 13.441537857055664]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 0.0, 8.0, 6.0, 13.0, 4.0, 4.0, 11.0, 13.0, 10.0, 23.0, 26.0, 23.0, 23.0, 29.0, 27.0, 35.0, 41.0, 33.0, 37.0, 36.0, 41.0, 40.0, 45.0, 38.0, 45.0, 45.0, 45.0, 35.0, 31.0, 40.0, 23.0, 19.0, 19.0, 21.0, 18.0, 16.0, 13.0, 12.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.658203125, -1.6042938232421875, -1.550384521484375, -1.4964752197265625, -1.44256591796875, -1.3886566162109375, -1.334747314453125, -1.2808380126953125, -1.2269287109375, -1.1730194091796875, -1.119110107421875, -1.0652008056640625, -1.01129150390625, -0.9573822021484375, -0.903472900390625, -0.8495635986328125, -0.795654296875, -0.7417449951171875, -0.687835693359375, -0.6339263916015625, -0.58001708984375, -0.5261077880859375, -0.472198486328125, -0.4182891845703125, -0.3643798828125, -0.3104705810546875, -0.256561279296875, -0.2026519775390625, -0.14874267578125, -0.0948333740234375, -0.040924072265625, 0.0129852294921875, 0.06689453125, 0.1208038330078125, 0.174713134765625, 0.2286224365234375, 0.28253173828125, 0.3364410400390625, 0.390350341796875, 0.4442596435546875, 0.4981689453125, 0.5520782470703125, 0.605987548828125, 0.6598968505859375, 0.71380615234375, 0.7677154541015625, 0.821624755859375, 0.8755340576171875, 0.929443359375, 0.9833526611328125, 1.037261962890625, 1.0911712646484375, 1.14508056640625, 1.1989898681640625, 1.252899169921875, 1.3068084716796875, 1.3607177734375, 1.4146270751953125, 1.468536376953125, 1.5224456787109375, 1.57635498046875, 1.6302642822265625, 1.684173583984375, 1.7380828857421875, 1.7919921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 11.0, 14.0, 21.0, 29.0, 54.0, 67.0, 94.0, 171.0, 253.0, 321.0, 497.0, 800.0, 1140.0, 1722.0, 2495.0, 3814.0, 5843.0, 8904.0, 14292.0, 23064.0, 38850.0, 69216.0, 132918.0, 247915.0, 225332.0, 116475.0, 61082.0, 34957.0, 21040.0, 12980.0, 8284.0, 5285.0, 3477.0, 2410.0, 1548.0, 1001.0, 686.0, 531.0, 285.0, 210.0, 151.0, 112.0, 70.0, 42.0, 32.0, 20.0, 16.0, 8.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23423194885253906, -0.22639846801757812, -0.2185649871826172, -0.21073150634765625, -0.2028980255126953, -0.19506454467773438, -0.18723106384277344, -0.1793975830078125, -0.17156410217285156, -0.16373062133789062, -0.1558971405029297, -0.14806365966796875, -0.1402301788330078, -0.13239669799804688, -0.12456321716308594, -0.116729736328125, -0.10889625549316406, -0.10106277465820312, -0.09322929382324219, -0.08539581298828125, -0.07756233215332031, -0.06972885131835938, -0.06189537048339844, -0.0540618896484375, -0.04622840881347656, -0.038394927978515625, -0.030561447143554688, -0.02272796630859375, -0.014894485473632812, -0.007061004638671875, 0.0007724761962890625, 0.00860595703125, 0.016439437866210938, 0.024272918701171875, 0.03210639953613281, 0.03993988037109375, 0.04777336120605469, 0.055606842041015625, 0.06344032287597656, 0.0712738037109375, 0.07910728454589844, 0.08694076538085938, 0.09477424621582031, 0.10260772705078125, 0.11044120788574219, 0.11827468872070312, 0.12610816955566406, 0.133941650390625, 0.14177513122558594, 0.14960861206054688, 0.1574420928955078, 0.16527557373046875, 0.1731090545654297, 0.18094253540039062, 0.18877601623535156, 0.1966094970703125, 0.20444297790527344, 0.21227645874023438, 0.2201099395751953, 0.22794342041015625, 0.2357769012451172, 0.24361038208007812, 0.25144386291503906, 0.25927734375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 11.0, 5.0, 15.0, 15.0, 16.0, 16.0, 11.0, 20.0, 24.0, 32.0, 36.0, 35.0, 37.0, 30.0, 53.0, 35.0, 34.0, 43.0, 1061.0, 40.0, 45.0, 39.0, 42.0, 39.0, 31.0, 41.0, 30.0, 31.0, 34.0, 32.0, 14.0, 9.0, 16.0, 10.0, 15.0, 6.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2939453125, -1.2555999755859375, -1.217254638671875, -1.1789093017578125, -1.14056396484375, -1.1022186279296875, -1.063873291015625, -1.0255279541015625, -0.9871826171875, -0.9488372802734375, -0.910491943359375, -0.8721466064453125, -0.83380126953125, -0.7954559326171875, -0.757110595703125, -0.7187652587890625, -0.680419921875, -0.6420745849609375, -0.603729248046875, -0.5653839111328125, -0.52703857421875, -0.4886932373046875, -0.450347900390625, -0.4120025634765625, -0.3736572265625, -0.3353118896484375, -0.296966552734375, -0.2586212158203125, -0.22027587890625, -0.1819305419921875, -0.143585205078125, -0.1052398681640625, -0.06689453125, -0.0285491943359375, 0.009796142578125, 0.0481414794921875, 0.08648681640625, 0.1248321533203125, 0.163177490234375, 0.2015228271484375, 0.2398681640625, 0.2782135009765625, 0.316558837890625, 0.3549041748046875, 0.39324951171875, 0.4315948486328125, 0.469940185546875, 0.5082855224609375, 0.546630859375, 0.5849761962890625, 0.623321533203125, 0.6616668701171875, 0.70001220703125, 0.7383575439453125, 0.776702880859375, 0.8150482177734375, 0.8533935546875, 0.8917388916015625, 0.930084228515625, 0.9684295654296875, 1.00677490234375, 1.0451202392578125, 1.083465576171875, 1.1218109130859375, 1.16015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 11.0, 14.0, 21.0, 29.0, 56.0, 68.0, 97.0, 154.0, 186.0, 269.0, 404.0, 641.0, 850.0, 1348.0, 2073.0, 3263.0, 5138.0, 8063.0, 13326.0, 22475.0, 38225.0, 67067.0, 124130.0, 235823.0, 1261601.0, 135348.0, 73457.0, 40880.0, 23580.0, 14064.0, 8700.0, 5497.0, 3390.0, 2288.0, 1509.0, 994.0, 677.0, 448.0, 303.0, 222.0, 143.0, 88.0, 73.0, 40.0, 30.0, 22.0, 21.0, 11.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.202880859375, -0.19692611694335938, -0.19097137451171875, -0.18501663208007812, -0.1790618896484375, -0.17310714721679688, -0.16715240478515625, -0.16119766235351562, -0.155242919921875, -0.14928817749023438, -0.14333343505859375, -0.13737869262695312, -0.1314239501953125, -0.12546920776367188, -0.11951446533203125, -0.11355972290039062, -0.10760498046875, -0.10165023803710938, -0.09569549560546875, -0.08974075317382812, -0.0837860107421875, -0.07783126831054688, -0.07187652587890625, -0.06592178344726562, -0.059967041015625, -0.054012298583984375, -0.04805755615234375, -0.042102813720703125, -0.0361480712890625, -0.030193328857421875, -0.02423858642578125, -0.018283843994140625, -0.0123291015625, -0.006374359130859375, -0.00041961669921875, 0.005535125732421875, 0.0114898681640625, 0.017444610595703125, 0.02339935302734375, 0.029354095458984375, 0.035308837890625, 0.041263580322265625, 0.04721832275390625, 0.053173065185546875, 0.0591278076171875, 0.06508255004882812, 0.07103729248046875, 0.07699203491210938, 0.08294677734375, 0.08890151977539062, 0.09485626220703125, 0.10081100463867188, 0.1067657470703125, 0.11272048950195312, 0.11867523193359375, 0.12462997436523438, 0.130584716796875, 0.13653945922851562, 0.14249420166015625, 0.14844894409179688, 0.1544036865234375, 0.16035842895507812, 0.16631317138671875, 0.17226791381835938, 0.17822265625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 3.0, 9.0, 14.0, 9.0, 20.0, 17.0, 9.0, 23.0, 34.0, 56.0, 51.0, 74.0, 77.0, 78.0, 79.0, 68.0, 57.0, 57.0, 42.0, 38.0, 36.0, 20.0, 18.0, 13.0, 19.0, 9.0, 10.0, 6.0, 6.0, 7.0, 9.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00090789794921875, -0.000881493091583252, -0.0008550882339477539, -0.0008286833763122559, -0.0008022785186767578, -0.0007758736610412598, -0.0007494688034057617, -0.0007230639457702637, -0.0006966590881347656, -0.0006702542304992676, -0.0006438493728637695, -0.0006174445152282715, -0.0005910396575927734, -0.0005646347999572754, -0.0005382299423217773, -0.0005118250846862793, -0.00048542022705078125, -0.0004590153694152832, -0.00043261051177978516, -0.0004062056541442871, -0.00037980079650878906, -0.000353395938873291, -0.00032699108123779297, -0.0003005862236022949, -0.0002741813659667969, -0.00024777650833129883, -0.00022137165069580078, -0.00019496679306030273, -0.0001685619354248047, -0.00014215707778930664, -0.0001157522201538086, -8.934736251831055e-05, -6.29425048828125e-05, -3.653764724731445e-05, -1.0132789611816406e-05, 1.627206802368164e-05, 4.267692565917969e-05, 6.908178329467773e-05, 9.548664093017578e-05, 0.00012189149856567383, 0.00014829635620117188, 0.00017470121383666992, 0.00020110607147216797, 0.00022751092910766602, 0.00025391578674316406, 0.0002803206443786621, 0.00030672550201416016, 0.0003331303596496582, 0.00035953521728515625, 0.0003859400749206543, 0.00041234493255615234, 0.0004387497901916504, 0.00046515464782714844, 0.0004915595054626465, 0.0005179643630981445, 0.0005443692207336426, 0.0005707740783691406, 0.0005971789360046387, 0.0006235837936401367, 0.0006499886512756348, 0.0006763935089111328, 0.0007027983665466309, 0.0007292032241821289, 0.000755608081817627, 0.000782012939453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 4.0, 9.0, 5.0, 9.0, 10.0, 18.0, 28.0, 32.0, 32.0, 56.0, 86.0, 114.0, 225.0, 409.0, 1133.0, 181806.0, 861221.0, 2049.0, 519.0, 266.0, 153.0, 107.0, 62.0, 46.0, 26.0, 25.0, 17.0, 13.0, 12.0, 10.0, 6.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01611328125, -0.015560150146484375, -0.01500701904296875, -0.014453887939453125, -0.0139007568359375, -0.013347625732421875, -0.01279449462890625, -0.012241363525390625, -0.011688232421875, -0.011135101318359375, -0.01058197021484375, -0.010028839111328125, -0.0094757080078125, -0.008922576904296875, -0.00836944580078125, -0.007816314697265625, -0.00726318359375, -0.006710052490234375, -0.00615692138671875, -0.005603790283203125, -0.0050506591796875, -0.004497528076171875, -0.00394439697265625, -0.003391265869140625, -0.002838134765625, -0.002285003662109375, -0.00173187255859375, -0.001178741455078125, -0.0006256103515625, -7.2479248046875e-05, 0.00048065185546875, 0.001033782958984375, 0.0015869140625, 0.002140045166015625, 0.00269317626953125, 0.003246307373046875, 0.0037994384765625, 0.004352569580078125, 0.00490570068359375, 0.005458831787109375, 0.006011962890625, 0.006565093994140625, 0.00711822509765625, 0.007671356201171875, 0.0082244873046875, 0.008777618408203125, 0.00933074951171875, 0.009883880615234375, 0.01043701171875, 0.010990142822265625, 0.01154327392578125, 0.012096405029296875, 0.0126495361328125, 0.013202667236328125, 0.01375579833984375, 0.014308929443359375, 0.014862060546875, 0.015415191650390625, 0.01596832275390625, 0.016521453857421875, 0.0170745849609375, 0.017627716064453125, 0.01818084716796875, 0.018733978271484375, 0.019287109375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 48.0, 219.0, 397.0, 262.0, 62.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022262653801590204, -0.002165293786674738, -0.0021043221931904554, -0.0020433503668755293, -0.001982378773391247, -0.0019214071799069643, -0.0018604355864226818, -0.0017994639929383993, -0.001738492283038795, -0.0016775206895545125, -0.0016165489796549082, -0.0015555773861706257, -0.0014946057926863432, -0.0014336340827867389, -0.0013726624893024564, -0.001311690779402852, -0.0012507191859185696, -0.001189747592434287, -0.0011287758825346828, -0.0010678042890504003, -0.001006832579150796, -0.0009458609856665134, -0.000884889392182231, -0.0008239177404902875, -0.0007629460887983441, -0.0007019744371064007, -0.0006410027854144573, -0.0005800311919301748, -0.0005190595402382314, -0.000458087888546288, -0.00039711626595817506, -0.0003361446433700621, -0.00027517310809344053, -0.00021420147095341235, -0.00015322983381338418, -9.2258196673356e-05, -3.128655953332782e-05, 2.968509215861559e-05, 9.065671474672854e-05, 0.0001516283373348415, 0.0002125999890267849, 0.0002735716407187283, 0.00033454326330684125, 0.0003955148858949542, 0.0004564865375868976, 0.000517458189278841, 0.0005784297827631235, 0.0006394014344550669, 0.0007003730861470103, 0.0007613447378389537, 0.0008223163895308971, 0.0008832879830151796, 0.000944259634707123, 0.0010052312863990664, 0.001066202879883349, 0.0011271745897829533, 0.0011881461832672358, 0.0012491177767515182, 0.0013100894866511226, 0.001371061080135405, 0.0014320327900350094, 0.0014930043835192919, 0.0015539759770035744, 0.0016149475704878569, 0.0016759192803874612]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 5.0, 7.0, 4.0, 14.0, 10.0, 10.0, 18.0, 18.0, 29.0, 22.0, 18.0, 30.0, 26.0, 31.0, 40.0, 21.0, 36.0, 50.0, 45.0, 52.0, 48.0, 37.0, 47.0, 27.0, 39.0, 35.0, 35.0, 35.0, 25.0, 22.0, 25.0, 18.0, 27.0, 13.0, 7.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0003914833068847656, -0.0003781011328101158, -0.000364718958735466, -0.0003513367846608162, -0.0003379546105861664, -0.00032457243651151657, -0.00031119026243686676, -0.00029780808836221695, -0.00028442591428756714, -0.00027104374021291733, -0.0002576615661382675, -0.0002442793920636177, -0.0002308972179889679, -0.00021751504391431808, -0.00020413286983966827, -0.00019075069576501846, -0.00017736852169036865, -0.00016398634761571884, -0.00015060417354106903, -0.00013722199946641922, -0.0001238398253917694, -0.0001104576513171196, -9.707547724246979e-05, -8.369330316781998e-05, -7.031112909317017e-05, -5.6928955018520355e-05, -4.3546780943870544e-05, -3.0164606869220734e-05, -1.6782432794570923e-05, -3.400258719921112e-06, 9.981915354728699e-06, 2.336408942937851e-05, 3.674626350402832e-05, 5.012843757867813e-05, 6.351061165332794e-05, 7.689278572797775e-05, 9.027495980262756e-05, 0.00010365713387727737, 0.00011703930795192719, 0.000130421482026577, 0.0001438036561012268, 0.00015718583017587662, 0.00017056800425052643, 0.00018395017832517624, 0.00019733235239982605, 0.00021071452647447586, 0.00022409670054912567, 0.00023747887462377548, 0.0002508610486984253, 0.0002642432227730751, 0.0002776253968477249, 0.0002910075709223747, 0.00030438974499702454, 0.00031777191907167435, 0.00033115409314632416, 0.00034453626722097397, 0.0003579184412956238, 0.0003713006153702736, 0.0003846827894449234, 0.0003980649635195732, 0.000411447137594223, 0.00042482931166887283, 0.00043821148574352264, 0.00045159365981817245, 0.00046497583389282227]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 0.0, 8.0, 6.0, 13.0, 4.0, 4.0, 11.0, 13.0, 10.0, 23.0, 26.0, 23.0, 23.0, 29.0, 27.0, 35.0, 41.0, 33.0, 37.0, 36.0, 41.0, 40.0, 45.0, 38.0, 45.0, 45.0, 45.0, 35.0, 31.0, 40.0, 23.0, 19.0, 19.0, 21.0, 18.0, 16.0, 13.0, 12.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.658203125, -1.6042938232421875, -1.550384521484375, -1.4964752197265625, -1.44256591796875, -1.3886566162109375, -1.334747314453125, -1.2808380126953125, -1.2269287109375, -1.1730194091796875, -1.119110107421875, -1.0652008056640625, -1.01129150390625, -0.9573822021484375, -0.903472900390625, -0.8495635986328125, -0.795654296875, -0.7417449951171875, -0.687835693359375, -0.6339263916015625, -0.58001708984375, -0.5261077880859375, -0.472198486328125, -0.4182891845703125, -0.3643798828125, -0.3104705810546875, -0.256561279296875, -0.2026519775390625, -0.14874267578125, -0.0948333740234375, -0.040924072265625, 0.0129852294921875, 0.06689453125, 0.1208038330078125, 0.174713134765625, 0.2286224365234375, 0.28253173828125, 0.3364410400390625, 0.390350341796875, 0.4442596435546875, 0.4981689453125, 0.5520782470703125, 0.605987548828125, 0.6598968505859375, 0.71380615234375, 0.7677154541015625, 0.821624755859375, 0.8755340576171875, 0.929443359375, 0.9833526611328125, 1.037261962890625, 1.0911712646484375, 1.14508056640625, 1.1989898681640625, 1.252899169921875, 1.3068084716796875, 1.3607177734375, 1.4146270751953125, 1.468536376953125, 1.5224456787109375, 1.57635498046875, 1.6302642822265625, 1.684173583984375, 1.7380828857421875, 1.7919921875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 9.0, 4.0, 7.0, 10.0, 8.0, 25.0, 31.0, 43.0, 61.0, 74.0, 107.0, 191.0, 266.0, 412.0, 634.0, 1019.0, 1639.0, 3078.0, 5166.0, 9586.0, 19286.0, 44239.0, 118925.0, 316471.0, 319434.0, 121476.0, 44417.0, 19305.0, 9746.0, 5309.0, 2953.0, 1771.0, 1005.0, 634.0, 388.0, 263.0, 166.0, 123.0, 74.0, 58.0, 36.0, 32.0, 20.0, 14.0, 9.0, 8.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9658203125, -1.9024200439453125, -1.839019775390625, -1.7756195068359375, -1.71221923828125, -1.6488189697265625, -1.585418701171875, -1.5220184326171875, -1.4586181640625, -1.3952178955078125, -1.331817626953125, -1.2684173583984375, -1.20501708984375, -1.1416168212890625, -1.078216552734375, -1.0148162841796875, -0.951416015625, -0.8880157470703125, -0.824615478515625, -0.7612152099609375, -0.69781494140625, -0.6344146728515625, -0.571014404296875, -0.5076141357421875, -0.4442138671875, -0.3808135986328125, -0.317413330078125, -0.2540130615234375, -0.19061279296875, -0.1272125244140625, -0.063812255859375, -0.0004119873046875, 0.06298828125, 0.1263885498046875, 0.189788818359375, 0.2531890869140625, 0.31658935546875, 0.3799896240234375, 0.443389892578125, 0.5067901611328125, 0.5701904296875, 0.6335906982421875, 0.696990966796875, 0.7603912353515625, 0.82379150390625, 0.8871917724609375, 0.950592041015625, 1.0139923095703125, 1.077392578125, 1.1407928466796875, 1.204193115234375, 1.2675933837890625, 1.33099365234375, 1.3943939208984375, 1.457794189453125, 1.5211944580078125, 1.5845947265625, 1.6479949951171875, 1.711395263671875, 1.7747955322265625, 1.83819580078125, 1.9015960693359375, 1.964996337890625, 2.0283966064453125, 2.091796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 6.0, 6.0, 4.0, 10.0, 10.0, 9.0, 9.0, 16.0, 18.0, 18.0, 25.0, 39.0, 27.0, 36.0, 53.0, 53.0, 65.0, 79.0, 174.0, 1390.0, 330.0, 181.0, 81.0, 51.0, 47.0, 43.0, 44.0, 31.0, 35.0, 27.0, 24.0, 18.0, 15.0, 12.0, 11.0, 6.0, 9.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.6341552734375, -6.412841796875, -6.1915283203125, -5.97021484375, -5.7489013671875, -5.527587890625, -5.3062744140625, -5.0849609375, -4.8636474609375, -4.642333984375, -4.4210205078125, -4.19970703125, -3.9783935546875, -3.757080078125, -3.5357666015625, -3.314453125, -3.0931396484375, -2.871826171875, -2.6505126953125, -2.42919921875, -2.2078857421875, -1.986572265625, -1.7652587890625, -1.5439453125, -1.3226318359375, -1.101318359375, -0.8800048828125, -0.65869140625, -0.4373779296875, -0.216064453125, 0.0052490234375, 0.2265625, 0.4478759765625, 0.669189453125, 0.8905029296875, 1.11181640625, 1.3331298828125, 1.554443359375, 1.7757568359375, 1.9970703125, 2.2183837890625, 2.439697265625, 2.6610107421875, 2.88232421875, 3.1036376953125, 3.324951171875, 3.5462646484375, 3.767578125, 3.9888916015625, 4.210205078125, 4.4315185546875, 4.65283203125, 4.8741455078125, 5.095458984375, 5.3167724609375, 5.5380859375, 5.7593994140625, 5.980712890625, 6.2020263671875, 6.42333984375, 6.6446533203125, 6.865966796875, 7.0872802734375, 7.30859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 22.0, 20.0, 30.0, 41.0, 74.0, 109.0, 157.0, 315.0, 814.0, 7764.0, 3101311.0, 33003.0, 1127.0, 367.0, 182.0, 122.0, 63.0, 56.0, 31.0, 16.0, 19.0, 16.0, 9.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-33.59375, -32.74609375, -31.8984375, -31.05078125, -30.203125, -29.35546875, -28.5078125, -27.66015625, -26.8125, -25.96484375, -25.1171875, -24.26953125, -23.421875, -22.57421875, -21.7265625, -20.87890625, -20.03125, -19.18359375, -18.3359375, -17.48828125, -16.640625, -15.79296875, -14.9453125, -14.09765625, -13.25, -12.40234375, -11.5546875, -10.70703125, -9.859375, -9.01171875, -8.1640625, -7.31640625, -6.46875, -5.62109375, -4.7734375, -3.92578125, -3.078125, -2.23046875, -1.3828125, -0.53515625, 0.3125, 1.16015625, 2.0078125, 2.85546875, 3.703125, 4.55078125, 5.3984375, 6.24609375, 7.09375, 7.94140625, 8.7890625, 9.63671875, 10.484375, 11.33203125, 12.1796875, 13.02734375, 13.875, 14.72265625, 15.5703125, 16.41796875, 17.265625, 18.11328125, 18.9609375, 19.80859375, 20.65625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [859.0, 155.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.426872730255127, 1.045492172241211, 5.517857074737549, 9.990222930908203, 14.462587356567383, 18.934951782226562, 23.407318115234375, 27.879682540893555, 32.352046966552734, 36.82441329956055, 41.296775817871094, 45.769142150878906, 50.24150848388672, 54.713871002197266, 59.18623733520508, 63.658599853515625, 68.13096618652344, 72.60333251953125, 77.07569885253906, 81.54806518554688, 86.02042388916016, 90.49279022216797, 94.96515655517578, 99.4375228881836, 103.90988159179688, 108.38224792480469, 112.8546142578125, 117.32698059082031, 121.7993392944336, 126.2717056274414, 130.74407958984375, 135.2164306640625, 139.6887969970703, 144.16116333007812, 148.63352966308594, 153.10589599609375, 157.57826232910156, 162.05062866210938, 166.52297973632812, 170.99534606933594, 175.46771240234375, 179.94007873535156, 184.41244506835938, 188.8848114013672, 193.357177734375, 197.82952880859375, 202.30191040039062, 206.77426147460938, 211.24664306640625, 215.71900939941406, 220.19137573242188, 224.6637420654297, 229.1361083984375, 233.60845947265625, 238.08084106445312, 242.55319213867188, 247.0255584716797, 251.4979248046875, 255.9702911376953, 260.4426574707031, 264.9150085449219, 269.38739013671875, 273.8597412109375, 278.3321228027344, 282.8044738769531]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 13.0, 10.0, 9.0, 11.0, 16.0, 11.0, 21.0, 17.0, 19.0, 23.0, 24.0, 24.0, 26.0, 36.0, 27.0, 35.0, 40.0, 29.0, 39.0, 42.0, 39.0, 40.0, 46.0, 37.0, 32.0, 35.0, 22.0, 18.0, 38.0, 24.0, 30.0, 23.0, 27.0, 14.0, 17.0, 13.0, 8.0, 11.0, 8.0, 7.0, 8.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-16.991905212402344, -16.486116409301758, -15.980329513549805, -15.474541664123535, -14.968753814697266, -14.46296501159668, -13.95717716217041, -13.45138931274414, -12.945601463317871, -12.439813613891602, -11.934025764465332, -11.428237915039062, -10.922449111938477, -10.416662216186523, -9.910873413085938, -9.405085563659668, -8.899297714233398, -8.393509864807129, -7.887722015380859, -7.381933689117432, -6.876145839691162, -6.370357990264893, -5.864569664001465, -5.358781814575195, -4.852993965148926, -4.347206115722656, -3.8414180278778076, -3.335629940032959, -2.8298420906066895, -2.32405424118042, -1.8182661533355713, -1.3124780654907227, -0.8066921234130859, -0.30090415477752686, 0.20488381385803223, 0.7106717824935913, 1.2164597511291504, 1.72224760055542, 2.2280356884002686, 2.733823776245117, 3.2396116256713867, 3.7453994750976562, 4.251187324523926, 4.7569756507873535, 5.262763500213623, 5.768551349639893, 6.27433967590332, 6.78012752532959, 7.285915374755859, 7.791703224182129, 8.297491073608398, 8.803278923034668, 9.309066772460938, 9.814855575561523, 10.320643424987793, 10.826431274414062, 11.332219123840332, 11.838006973266602, 12.343794822692871, 12.84958267211914, 13.355371475219727, 13.86115837097168, 14.366947174072266, 14.872735023498535, 15.378522872924805]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 9.0, 10.0, 8.0, 18.0, 8.0, 19.0, 21.0, 25.0, 19.0, 21.0, 31.0, 33.0, 26.0, 33.0, 36.0, 35.0, 34.0, 41.0, 36.0, 41.0, 34.0, 47.0, 45.0, 41.0, 41.0, 38.0, 40.0, 26.0, 27.0, 20.0, 10.0, 14.0, 14.0, 21.0, 10.0, 11.0, 5.0, 4.0, 7.0, 6.0, 6.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.697265625, -1.640472412109375, -1.58367919921875, -1.526885986328125, -1.4700927734375, -1.413299560546875, -1.35650634765625, -1.299713134765625, -1.242919921875, -1.186126708984375, -1.12933349609375, -1.072540283203125, -1.0157470703125, -0.958953857421875, -0.90216064453125, -0.845367431640625, -0.78857421875, -0.731781005859375, -0.67498779296875, -0.618194580078125, -0.5614013671875, -0.504608154296875, -0.44781494140625, -0.391021728515625, -0.334228515625, -0.277435302734375, -0.22064208984375, -0.163848876953125, -0.1070556640625, -0.050262451171875, 0.00653076171875, 0.063323974609375, 0.1201171875, 0.176910400390625, 0.23370361328125, 0.290496826171875, 0.3472900390625, 0.404083251953125, 0.46087646484375, 0.517669677734375, 0.574462890625, 0.631256103515625, 0.68804931640625, 0.744842529296875, 0.8016357421875, 0.858428955078125, 0.91522216796875, 0.972015380859375, 1.02880859375, 1.085601806640625, 1.14239501953125, 1.199188232421875, 1.2559814453125, 1.312774658203125, 1.36956787109375, 1.426361083984375, 1.483154296875, 1.539947509765625, 1.59674072265625, 1.653533935546875, 1.7103271484375, 1.767120361328125, 1.82391357421875, 1.880706787109375, 1.9375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 12.0, 8.0, 13.0, 25.0, 20.0, 24.0, 28.0, 41.0, 45.0, 40.0, 54.0, 58.0, 70.0, 112.0, 176.0, 405.0, 1579.0, 14027.0, 453125.0, 3371785.0, 338773.0, 11274.0, 1398.0, 374.0, 196.0, 140.0, 86.0, 61.0, 44.0, 32.0, 33.0, 39.0, 35.0, 29.0, 10.0, 10.0, 13.0, 17.0, 8.0, 14.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1171875, -6.8756103515625, -6.634033203125, -6.3924560546875, -6.15087890625, -5.9093017578125, -5.667724609375, -5.4261474609375, -5.1845703125, -4.9429931640625, -4.701416015625, -4.4598388671875, -4.21826171875, -3.9766845703125, -3.735107421875, -3.4935302734375, -3.251953125, -3.0103759765625, -2.768798828125, -2.5272216796875, -2.28564453125, -2.0440673828125, -1.802490234375, -1.5609130859375, -1.3193359375, -1.0777587890625, -0.836181640625, -0.5946044921875, -0.35302734375, -0.1114501953125, 0.130126953125, 0.3717041015625, 0.61328125, 0.8548583984375, 1.096435546875, 1.3380126953125, 1.57958984375, 1.8211669921875, 2.062744140625, 2.3043212890625, 2.5458984375, 2.7874755859375, 3.029052734375, 3.2706298828125, 3.51220703125, 3.7537841796875, 3.995361328125, 4.2369384765625, 4.478515625, 4.7200927734375, 4.961669921875, 5.2032470703125, 5.44482421875, 5.6864013671875, 5.927978515625, 6.1695556640625, 6.4111328125, 6.6527099609375, 6.894287109375, 7.1358642578125, 7.37744140625, 7.6190185546875, 7.860595703125, 8.1021728515625, 8.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 10.0, 9.0, 23.0, 32.0, 51.0, 63.0, 95.0, 127.0, 194.0, 256.0, 388.0, 441.0, 514.0, 464.0, 426.0, 303.0, 207.0, 136.0, 97.0, 70.0, 49.0, 34.0, 26.0, 17.0, 9.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1197509765625, -4.946533203125, -4.7733154296875, -4.60009765625, -4.4268798828125, -4.253662109375, -4.0804443359375, -3.9072265625, -3.7340087890625, -3.560791015625, -3.3875732421875, -3.21435546875, -3.0411376953125, -2.867919921875, -2.6947021484375, -2.521484375, -2.3482666015625, -2.175048828125, -2.0018310546875, -1.82861328125, -1.6553955078125, -1.482177734375, -1.3089599609375, -1.1357421875, -0.9625244140625, -0.789306640625, -0.6160888671875, -0.44287109375, -0.2696533203125, -0.096435546875, 0.0767822265625, 0.25, 0.4232177734375, 0.596435546875, 0.7696533203125, 0.94287109375, 1.1160888671875, 1.289306640625, 1.4625244140625, 1.6357421875, 1.8089599609375, 1.982177734375, 2.1553955078125, 2.32861328125, 2.5018310546875, 2.675048828125, 2.8482666015625, 3.021484375, 3.1947021484375, 3.367919921875, 3.5411376953125, 3.71435546875, 3.8875732421875, 4.060791015625, 4.2340087890625, 4.4072265625, 4.5804443359375, 4.753662109375, 4.9268798828125, 5.10009765625, 5.2733154296875, 5.446533203125, 5.6197509765625, 5.79296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 10.0, 13.0, 22.0, 34.0, 41.0, 74.0, 99.0, 182.0, 266.0, 509.0, 1590.0, 23170.0, 2131487.0, 2012358.0, 21617.0, 1606.0, 487.0, 259.0, 149.0, 94.0, 77.0, 49.0, 23.0, 24.0, 11.0, 8.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4296875, -14.9473876953125, -14.465087890625, -13.9827880859375, -13.50048828125, -13.0181884765625, -12.535888671875, -12.0535888671875, -11.5712890625, -11.0889892578125, -10.606689453125, -10.1243896484375, -9.64208984375, -9.1597900390625, -8.677490234375, -8.1951904296875, -7.712890625, -7.2305908203125, -6.748291015625, -6.2659912109375, -5.78369140625, -5.3013916015625, -4.819091796875, -4.3367919921875, -3.8544921875, -3.3721923828125, -2.889892578125, -2.4075927734375, -1.92529296875, -1.4429931640625, -0.960693359375, -0.4783935546875, 0.00390625, 0.4862060546875, 0.968505859375, 1.4508056640625, 1.93310546875, 2.4154052734375, 2.897705078125, 3.3800048828125, 3.8623046875, 4.3446044921875, 4.826904296875, 5.3092041015625, 5.79150390625, 6.2738037109375, 6.756103515625, 7.2384033203125, 7.720703125, 8.2030029296875, 8.685302734375, 9.1676025390625, 9.64990234375, 10.1322021484375, 10.614501953125, 11.0968017578125, 11.5791015625, 12.0614013671875, 12.543701171875, 13.0260009765625, 13.50830078125, 13.9906005859375, 14.472900390625, 14.9552001953125, 15.4375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 185.0, 674.0, 148.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.9256134033203, -189.0108642578125, -184.09613037109375, -179.18138122558594, -174.26663208007812, -169.3518829345703, -164.4371337890625, -159.52239990234375, -154.60765075683594, -149.69290161132812, -144.77816772460938, -139.86341857910156, -134.94866943359375, -130.03392028808594, -125.11917877197266, -120.20443725585938, -115.28968811035156, -110.37493896484375, -105.46019744873047, -100.54545593261719, -95.63070678710938, -90.71595764160156, -85.80121612548828, -80.886474609375, -75.97172546386719, -71.05697631835938, -66.1422348022461, -61.22748947143555, -56.312744140625, -51.39799880981445, -46.483253479003906, -41.56850814819336, -36.65374755859375, -31.739002227783203, -26.824256896972656, -21.90951156616211, -16.994766235351562, -12.080020904541016, -7.165275573730469, -2.250530242919922, 2.664215087890625, 7.578960418701172, 12.493705749511719, 17.408451080322266, 22.323196411132812, 27.23794174194336, 32.152687072753906, 37.06743240356445, 41.982177734375, 46.89692306518555, 51.811668395996094, 56.72641372680664, 61.64115905761719, 66.555908203125, 71.47064971923828, 76.38539123535156, 81.30014038085938, 86.21488952636719, 91.12963104248047, 96.04437255859375, 100.95912170410156, 105.87387084960938, 110.78861236572266, 115.70335388183594, 120.61810302734375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 6.0, 9.0, 15.0, 15.0, 15.0, 18.0, 24.0, 25.0, 20.0, 26.0, 28.0, 36.0, 41.0, 44.0, 40.0, 51.0, 48.0, 41.0, 47.0, 36.0, 30.0, 45.0, 35.0, 34.0, 43.0, 36.0, 32.0, 22.0, 25.0, 23.0, 19.0, 7.0, 6.0, 9.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.537100791931152, -15.014609336853027, -14.492117881774902, -13.969627380371094, -13.447135925292969, -12.924644470214844, -12.402153015136719, -11.879661560058594, -11.357170104980469, -10.834678649902344, -10.312187194824219, -9.789695739746094, -9.267205238342285, -8.74471378326416, -8.222222328186035, -7.69973087310791, -7.177240371704102, -6.654748916625977, -6.13225793838501, -5.609766483306885, -5.087275505065918, -4.564784049987793, -4.042292594909668, -3.519801378250122, -2.997310161590576, -2.4748189449310303, -1.9523276090621948, -1.4298362731933594, -0.9073450565338135, -0.3848538398742676, 0.13763761520385742, 0.6601288318634033, 1.1826190948486328, 1.7051103115081787, 2.2276015281677246, 2.7500929832458496, 3.2725841999053955, 3.7950754165649414, 4.317566871643066, 4.840058326721191, 5.362549304962158, 5.885040760040283, 6.40753173828125, 6.930023193359375, 7.4525146484375, 7.975005626678467, 8.49749755859375, 9.019988059997559, 9.542479515075684, 10.064970970153809, 10.587462425231934, 11.109952926635742, 11.632444381713867, 12.154935836791992, 12.677427291870117, 13.199918746948242, 13.722410202026367, 14.244901657104492, 14.767393112182617, 15.289884567260742, 15.81237506866455, 16.33486557006836, 16.857357025146484, 17.37984848022461, 17.902339935302734]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 6.0, 6.0, 7.0, 8.0, 12.0, 10.0, 13.0, 13.0, 19.0, 17.0, 22.0, 19.0, 23.0, 25.0, 29.0, 30.0, 37.0, 50.0, 37.0, 38.0, 50.0, 42.0, 31.0, 39.0, 44.0, 47.0, 30.0, 39.0, 37.0, 19.0, 27.0, 24.0, 26.0, 21.0, 16.0, 16.0, 13.0, 10.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.654296875, -1.596221923828125, -1.53814697265625, -1.480072021484375, -1.4219970703125, -1.363922119140625, -1.30584716796875, -1.247772216796875, -1.189697265625, -1.131622314453125, -1.07354736328125, -1.015472412109375, -0.9573974609375, -0.899322509765625, -0.84124755859375, -0.783172607421875, -0.72509765625, -0.667022705078125, -0.60894775390625, -0.550872802734375, -0.4927978515625, -0.434722900390625, -0.37664794921875, -0.318572998046875, -0.260498046875, -0.202423095703125, -0.14434814453125, -0.086273193359375, -0.0281982421875, 0.029876708984375, 0.08795166015625, 0.146026611328125, 0.2041015625, 0.262176513671875, 0.32025146484375, 0.378326416015625, 0.4364013671875, 0.494476318359375, 0.55255126953125, 0.610626220703125, 0.668701171875, 0.726776123046875, 0.78485107421875, 0.842926025390625, 0.9010009765625, 0.959075927734375, 1.01715087890625, 1.075225830078125, 1.13330078125, 1.191375732421875, 1.24945068359375, 1.307525634765625, 1.3656005859375, 1.423675537109375, 1.48175048828125, 1.539825439453125, 1.597900390625, 1.655975341796875, 1.71405029296875, 1.772125244140625, 1.8302001953125, 1.888275146484375, 1.94635009765625, 2.004425048828125, 2.0625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 8.0, 4.0, 8.0, 12.0, 17.0, 43.0, 54.0, 62.0, 106.0, 164.0, 245.0, 329.0, 528.0, 795.0, 1192.0, 1809.0, 2693.0, 4110.0, 6046.0, 9370.0, 14634.0, 23034.0, 38353.0, 65895.0, 115754.0, 205618.0, 228907.0, 135649.0, 75413.0, 43918.0, 26431.0, 16602.0, 10506.0, 6838.0, 4444.0, 2986.0, 2001.0, 1329.0, 851.0, 583.0, 388.0, 292.0, 184.0, 137.0, 70.0, 43.0, 35.0, 27.0, 13.0, 15.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.236083984375, -0.22824859619140625, -0.2204132080078125, -0.21257781982421875, -0.204742431640625, -0.19690704345703125, -0.1890716552734375, -0.18123626708984375, -0.17340087890625, -0.16556549072265625, -0.1577301025390625, -0.14989471435546875, -0.142059326171875, -0.13422393798828125, -0.1263885498046875, -0.11855316162109375, -0.1107177734375, -0.10288238525390625, -0.0950469970703125, -0.08721160888671875, -0.079376220703125, -0.07154083251953125, -0.0637054443359375, -0.05587005615234375, -0.04803466796875, -0.04019927978515625, -0.0323638916015625, -0.02452850341796875, -0.016693115234375, -0.00885772705078125, -0.0010223388671875, 0.00681304931640625, 0.0146484375, 0.02248382568359375, 0.0303192138671875, 0.03815460205078125, 0.045989990234375, 0.05382537841796875, 0.0616607666015625, 0.06949615478515625, 0.07733154296875, 0.08516693115234375, 0.0930023193359375, 0.10083770751953125, 0.108673095703125, 0.11650848388671875, 0.1243438720703125, 0.13217926025390625, 0.1400146484375, 0.14785003662109375, 0.1556854248046875, 0.16352081298828125, 0.171356201171875, 0.17919158935546875, 0.1870269775390625, 0.19486236572265625, 0.20269775390625, 0.21053314208984375, 0.2183685302734375, 0.22620391845703125, 0.234039306640625, 0.24187469482421875, 0.2497100830078125, 0.25754547119140625, 0.265380859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 7.0, 4.0, 8.0, 7.0, 23.0, 16.0, 18.0, 11.0, 21.0, 23.0, 25.0, 32.0, 26.0, 24.0, 52.0, 27.0, 38.0, 47.0, 38.0, 1077.0, 46.0, 37.0, 38.0, 41.0, 28.0, 29.0, 28.0, 33.0, 22.0, 25.0, 16.0, 10.0, 18.0, 17.0, 22.0, 19.0, 12.0, 14.0, 11.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.19921875, -1.1625823974609375, -1.125946044921875, -1.0893096923828125, -1.05267333984375, -1.0160369873046875, -0.979400634765625, -0.9427642822265625, -0.9061279296875, -0.8694915771484375, -0.832855224609375, -0.7962188720703125, -0.75958251953125, -0.7229461669921875, -0.686309814453125, -0.6496734619140625, -0.613037109375, -0.5764007568359375, -0.539764404296875, -0.5031280517578125, -0.46649169921875, -0.4298553466796875, -0.393218994140625, -0.3565826416015625, -0.3199462890625, -0.2833099365234375, -0.246673583984375, -0.2100372314453125, -0.17340087890625, -0.1367645263671875, -0.100128173828125, -0.0634918212890625, -0.02685546875, 0.0097808837890625, 0.046417236328125, 0.0830535888671875, 0.11968994140625, 0.1563262939453125, 0.192962646484375, 0.2295989990234375, 0.2662353515625, 0.3028717041015625, 0.339508056640625, 0.3761444091796875, 0.41278076171875, 0.4494171142578125, 0.486053466796875, 0.5226898193359375, 0.559326171875, 0.5959625244140625, 0.632598876953125, 0.6692352294921875, 0.70587158203125, 0.7425079345703125, 0.779144287109375, 0.8157806396484375, 0.8524169921875, 0.8890533447265625, 0.925689697265625, 0.9623260498046875, 0.99896240234375, 1.0355987548828125, 1.072235107421875, 1.1088714599609375, 1.1455078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 8.0, 17.0, 30.0, 49.0, 62.0, 86.0, 166.0, 188.0, 310.0, 452.0, 657.0, 925.0, 1395.0, 2117.0, 3123.0, 4918.0, 7487.0, 12000.0, 19623.0, 32488.0, 56605.0, 101934.0, 185783.0, 1290428.0, 161598.0, 88096.0, 49161.0, 28970.0, 17335.0, 11016.0, 7035.0, 4480.0, 2894.0, 1869.0, 1218.0, 864.0, 555.0, 349.0, 259.0, 187.0, 90.0, 102.0, 59.0, 37.0, 24.0, 21.0, 16.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1943359375, -0.1881427764892578, -0.18194961547851562, -0.17575645446777344, -0.16956329345703125, -0.16337013244628906, -0.15717697143554688, -0.1509838104248047, -0.1447906494140625, -0.1385974884033203, -0.13240432739257812, -0.12621116638183594, -0.12001800537109375, -0.11382484436035156, -0.10763168334960938, -0.10143852233886719, -0.095245361328125, -0.08905220031738281, -0.08285903930664062, -0.07666587829589844, -0.07047271728515625, -0.06427955627441406, -0.058086395263671875, -0.05189323425292969, -0.0457000732421875, -0.03950691223144531, -0.033313751220703125, -0.027120590209960938, -0.02092742919921875, -0.014734268188476562, -0.008541107177734375, -0.0023479461669921875, 0.00384521484375, 0.010038375854492188, 0.016231536865234375, 0.022424697875976562, 0.02861785888671875, 0.03481101989746094, 0.041004180908203125, 0.04719734191894531, 0.0533905029296875, 0.05958366394042969, 0.06577682495117188, 0.07196998596191406, 0.07816314697265625, 0.08435630798339844, 0.09054946899414062, 0.09674263000488281, 0.102935791015625, 0.10912895202636719, 0.11532211303710938, 0.12151527404785156, 0.12770843505859375, 0.13390159606933594, 0.14009475708007812, 0.1462879180908203, 0.1524810791015625, 0.1586742401123047, 0.16486740112304688, 0.17106056213378906, 0.17725372314453125, 0.18344688415527344, 0.18964004516601562, 0.1958332061767578, 0.2020263671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 13.0, 9.0, 16.0, 22.0, 18.0, 15.0, 27.0, 39.0, 49.0, 48.0, 54.0, 68.0, 55.0, 71.0, 64.0, 61.0, 49.0, 58.0, 51.0, 41.0, 21.0, 20.0, 20.0, 12.0, 20.0, 11.0, 13.0, 5.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009546279907226562, -0.0009261369705200195, -0.0008976459503173828, -0.0008691549301147461, -0.0008406639099121094, -0.0008121728897094727, -0.0007836818695068359, -0.0007551908493041992, -0.0007266998291015625, -0.0006982088088989258, -0.0006697177886962891, -0.0006412267684936523, -0.0006127357482910156, -0.0005842447280883789, -0.0005557537078857422, -0.0005272626876831055, -0.0004987716674804688, -0.00047028064727783203, -0.0004417896270751953, -0.0004132986068725586, -0.0003848075866699219, -0.00035631656646728516, -0.00032782554626464844, -0.0002993345260620117, -0.000270843505859375, -0.00024235248565673828, -0.00021386146545410156, -0.00018537044525146484, -0.00015687942504882812, -0.0001283884048461914, -9.989738464355469e-05, -7.140636444091797e-05, -4.291534423828125e-05, -1.4424324035644531e-05, 1.4066696166992188e-05, 4.2557716369628906e-05, 7.104873657226562e-05, 9.953975677490234e-05, 0.00012803077697753906, 0.00015652179718017578, 0.0001850128173828125, 0.00021350383758544922, 0.00024199485778808594, 0.00027048587799072266, 0.0002989768981933594, 0.0003274679183959961, 0.0003559589385986328, 0.00038444995880126953, 0.00041294097900390625, 0.00044143199920654297, 0.0004699230194091797, 0.0004984140396118164, 0.0005269050598144531, 0.0005553960800170898, 0.0005838871002197266, 0.0006123781204223633, 0.000640869140625, 0.0006693601608276367, 0.0006978511810302734, 0.0007263422012329102, 0.0007548332214355469, 0.0007833242416381836, 0.0008118152618408203, 0.000840306282043457, 0.0008687973022460938]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 4.0, 3.0, 5.0, 12.0, 12.0, 15.0, 16.0, 31.0, 30.0, 46.0, 72.0, 121.0, 177.0, 384.0, 917.0, 44090.0, 997996.0, 3301.0, 554.0, 292.0, 157.0, 93.0, 56.0, 38.0, 18.0, 26.0, 15.0, 15.0, 18.0, 4.0, 8.0, 10.0, 4.0, 1.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0197601318359375, -0.019107580184936523, -0.018455028533935547, -0.01780247688293457, -0.017149925231933594, -0.016497373580932617, -0.01584482192993164, -0.015192270278930664, -0.014539718627929688, -0.013887166976928711, -0.013234615325927734, -0.012582063674926758, -0.011929512023925781, -0.011276960372924805, -0.010624408721923828, -0.009971857070922852, -0.009319305419921875, -0.008666753768920898, -0.008014202117919922, -0.007361650466918945, -0.006709098815917969, -0.006056547164916992, -0.005403995513916016, -0.004751443862915039, -0.0040988922119140625, -0.003446340560913086, -0.0027937889099121094, -0.002141237258911133, -0.0014886856079101562, -0.0008361339569091797, -0.00018358230590820312, 0.00046896934509277344, 0.00112152099609375, 0.0017740726470947266, 0.002426624298095703, 0.0030791759490966797, 0.0037317276000976562, 0.004384279251098633, 0.005036830902099609, 0.005689382553100586, 0.0063419342041015625, 0.006994485855102539, 0.007647037506103516, 0.008299589157104492, 0.008952140808105469, 0.009604692459106445, 0.010257244110107422, 0.010909795761108398, 0.011562347412109375, 0.012214899063110352, 0.012867450714111328, 0.013520002365112305, 0.014172554016113281, 0.014825105667114258, 0.015477657318115234, 0.01613020896911621, 0.016782760620117188, 0.017435312271118164, 0.01808786392211914, 0.018740415573120117, 0.019392967224121094, 0.02004551887512207, 0.020698070526123047, 0.021350622177124023, 0.022003173828125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 10.0, 72.0, 304.0, 390.0, 195.0, 38.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043118110625073314, -0.00036270642885938287, -0.00029423178057186306, -0.00022575711773242801, -0.00015728245489299297, -8.88077775016427e-05, -2.033312921412289e-05, 4.814151907339692e-05, 0.00011661619646474719, 0.00018509085930418223, 0.00025356552214361727, 0.0003220401704311371, 0.00039051484782248735, 0.0004589895252138376, 0.0005274642026051879, 0.0005959388217888772, 0.0006644134991802275, 0.0007328881765715778, 0.0008013627957552671, 0.0008698374731466174, 0.0009383121505379677, 0.001006786827929318, 0.0010752615053206682, 0.0011437360662966967, 0.0012122108601033688, 0.001280685537494719, 0.0013491602148860693, 0.0014176348922774196, 0.0014861095696687698, 0.0015545841306447983, 0.0016230588080361485, 0.0016915334854274988, 0.001760008279234171, 0.0018284829566255212, 0.0018969576340168715, 0.0019654321949929, 0.002033906988799572, 0.0021023815497756004, 0.0021708563435822725, 0.002239330904558301, 0.002307805698364973, 0.0023762802593410015, 0.0024447550531476736, 0.002513229614123702, 0.002581704407930374, 0.0026501789689064026, 0.0027186537627130747, 0.002787128323689103, 0.0028556028846651316, 0.00292407744564116, 0.002992552239447832, 0.0030610268004238605, 0.0031295015942305326, 0.003197976155206561, 0.003266450949013233, 0.0033349255099892616, 0.00340340007096529, 0.0034718746319413185, 0.0035403494257479906, 0.003608823986724019, 0.003677298780530691, 0.0037457733415067196, 0.0038142481353133917, 0.00388272269628942, 0.003951197490096092]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 8.0, 8.0, 10.0, 13.0, 11.0, 17.0, 16.0, 19.0, 30.0, 25.0, 29.0, 18.0, 35.0, 36.0, 30.0, 40.0, 49.0, 43.0, 37.0, 48.0, 40.0, 51.0, 43.0, 39.0, 34.0, 42.0, 28.0, 28.0, 37.0, 22.0, 9.0, 14.0, 16.0, 17.0, 10.0, 3.0, 9.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004521012306213379, -0.0004372112452983856, -0.00042232125997543335, -0.0004074312746524811, -0.0003925412893295288, -0.00037765130400657654, -0.00036276131868362427, -0.000347871333360672, -0.0003329813480377197, -0.00031809136271476746, -0.0003032013773918152, -0.0002883113920688629, -0.00027342140674591064, -0.0002585314214229584, -0.0002436414361000061, -0.00022875145077705383, -0.00021386146545410156, -0.0001989714801311493, -0.00018408149480819702, -0.00016919150948524475, -0.00015430152416229248, -0.0001394115388393402, -0.00012452155351638794, -0.00010963156819343567, -9.47415828704834e-05, -7.985159754753113e-05, -6.496161222457886e-05, -5.007162690162659e-05, -3.5181641578674316e-05, -2.0291656255722046e-05, -5.401670932769775e-06, 9.488314390182495e-06, 2.4378299713134766e-05, 3.9268285036087036e-05, 5.415827035903931e-05, 6.904825568199158e-05, 8.393824100494385e-05, 9.882822632789612e-05, 0.00011371821165084839, 0.00012860819697380066, 0.00014349818229675293, 0.0001583881676197052, 0.00017327815294265747, 0.00018816813826560974, 0.000203058123588562, 0.00021794810891151428, 0.00023283809423446655, 0.0002477280795574188, 0.0002626180648803711, 0.00027750805020332336, 0.00029239803552627563, 0.0003072880208492279, 0.0003221780061721802, 0.00033706799149513245, 0.0003519579768180847, 0.000366847962141037, 0.00038173794746398926, 0.00039662793278694153, 0.0004115179181098938, 0.00042640790343284607, 0.00044129788875579834, 0.0004561878740787506, 0.0004710778594017029, 0.00048596784472465515, 0.0005008578300476074]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 6.0, 6.0, 7.0, 8.0, 12.0, 10.0, 13.0, 13.0, 19.0, 17.0, 22.0, 19.0, 23.0, 25.0, 29.0, 30.0, 37.0, 50.0, 37.0, 38.0, 50.0, 42.0, 31.0, 39.0, 44.0, 47.0, 30.0, 39.0, 36.0, 20.0, 27.0, 24.0, 26.0, 21.0, 16.0, 16.0, 13.0, 10.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.654296875, -1.596221923828125, -1.53814697265625, -1.480072021484375, -1.4219970703125, -1.363922119140625, -1.30584716796875, -1.247772216796875, -1.189697265625, -1.131622314453125, -1.07354736328125, -1.015472412109375, -0.9573974609375, -0.899322509765625, -0.84124755859375, -0.783172607421875, -0.72509765625, -0.667022705078125, -0.60894775390625, -0.550872802734375, -0.4927978515625, -0.434722900390625, -0.37664794921875, -0.318572998046875, -0.260498046875, -0.202423095703125, -0.14434814453125, -0.086273193359375, -0.0281982421875, 0.029876708984375, 0.08795166015625, 0.146026611328125, 0.2041015625, 0.262176513671875, 0.32025146484375, 0.378326416015625, 0.4364013671875, 0.494476318359375, 0.55255126953125, 0.610626220703125, 0.668701171875, 0.726776123046875, 0.78485107421875, 0.842926025390625, 0.9010009765625, 0.959075927734375, 1.01715087890625, 1.075225830078125, 1.13330078125, 1.191375732421875, 1.24945068359375, 1.307525634765625, 1.3656005859375, 1.423675537109375, 1.48175048828125, 1.539825439453125, 1.597900390625, 1.655975341796875, 1.71405029296875, 1.772125244140625, 1.8302001953125, 1.888275146484375, 1.94635009765625, 2.004425048828125, 2.0625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 6.0, 6.0, 14.0, 15.0, 22.0, 26.0, 45.0, 73.0, 100.0, 197.0, 312.0, 514.0, 996.0, 1812.0, 3534.0, 6667.0, 12217.0, 22818.0, 43328.0, 90691.0, 219645.0, 325898.0, 170288.0, 72083.0, 35679.0, 19255.0, 10399.0, 5458.0, 2883.0, 1521.0, 811.0, 477.0, 246.0, 160.0, 108.0, 52.0, 52.0, 31.0, 21.0, 20.0, 12.0, 15.0, 8.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.779296875, -1.7259521484375, -1.672607421875, -1.6192626953125, -1.56591796875, -1.5125732421875, -1.459228515625, -1.4058837890625, -1.3525390625, -1.2991943359375, -1.245849609375, -1.1925048828125, -1.13916015625, -1.0858154296875, -1.032470703125, -0.9791259765625, -0.92578125, -0.8724365234375, -0.819091796875, -0.7657470703125, -0.71240234375, -0.6590576171875, -0.605712890625, -0.5523681640625, -0.4990234375, -0.4456787109375, -0.392333984375, -0.3389892578125, -0.28564453125, -0.2322998046875, -0.178955078125, -0.1256103515625, -0.072265625, -0.0189208984375, 0.034423828125, 0.0877685546875, 0.14111328125, 0.1944580078125, 0.247802734375, 0.3011474609375, 0.3544921875, 0.4078369140625, 0.461181640625, 0.5145263671875, 0.56787109375, 0.6212158203125, 0.674560546875, 0.7279052734375, 0.78125, 0.8345947265625, 0.887939453125, 0.9412841796875, 0.99462890625, 1.0479736328125, 1.101318359375, 1.1546630859375, 1.2080078125, 1.2613525390625, 1.314697265625, 1.3680419921875, 1.42138671875, 1.4747314453125, 1.528076171875, 1.5814208984375, 1.634765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 9.0, 9.0, 14.0, 14.0, 14.0, 10.0, 18.0, 19.0, 32.0, 31.0, 34.0, 40.0, 24.0, 44.0, 45.0, 69.0, 96.0, 195.0, 1428.0, 273.0, 144.0, 73.0, 59.0, 41.0, 27.0, 28.0, 24.0, 31.0, 25.0, 21.0, 28.0, 18.0, 18.0, 13.0, 11.0, 5.0, 12.0, 7.0, 6.0, 5.0, 8.0, 3.0, 1.0, 0.0, 4.0, 4.0, 0.0, 3.0, 1.0], "bins": [-7.39453125, -7.1751708984375, -6.955810546875, -6.7364501953125, -6.51708984375, -6.2977294921875, -6.078369140625, -5.8590087890625, -5.6396484375, -5.4202880859375, -5.200927734375, -4.9815673828125, -4.76220703125, -4.5428466796875, -4.323486328125, -4.1041259765625, -3.884765625, -3.6654052734375, -3.446044921875, -3.2266845703125, -3.00732421875, -2.7879638671875, -2.568603515625, -2.3492431640625, -2.1298828125, -1.9105224609375, -1.691162109375, -1.4718017578125, -1.25244140625, -1.0330810546875, -0.813720703125, -0.5943603515625, -0.375, -0.1556396484375, 0.063720703125, 0.2830810546875, 0.50244140625, 0.7218017578125, 0.941162109375, 1.1605224609375, 1.3798828125, 1.5992431640625, 1.818603515625, 2.0379638671875, 2.25732421875, 2.4766845703125, 2.696044921875, 2.9154052734375, 3.134765625, 3.3541259765625, 3.573486328125, 3.7928466796875, 4.01220703125, 4.2315673828125, 4.450927734375, 4.6702880859375, 4.8896484375, 5.1090087890625, 5.328369140625, 5.5477294921875, 5.76708984375, 5.9864501953125, 6.205810546875, 6.4251708984375, 6.64453125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 2.0, 15.0, 18.0, 20.0, 27.0, 31.0, 55.0, 83.0, 146.0, 211.0, 370.0, 979.0, 14682.0, 3114621.0, 12549.0, 922.0, 352.0, 208.0, 103.0, 80.0, 62.0, 29.0, 26.0, 23.0, 16.0, 11.0, 10.0, 10.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.6708984375, -26.732421875, -25.7939453125, -24.85546875, -23.9169921875, -22.978515625, -22.0400390625, -21.1015625, -20.1630859375, -19.224609375, -18.2861328125, -17.34765625, -16.4091796875, -15.470703125, -14.5322265625, -13.59375, -12.6552734375, -11.716796875, -10.7783203125, -9.83984375, -8.9013671875, -7.962890625, -7.0244140625, -6.0859375, -5.1474609375, -4.208984375, -3.2705078125, -2.33203125, -1.3935546875, -0.455078125, 0.4833984375, 1.421875, 2.3603515625, 3.298828125, 4.2373046875, 5.17578125, 6.1142578125, 7.052734375, 7.9912109375, 8.9296875, 9.8681640625, 10.806640625, 11.7451171875, 12.68359375, 13.6220703125, 14.560546875, 15.4990234375, 16.4375, 17.3759765625, 18.314453125, 19.2529296875, 20.19140625, 21.1298828125, 22.068359375, 23.0068359375, 23.9453125, 24.8837890625, 25.822265625, 26.7607421875, 27.69921875, 28.6376953125, 29.576171875, 30.5146484375, 31.453125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 96.0, 681.0, 233.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.49155330657959, -13.164342880249023, -10.83713150024414, -8.509920120239258, -6.182709693908691, -3.8554983139038086, -1.5282878875732422, 0.7989225387573242, 3.126133918762207, 5.453344821929932, 7.780555725097656, 10.107767105102539, 12.434977531433105, 14.762188911437988, 17.089399337768555, 19.416610717773438, 21.743820190429688, 24.07103157043457, 26.398242950439453, 28.725452423095703, 31.052663803100586, 33.37987518310547, 35.70708465576172, 38.03429412841797, 40.361507415771484, 42.688716888427734, 45.01593017578125, 47.3431396484375, 49.67034912109375, 51.997562408447266, 54.324771881103516, 56.65198516845703, 58.97920227050781, 61.30641174316406, 63.63362503051758, 65.9608383178711, 68.28804779052734, 70.6152572631836, 72.94246673583984, 75.2696762084961, 77.59689331054688, 79.92410278320312, 82.25131225585938, 84.57852935791016, 86.9057388305664, 89.23294830322266, 91.5601577758789, 93.88736724853516, 96.2145767211914, 98.54178619384766, 100.8689956665039, 103.19621276855469, 105.52342224121094, 107.85063171386719, 110.17784118652344, 112.50505065917969, 114.83226013183594, 117.15946960449219, 119.48667907714844, 121.81389617919922, 124.14110565185547, 126.46831512451172, 128.7955322265625, 131.12274169921875, 133.449951171875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 9.0, 12.0, 15.0, 9.0, 22.0, 17.0, 19.0, 16.0, 18.0, 27.0, 26.0, 27.0, 33.0, 37.0, 37.0, 33.0, 31.0, 50.0, 26.0, 37.0, 35.0, 38.0, 32.0, 33.0, 32.0, 28.0, 23.0, 27.0, 36.0, 34.0, 24.0, 18.0, 25.0, 22.0, 16.0, 15.0, 9.0, 7.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0], "bins": [-21.65027618408203, -21.046649932861328, -20.443025588989258, -19.839399337768555, -19.235774993896484, -18.63214874267578, -18.02852439880371, -17.424898147583008, -16.821273803710938, -16.217647552490234, -15.614023208618164, -15.010397911071777, -14.40677261352539, -13.803146362304688, -13.1995210647583, -12.595895767211914, -11.992269515991211, -11.388644218444824, -10.785018920898438, -10.18139362335205, -9.577768325805664, -8.974142074584961, -8.370516777038574, -7.7668914794921875, -7.163266181945801, -6.559640884399414, -5.956015586853027, -5.352389812469482, -4.748764514923096, -4.145139217376709, -3.541513681411743, -2.9378881454467773, -2.3342628479003906, -1.7306374311447144, -1.127012014389038, -0.5233865976333618, 0.08023881912231445, 0.6838641166687012, 1.287489652633667, 1.8911151885986328, 2.4947404861450195, 3.0983657836914062, 3.701991319656372, 4.305616855621338, 4.909242153167725, 5.512867450714111, 6.116493225097656, 6.720118522644043, 7.32374382019043, 7.927369117736816, 8.530994415283203, 9.13461971282959, 9.738245010375977, 10.34187126159668, 10.945496559143066, 11.549121856689453, 12.15274715423584, 12.756372451782227, 13.359997749328613, 13.963623046875, 14.567249298095703, 15.170873641967773, 15.774499893188477, 16.378124237060547, 16.98175048828125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 2.0, 5.0, 8.0, 7.0, 7.0, 5.0, 12.0, 15.0, 12.0, 14.0, 19.0, 32.0, 19.0, 27.0, 27.0, 37.0, 23.0, 31.0, 41.0, 47.0, 39.0, 38.0, 53.0, 49.0, 36.0, 39.0, 27.0, 44.0, 50.0, 29.0, 29.0, 19.0, 26.0, 19.0, 14.0, 17.0, 12.0, 11.0, 15.0, 6.0, 5.0, 4.0, 4.0, 2.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9814453125, -1.9159698486328125, -1.850494384765625, -1.7850189208984375, -1.71954345703125, -1.6540679931640625, -1.588592529296875, -1.5231170654296875, -1.4576416015625, -1.3921661376953125, -1.326690673828125, -1.2612152099609375, -1.19573974609375, -1.1302642822265625, -1.064788818359375, -0.9993133544921875, -0.933837890625, -0.8683624267578125, -0.802886962890625, -0.7374114990234375, -0.67193603515625, -0.6064605712890625, -0.540985107421875, -0.4755096435546875, -0.4100341796875, -0.3445587158203125, -0.279083251953125, -0.2136077880859375, -0.14813232421875, -0.0826568603515625, -0.017181396484375, 0.0482940673828125, 0.11376953125, 0.1792449951171875, 0.244720458984375, 0.3101959228515625, 0.37567138671875, 0.4411468505859375, 0.506622314453125, 0.5720977783203125, 0.6375732421875, 0.7030487060546875, 0.768524169921875, 0.8339996337890625, 0.89947509765625, 0.9649505615234375, 1.030426025390625, 1.0959014892578125, 1.161376953125, 1.2268524169921875, 1.292327880859375, 1.3578033447265625, 1.42327880859375, 1.4887542724609375, 1.554229736328125, 1.6197052001953125, 1.6851806640625, 1.7506561279296875, 1.816131591796875, 1.8816070556640625, 1.94708251953125, 2.0125579833984375, 2.078033447265625, 2.1435089111328125, 2.208984375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 12.0, 8.0, 12.0, 9.0, 15.0, 23.0, 26.0, 53.0, 64.0, 103.0, 179.0, 304.0, 768.0, 2298.0, 10786.0, 75396.0, 616280.0, 2169328.0, 1132248.0, 159843.0, 20477.0, 3820.0, 1115.0, 445.0, 228.0, 136.0, 88.0, 64.0, 35.0, 29.0, 17.0, 5.0, 9.0, 9.0, 14.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.24444580078125, -4.1060791015625, -3.96771240234375, -3.829345703125, -3.69097900390625, -3.5526123046875, -3.41424560546875, -3.27587890625, -3.13751220703125, -2.9991455078125, -2.86077880859375, -2.722412109375, -2.58404541015625, -2.4456787109375, -2.30731201171875, -2.1689453125, -2.03057861328125, -1.8922119140625, -1.75384521484375, -1.615478515625, -1.47711181640625, -1.3387451171875, -1.20037841796875, -1.06201171875, -0.92364501953125, -0.7852783203125, -0.64691162109375, -0.508544921875, -0.37017822265625, -0.2318115234375, -0.09344482421875, 0.044921875, 0.18328857421875, 0.3216552734375, 0.46002197265625, 0.598388671875, 0.73675537109375, 0.8751220703125, 1.01348876953125, 1.15185546875, 1.29022216796875, 1.4285888671875, 1.56695556640625, 1.705322265625, 1.84368896484375, 1.9820556640625, 2.12042236328125, 2.2587890625, 2.39715576171875, 2.5355224609375, 2.67388916015625, 2.812255859375, 2.95062255859375, 3.0889892578125, 3.22735595703125, 3.36572265625, 3.50408935546875, 3.6424560546875, 3.78082275390625, 3.919189453125, 4.05755615234375, 4.1959228515625, 4.33428955078125, 4.47265625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 8.0, 10.0, 22.0, 31.0, 56.0, 69.0, 97.0, 172.0, 216.0, 281.0, 384.0, 461.0, 486.0, 459.0, 379.0, 304.0, 195.0, 129.0, 98.0, 73.0, 40.0, 28.0, 12.0, 23.0, 12.0, 7.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.32403564453125, -5.1363525390625, -4.94866943359375, -4.760986328125, -4.57330322265625, -4.3856201171875, -4.19793701171875, -4.01025390625, -3.82257080078125, -3.6348876953125, -3.44720458984375, -3.259521484375, -3.07183837890625, -2.8841552734375, -2.69647216796875, -2.5087890625, -2.32110595703125, -2.1334228515625, -1.94573974609375, -1.758056640625, -1.57037353515625, -1.3826904296875, -1.19500732421875, -1.00732421875, -0.81964111328125, -0.6319580078125, -0.44427490234375, -0.256591796875, -0.06890869140625, 0.1187744140625, 0.30645751953125, 0.494140625, 0.68182373046875, 0.8695068359375, 1.05718994140625, 1.244873046875, 1.43255615234375, 1.6202392578125, 1.80792236328125, 1.99560546875, 2.18328857421875, 2.3709716796875, 2.55865478515625, 2.746337890625, 2.93402099609375, 3.1217041015625, 3.30938720703125, 3.4970703125, 3.68475341796875, 3.8724365234375, 4.06011962890625, 4.247802734375, 4.43548583984375, 4.6231689453125, 4.81085205078125, 4.99853515625, 5.18621826171875, 5.3739013671875, 5.56158447265625, 5.749267578125, 5.93695068359375, 6.1246337890625, 6.31231689453125, 6.5]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 9.0, 12.0, 11.0, 25.0, 40.0, 47.0, 92.0, 115.0, 188.0, 266.0, 558.0, 1612.0, 12970.0, 397612.0, 3414644.0, 351602.0, 11605.0, 1512.0, 509.0, 295.0, 180.0, 115.0, 81.0, 74.0, 34.0, 15.0, 16.0, 16.0, 9.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7249755859375, -11.364013671875, -11.0030517578125, -10.64208984375, -10.2811279296875, -9.920166015625, -9.5592041015625, -9.1982421875, -8.8372802734375, -8.476318359375, -8.1153564453125, -7.75439453125, -7.3934326171875, -7.032470703125, -6.6715087890625, -6.310546875, -5.9495849609375, -5.588623046875, -5.2276611328125, -4.86669921875, -4.5057373046875, -4.144775390625, -3.7838134765625, -3.4228515625, -3.0618896484375, -2.700927734375, -2.3399658203125, -1.97900390625, -1.6180419921875, -1.257080078125, -0.8961181640625, -0.53515625, -0.1741943359375, 0.186767578125, 0.5477294921875, 0.90869140625, 1.2696533203125, 1.630615234375, 1.9915771484375, 2.3525390625, 2.7135009765625, 3.074462890625, 3.4354248046875, 3.79638671875, 4.1573486328125, 4.518310546875, 4.8792724609375, 5.240234375, 5.6011962890625, 5.962158203125, 6.3231201171875, 6.68408203125, 7.0450439453125, 7.406005859375, 7.7669677734375, 8.1279296875, 8.4888916015625, 8.849853515625, 9.2108154296875, 9.57177734375, 9.9327392578125, 10.293701171875, 10.6546630859375, 11.015625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 12.0, 24.0, 58.0, 107.0, 172.0, 194.0, 185.0, 127.0, 77.0, 35.0, 14.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.13328552246094, -35.83259582519531, -34.53190231323242, -33.2312126159668, -31.93052101135254, -30.62982940673828, -29.329137802124023, -28.028446197509766, -26.72775650024414, -25.427064895629883, -24.126373291015625, -22.82568359375, -21.524991989135742, -20.224300384521484, -18.923608779907227, -17.62291717529297, -16.32222557067871, -15.021533966064453, -13.720843315124512, -12.420151710510254, -11.119461059570312, -9.818769454956055, -8.518077850341797, -7.2173871994018555, -5.916695594787598, -4.616004467010498, -3.3153131008148193, -2.0146217346191406, -0.713930606842041, 0.5867605209350586, 1.8874521255493164, 3.188142776489258, 4.488834381103516, 5.789525508880615, 7.090216636657715, 8.390908241271973, 9.691598892211914, 10.992290496826172, 12.29298210144043, 13.593672752380371, 14.894364356994629, 16.19505500793457, 17.495746612548828, 18.796438217163086, 20.097129821777344, 21.39781951904297, 22.69851303100586, 23.999202728271484, 25.299894332885742, 26.6005859375, 27.901277542114258, 29.201969146728516, 30.50265884399414, 31.8033504486084, 33.104042053222656, 34.40473175048828, 35.70542526245117, 37.0061149597168, 38.30680847167969, 39.60749816894531, 40.9081916809082, 42.20888137817383, 43.50957489013672, 44.810264587402344, 46.11095428466797]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 15.0, 20.0, 18.0, 21.0, 22.0, 26.0, 19.0, 29.0, 29.0, 33.0, 25.0, 48.0, 40.0, 42.0, 32.0, 37.0, 55.0, 41.0, 32.0, 44.0, 34.0, 35.0, 31.0, 31.0, 22.0, 24.0, 25.0, 26.0, 19.0, 19.0, 17.0, 16.0, 14.0, 8.0, 10.0, 6.0, 6.0, 9.0, 1.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.19491195678711, -15.685200691223145, -15.17548942565918, -14.665778160095215, -14.15606689453125, -13.646355628967285, -13.13664436340332, -12.626934051513672, -12.11722183227539, -11.607510566711426, -11.097799301147461, -10.588088035583496, -10.078376770019531, -9.568665504455566, -9.058954238891602, -8.549243927001953, -8.039532661437988, -7.529821395874023, -7.020110130310059, -6.510398864746094, -6.000687599182129, -5.490976333618164, -4.981265544891357, -4.471554279327393, -3.9618430137634277, -3.452131748199463, -2.942420482635498, -2.4327094554901123, -1.9229981899261475, -1.4132869243621826, -0.9035758972167969, -0.39386463165283203, 0.11584663391113281, 0.6255578398704529, 1.135269045829773, 1.6449801921844482, 2.154691457748413, 2.664402723312378, 3.1741137504577637, 3.6838250160217285, 4.193536281585693, 4.703247547149658, 5.212958812713623, 5.72266960144043, 6.2323808670043945, 6.742092132568359, 7.251803398132324, 7.761514663696289, 8.271225929260254, 8.780937194824219, 9.290648460388184, 9.800359725952148, 10.310070991516113, 10.819782257080078, 11.329492568969727, 11.839204788208008, 12.348915100097656, 12.858626365661621, 13.368337631225586, 13.87804889678955, 14.387760162353516, 14.89747142791748, 15.407182693481445, 15.916893005371094, 16.426605224609375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 6.0, 8.0, 7.0, 12.0, 13.0, 19.0, 22.0, 13.0, 18.0, 22.0, 36.0, 23.0, 34.0, 31.0, 46.0, 43.0, 46.0, 36.0, 53.0, 56.0, 44.0, 53.0, 34.0, 35.0, 33.0, 32.0, 22.0, 28.0, 30.0, 19.0, 23.0, 19.0, 11.0, 12.0, 14.0, 5.0, 3.0, 8.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.9627685546875, -1.894287109375, -1.8258056640625, -1.75732421875, -1.6888427734375, -1.620361328125, -1.5518798828125, -1.4833984375, -1.4149169921875, -1.346435546875, -1.2779541015625, -1.20947265625, -1.1409912109375, -1.072509765625, -1.0040283203125, -0.935546875, -0.8670654296875, -0.798583984375, -0.7301025390625, -0.66162109375, -0.5931396484375, -0.524658203125, -0.4561767578125, -0.3876953125, -0.3192138671875, -0.250732421875, -0.1822509765625, -0.11376953125, -0.0452880859375, 0.023193359375, 0.0916748046875, 0.16015625, 0.2286376953125, 0.297119140625, 0.3656005859375, 0.43408203125, 0.5025634765625, 0.571044921875, 0.6395263671875, 0.7080078125, 0.7764892578125, 0.844970703125, 0.9134521484375, 0.98193359375, 1.0504150390625, 1.118896484375, 1.1873779296875, 1.255859375, 1.3243408203125, 1.392822265625, 1.4613037109375, 1.52978515625, 1.5982666015625, 1.666748046875, 1.7352294921875, 1.8037109375, 1.8721923828125, 1.940673828125, 2.0091552734375, 2.07763671875, 2.1461181640625, 2.214599609375, 2.2830810546875, 2.3515625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 12.0, 7.0, 24.0, 26.0, 43.0, 52.0, 86.0, 121.0, 176.0, 272.0, 351.0, 531.0, 707.0, 920.0, 1200.0, 1723.0, 2340.0, 3199.0, 4396.0, 5937.0, 8251.0, 11825.0, 17268.0, 25045.0, 37923.0, 58458.0, 93772.0, 151606.0, 197186.0, 151366.0, 93065.0, 57825.0, 38042.0, 25449.0, 17096.0, 11863.0, 8216.0, 5936.0, 4360.0, 3289.0, 2283.0, 1784.0, 1266.0, 919.0, 684.0, 533.0, 340.0, 259.0, 163.0, 110.0, 93.0, 64.0, 34.0, 23.0, 20.0, 6.0, 6.0, 7.0, 4.0, 4.0], "bins": [-0.2230224609375, -0.21615982055664062, -0.20929718017578125, -0.20243453979492188, -0.1955718994140625, -0.18870925903320312, -0.18184661865234375, -0.17498397827148438, -0.168121337890625, -0.16125869750976562, -0.15439605712890625, -0.14753341674804688, -0.1406707763671875, -0.13380813598632812, -0.12694549560546875, -0.12008285522460938, -0.11322021484375, -0.10635757446289062, -0.09949493408203125, -0.09263229370117188, -0.0857696533203125, -0.07890701293945312, -0.07204437255859375, -0.06518173217773438, -0.058319091796875, -0.051456451416015625, -0.04459381103515625, -0.037731170654296875, -0.0308685302734375, -0.024005889892578125, -0.01714324951171875, -0.010280609130859375, -0.00341796875, 0.003444671630859375, 0.01030731201171875, 0.017169952392578125, 0.0240325927734375, 0.030895233154296875, 0.03775787353515625, 0.044620513916015625, 0.051483154296875, 0.058345794677734375, 0.06520843505859375, 0.07207107543945312, 0.0789337158203125, 0.08579635620117188, 0.09265899658203125, 0.09952163696289062, 0.10638427734375, 0.11324691772460938, 0.12010955810546875, 0.12697219848632812, 0.1338348388671875, 0.14069747924804688, 0.14756011962890625, 0.15442276000976562, 0.161285400390625, 0.16814804077148438, 0.17501068115234375, 0.18187332153320312, 0.1887359619140625, 0.19559860229492188, 0.20246124267578125, 0.20932388305664062, 0.2161865234375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 4.0, 10.0, 8.0, 17.0, 13.0, 21.0, 22.0, 30.0, 22.0, 26.0, 39.0, 37.0, 29.0, 45.0, 43.0, 42.0, 37.0, 41.0, 1064.0, 33.0, 41.0, 33.0, 44.0, 40.0, 28.0, 26.0, 31.0, 27.0, 20.0, 17.0, 20.0, 12.0, 17.0, 13.0, 8.0, 9.0, 6.0, 9.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0], "bins": [-1.4765625, -1.43438720703125, -1.3922119140625, -1.35003662109375, -1.307861328125, -1.26568603515625, -1.2235107421875, -1.18133544921875, -1.13916015625, -1.09698486328125, -1.0548095703125, -1.01263427734375, -0.970458984375, -0.92828369140625, -0.8861083984375, -0.84393310546875, -0.8017578125, -0.75958251953125, -0.7174072265625, -0.67523193359375, -0.633056640625, -0.59088134765625, -0.5487060546875, -0.50653076171875, -0.46435546875, -0.42218017578125, -0.3800048828125, -0.33782958984375, -0.295654296875, -0.25347900390625, -0.2113037109375, -0.16912841796875, -0.126953125, -0.08477783203125, -0.0426025390625, -0.00042724609375, 0.041748046875, 0.08392333984375, 0.1260986328125, 0.16827392578125, 0.21044921875, 0.25262451171875, 0.2947998046875, 0.33697509765625, 0.379150390625, 0.42132568359375, 0.4635009765625, 0.50567626953125, 0.5478515625, 0.59002685546875, 0.6322021484375, 0.67437744140625, 0.716552734375, 0.75872802734375, 0.8009033203125, 0.84307861328125, 0.88525390625, 0.92742919921875, 0.9696044921875, 1.01177978515625, 1.053955078125, 1.09613037109375, 1.1383056640625, 1.18048095703125, 1.22265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 8.0, 15.0, 24.0, 27.0, 43.0, 61.0, 81.0, 113.0, 177.0, 225.0, 364.0, 430.0, 617.0, 915.0, 1299.0, 1775.0, 2525.0, 3736.0, 5452.0, 7891.0, 11719.0, 17535.0, 26914.0, 42264.0, 66631.0, 108256.0, 168829.0, 1244070.0, 140097.0, 86953.0, 54551.0, 34594.0, 22237.0, 14992.0, 9844.0, 6634.0, 4579.0, 3250.0, 2206.0, 1569.0, 1063.0, 750.0, 544.0, 376.0, 266.0, 207.0, 135.0, 92.0, 70.0, 43.0, 24.0, 26.0, 13.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1856689453125, -0.1799163818359375, -0.174163818359375, -0.1684112548828125, -0.16265869140625, -0.1569061279296875, -0.151153564453125, -0.1454010009765625, -0.1396484375, -0.1338958740234375, -0.128143310546875, -0.1223907470703125, -0.11663818359375, -0.1108856201171875, -0.105133056640625, -0.0993804931640625, -0.0936279296875, -0.0878753662109375, -0.082122802734375, -0.0763702392578125, -0.07061767578125, -0.0648651123046875, -0.059112548828125, -0.0533599853515625, -0.047607421875, -0.0418548583984375, -0.036102294921875, -0.0303497314453125, -0.02459716796875, -0.0188446044921875, -0.013092041015625, -0.0073394775390625, -0.0015869140625, 0.0041656494140625, 0.009918212890625, 0.0156707763671875, 0.02142333984375, 0.0271759033203125, 0.032928466796875, 0.0386810302734375, 0.04443359375, 0.0501861572265625, 0.055938720703125, 0.0616912841796875, 0.06744384765625, 0.0731964111328125, 0.078948974609375, 0.0847015380859375, 0.0904541015625, 0.0962066650390625, 0.101959228515625, 0.1077117919921875, 0.11346435546875, 0.1192169189453125, 0.124969482421875, 0.1307220458984375, 0.136474609375, 0.1422271728515625, 0.147979736328125, 0.1537322998046875, 0.15948486328125, 0.1652374267578125, 0.170989990234375, 0.1767425537109375, 0.1824951171875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 5.0, 4.0, 11.0, 18.0, 13.0, 15.0, 28.0, 23.0, 30.0, 48.0, 65.0, 87.0, 104.0, 109.0, 85.0, 68.0, 65.0, 47.0, 36.0, 25.0, 20.0, 19.0, 21.0, 15.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010929107666015625, -0.0010569244623184204, -0.0010209381580352783, -0.0009849518537521362, -0.0009489655494689941, -0.000912979245185852, -0.00087699294090271, -0.0008410066366195679, -0.0008050203323364258, -0.0007690340280532837, -0.0007330477237701416, -0.0006970614194869995, -0.0006610751152038574, -0.0006250888109207153, -0.0005891025066375732, -0.0005531162023544312, -0.0005171298980712891, -0.00048114359378814697, -0.0004451572895050049, -0.0004091709852218628, -0.0003731846809387207, -0.0003371983766555786, -0.0003012120723724365, -0.00026522576808929443, -0.00022923946380615234, -0.00019325315952301025, -0.00015726685523986816, -0.00012128055095672607, -8.529424667358398e-05, -4.9307942390441895e-05, -1.3321638107299805e-05, 2.2664666175842285e-05, 5.8650970458984375e-05, 9.463727474212646e-05, 0.00013062357902526855, 0.00016660988330841064, 0.00020259618759155273, 0.00023858249187469482, 0.0002745687961578369, 0.000310555100440979, 0.0003465414047241211, 0.0003825277090072632, 0.0004185140132904053, 0.00045450031757354736, 0.0004904866218566895, 0.0005264729261398315, 0.0005624592304229736, 0.0005984455347061157, 0.0006344318389892578, 0.0006704181432723999, 0.000706404447555542, 0.0007423907518386841, 0.0007783770561218262, 0.0008143633604049683, 0.0008503496646881104, 0.0008863359689712524, 0.0009223222732543945, 0.0009583085775375366, 0.0009942948818206787, 0.0010302811861038208, 0.0010662674903869629, 0.001102253794670105, 0.001138240098953247, 0.0011742264032363892, 0.0012102127075195312]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 5.0, 15.0, 13.0, 27.0, 31.0, 40.0, 53.0, 91.0, 178.0, 281.0, 709.0, 15805.0, 1026283.0, 3773.0, 587.0, 245.0, 141.0, 61.0, 50.0, 40.0, 33.0, 17.0, 16.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0250701904296875, -0.024319171905517578, -0.023568153381347656, -0.022817134857177734, -0.022066116333007812, -0.02131509780883789, -0.02056407928466797, -0.019813060760498047, -0.019062042236328125, -0.018311023712158203, -0.01756000518798828, -0.01680898666381836, -0.016057968139648438, -0.015306949615478516, -0.014555931091308594, -0.013804912567138672, -0.01305389404296875, -0.012302875518798828, -0.011551856994628906, -0.010800838470458984, -0.010049819946289062, -0.00929880142211914, -0.008547782897949219, -0.007796764373779297, -0.007045745849609375, -0.006294727325439453, -0.005543708801269531, -0.004792690277099609, -0.0040416717529296875, -0.0032906532287597656, -0.0025396347045898438, -0.0017886161804199219, -0.00103759765625, -0.0002865791320800781, 0.00046443939208984375, 0.0012154579162597656, 0.0019664764404296875, 0.0027174949645996094, 0.0034685134887695312, 0.004219532012939453, 0.004970550537109375, 0.005721569061279297, 0.006472587585449219, 0.007223606109619141, 0.007974624633789062, 0.008725643157958984, 0.009476661682128906, 0.010227680206298828, 0.01097869873046875, 0.011729717254638672, 0.012480735778808594, 0.013231754302978516, 0.013982772827148438, 0.01473379135131836, 0.015484809875488281, 0.016235828399658203, 0.016986846923828125, 0.017737865447998047, 0.01848888397216797, 0.01923990249633789, 0.019990921020507812, 0.020741939544677734, 0.021492958068847656, 0.022243976593017578, 0.0229949951171875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 14.0, 130.0, 458.0, 361.0, 51.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009727643919177353, -0.0008826218545436859, -0.0007924793171696365, -0.0007023367797955871, -0.0006121943006291986, -0.0005220517050474882, -0.0004319092258810997, -0.0003417666885070503, -0.00025162415113300085, -0.00016148161375895143, -7.133909093681723e-05, 1.8803431885316968e-05, 0.00010894596925936639, 0.00019908850663341582, 0.0002892310149036348, 0.0003793735522776842, 0.00046951608965173364, 0.0005596586270257831, 0.0006498011643998325, 0.0007399437017738819, 0.0008300861809402704, 0.0009202287765219808, 0.0010103712556883693, 0.0011005138512700796, 0.0011906563304364681, 0.0012807988096028566, 0.001370941405184567, 0.0014610838843509555, 0.0015512264799326658, 0.0016413689590990543, 0.0017315114382654428, 0.0018216540338471532, 0.0019117963965982199, 0.0020019388757646084, 0.002092081354930997, 0.002182224066928029, 0.0022723665460944176, 0.002362509025260806, 0.0024526515044271946, 0.0025427942164242268, 0.0026329366955906153, 0.002723079174757004, 0.0028132216539233923, 0.0029033643659204245, 0.002993506845086813, 0.0030836493242532015, 0.00317379180341959, 0.003263934515416622, 0.003354076761752367, 0.0034442192409187555, 0.003534361720085144, 0.003624504432082176, 0.0037146469112485647, 0.0038047893904149532, 0.0038949318695813417, 0.00398507434874773, 0.004075217060744762, 0.004165359772741795, 0.0042555020190775394, 0.004345644731074572, 0.0044357869774103165, 0.004525929689407349, 0.004616072401404381, 0.004706214647740126, 0.004796357359737158]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 10.0, 9.0, 3.0, 18.0, 18.0, 18.0, 20.0, 27.0, 32.0, 39.0, 41.0, 45.0, 27.0, 49.0, 59.0, 49.0, 52.0, 59.0, 60.0, 52.0, 41.0, 53.0, 33.0, 30.0, 36.0, 22.0, 20.0, 18.0, 21.0, 17.0, 10.0, 3.0, 2.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006871223449707031, -0.0006687510758638382, -0.0006503798067569733, -0.0006320085376501083, -0.0006136372685432434, -0.0005952659994363785, -0.0005768947303295135, -0.0005585234612226486, -0.0005401521921157837, -0.0005217809230089188, -0.0005034096539020538, -0.0004850383847951889, -0.000466667115688324, -0.00044829584658145905, -0.0004299245774745941, -0.0004115533083677292, -0.00039318203926086426, -0.00037481077015399933, -0.0003564395010471344, -0.00033806823194026947, -0.00031969696283340454, -0.0003013256937265396, -0.0002829544246196747, -0.00026458315551280975, -0.0002462118864059448, -0.0002278406172990799, -0.00020946934819221497, -0.00019109807908535004, -0.0001727268099784851, -0.00015435554087162018, -0.00013598427176475525, -0.00011761300265789032, -9.924173355102539e-05, -8.087046444416046e-05, -6.249919533729553e-05, -4.41279262304306e-05, -2.5756657123565674e-05, -7.385388016700745e-06, 1.0985881090164185e-05, 2.9357150197029114e-05, 4.772841930389404e-05, 6.609968841075897e-05, 8.44709575176239e-05, 0.00010284222662448883, 0.00012121349573135376, 0.0001395847648382187, 0.00015795603394508362, 0.00017632730305194855, 0.00019469857215881348, 0.0002130698412656784, 0.00023144111037254333, 0.00024981237947940826, 0.0002681836485862732, 0.0002865549176931381, 0.00030492618680000305, 0.000323297455906868, 0.0003416687250137329, 0.00036003999412059784, 0.00037841126322746277, 0.0003967825323343277, 0.0004151538014411926, 0.00043352507054805756, 0.0004518963396549225, 0.0004702676087617874, 0.0004886388778686523]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 6.0, 8.0, 7.0, 12.0, 13.0, 19.0, 22.0, 13.0, 18.0, 22.0, 36.0, 23.0, 34.0, 31.0, 46.0, 45.0, 44.0, 36.0, 54.0, 55.0, 44.0, 53.0, 34.0, 35.0, 33.0, 32.0, 23.0, 28.0, 30.0, 18.0, 24.0, 18.0, 11.0, 12.0, 14.0, 5.0, 3.0, 8.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.962738037109375, -1.89422607421875, -1.825714111328125, -1.7572021484375, -1.688690185546875, -1.62017822265625, -1.551666259765625, -1.483154296875, -1.414642333984375, -1.34613037109375, -1.277618408203125, -1.2091064453125, -1.140594482421875, -1.07208251953125, -1.003570556640625, -0.93505859375, -0.866546630859375, -0.79803466796875, -0.729522705078125, -0.6610107421875, -0.592498779296875, -0.52398681640625, -0.455474853515625, -0.386962890625, -0.318450927734375, -0.24993896484375, -0.181427001953125, -0.1129150390625, -0.044403076171875, 0.02410888671875, 0.092620849609375, 0.1611328125, 0.229644775390625, 0.29815673828125, 0.366668701171875, 0.4351806640625, 0.503692626953125, 0.57220458984375, 0.640716552734375, 0.709228515625, 0.777740478515625, 0.84625244140625, 0.914764404296875, 0.9832763671875, 1.051788330078125, 1.12030029296875, 1.188812255859375, 1.25732421875, 1.325836181640625, 1.39434814453125, 1.462860107421875, 1.5313720703125, 1.599884033203125, 1.66839599609375, 1.736907958984375, 1.805419921875, 1.873931884765625, 1.94244384765625, 2.010955810546875, 2.0794677734375, 2.147979736328125, 2.21649169921875, 2.285003662109375, 2.353515625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 22.0, 22.0, 42.0, 60.0, 98.0, 136.0, 241.0, 507.0, 953.0, 2226.0, 5386.0, 12818.0, 29801.0, 69575.0, 166032.0, 315143.0, 250713.0, 112400.0, 46729.0, 20403.0, 8569.0, 3505.0, 1589.0, 717.0, 349.0, 196.0, 127.0, 76.0, 42.0, 29.0, 15.0, 11.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.607421875, -2.53021240234375, -2.4530029296875, -2.37579345703125, -2.298583984375, -2.22137451171875, -2.1441650390625, -2.06695556640625, -1.98974609375, -1.91253662109375, -1.8353271484375, -1.75811767578125, -1.680908203125, -1.60369873046875, -1.5264892578125, -1.44927978515625, -1.3720703125, -1.29486083984375, -1.2176513671875, -1.14044189453125, -1.063232421875, -0.98602294921875, -0.9088134765625, -0.83160400390625, -0.75439453125, -0.67718505859375, -0.5999755859375, -0.52276611328125, -0.445556640625, -0.36834716796875, -0.2911376953125, -0.21392822265625, -0.13671875, -0.05950927734375, 0.0177001953125, 0.09490966796875, 0.172119140625, 0.24932861328125, 0.3265380859375, 0.40374755859375, 0.48095703125, 0.55816650390625, 0.6353759765625, 0.71258544921875, 0.789794921875, 0.86700439453125, 0.9442138671875, 1.02142333984375, 1.0986328125, 1.17584228515625, 1.2530517578125, 1.33026123046875, 1.407470703125, 1.48468017578125, 1.5618896484375, 1.63909912109375, 1.71630859375, 1.79351806640625, 1.8707275390625, 1.94793701171875, 2.025146484375, 2.10235595703125, 2.1795654296875, 2.25677490234375, 2.333984375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 14.0, 17.0, 10.0, 21.0, 18.0, 34.0, 33.0, 31.0, 39.0, 59.0, 52.0, 79.0, 153.0, 392.0, 1466.0, 184.0, 93.0, 50.0, 51.0, 39.0, 46.0, 37.0, 27.0, 24.0, 16.0, 12.0, 8.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.0546875, -13.71246337890625, -13.3702392578125, -13.02801513671875, -12.685791015625, -12.34356689453125, -12.0013427734375, -11.65911865234375, -11.31689453125, -10.97467041015625, -10.6324462890625, -10.29022216796875, -9.947998046875, -9.60577392578125, -9.2635498046875, -8.92132568359375, -8.5791015625, -8.23687744140625, -7.8946533203125, -7.55242919921875, -7.210205078125, -6.86798095703125, -6.5257568359375, -6.18353271484375, -5.84130859375, -5.49908447265625, -5.1568603515625, -4.81463623046875, -4.472412109375, -4.13018798828125, -3.7879638671875, -3.44573974609375, -3.103515625, -2.76129150390625, -2.4190673828125, -2.07684326171875, -1.734619140625, -1.39239501953125, -1.0501708984375, -0.70794677734375, -0.36572265625, -0.02349853515625, 0.3187255859375, 0.66094970703125, 1.003173828125, 1.34539794921875, 1.6876220703125, 2.02984619140625, 2.3720703125, 2.71429443359375, 3.0565185546875, 3.39874267578125, 3.740966796875, 4.08319091796875, 4.4254150390625, 4.76763916015625, 5.10986328125, 5.45208740234375, 5.7943115234375, 6.13653564453125, 6.478759765625, 6.82098388671875, 7.1632080078125, 7.50543212890625, 7.84765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 13.0, 6.0, 7.0, 13.0, 16.0, 19.0, 34.0, 41.0, 60.0, 80.0, 103.0, 165.0, 219.0, 427.0, 950.0, 17031.0, 3086127.0, 37811.0, 1225.0, 452.0, 257.0, 168.0, 106.0, 93.0, 58.0, 51.0, 27.0, 27.0, 26.0, 24.0, 19.0, 12.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.484375, -17.665283203125, -16.84619140625, -16.027099609375, -15.2080078125, -14.388916015625, -13.56982421875, -12.750732421875, -11.931640625, -11.112548828125, -10.29345703125, -9.474365234375, -8.6552734375, -7.836181640625, -7.01708984375, -6.197998046875, -5.37890625, -4.559814453125, -3.74072265625, -2.921630859375, -2.1025390625, -1.283447265625, -0.46435546875, 0.354736328125, 1.173828125, 1.992919921875, 2.81201171875, 3.631103515625, 4.4501953125, 5.269287109375, 6.08837890625, 6.907470703125, 7.7265625, 8.545654296875, 9.36474609375, 10.183837890625, 11.0029296875, 11.822021484375, 12.64111328125, 13.460205078125, 14.279296875, 15.098388671875, 15.91748046875, 16.736572265625, 17.5556640625, 18.374755859375, 19.19384765625, 20.012939453125, 20.83203125, 21.651123046875, 22.47021484375, 23.289306640625, 24.1083984375, 24.927490234375, 25.74658203125, 26.565673828125, 27.384765625, 28.203857421875, 29.02294921875, 29.842041015625, 30.6611328125, 31.480224609375, 32.29931640625, 33.118408203125, 33.9375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 25.0, 43.0, 127.0, 242.0, 283.0, 157.0, 92.0, 29.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.05703353881836, -29.151933670043945, -28.246835708618164, -27.34173583984375, -26.436635971069336, -25.531536102294922, -24.62643814086914, -23.721338272094727, -22.816238403320312, -21.9111385345459, -21.006040573120117, -20.100940704345703, -19.19584083557129, -18.290740966796875, -17.385643005371094, -16.48054313659668, -15.575444221496582, -14.670345306396484, -13.76524543762207, -12.860146522521973, -11.955046653747559, -11.049947738647461, -10.144847869873047, -9.23974895477295, -8.334650039672852, -7.429550647735596, -6.52445125579834, -5.619352340698242, -4.714252471923828, -3.8091535568237305, -2.9040541648864746, -1.9989547729492188, -1.0938549041748047, -0.1887555718421936, 0.7163437604904175, 1.6214430332183838, 2.5265424251556396, 3.4316415786743164, 4.336740970611572, 5.241840362548828, 6.146939754486084, 7.05203914642334, 7.957138538360596, 8.862237930297852, 9.76733684539795, 10.672435760498047, 11.577535629272461, 12.482635498046875, 13.387734413146973, 14.29283332824707, 15.197933197021484, 16.1030330657959, 17.00813102722168, 17.913230895996094, 18.818330764770508, 19.723430633544922, 20.628528594970703, 21.533628463745117, 22.4387264251709, 23.343826293945312, 24.248926162719727, 25.15402603149414, 26.059123992919922, 26.964223861694336, 27.86932373046875]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 15.0, 9.0, 9.0, 15.0, 10.0, 15.0, 14.0, 21.0, 18.0, 27.0, 28.0, 19.0, 38.0, 37.0, 34.0, 31.0, 44.0, 41.0, 45.0, 47.0, 46.0, 52.0, 38.0, 29.0, 36.0, 32.0, 27.0, 23.0, 28.0, 30.0, 26.0, 28.0, 15.0, 12.0, 15.0, 7.0, 9.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.2705135345459, -19.670528411865234, -19.070541381835938, -18.47055435180664, -17.870569229125977, -17.270584106445312, -16.670597076416016, -16.07061004638672, -15.470624923706055, -14.870638847351074, -14.270652770996094, -13.670666694641113, -13.070680618286133, -12.470694541931152, -11.870708465576172, -11.270722389221191, -10.670736312866211, -10.07075023651123, -9.47076416015625, -8.87077808380127, -8.270792007446289, -7.670805931091309, -7.070819854736328, -6.470833778381348, -5.870847702026367, -5.270861625671387, -4.670875549316406, -4.070889472961426, -3.4709033966064453, -2.870917320251465, -2.2709312438964844, -1.670945167541504, -1.0709609985351562, -0.4709749221801758, 0.1290111541748047, 0.7289972305297852, 1.3289833068847656, 1.928969383239746, 2.5289554595947266, 3.128941535949707, 3.7289276123046875, 4.328913688659668, 4.928899765014648, 5.528885841369629, 6.128871917724609, 6.72885799407959, 7.32884407043457, 7.928830146789551, 8.528816223144531, 9.128802299499512, 9.728788375854492, 10.328774452209473, 10.928760528564453, 11.528746604919434, 12.128732681274414, 12.728718757629395, 13.328704833984375, 13.928690910339355, 14.528676986694336, 15.128663063049316, 15.728649139404297, 16.328636169433594, 16.928621292114258, 17.528606414794922, 18.12859344482422]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 3.0, 5.0, 4.0, 12.0, 13.0, 10.0, 21.0, 16.0, 17.0, 25.0, 41.0, 25.0, 19.0, 22.0, 30.0, 33.0, 36.0, 51.0, 35.0, 49.0, 51.0, 40.0, 41.0, 37.0, 39.0, 33.0, 38.0, 21.0, 25.0, 21.0, 26.0, 18.0, 23.0, 22.0, 12.0, 11.0, 11.0, 11.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.349609375, -2.2789306640625, -2.208251953125, -2.1375732421875, -2.06689453125, -1.9962158203125, -1.925537109375, -1.8548583984375, -1.7841796875, -1.7135009765625, -1.642822265625, -1.5721435546875, -1.50146484375, -1.4307861328125, -1.360107421875, -1.2894287109375, -1.21875, -1.1480712890625, -1.077392578125, -1.0067138671875, -0.93603515625, -0.8653564453125, -0.794677734375, -0.7239990234375, -0.6533203125, -0.5826416015625, -0.511962890625, -0.4412841796875, -0.37060546875, -0.2999267578125, -0.229248046875, -0.1585693359375, -0.087890625, -0.0172119140625, 0.053466796875, 0.1241455078125, 0.19482421875, 0.2655029296875, 0.336181640625, 0.4068603515625, 0.4775390625, 0.5482177734375, 0.618896484375, 0.6895751953125, 0.76025390625, 0.8309326171875, 0.901611328125, 0.9722900390625, 1.04296875, 1.1136474609375, 1.184326171875, 1.2550048828125, 1.32568359375, 1.3963623046875, 1.467041015625, 1.5377197265625, 1.6083984375, 1.6790771484375, 1.749755859375, 1.8204345703125, 1.89111328125, 1.9617919921875, 2.032470703125, 2.1031494140625, 2.173828125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 10.0, 17.0, 16.0, 24.0, 24.0, 27.0, 28.0, 30.0, 44.0, 74.0, 146.0, 309.0, 830.0, 4011.0, 59946.0, 1382138.0, 2531140.0, 203804.0, 9246.0, 1366.0, 409.0, 198.0, 92.0, 51.0, 32.0, 34.0, 17.0, 28.0, 26.0, 18.0, 15.0, 11.0, 13.0, 7.0, 6.0, 11.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-7.53515625, -7.30804443359375, -7.0809326171875, -6.85382080078125, -6.626708984375, -6.39959716796875, -6.1724853515625, -5.94537353515625, -5.71826171875, -5.49114990234375, -5.2640380859375, -5.03692626953125, -4.809814453125, -4.58270263671875, -4.3555908203125, -4.12847900390625, -3.9013671875, -3.67425537109375, -3.4471435546875, -3.22003173828125, -2.992919921875, -2.76580810546875, -2.5386962890625, -2.31158447265625, -2.08447265625, -1.85736083984375, -1.6302490234375, -1.40313720703125, -1.176025390625, -0.94891357421875, -0.7218017578125, -0.49468994140625, -0.267578125, -0.04046630859375, 0.1866455078125, 0.41375732421875, 0.640869140625, 0.86798095703125, 1.0950927734375, 1.32220458984375, 1.54931640625, 1.77642822265625, 2.0035400390625, 2.23065185546875, 2.457763671875, 2.68487548828125, 2.9119873046875, 3.13909912109375, 3.3662109375, 3.59332275390625, 3.8204345703125, 4.04754638671875, 4.274658203125, 4.50177001953125, 4.7288818359375, 4.95599365234375, 5.18310546875, 5.41021728515625, 5.6373291015625, 5.86444091796875, 6.091552734375, 6.31866455078125, 6.5457763671875, 6.77288818359375, 7.0]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 15.0, 5.0, 11.0, 16.0, 30.0, 35.0, 40.0, 42.0, 66.0, 91.0, 100.0, 154.0, 170.0, 224.0, 254.0, 317.0, 305.0, 411.0, 329.0, 310.0, 259.0, 197.0, 158.0, 118.0, 88.0, 75.0, 47.0, 55.0, 29.0, 26.0, 21.0, 18.0, 13.0, 14.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.65234375, -4.516357421875, -4.38037109375, -4.244384765625, -4.1083984375, -3.972412109375, -3.83642578125, -3.700439453125, -3.564453125, -3.428466796875, -3.29248046875, -3.156494140625, -3.0205078125, -2.884521484375, -2.74853515625, -2.612548828125, -2.4765625, -2.340576171875, -2.20458984375, -2.068603515625, -1.9326171875, -1.796630859375, -1.66064453125, -1.524658203125, -1.388671875, -1.252685546875, -1.11669921875, -0.980712890625, -0.8447265625, -0.708740234375, -0.57275390625, -0.436767578125, -0.30078125, -0.164794921875, -0.02880859375, 0.107177734375, 0.2431640625, 0.379150390625, 0.51513671875, 0.651123046875, 0.787109375, 0.923095703125, 1.05908203125, 1.195068359375, 1.3310546875, 1.467041015625, 1.60302734375, 1.739013671875, 1.875, 2.010986328125, 2.14697265625, 2.282958984375, 2.4189453125, 2.554931640625, 2.69091796875, 2.826904296875, 2.962890625, 3.098876953125, 3.23486328125, 3.370849609375, 3.5068359375, 3.642822265625, 3.77880859375, 3.914794921875, 4.05078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 11.0, 15.0, 16.0, 17.0, 24.0, 29.0, 39.0, 55.0, 59.0, 91.0, 98.0, 120.0, 145.0, 246.0, 305.0, 732.0, 3084.0, 36187.0, 758349.0, 3046357.0, 328036.0, 16664.0, 1878.0, 580.0, 287.0, 201.0, 164.0, 118.0, 96.0, 60.0, 53.0, 43.0, 29.0, 29.0, 15.0, 19.0, 6.0, 5.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.6934814453125, -8.386962890625, -8.0804443359375, -7.77392578125, -7.4674072265625, -7.160888671875, -6.8543701171875, -6.5478515625, -6.2413330078125, -5.934814453125, -5.6282958984375, -5.32177734375, -5.0152587890625, -4.708740234375, -4.4022216796875, -4.095703125, -3.7891845703125, -3.482666015625, -3.1761474609375, -2.86962890625, -2.5631103515625, -2.256591796875, -1.9500732421875, -1.6435546875, -1.3370361328125, -1.030517578125, -0.7239990234375, -0.41748046875, -0.1109619140625, 0.195556640625, 0.5020751953125, 0.80859375, 1.1151123046875, 1.421630859375, 1.7281494140625, 2.03466796875, 2.3411865234375, 2.647705078125, 2.9542236328125, 3.2607421875, 3.5672607421875, 3.873779296875, 4.1802978515625, 4.48681640625, 4.7933349609375, 5.099853515625, 5.4063720703125, 5.712890625, 6.0194091796875, 6.325927734375, 6.6324462890625, 6.93896484375, 7.2454833984375, 7.552001953125, 7.8585205078125, 8.1650390625, 8.4715576171875, 8.778076171875, 9.0845947265625, 9.39111328125, 9.6976318359375, 10.004150390625, 10.3106689453125, 10.6171875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 10.0, 36.0, 49.0, 51.0, 86.0, 104.0, 119.0, 141.0, 119.0, 108.0, 82.0, 40.0, 28.0, 18.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.795066833496094, -28.9697265625, -28.144386291503906, -27.319046020507812, -26.49370574951172, -25.668365478515625, -24.8430233001709, -24.017683029174805, -23.19234275817871, -22.367002487182617, -21.541662216186523, -20.71632194519043, -19.890979766845703, -19.06563949584961, -18.240299224853516, -17.414958953857422, -16.589618682861328, -15.764278411865234, -14.93893814086914, -14.11359691619873, -13.288256645202637, -12.462916374206543, -11.637575149536133, -10.812234878540039, -9.986894607543945, -9.161554336547852, -8.336214065551758, -7.510872840881348, -6.685532569885254, -5.86019229888916, -5.034851551055908, -4.209510803222656, -3.3841705322265625, -2.5588300228118896, -1.7334895133972168, -0.908149003982544, -0.0828084945678711, 0.7425317764282227, 1.5678725242614746, 2.3932132720947266, 3.2185535430908203, 4.043893814086914, 4.869234561920166, 5.694575309753418, 6.519915580749512, 7.3452558517456055, 8.170597076416016, 8.99593734741211, 9.821277618408203, 10.646617889404297, 11.47195816040039, 12.2972993850708, 13.122639656066895, 13.947979927062988, 14.773321151733398, 15.598661422729492, 16.424001693725586, 17.24934196472168, 18.074682235717773, 18.900022506713867, 19.725364685058594, 20.550704956054688, 21.37604522705078, 22.201385498046875, 23.02672576904297]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 13.0, 20.0, 19.0, 19.0, 16.0, 32.0, 23.0, 29.0, 47.0, 35.0, 34.0, 37.0, 47.0, 50.0, 38.0, 50.0, 43.0, 49.0, 47.0, 29.0, 48.0, 34.0, 38.0, 32.0, 24.0, 26.0, 31.0, 10.0, 14.0, 11.0, 12.0, 9.0, 8.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.86268424987793, -18.28342628479004, -17.70416831970215, -17.124910354614258, -16.545652389526367, -15.966394424438477, -15.387136459350586, -14.807878494262695, -14.228620529174805, -13.649362564086914, -13.070104598999023, -12.490846633911133, -11.911588668823242, -11.332330703735352, -10.753072738647461, -10.17381477355957, -9.594555854797363, -9.015297889709473, -8.436039924621582, -7.856781959533691, -7.277523994445801, -6.69826602935791, -6.119007587432861, -5.539749622344971, -4.96049165725708, -4.3812336921691895, -3.801975727081299, -3.222717523574829, -2.6434595584869385, -2.064201593399048, -1.4849433898925781, -0.9056854248046875, -0.3264274597167969, 0.2528305649757385, 0.8320885896682739, 1.411346673965454, 1.9906046390533447, 2.5698626041412354, 3.149120807647705, 3.7283787727355957, 4.307636737823486, 4.886894702911377, 5.466152667999268, 6.045411109924316, 6.624669075012207, 7.203927040100098, 7.783185005187988, 8.362442970275879, 8.94170093536377, 9.52095890045166, 10.10021686553955, 10.679474830627441, 11.258732795715332, 11.837990760803223, 12.41724967956543, 12.99650764465332, 13.575765609741211, 14.155023574829102, 14.734281539916992, 15.313539505004883, 15.892797470092773, 16.472055435180664, 17.051313400268555, 17.630571365356445, 18.209829330444336]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 11.0, 4.0, 1.0, 5.0, 6.0, 5.0, 12.0, 13.0, 13.0, 12.0, 18.0, 20.0, 23.0, 24.0, 24.0, 16.0, 26.0, 23.0, 25.0, 41.0, 37.0, 51.0, 43.0, 50.0, 36.0, 26.0, 39.0, 32.0, 25.0, 26.0, 36.0, 30.0, 31.0, 21.0, 20.0, 21.0, 19.0, 18.0, 17.0, 17.0, 12.0, 18.0, 10.0, 15.0, 4.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-2.005859375, -1.94427490234375, -1.8826904296875, -1.82110595703125, -1.759521484375, -1.69793701171875, -1.6363525390625, -1.57476806640625, -1.51318359375, -1.45159912109375, -1.3900146484375, -1.32843017578125, -1.266845703125, -1.20526123046875, -1.1436767578125, -1.08209228515625, -1.0205078125, -0.95892333984375, -0.8973388671875, -0.83575439453125, -0.774169921875, -0.71258544921875, -0.6510009765625, -0.58941650390625, -0.52783203125, -0.46624755859375, -0.4046630859375, -0.34307861328125, -0.281494140625, -0.21990966796875, -0.1583251953125, -0.09674072265625, -0.03515625, 0.02642822265625, 0.0880126953125, 0.14959716796875, 0.211181640625, 0.27276611328125, 0.3343505859375, 0.39593505859375, 0.45751953125, 0.51910400390625, 0.5806884765625, 0.64227294921875, 0.703857421875, 0.76544189453125, 0.8270263671875, 0.88861083984375, 0.9501953125, 1.01177978515625, 1.0733642578125, 1.13494873046875, 1.196533203125, 1.25811767578125, 1.3197021484375, 1.38128662109375, 1.44287109375, 1.50445556640625, 1.5660400390625, 1.62762451171875, 1.689208984375, 1.75079345703125, 1.8123779296875, 1.87396240234375, 1.935546875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 8.0, 19.0, 28.0, 38.0, 58.0, 111.0, 156.0, 209.0, 338.0, 448.0, 660.0, 1018.0, 1431.0, 1991.0, 2743.0, 4053.0, 5821.0, 8684.0, 12682.0, 19424.0, 30736.0, 50101.0, 86332.0, 159693.0, 241872.0, 173924.0, 94783.0, 54303.0, 33035.0, 20898.0, 13584.0, 9150.0, 6216.0, 4207.0, 2997.0, 2099.0, 1460.0, 1003.0, 717.0, 487.0, 336.0, 228.0, 159.0, 100.0, 74.0, 49.0, 34.0, 19.0, 9.0, 10.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.290283203125, -0.2813720703125, -0.2724609375, -0.2635498046875, -0.254638671875, -0.2457275390625, -0.23681640625, -0.2279052734375, -0.218994140625, -0.2100830078125, -0.201171875, -0.1922607421875, -0.183349609375, -0.1744384765625, -0.16552734375, -0.1566162109375, -0.147705078125, -0.1387939453125, -0.1298828125, -0.1209716796875, -0.112060546875, -0.1031494140625, -0.09423828125, -0.0853271484375, -0.076416015625, -0.0675048828125, -0.05859375, -0.0496826171875, -0.040771484375, -0.0318603515625, -0.02294921875, -0.0140380859375, -0.005126953125, 0.0037841796875, 0.0126953125, 0.0216064453125, 0.030517578125, 0.0394287109375, 0.04833984375, 0.0572509765625, 0.066162109375, 0.0750732421875, 0.083984375, 0.0928955078125, 0.101806640625, 0.1107177734375, 0.11962890625, 0.1285400390625, 0.137451171875, 0.1463623046875, 0.1552734375, 0.1641845703125, 0.173095703125, 0.1820068359375, 0.19091796875, 0.1998291015625, 0.208740234375, 0.2176513671875, 0.2265625, 0.2354736328125, 0.244384765625, 0.2532958984375, 0.26220703125, 0.2711181640625, 0.280029296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 10.0, 14.0, 11.0, 30.0, 19.0, 39.0, 30.0, 36.0, 32.0, 39.0, 33.0, 38.0, 55.0, 60.0, 1078.0, 37.0, 51.0, 50.0, 45.0, 38.0, 34.0, 36.0, 37.0, 22.0, 23.0, 22.0, 23.0, 6.0, 12.0, 7.0, 9.0, 10.0, 2.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5842742919921875, -1.533782958984375, -1.4832916259765625, -1.43280029296875, -1.3823089599609375, -1.331817626953125, -1.2813262939453125, -1.2308349609375, -1.1803436279296875, -1.129852294921875, -1.0793609619140625, -1.02886962890625, -0.9783782958984375, -0.927886962890625, -0.8773956298828125, -0.826904296875, -0.7764129638671875, -0.725921630859375, -0.6754302978515625, -0.62493896484375, -0.5744476318359375, -0.523956298828125, -0.4734649658203125, -0.4229736328125, -0.3724822998046875, -0.321990966796875, -0.2714996337890625, -0.22100830078125, -0.1705169677734375, -0.120025634765625, -0.0695343017578125, -0.01904296875, 0.0314483642578125, 0.081939697265625, 0.1324310302734375, 0.18292236328125, 0.2334136962890625, 0.283905029296875, 0.3343963623046875, 0.3848876953125, 0.4353790283203125, 0.485870361328125, 0.5363616943359375, 0.58685302734375, 0.6373443603515625, 0.687835693359375, 0.7383270263671875, 0.788818359375, 0.8393096923828125, 0.889801025390625, 0.9402923583984375, 0.99078369140625, 1.0412750244140625, 1.091766357421875, 1.1422576904296875, 1.1927490234375, 1.2432403564453125, 1.293731689453125, 1.3442230224609375, 1.39471435546875, 1.4452056884765625, 1.495697021484375, 1.5461883544921875, 1.5966796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 20.0, 32.0, 44.0, 52.0, 93.0, 117.0, 153.0, 277.0, 339.0, 532.0, 814.0, 1127.0, 1698.0, 2561.0, 3962.0, 6056.0, 9765.0, 15651.0, 25211.0, 41603.0, 72262.0, 130433.0, 1225153.0, 260528.0, 124095.0, 68784.0, 40169.0, 24068.0, 14710.0, 9196.0, 5926.0, 3782.0, 2614.0, 1662.0, 1160.0, 806.0, 539.0, 343.0, 236.0, 174.0, 109.0, 80.0, 66.0, 38.0, 28.0, 15.0, 14.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.248779296875, -0.2409954071044922, -0.23321151733398438, -0.22542762756347656, -0.21764373779296875, -0.20985984802246094, -0.20207595825195312, -0.1942920684814453, -0.1865081787109375, -0.1787242889404297, -0.17094039916992188, -0.16315650939941406, -0.15537261962890625, -0.14758872985839844, -0.13980484008789062, -0.1320209503173828, -0.124237060546875, -0.11645317077636719, -0.10866928100585938, -0.10088539123535156, -0.09310150146484375, -0.08531761169433594, -0.07753372192382812, -0.06974983215332031, -0.0619659423828125, -0.05418205261230469, -0.046398162841796875, -0.03861427307128906, -0.03083038330078125, -0.023046493530273438, -0.015262603759765625, -0.0074787139892578125, 0.00030517578125, 0.008089065551757812, 0.015872955322265625, 0.023656845092773438, 0.03144073486328125, 0.03922462463378906, 0.047008514404296875, 0.05479240417480469, 0.0625762939453125, 0.07036018371582031, 0.07814407348632812, 0.08592796325683594, 0.09371185302734375, 0.10149574279785156, 0.10927963256835938, 0.11706352233886719, 0.124847412109375, 0.1326313018798828, 0.14041519165039062, 0.14819908142089844, 0.15598297119140625, 0.16376686096191406, 0.17155075073242188, 0.1793346405029297, 0.1871185302734375, 0.1949024200439453, 0.20268630981445312, 0.21047019958496094, 0.21825408935546875, 0.22603797912597656, 0.23382186889648438, 0.2416057586669922, 0.2493896484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 6.0, 8.0, 12.0, 7.0, 12.0, 19.0, 18.0, 38.0, 38.0, 50.0, 39.0, 61.0, 57.0, 64.0, 68.0, 74.0, 65.0, 55.0, 57.0, 41.0, 36.0, 25.0, 29.0, 22.0, 13.0, 16.0, 17.0, 11.0, 8.0, 7.0, 8.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007238388061523438, -0.0006979629397392273, -0.0006720870733261108, -0.0006462112069129944, -0.0006203353404998779, -0.0005944594740867615, -0.000568583607673645, -0.0005427077412605286, -0.0005168318748474121, -0.0004909560084342957, -0.0004650801420211792, -0.00043920427560806274, -0.0004133284091949463, -0.00038745254278182983, -0.0003615766763687134, -0.0003357008099555969, -0.00030982494354248047, -0.000283949077129364, -0.00025807321071624756, -0.0002321973443031311, -0.00020632147789001465, -0.0001804456114768982, -0.00015456974506378174, -0.00012869387865066528, -0.00010281801223754883, -7.694214582443237e-05, -5.106627941131592e-05, -2.5190412998199463e-05, 6.854534149169922e-07, 2.6561319828033447e-05, 5.24371862411499e-05, 7.831305265426636e-05, 0.00010418891906738281, 0.00013006478548049927, 0.00015594065189361572, 0.00018181651830673218, 0.00020769238471984863, 0.0002335682511329651, 0.00025944411754608154, 0.000285319983959198, 0.00031119585037231445, 0.0003370717167854309, 0.00036294758319854736, 0.0003888234496116638, 0.0004146993160247803, 0.00044057518243789673, 0.0004664510488510132, 0.0004923269152641296, 0.0005182027816772461, 0.0005440786480903625, 0.000569954514503479, 0.0005958303809165955, 0.0006217062473297119, 0.0006475821137428284, 0.0006734579801559448, 0.0006993338465690613, 0.0007252097129821777, 0.0007510855793952942, 0.0007769614458084106, 0.0008028373122215271, 0.0008287131786346436, 0.00085458904504776, 0.0008804649114608765, 0.0009063407778739929, 0.0009322166442871094]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 11.0, 14.0, 13.0, 15.0, 18.0, 19.0, 34.0, 35.0, 57.0, 94.0, 131.0, 224.0, 475.0, 1967.0, 275847.0, 764663.0, 3525.0, 611.0, 272.0, 148.0, 79.0, 61.0, 54.0, 42.0, 25.0, 21.0, 19.0, 8.0, 18.0, 4.0, 4.0, 2.0, 5.0, 8.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01666259765625, -0.0161435604095459, -0.015624523162841797, -0.015105485916137695, -0.014586448669433594, -0.014067411422729492, -0.01354837417602539, -0.013029336929321289, -0.012510299682617188, -0.011991262435913086, -0.011472225189208984, -0.010953187942504883, -0.010434150695800781, -0.00991511344909668, -0.009396076202392578, -0.008877038955688477, -0.008358001708984375, -0.007838964462280273, -0.007319927215576172, -0.00680088996887207, -0.006281852722167969, -0.005762815475463867, -0.005243778228759766, -0.004724740982055664, -0.0042057037353515625, -0.003686666488647461, -0.0031676292419433594, -0.002648591995239258, -0.0021295547485351562, -0.0016105175018310547, -0.0010914802551269531, -0.0005724430084228516, -5.340576171875e-05, 0.00046563148498535156, 0.0009846687316894531, 0.0015037059783935547, 0.0020227432250976562, 0.002541780471801758, 0.0030608177185058594, 0.003579854965209961, 0.0040988922119140625, 0.004617929458618164, 0.005136966705322266, 0.005656003952026367, 0.006175041198730469, 0.00669407844543457, 0.007213115692138672, 0.0077321529388427734, 0.008251190185546875, 0.008770227432250977, 0.009289264678955078, 0.00980830192565918, 0.010327339172363281, 0.010846376419067383, 0.011365413665771484, 0.011884450912475586, 0.012403488159179688, 0.012922525405883789, 0.01344156265258789, 0.013960599899291992, 0.014479637145996094, 0.014998674392700195, 0.015517711639404297, 0.0160367488861084, 0.0165557861328125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 29.0, 87.0, 207.0, 318.0, 223.0, 99.0, 29.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032286858186125755, -0.0002732789143919945, -0.00022368927602656186, -0.000174099623109214, -0.00012450997019186616, -7.492030272260308e-05, -2.5330664357170463e-05, 2.4258974008262157e-05, 7.384864147752523e-05, 0.00012343829439487308, 0.00017302794731222093, 0.00022261760022956878, 0.00027220725314691663, 0.0003217969206161797, 0.0003713865589816123, 0.00042097619734704494, 0.000470565864816308, 0.0005201555322855711, 0.0005697451997548342, 0.0006193348090164363, 0.0006689244764856994, 0.0007185141439549625, 0.0007681037532165647, 0.0008176934206858277, 0.0008672830881550908, 0.0009168727556243539, 0.000966462423093617, 0.00101605209056288, 0.0010656416416168213, 0.0011152313090860844, 0.0011648209765553474, 0.0012144106440246105, 0.0012640003114938736, 0.0013135899789631367, 0.0013631796464323997, 0.0014127693139016628, 0.001462358981370926, 0.001511948648840189, 0.0015615381998941302, 0.0016111278673633933, 0.0016607175348326564, 0.0017103072023019195, 0.0017598968697711825, 0.0018094865372404456, 0.0018590760882943869, 0.00190866575576365, 0.001958255423232913, 0.002007845090702176, 0.002057434758171439, 0.0021070244256407022, 0.0021566140931099653, 0.0022062037605792284, 0.0022557934280484915, 0.0023053830955177546, 0.0023549727629870176, 0.002404562197625637, 0.0024541518650949, 0.002503741532564163, 0.0025533312000334263, 0.0026029208675026894, 0.0026525105349719524, 0.0027021002024412155, 0.0027516898699104786, 0.0028012795373797417, 0.0028508692048490047]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 9.0, 4.0, 10.0, 18.0, 16.0, 18.0, 17.0, 23.0, 30.0, 28.0, 32.0, 42.0, 28.0, 35.0, 43.0, 45.0, 46.0, 49.0, 42.0, 40.0, 39.0, 37.0, 30.0, 34.0, 40.0, 30.0, 24.0, 22.0, 29.0, 14.0, 25.0, 16.0, 19.0, 7.0, 9.0, 12.0, 6.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00043070316314697266, -0.00041798409074544907, -0.0004052650183439255, -0.0003925459459424019, -0.0003798268735408783, -0.0003671078011393547, -0.0003543887287378311, -0.0003416696563363075, -0.00032895058393478394, -0.00031623151153326035, -0.00030351243913173676, -0.00029079336673021317, -0.0002780742943286896, -0.000265355221927166, -0.0002526361495256424, -0.0002399170771241188, -0.00022719800472259521, -0.00021447893232107162, -0.00020175985991954803, -0.00018904078751802444, -0.00017632171511650085, -0.00016360264271497726, -0.00015088357031345367, -0.00013816449791193008, -0.0001254454255104065, -0.0001127263531088829, -0.00010000728070735931, -8.728820830583572e-05, -7.456913590431213e-05, -6.185006350278854e-05, -4.9130991101264954e-05, -3.6411918699741364e-05, -2.3692846298217773e-05, -1.0973773896694183e-05, 1.7452985048294067e-06, 1.4464370906352997e-05, 2.7183443307876587e-05, 3.990251570940018e-05, 5.262158811092377e-05, 6.534066051244736e-05, 7.805973291397095e-05, 9.077880531549454e-05, 0.00010349787771701813, 0.00011621695011854172, 0.0001289360225200653, 0.0001416550949215889, 0.0001543741673231125, 0.00016709323972463608, 0.00017981231212615967, 0.00019253138452768326, 0.00020525045692920685, 0.00021796952933073044, 0.00023068860173225403, 0.00024340767413377762, 0.0002561267465353012, 0.0002688458189368248, 0.0002815648913383484, 0.000294283963739872, 0.00030700303614139557, 0.00031972210854291916, 0.00033244118094444275, 0.00034516025334596634, 0.00035787932574748993, 0.0003705983981490135, 0.0003833174705505371]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 11.0, 4.0, 1.0, 5.0, 6.0, 5.0, 12.0, 13.0, 13.0, 12.0, 19.0, 20.0, 24.0, 22.0, 24.0, 16.0, 27.0, 26.0, 22.0, 40.0, 38.0, 50.0, 44.0, 50.0, 35.0, 29.0, 36.0, 32.0, 25.0, 27.0, 35.0, 30.0, 32.0, 21.0, 19.0, 21.0, 19.0, 18.0, 17.0, 17.0, 12.0, 18.0, 10.0, 15.0, 4.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-2.00390625, -1.942352294921875, -1.88079833984375, -1.819244384765625, -1.7576904296875, -1.696136474609375, -1.63458251953125, -1.573028564453125, -1.511474609375, -1.449920654296875, -1.38836669921875, -1.326812744140625, -1.2652587890625, -1.203704833984375, -1.14215087890625, -1.080596923828125, -1.01904296875, -0.957489013671875, -0.89593505859375, -0.834381103515625, -0.7728271484375, -0.711273193359375, -0.64971923828125, -0.588165283203125, -0.526611328125, -0.465057373046875, -0.40350341796875, -0.341949462890625, -0.2803955078125, -0.218841552734375, -0.15728759765625, -0.095733642578125, -0.0341796875, 0.027374267578125, 0.08892822265625, 0.150482177734375, 0.2120361328125, 0.273590087890625, 0.33514404296875, 0.396697998046875, 0.458251953125, 0.519805908203125, 0.58135986328125, 0.642913818359375, 0.7044677734375, 0.766021728515625, 0.82757568359375, 0.889129638671875, 0.95068359375, 1.012237548828125, 1.07379150390625, 1.135345458984375, 1.1968994140625, 1.258453369140625, 1.32000732421875, 1.381561279296875, 1.443115234375, 1.504669189453125, 1.56622314453125, 1.627777099609375, 1.6893310546875, 1.750885009765625, 1.81243896484375, 1.873992919921875, 1.935546875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 4.0, 12.0, 16.0, 28.0, 50.0, 90.0, 135.0, 231.0, 475.0, 1185.0, 3176.0, 8944.0, 26030.0, 67175.0, 167149.0, 363285.0, 246029.0, 101755.0, 39787.0, 14649.0, 5124.0, 1756.0, 735.0, 319.0, 165.0, 96.0, 46.0, 42.0, 24.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.8165283203125, -2.724853515625, -2.6331787109375, -2.54150390625, -2.4498291015625, -2.358154296875, -2.2664794921875, -2.1748046875, -2.0831298828125, -1.991455078125, -1.8997802734375, -1.80810546875, -1.7164306640625, -1.624755859375, -1.5330810546875, -1.44140625, -1.3497314453125, -1.258056640625, -1.1663818359375, -1.07470703125, -0.9830322265625, -0.891357421875, -0.7996826171875, -0.7080078125, -0.6163330078125, -0.524658203125, -0.4329833984375, -0.34130859375, -0.2496337890625, -0.157958984375, -0.0662841796875, 0.025390625, 0.1170654296875, 0.208740234375, 0.3004150390625, 0.39208984375, 0.4837646484375, 0.575439453125, 0.6671142578125, 0.7587890625, 0.8504638671875, 0.942138671875, 1.0338134765625, 1.12548828125, 1.2171630859375, 1.308837890625, 1.4005126953125, 1.4921875, 1.5838623046875, 1.675537109375, 1.7672119140625, 1.85888671875, 1.9505615234375, 2.042236328125, 2.1339111328125, 2.2255859375, 2.3172607421875, 2.408935546875, 2.5006103515625, 2.59228515625, 2.6839599609375, 2.775634765625, 2.8673095703125, 2.958984375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 17.0, 8.0, 15.0, 21.0, 18.0, 15.0, 25.0, 29.0, 47.0, 42.0, 33.0, 57.0, 73.0, 117.0, 349.0, 1450.0, 210.0, 111.0, 55.0, 44.0, 43.0, 37.0, 37.0, 38.0, 27.0, 23.0, 25.0, 13.0, 6.0, 16.0, 11.0, 10.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.49725341796875, -6.2171630859375, -5.93707275390625, -5.656982421875, -5.37689208984375, -5.0968017578125, -4.81671142578125, -4.53662109375, -4.25653076171875, -3.9764404296875, -3.69635009765625, -3.416259765625, -3.13616943359375, -2.8560791015625, -2.57598876953125, -2.2958984375, -2.01580810546875, -1.7357177734375, -1.45562744140625, -1.175537109375, -0.89544677734375, -0.6153564453125, -0.33526611328125, -0.05517578125, 0.22491455078125, 0.5050048828125, 0.78509521484375, 1.065185546875, 1.34527587890625, 1.6253662109375, 1.90545654296875, 2.185546875, 2.46563720703125, 2.7457275390625, 3.02581787109375, 3.305908203125, 3.58599853515625, 3.8660888671875, 4.14617919921875, 4.42626953125, 4.70635986328125, 4.9864501953125, 5.26654052734375, 5.546630859375, 5.82672119140625, 6.1068115234375, 6.38690185546875, 6.6669921875, 6.94708251953125, 7.2271728515625, 7.50726318359375, 7.787353515625, 8.06744384765625, 8.3475341796875, 8.62762451171875, 8.90771484375, 9.18780517578125, 9.4678955078125, 9.74798583984375, 10.028076171875, 10.30816650390625, 10.5882568359375, 10.86834716796875, 11.1484375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 10.0, 11.0, 11.0, 24.0, 28.0, 27.0, 41.0, 48.0, 63.0, 83.0, 138.0, 153.0, 250.0, 489.0, 1411.0, 84413.0, 3049230.0, 7396.0, 798.0, 337.0, 206.0, 130.0, 96.0, 71.0, 55.0, 40.0, 31.0, 14.0, 21.0, 7.0, 21.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.05419921875, -23.2333984375, -22.41259765625, -21.591796875, -20.77099609375, -19.9501953125, -19.12939453125, -18.30859375, -17.48779296875, -16.6669921875, -15.84619140625, -15.025390625, -14.20458984375, -13.3837890625, -12.56298828125, -11.7421875, -10.92138671875, -10.1005859375, -9.27978515625, -8.458984375, -7.63818359375, -6.8173828125, -5.99658203125, -5.17578125, -4.35498046875, -3.5341796875, -2.71337890625, -1.892578125, -1.07177734375, -0.2509765625, 0.56982421875, 1.390625, 2.21142578125, 3.0322265625, 3.85302734375, 4.673828125, 5.49462890625, 6.3154296875, 7.13623046875, 7.95703125, 8.77783203125, 9.5986328125, 10.41943359375, 11.240234375, 12.06103515625, 12.8818359375, 13.70263671875, 14.5234375, 15.34423828125, 16.1650390625, 16.98583984375, 17.806640625, 18.62744140625, 19.4482421875, 20.26904296875, 21.08984375, 21.91064453125, 22.7314453125, 23.55224609375, 24.373046875, 25.19384765625, 26.0146484375, 26.83544921875, 27.65625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 74.0, 632.0, 299.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.503320693969727, -18.72210121154785, -15.94088363647461, -13.159664154052734, -10.378445625305176, -7.597227096557617, -4.816007614135742, -2.0347900390625, 0.746429443359375, 3.5276482105255127, 6.30886697769165, 9.090085983276367, 11.871304512023926, 14.652523040771484, 17.43374252319336, 20.2149600982666, 22.996179580688477, 25.77739906311035, 28.558616638183594, 31.33983612060547, 34.121055603027344, 36.90227508544922, 39.683494567871094, 42.4647102355957, 45.24592971801758, 48.02714920043945, 50.80836868286133, 53.58958435058594, 56.37080383300781, 59.15202331542969, 61.93324279785156, 64.71446228027344, 67.49567413330078, 70.27689361572266, 73.05811309814453, 75.8393325805664, 78.62055206298828, 81.40176391601562, 84.1829833984375, 86.96420288085938, 89.74542236328125, 92.52664184570312, 95.307861328125, 98.08908081054688, 100.87030029296875, 103.65151977539062, 106.4327392578125, 109.21395111083984, 111.99517822265625, 114.77639770507812, 117.5576171875, 120.33883666992188, 123.12005615234375, 125.90127563476562, 128.6824951171875, 131.46371459960938, 134.2449188232422, 137.02613830566406, 139.80735778808594, 142.5885772705078, 145.3697967529297, 148.15101623535156, 150.93223571777344, 153.7134552001953, 156.4946746826172]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 6.0, 8.0, 10.0, 12.0, 17.0, 15.0, 18.0, 17.0, 13.0, 28.0, 24.0, 35.0, 41.0, 31.0, 40.0, 38.0, 47.0, 38.0, 47.0, 30.0, 42.0, 33.0, 39.0, 37.0, 32.0, 35.0, 35.0, 29.0, 25.0, 22.0, 34.0, 20.0, 18.0, 13.0, 17.0, 11.0, 4.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.69818878173828, -22.0194034576416, -21.340618133544922, -20.66183090209961, -19.98304557800293, -19.30426025390625, -18.62547492980957, -17.94668960571289, -17.267902374267578, -16.5891170501709, -15.910330772399902, -15.231545448303223, -14.552759170532227, -13.873973846435547, -13.195188522338867, -12.516403198242188, -11.837617874145508, -11.158832550048828, -10.480046272277832, -9.801260948181152, -9.122474670410156, -8.443689346313477, -7.764904022216797, -7.086118221282959, -6.407332420349121, -5.728546619415283, -5.049760818481445, -4.370975494384766, -3.6921896934509277, -3.01340389251709, -2.33461856842041, -1.6558327674865723, -0.9770450592041016, -0.2982593774795532, 0.3805263042449951, 1.059311866760254, 1.7380976676940918, 2.4168834686279297, 3.0956687927246094, 3.7744545936584473, 4.453240394592285, 5.132026195526123, 5.810811996459961, 6.489597320556641, 7.1683831214904785, 7.847168922424316, 8.525954246520996, 9.204740524291992, 9.883525848388672, 10.562311172485352, 11.241097450256348, 11.919882774353027, 12.598669052124023, 13.277454376220703, 13.956239700317383, 14.635025024414062, 15.313811302185059, 15.992596626281738, 16.671382904052734, 17.350168228149414, 18.028953552246094, 18.707740783691406, 19.386524200439453, 20.065311431884766, 20.744096755981445]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 2.0, 8.0, 9.0, 11.0, 12.0, 22.0, 20.0, 13.0, 18.0, 27.0, 17.0, 27.0, 30.0, 33.0, 35.0, 37.0, 33.0, 45.0, 49.0, 43.0, 27.0, 40.0, 42.0, 35.0, 26.0, 38.0, 34.0, 27.0, 23.0, 24.0, 24.0, 12.0, 22.0, 15.0, 17.0, 19.0, 13.0, 8.0, 13.0, 6.0, 11.0, 3.0, 3.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.271484375, -2.198577880859375, -2.12567138671875, -2.052764892578125, -1.9798583984375, -1.906951904296875, -1.83404541015625, -1.761138916015625, -1.688232421875, -1.615325927734375, -1.54241943359375, -1.469512939453125, -1.3966064453125, -1.323699951171875, -1.25079345703125, -1.177886962890625, -1.10498046875, -1.032073974609375, -0.95916748046875, -0.886260986328125, -0.8133544921875, -0.740447998046875, -0.66754150390625, -0.594635009765625, -0.521728515625, -0.448822021484375, -0.37591552734375, -0.303009033203125, -0.2301025390625, -0.157196044921875, -0.08428955078125, -0.011383056640625, 0.0615234375, 0.134429931640625, 0.20733642578125, 0.280242919921875, 0.3531494140625, 0.426055908203125, 0.49896240234375, 0.571868896484375, 0.644775390625, 0.717681884765625, 0.79058837890625, 0.863494873046875, 0.9364013671875, 1.009307861328125, 1.08221435546875, 1.155120849609375, 1.22802734375, 1.300933837890625, 1.37384033203125, 1.446746826171875, 1.5196533203125, 1.592559814453125, 1.66546630859375, 1.738372802734375, 1.811279296875, 1.884185791015625, 1.95709228515625, 2.029998779296875, 2.1029052734375, 2.175811767578125, 2.24871826171875, 2.321624755859375, 2.39453125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 4.0, 8.0, 14.0, 11.0, 11.0, 8.0, 21.0, 22.0, 26.0, 27.0, 33.0, 48.0, 52.0, 89.0, 157.0, 279.0, 788.0, 3331.0, 35439.0, 697934.0, 2756964.0, 660153.0, 33588.0, 3312.0, 916.0, 379.0, 195.0, 107.0, 65.0, 58.0, 27.0, 33.0, 20.0, 25.0, 11.0, 28.0, 17.0, 10.0, 9.0, 8.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.1171875, -6.89813232421875, -6.6790771484375, -6.46002197265625, -6.240966796875, -6.02191162109375, -5.8028564453125, -5.58380126953125, -5.36474609375, -5.14569091796875, -4.9266357421875, -4.70758056640625, -4.488525390625, -4.26947021484375, -4.0504150390625, -3.83135986328125, -3.6123046875, -3.39324951171875, -3.1741943359375, -2.95513916015625, -2.736083984375, -2.51702880859375, -2.2979736328125, -2.07891845703125, -1.85986328125, -1.64080810546875, -1.4217529296875, -1.20269775390625, -0.983642578125, -0.76458740234375, -0.5455322265625, -0.32647705078125, -0.107421875, 0.11163330078125, 0.3306884765625, 0.54974365234375, 0.768798828125, 0.98785400390625, 1.2069091796875, 1.42596435546875, 1.64501953125, 1.86407470703125, 2.0831298828125, 2.30218505859375, 2.521240234375, 2.74029541015625, 2.9593505859375, 3.17840576171875, 3.3974609375, 3.61651611328125, 3.8355712890625, 4.05462646484375, 4.273681640625, 4.49273681640625, 4.7117919921875, 4.93084716796875, 5.14990234375, 5.36895751953125, 5.5880126953125, 5.80706787109375, 6.026123046875, 6.24517822265625, 6.4642333984375, 6.68328857421875, 6.90234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 5.0, 8.0, 11.0, 16.0, 20.0, 27.0, 25.0, 38.0, 41.0, 79.0, 79.0, 121.0, 141.0, 194.0, 253.0, 254.0, 309.0, 346.0, 358.0, 300.0, 285.0, 270.0, 201.0, 136.0, 124.0, 80.0, 102.0, 55.0, 42.0, 31.0, 23.0, 22.0, 14.0, 16.0, 12.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.13671875, -3.9947509765625, -3.852783203125, -3.7108154296875, -3.56884765625, -3.4268798828125, -3.284912109375, -3.1429443359375, -3.0009765625, -2.8590087890625, -2.717041015625, -2.5750732421875, -2.43310546875, -2.2911376953125, -2.149169921875, -2.0072021484375, -1.865234375, -1.7232666015625, -1.581298828125, -1.4393310546875, -1.29736328125, -1.1553955078125, -1.013427734375, -0.8714599609375, -0.7294921875, -0.5875244140625, -0.445556640625, -0.3035888671875, -0.16162109375, -0.0196533203125, 0.122314453125, 0.2642822265625, 0.40625, 0.5482177734375, 0.690185546875, 0.8321533203125, 0.97412109375, 1.1160888671875, 1.258056640625, 1.4000244140625, 1.5419921875, 1.6839599609375, 1.825927734375, 1.9678955078125, 2.10986328125, 2.2518310546875, 2.393798828125, 2.5357666015625, 2.677734375, 2.8197021484375, 2.961669921875, 3.1036376953125, 3.24560546875, 3.3875732421875, 3.529541015625, 3.6715087890625, 3.8134765625, 3.9554443359375, 4.097412109375, 4.2393798828125, 4.38134765625, 4.5233154296875, 4.665283203125, 4.8072509765625, 4.94921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 5.0, 9.0, 9.0, 21.0, 18.0, 19.0, 28.0, 54.0, 64.0, 94.0, 117.0, 155.0, 212.0, 340.0, 536.0, 1627.0, 37059.0, 2948143.0, 1191465.0, 11810.0, 1041.0, 426.0, 293.0, 186.0, 149.0, 92.0, 82.0, 52.0, 40.0, 26.0, 26.0, 21.0, 16.0, 12.0, 4.0, 8.0, 9.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.709716796875, -15.20068359375, -14.691650390625, -14.1826171875, -13.673583984375, -13.16455078125, -12.655517578125, -12.146484375, -11.637451171875, -11.12841796875, -10.619384765625, -10.1103515625, -9.601318359375, -9.09228515625, -8.583251953125, -8.07421875, -7.565185546875, -7.05615234375, -6.547119140625, -6.0380859375, -5.529052734375, -5.02001953125, -4.510986328125, -4.001953125, -3.492919921875, -2.98388671875, -2.474853515625, -1.9658203125, -1.456787109375, -0.94775390625, -0.438720703125, 0.0703125, 0.579345703125, 1.08837890625, 1.597412109375, 2.1064453125, 2.615478515625, 3.12451171875, 3.633544921875, 4.142578125, 4.651611328125, 5.16064453125, 5.669677734375, 6.1787109375, 6.687744140625, 7.19677734375, 7.705810546875, 8.21484375, 8.723876953125, 9.23291015625, 9.741943359375, 10.2509765625, 10.760009765625, 11.26904296875, 11.778076171875, 12.287109375, 12.796142578125, 13.30517578125, 13.814208984375, 14.3232421875, 14.832275390625, 15.34130859375, 15.850341796875, 16.359375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 22.0, 189.0, 453.0, 294.0, 54.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.65222930908203, -100.47725677490234, -97.30227661132812, -94.12730407714844, -90.95233154296875, -87.77735900878906, -84.60238647460938, -81.42740631103516, -78.25243377685547, -75.07746124267578, -71.90248107910156, -68.72750854492188, -65.55253601074219, -62.3775634765625, -59.20258712768555, -56.027610778808594, -52.852638244628906, -49.67766571044922, -46.502689361572266, -43.32771301269531, -40.152740478515625, -36.97776794433594, -33.802791595458984, -30.627817153930664, -27.452842712402344, -24.277868270874023, -21.102893829345703, -17.927919387817383, -14.752944946289062, -11.577970504760742, -8.402996063232422, -5.228021621704102, -2.0530548095703125, 1.1219196319580078, 4.296894073486328, 7.471868515014648, 10.646842956542969, 13.821817398071289, 16.99679183959961, 20.17176628112793, 23.34674072265625, 26.52171516418457, 29.69668960571289, 32.871665954589844, 36.04663848876953, 39.22161102294922, 42.39658737182617, 45.571563720703125, 48.74653625488281, 51.9215087890625, 55.09648513793945, 58.271461486816406, 61.446434020996094, 64.62140655517578, 67.79638671875, 70.97135925292969, 74.14633178710938, 77.32130432128906, 80.49627685546875, 83.67125701904297, 86.84622955322266, 90.02120208740234, 93.19618225097656, 96.37115478515625, 99.54612731933594]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 12.0, 9.0, 16.0, 29.0, 14.0, 16.0, 25.0, 31.0, 33.0, 36.0, 37.0, 36.0, 47.0, 38.0, 35.0, 37.0, 35.0, 34.0, 39.0, 42.0, 40.0, 40.0, 38.0, 31.0, 30.0, 28.0, 29.0, 16.0, 13.0, 14.0, 16.0, 8.0, 12.0, 14.0, 9.0, 7.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.75714874267578, -16.243026733398438, -15.728904724121094, -15.214783668518066, -14.700661659240723, -14.186539649963379, -13.672418594360352, -13.158296585083008, -12.644174575805664, -12.13005256652832, -11.615930557250977, -11.10180950164795, -10.587687492370605, -10.073565483093262, -9.559444427490234, -9.04532241821289, -8.531200408935547, -8.017078399658203, -7.502956867218018, -6.988835334777832, -6.474713325500488, -5.9605913162231445, -5.446469783782959, -4.932348251342773, -4.41822624206543, -3.904104471206665, -3.3899827003479004, -2.8758609294891357, -2.361739158630371, -1.8476173877716064, -1.3334956169128418, -0.8193738460540771, -0.3052520751953125, 0.20886969566345215, 0.7229914665222168, 1.2371132373809814, 1.751235008239746, 2.2653567790985107, 2.7794785499572754, 3.29360032081604, 3.8077220916748047, 4.321844100952148, 4.835965633392334, 5.3500871658325195, 5.864209175109863, 6.378331184387207, 6.892452716827393, 7.406574249267578, 7.920696258544922, 8.434818267822266, 8.94894027709961, 9.463061332702637, 9.97718334197998, 10.491305351257324, 11.005426406860352, 11.519548416137695, 12.033670425415039, 12.547792434692383, 13.061914443969727, 13.576035499572754, 14.090157508850098, 14.604279518127441, 15.118400573730469, 15.632522583007812, 16.146644592285156]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 3.0, 20.0, 19.0, 22.0, 19.0, 26.0, 17.0, 29.0, 28.0, 33.0, 42.0, 33.0, 52.0, 51.0, 38.0, 40.0, 29.0, 41.0, 59.0, 33.0, 34.0, 25.0, 32.0, 45.0, 31.0, 27.0, 29.0, 23.0, 16.0, 15.0, 14.0, 12.0, 8.0, 10.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.53125, -2.452484130859375, -2.37371826171875, -2.294952392578125, -2.2161865234375, -2.137420654296875, -2.05865478515625, -1.979888916015625, -1.901123046875, -1.822357177734375, -1.74359130859375, -1.664825439453125, -1.5860595703125, -1.507293701171875, -1.42852783203125, -1.349761962890625, -1.27099609375, -1.192230224609375, -1.11346435546875, -1.034698486328125, -0.9559326171875, -0.877166748046875, -0.79840087890625, -0.719635009765625, -0.640869140625, -0.562103271484375, -0.48333740234375, -0.404571533203125, -0.3258056640625, -0.247039794921875, -0.16827392578125, -0.089508056640625, -0.0107421875, 0.068023681640625, 0.14678955078125, 0.225555419921875, 0.3043212890625, 0.383087158203125, 0.46185302734375, 0.540618896484375, 0.619384765625, 0.698150634765625, 0.77691650390625, 0.855682373046875, 0.9344482421875, 1.013214111328125, 1.09197998046875, 1.170745849609375, 1.24951171875, 1.328277587890625, 1.40704345703125, 1.485809326171875, 1.5645751953125, 1.643341064453125, 1.72210693359375, 1.800872802734375, 1.879638671875, 1.958404541015625, 2.03717041015625, 2.115936279296875, 2.1947021484375, 2.273468017578125, 2.35223388671875, 2.430999755859375, 2.509765625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 12.0, 13.0, 31.0, 29.0, 55.0, 73.0, 108.0, 160.0, 250.0, 378.0, 539.0, 810.0, 1215.0, 1800.0, 2649.0, 4187.0, 6282.0, 10189.0, 16053.0, 26407.0, 45285.0, 80965.0, 152999.0, 254476.0, 196662.0, 104464.0, 56403.0, 32263.0, 19568.0, 11920.0, 7757.0, 5008.0, 3216.0, 2114.0, 1366.0, 929.0, 585.0, 437.0, 289.0, 178.0, 148.0, 78.0, 70.0, 40.0, 27.0, 22.0, 13.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3486328125, -0.3379707336425781, -0.32730865478515625, -0.3166465759277344, -0.3059844970703125, -0.2953224182128906, -0.28466033935546875, -0.2739982604980469, -0.263336181640625, -0.2526741027832031, -0.24201202392578125, -0.23134994506835938, -0.2206878662109375, -0.21002578735351562, -0.19936370849609375, -0.18870162963867188, -0.17803955078125, -0.16737747192382812, -0.15671539306640625, -0.14605331420898438, -0.1353912353515625, -0.12472915649414062, -0.11406707763671875, -0.10340499877929688, -0.092742919921875, -0.08208084106445312, -0.07141876220703125, -0.060756683349609375, -0.0500946044921875, -0.039432525634765625, -0.02877044677734375, -0.018108367919921875, -0.0074462890625, 0.003215789794921875, 0.01387786865234375, 0.024539947509765625, 0.0352020263671875, 0.045864105224609375, 0.05652618408203125, 0.06718826293945312, 0.077850341796875, 0.08851242065429688, 0.09917449951171875, 0.10983657836914062, 0.1204986572265625, 0.13116073608398438, 0.14182281494140625, 0.15248489379882812, 0.16314697265625, 0.17380905151367188, 0.18447113037109375, 0.19513320922851562, 0.2057952880859375, 0.21645736694335938, 0.22711944580078125, 0.23778152465820312, 0.248443603515625, 0.2591056823730469, 0.26976776123046875, 0.2804298400878906, 0.2910919189453125, 0.3017539978027344, 0.31241607666015625, 0.3230781555175781, 0.333740234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 11.0, 7.0, 18.0, 18.0, 13.0, 13.0, 19.0, 23.0, 28.0, 19.0, 36.0, 26.0, 29.0, 32.0, 49.0, 34.0, 37.0, 46.0, 39.0, 1060.0, 34.0, 37.0, 35.0, 35.0, 40.0, 31.0, 35.0, 38.0, 23.0, 23.0, 13.0, 11.0, 16.0, 15.0, 11.0, 12.0, 15.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.654296875, -1.6084747314453125, -1.562652587890625, -1.5168304443359375, -1.47100830078125, -1.4251861572265625, -1.379364013671875, -1.3335418701171875, -1.2877197265625, -1.2418975830078125, -1.196075439453125, -1.1502532958984375, -1.10443115234375, -1.0586090087890625, -1.012786865234375, -0.9669647216796875, -0.921142578125, -0.8753204345703125, -0.829498291015625, -0.7836761474609375, -0.73785400390625, -0.6920318603515625, -0.646209716796875, -0.6003875732421875, -0.5545654296875, -0.5087432861328125, -0.462921142578125, -0.4170989990234375, -0.37127685546875, -0.3254547119140625, -0.279632568359375, -0.2338104248046875, -0.18798828125, -0.1421661376953125, -0.096343994140625, -0.0505218505859375, -0.00469970703125, 0.0411224365234375, 0.086944580078125, 0.1327667236328125, 0.1785888671875, 0.2244110107421875, 0.270233154296875, 0.3160552978515625, 0.36187744140625, 0.4076995849609375, 0.453521728515625, 0.4993438720703125, 0.545166015625, 0.5909881591796875, 0.636810302734375, 0.6826324462890625, 0.72845458984375, 0.7742767333984375, 0.820098876953125, 0.8659210205078125, 0.9117431640625, 0.9575653076171875, 1.003387451171875, 1.0492095947265625, 1.09503173828125, 1.1408538818359375, 1.186676025390625, 1.2324981689453125, 1.2783203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 7.0, 9.0, 18.0, 30.0, 51.0, 59.0, 86.0, 141.0, 203.0, 292.0, 441.0, 610.0, 845.0, 1360.0, 1963.0, 2870.0, 4421.0, 6768.0, 10332.0, 15876.0, 25939.0, 42274.0, 70788.0, 121251.0, 207640.0, 1246425.0, 133525.0, 78430.0, 46582.0, 28083.0, 17512.0, 10855.0, 7127.0, 4622.0, 3114.0, 2064.0, 1396.0, 932.0, 701.0, 464.0, 321.0, 244.0, 144.0, 111.0, 59.0, 48.0, 41.0, 17.0, 17.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23499488830566406, -0.22743606567382812, -0.2198772430419922, -0.21231842041015625, -0.2047595977783203, -0.19720077514648438, -0.18964195251464844, -0.1820831298828125, -0.17452430725097656, -0.16696548461914062, -0.1594066619873047, -0.15184783935546875, -0.1442890167236328, -0.13673019409179688, -0.12917137145996094, -0.121612548828125, -0.11405372619628906, -0.10649490356445312, -0.09893608093261719, -0.09137725830078125, -0.08381843566894531, -0.07625961303710938, -0.06870079040527344, -0.0611419677734375, -0.05358314514160156, -0.046024322509765625, -0.03846549987792969, -0.03090667724609375, -0.023347854614257812, -0.015789031982421875, -0.008230209350585938, -0.00067138671875, 0.0068874359130859375, 0.014446258544921875, 0.022005081176757812, 0.02956390380859375, 0.03712272644042969, 0.044681549072265625, 0.05224037170410156, 0.0597991943359375, 0.06735801696777344, 0.07491683959960938, 0.08247566223144531, 0.09003448486328125, 0.09759330749511719, 0.10515213012695312, 0.11271095275878906, 0.120269775390625, 0.12782859802246094, 0.13538742065429688, 0.1429462432861328, 0.15050506591796875, 0.1580638885498047, 0.16562271118164062, 0.17318153381347656, 0.1807403564453125, 0.18829917907714844, 0.19585800170898438, 0.2034168243408203, 0.21097564697265625, 0.2185344696044922, 0.22609329223632812, 0.23365211486816406, 0.2412109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 2.0, 5.0, 21.0, 11.0, 21.0, 27.0, 39.0, 54.0, 65.0, 95.0, 94.0, 101.0, 99.0, 93.0, 78.0, 44.0, 38.0, 23.0, 27.0, 15.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00135040283203125, -0.0013047903776168823, -0.0012591779232025146, -0.001213565468788147, -0.0011679530143737793, -0.0011223405599594116, -0.001076728105545044, -0.0010311156511306763, -0.0009855031967163086, -0.0009398907423019409, -0.0008942782878875732, -0.0008486658334732056, -0.0008030533790588379, -0.0007574409246444702, -0.0007118284702301025, -0.0006662160158157349, -0.0006206035614013672, -0.0005749911069869995, -0.0005293786525726318, -0.00048376619815826416, -0.0004381537437438965, -0.0003925412893295288, -0.00034692883491516113, -0.00030131638050079346, -0.0002557039260864258, -0.0002100914716720581, -0.00016447901725769043, -0.00011886656284332275, -7.325410842895508e-05, -2.7641654014587402e-05, 1.7970800399780273e-05, 6.358325481414795e-05, 0.00010919570922851562, 0.0001548081636428833, 0.00020042061805725098, 0.00024603307247161865, 0.00029164552688598633, 0.000337257981300354, 0.0003828704357147217, 0.00042848289012908936, 0.00047409534454345703, 0.0005197077989578247, 0.0005653202533721924, 0.0006109327077865601, 0.0006565451622009277, 0.0007021576166152954, 0.0007477700710296631, 0.0007933825254440308, 0.0008389949798583984, 0.0008846074342727661, 0.0009302198886871338, 0.0009758323431015015, 0.0010214447975158691, 0.0010670572519302368, 0.0011126697063446045, 0.0011582821607589722, 0.0012038946151733398, 0.0012495070695877075, 0.0012951195240020752, 0.0013407319784164429, 0.0013863444328308105, 0.0014319568872451782, 0.001477569341659546, 0.0015231817960739136, 0.0015687942504882812]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 5.0, 5.0, 13.0, 25.0, 38.0, 60.0, 107.0, 191.0, 463.0, 4357.0, 1039744.0, 2642.0, 421.0, 188.0, 81.0, 58.0, 41.0, 23.0, 24.0, 13.0, 11.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03558349609375, -0.03455066680908203, -0.03351783752441406, -0.032485008239746094, -0.031452178955078125, -0.030419349670410156, -0.029386520385742188, -0.02835369110107422, -0.02732086181640625, -0.02628803253173828, -0.025255203247070312, -0.024222373962402344, -0.023189544677734375, -0.022156715393066406, -0.021123886108398438, -0.02009105682373047, -0.0190582275390625, -0.01802539825439453, -0.016992568969726562, -0.015959739685058594, -0.014926910400390625, -0.013894081115722656, -0.012861251831054688, -0.011828422546386719, -0.01079559326171875, -0.009762763977050781, -0.008729934692382812, -0.007697105407714844, -0.006664276123046875, -0.005631446838378906, -0.0045986175537109375, -0.0035657882690429688, -0.002532958984375, -0.0015001296997070312, -0.0004673004150390625, 0.0005655288696289062, 0.001598358154296875, 0.0026311874389648438, 0.0036640167236328125, 0.004696846008300781, 0.00572967529296875, 0.006762504577636719, 0.0077953338623046875, 0.008828163146972656, 0.009860992431640625, 0.010893821716308594, 0.011926651000976562, 0.012959480285644531, 0.0139923095703125, 0.015025138854980469, 0.016057968139648438, 0.017090797424316406, 0.018123626708984375, 0.019156455993652344, 0.020189285278320312, 0.02122211456298828, 0.02225494384765625, 0.02328777313232422, 0.024320602416992188, 0.025353431701660156, 0.026386260986328125, 0.027419090270996094, 0.028451919555664062, 0.02948474884033203, 0.030517578125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 31.0, 246.0, 491.0, 220.0, 24.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009341160766780376, -0.0008362005464732647, -0.0007382850162684917, -0.0006403694860637188, -0.0005424539558589458, -0.000444538367446512, -0.00034662283724173903, -0.0002487073070369661, -0.00015079177683219314, -5.287623935146257e-05, 4.503929812926799e-05, 0.00014295484288595617, 0.00024087037309072912, 0.0003387859323993325, 0.00043670146260410547, 0.0005346169928088784, 0.0006325325230136514, 0.0007304480532184243, 0.0008283635834231973, 0.0009262791136279702, 0.0010241946438327432, 0.001122110290452838, 0.001220025820657611, 0.0013179413508623838, 0.0014158568810671568, 0.0015137724112719297, 0.0016116879414767027, 0.0017096034716814756, 0.0018075190018862486, 0.0019054345320910215, 0.0020033500622957945, 0.0021012655925005674, 0.0021991811227053404, 0.0022970966529101133, 0.0023950121831148863, 0.0024929277133196592, 0.002590843243524432, 0.002688758773729205, 0.002786674303933978, 0.002884589834138751, 0.002982505364343524, 0.003080420894548297, 0.00317833642475307, 0.003276251954957843, 0.0033741674851626158, 0.0034720830153673887, 0.0035699985455721617, 0.0036679140757769346, 0.0037658298388123512, 0.003863745369017124, 0.003961660899221897, 0.00405957642942667, 0.004157491959631443, 0.004255407489836216, 0.004353323020040989, 0.004451238550245762, 0.004549154080450535, 0.004647069610655308, 0.004744985140860081, 0.004842900671064854, 0.004940816201269627, 0.0050387317314744, 0.0051366472616791725, 0.0052345627918839455, 0.005332478322088718]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 7.0, 8.0, 6.0, 2.0, 12.0, 4.0, 17.0, 21.0, 18.0, 23.0, 16.0, 26.0, 20.0, 29.0, 26.0, 45.0, 34.0, 38.0, 41.0, 35.0, 36.0, 29.0, 41.0, 44.0, 34.0, 32.0, 29.0, 34.0, 37.0, 32.0, 23.0, 21.0, 32.0, 23.0, 16.0, 24.0, 18.0, 11.0, 18.0, 9.0, 5.0, 8.0, 5.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0005388259887695312, -0.0005229907110333443, -0.0005071554332971573, -0.0004913201555609703, -0.0004754848778247833, -0.00045964960008859634, -0.00044381432235240936, -0.0004279790446162224, -0.0004121437668800354, -0.0003963084891438484, -0.00038047321140766144, -0.00036463793367147446, -0.0003488026559352875, -0.0003329673781991005, -0.0003171321004629135, -0.00030129682272672653, -0.00028546154499053955, -0.00026962626725435257, -0.0002537909895181656, -0.0002379557117819786, -0.00022212043404579163, -0.00020628515630960464, -0.00019044987857341766, -0.00017461460083723068, -0.0001587793231010437, -0.00014294404536485672, -0.00012710876762866974, -0.00011127348989248276, -9.543821215629578e-05, -7.96029344201088e-05, -6.376765668392181e-05, -4.793237894773483e-05, -3.209710121154785e-05, -1.626182347536087e-05, -4.2654573917388916e-07, 1.5408731997013092e-05, 3.124400973320007e-05, 4.7079287469387054e-05, 6.291456520557404e-05, 7.874984294176102e-05, 9.4585120677948e-05, 0.00011042039841413498, 0.00012625567615032196, 0.00014209095388650894, 0.00015792623162269592, 0.0001737615093588829, 0.00018959678709506989, 0.00020543206483125687, 0.00022126734256744385, 0.00023710262030363083, 0.0002529378980398178, 0.0002687731757760048, 0.00028460845351219177, 0.00030044373124837875, 0.00031627900898456573, 0.0003321142867207527, 0.0003479495644569397, 0.0003637848421931267, 0.00037962011992931366, 0.00039545539766550064, 0.0004112906754016876, 0.0004271259531378746, 0.0004429612308740616, 0.00045879650861024857, 0.00047463178634643555]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 3.0, 20.0, 19.0, 22.0, 19.0, 26.0, 17.0, 29.0, 28.0, 33.0, 42.0, 33.0, 52.0, 51.0, 38.0, 40.0, 29.0, 41.0, 59.0, 33.0, 34.0, 25.0, 32.0, 45.0, 31.0, 27.0, 29.0, 23.0, 16.0, 15.0, 14.0, 12.0, 8.0, 10.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.53125, -2.452484130859375, -2.37371826171875, -2.294952392578125, -2.2161865234375, -2.137420654296875, -2.05865478515625, -1.979888916015625, -1.901123046875, -1.822357177734375, -1.74359130859375, -1.664825439453125, -1.5860595703125, -1.507293701171875, -1.42852783203125, -1.349761962890625, -1.27099609375, -1.192230224609375, -1.11346435546875, -1.034698486328125, -0.9559326171875, -0.877166748046875, -0.79840087890625, -0.719635009765625, -0.640869140625, -0.562103271484375, -0.48333740234375, -0.404571533203125, -0.3258056640625, -0.247039794921875, -0.16827392578125, -0.089508056640625, -0.0107421875, 0.068023681640625, 0.14678955078125, 0.225555419921875, 0.3043212890625, 0.383087158203125, 0.46185302734375, 0.540618896484375, 0.619384765625, 0.698150634765625, 0.77691650390625, 0.855682373046875, 0.9344482421875, 1.013214111328125, 1.09197998046875, 1.170745849609375, 1.24951171875, 1.328277587890625, 1.40704345703125, 1.485809326171875, 1.5645751953125, 1.643341064453125, 1.72210693359375, 1.800872802734375, 1.879638671875, 1.958404541015625, 2.03717041015625, 2.115936279296875, 2.1947021484375, 2.273468017578125, 2.35223388671875, 2.430999755859375, 2.509765625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 7.0, 6.0, 6.0, 11.0, 22.0, 21.0, 26.0, 39.0, 60.0, 87.0, 144.0, 205.0, 331.0, 616.0, 1255.0, 2853.0, 6790.0, 16787.0, 43972.0, 114215.0, 288325.0, 345738.0, 138439.0, 53407.0, 20507.0, 8003.0, 3343.0, 1516.0, 763.0, 379.0, 257.0, 125.0, 75.0, 77.0, 38.0, 30.0, 31.0, 13.0, 11.0, 5.0, 9.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.81536865234375, -2.7186279296875, -2.62188720703125, -2.525146484375, -2.42840576171875, -2.3316650390625, -2.23492431640625, -2.13818359375, -2.04144287109375, -1.9447021484375, -1.84796142578125, -1.751220703125, -1.65447998046875, -1.5577392578125, -1.46099853515625, -1.3642578125, -1.26751708984375, -1.1707763671875, -1.07403564453125, -0.977294921875, -0.88055419921875, -0.7838134765625, -0.68707275390625, -0.59033203125, -0.49359130859375, -0.3968505859375, -0.30010986328125, -0.203369140625, -0.10662841796875, -0.0098876953125, 0.08685302734375, 0.18359375, 0.28033447265625, 0.3770751953125, 0.47381591796875, 0.570556640625, 0.66729736328125, 0.7640380859375, 0.86077880859375, 0.95751953125, 1.05426025390625, 1.1510009765625, 1.24774169921875, 1.344482421875, 1.44122314453125, 1.5379638671875, 1.63470458984375, 1.7314453125, 1.82818603515625, 1.9249267578125, 2.02166748046875, 2.118408203125, 2.21514892578125, 2.3118896484375, 2.40863037109375, 2.50537109375, 2.60211181640625, 2.6988525390625, 2.79559326171875, 2.892333984375, 2.98907470703125, 3.0858154296875, 3.18255615234375, 3.279296875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 6.0, 3.0, 10.0, 7.0, 18.0, 21.0, 24.0, 29.0, 32.0, 36.0, 53.0, 52.0, 67.0, 80.0, 160.0, 338.0, 1468.0, 188.0, 89.0, 75.0, 60.0, 40.0, 34.0, 28.0, 24.0, 24.0, 17.0, 11.0, 12.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.9864501953125, -10.644775390625, -10.3031005859375, -9.96142578125, -9.6197509765625, -9.278076171875, -8.9364013671875, -8.5947265625, -8.2530517578125, -7.911376953125, -7.5697021484375, -7.22802734375, -6.8863525390625, -6.544677734375, -6.2030029296875, -5.861328125, -5.5196533203125, -5.177978515625, -4.8363037109375, -4.49462890625, -4.1529541015625, -3.811279296875, -3.4696044921875, -3.1279296875, -2.7862548828125, -2.444580078125, -2.1029052734375, -1.76123046875, -1.4195556640625, -1.077880859375, -0.7362060546875, -0.39453125, -0.0528564453125, 0.288818359375, 0.6304931640625, 0.97216796875, 1.3138427734375, 1.655517578125, 1.9971923828125, 2.3388671875, 2.6805419921875, 3.022216796875, 3.3638916015625, 3.70556640625, 4.0472412109375, 4.388916015625, 4.7305908203125, 5.072265625, 5.4139404296875, 5.755615234375, 6.0972900390625, 6.43896484375, 6.7806396484375, 7.122314453125, 7.4639892578125, 7.8056640625, 8.1473388671875, 8.489013671875, 8.8306884765625, 9.17236328125, 9.5140380859375, 9.855712890625, 10.1973876953125, 10.5390625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 3.0, 10.0, 6.0, 11.0, 13.0, 33.0, 27.0, 48.0, 63.0, 101.0, 158.0, 273.0, 576.0, 3309.0, 3104145.0, 34732.0, 1105.0, 437.0, 214.0, 152.0, 81.0, 57.0, 41.0, 19.0, 16.0, 11.0, 12.0, 15.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-50.6875, -49.22802734375, -47.7685546875, -46.30908203125, -44.849609375, -43.39013671875, -41.9306640625, -40.47119140625, -39.01171875, -37.55224609375, -36.0927734375, -34.63330078125, -33.173828125, -31.71435546875, -30.2548828125, -28.79541015625, -27.3359375, -25.87646484375, -24.4169921875, -22.95751953125, -21.498046875, -20.03857421875, -18.5791015625, -17.11962890625, -15.66015625, -14.20068359375, -12.7412109375, -11.28173828125, -9.822265625, -8.36279296875, -6.9033203125, -5.44384765625, -3.984375, -2.52490234375, -1.0654296875, 0.39404296875, 1.853515625, 3.31298828125, 4.7724609375, 6.23193359375, 7.69140625, 9.15087890625, 10.6103515625, 12.06982421875, 13.529296875, 14.98876953125, 16.4482421875, 17.90771484375, 19.3671875, 20.82666015625, 22.2861328125, 23.74560546875, 25.205078125, 26.66455078125, 28.1240234375, 29.58349609375, 31.04296875, 32.50244140625, 33.9619140625, 35.42138671875, 36.880859375, 38.34033203125, 39.7998046875, 41.25927734375, 42.71875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 85.0, 391.0, 415.0, 107.0, 9.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.1226806640625, -78.42129516601562, -76.71990203857422, -75.01851654052734, -73.31712341308594, -71.61573791503906, -69.91435241699219, -68.21295928955078, -66.5115737915039, -64.81018829345703, -63.108795166015625, -61.40740966796875, -59.70602035522461, -58.00463104248047, -56.303245544433594, -54.60185623168945, -52.90046691894531, -51.19907760620117, -49.49768829345703, -47.796302795410156, -46.094913482666016, -44.393524169921875, -42.692138671875, -40.99074935913086, -39.28936004638672, -37.58797073364258, -35.88658142089844, -34.18519592285156, -32.48380661010742, -30.78241729736328, -29.081029891967773, -27.379642486572266, -25.67825698852539, -23.97686767578125, -22.275480270385742, -20.574092864990234, -18.872703552246094, -17.171314239501953, -15.469926834106445, -13.768538475036621, -12.067150115966797, -10.365761756896973, -8.664373397827148, -6.962985038757324, -5.2615966796875, -3.560208320617676, -1.8588199615478516, -0.15743160247802734, 1.5439567565917969, 3.245345115661621, 4.946733474731445, 6.6481218338012695, 8.349510192871094, 10.050898551940918, 11.752286911010742, 13.453675270080566, 15.15506362915039, 16.85645294189453, 18.55784034729004, 20.259227752685547, 21.960617065429688, 23.662006378173828, 25.363393783569336, 27.064781188964844, 28.766170501708984]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 5.0, 4.0, 13.0, 16.0, 14.0, 15.0, 18.0, 27.0, 27.0, 21.0, 48.0, 43.0, 31.0, 47.0, 28.0, 43.0, 46.0, 53.0, 58.0, 39.0, 40.0, 53.0, 47.0, 45.0, 36.0, 30.0, 23.0, 21.0, 23.0, 15.0, 14.0, 12.0, 8.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.709001541137695, -24.9377384185791, -24.166475296020508, -23.395212173461914, -22.62394905090332, -21.852684020996094, -21.0814208984375, -20.310157775878906, -19.538894653320312, -18.76763153076172, -17.996368408203125, -17.22510528564453, -16.453842163085938, -15.682578086853027, -14.911314964294434, -14.140050888061523, -13.368788719177246, -12.597525596618652, -11.826262474060059, -11.054998397827148, -10.283735275268555, -9.512472152709961, -8.741209030151367, -7.969945430755615, -7.1986823081970215, -6.427419185638428, -5.656155586242676, -4.884892463684082, -4.113629341125488, -3.3423657417297363, -2.5711026191711426, -1.7998390197753906, -1.0285758972167969, -0.2573125958442688, 0.5139507055282593, 1.2852139472961426, 2.0564773082733154, 2.8277406692504883, 3.599003791809082, 4.370267391204834, 5.141530513763428, 5.9127936363220215, 6.684057235717773, 7.455320358276367, 8.226583480834961, 8.997846603393555, 9.769109725952148, 10.540373802185059, 11.311636924743652, 12.082900047302246, 12.85416316986084, 13.62542724609375, 14.396690368652344, 15.167953491210938, 15.939216613769531, 16.710479736328125, 17.48174285888672, 18.253005981445312, 19.024269104003906, 19.7955322265625, 20.566795349121094, 21.338058471679688, 22.10932159423828, 22.880586624145508, 23.6518497467041]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 9.0, 8.0, 8.0, 8.0, 11.0, 11.0, 15.0, 26.0, 23.0, 23.0, 36.0, 34.0, 36.0, 34.0, 41.0, 43.0, 41.0, 55.0, 34.0, 50.0, 45.0, 34.0, 35.0, 39.0, 45.0, 33.0, 35.0, 37.0, 28.0, 25.0, 15.0, 13.0, 15.0, 12.0, 8.0, 2.0, 8.0, 11.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.168243408203125, -3.07476806640625, -2.981292724609375, -2.8878173828125, -2.794342041015625, -2.70086669921875, -2.607391357421875, -2.513916015625, -2.420440673828125, -2.32696533203125, -2.233489990234375, -2.1400146484375, -2.046539306640625, -1.95306396484375, -1.859588623046875, -1.76611328125, -1.672637939453125, -1.57916259765625, -1.485687255859375, -1.3922119140625, -1.298736572265625, -1.20526123046875, -1.111785888671875, -1.018310546875, -0.924835205078125, -0.83135986328125, -0.737884521484375, -0.6444091796875, -0.550933837890625, -0.45745849609375, -0.363983154296875, -0.2705078125, -0.177032470703125, -0.08355712890625, 0.009918212890625, 0.1033935546875, 0.196868896484375, 0.29034423828125, 0.383819580078125, 0.477294921875, 0.570770263671875, 0.66424560546875, 0.757720947265625, 0.8511962890625, 0.944671630859375, 1.03814697265625, 1.131622314453125, 1.22509765625, 1.318572998046875, 1.41204833984375, 1.505523681640625, 1.5989990234375, 1.692474365234375, 1.78594970703125, 1.879425048828125, 1.972900390625, 2.066375732421875, 2.15985107421875, 2.253326416015625, 2.3468017578125, 2.440277099609375, 2.53375244140625, 2.627227783203125, 2.720703125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 5.0, 7.0, 9.0, 9.0, 11.0, 16.0, 19.0, 28.0, 30.0, 42.0, 65.0, 104.0, 176.0, 278.0, 574.0, 1880.0, 12743.0, 169219.0, 1567401.0, 2091644.0, 321558.0, 23367.0, 3103.0, 893.0, 416.0, 199.0, 146.0, 107.0, 60.0, 39.0, 32.0, 20.0, 14.0, 16.0, 11.0, 12.0, 3.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.26171875, -7.06610107421875, -6.8704833984375, -6.67486572265625, -6.479248046875, -6.28363037109375, -6.0880126953125, -5.89239501953125, -5.69677734375, -5.50115966796875, -5.3055419921875, -5.10992431640625, -4.914306640625, -4.71868896484375, -4.5230712890625, -4.32745361328125, -4.1318359375, -3.93621826171875, -3.7406005859375, -3.54498291015625, -3.349365234375, -3.15374755859375, -2.9581298828125, -2.76251220703125, -2.56689453125, -2.37127685546875, -2.1756591796875, -1.98004150390625, -1.784423828125, -1.58880615234375, -1.3931884765625, -1.19757080078125, -1.001953125, -0.80633544921875, -0.6107177734375, -0.41510009765625, -0.219482421875, -0.02386474609375, 0.1717529296875, 0.36737060546875, 0.56298828125, 0.75860595703125, 0.9542236328125, 1.14984130859375, 1.345458984375, 1.54107666015625, 1.7366943359375, 1.93231201171875, 2.1279296875, 2.32354736328125, 2.5191650390625, 2.71478271484375, 2.910400390625, 3.10601806640625, 3.3016357421875, 3.49725341796875, 3.69287109375, 3.88848876953125, 4.0841064453125, 4.27972412109375, 4.475341796875, 4.67095947265625, 4.8665771484375, 5.06219482421875, 5.2578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 10.0, 16.0, 14.0, 18.0, 25.0, 31.0, 35.0, 60.0, 78.0, 95.0, 119.0, 152.0, 217.0, 262.0, 345.0, 346.0, 355.0, 401.0, 316.0, 279.0, 211.0, 169.0, 126.0, 79.0, 75.0, 52.0, 47.0, 28.0, 28.0, 22.0, 17.0, 7.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.40985107421875, -4.2493896484375, -4.08892822265625, -3.928466796875, -3.76800537109375, -3.6075439453125, -3.44708251953125, -3.28662109375, -3.12615966796875, -2.9656982421875, -2.80523681640625, -2.644775390625, -2.48431396484375, -2.3238525390625, -2.16339111328125, -2.0029296875, -1.84246826171875, -1.6820068359375, -1.52154541015625, -1.361083984375, -1.20062255859375, -1.0401611328125, -0.87969970703125, -0.71923828125, -0.55877685546875, -0.3983154296875, -0.23785400390625, -0.077392578125, 0.08306884765625, 0.2435302734375, 0.40399169921875, 0.564453125, 0.72491455078125, 0.8853759765625, 1.04583740234375, 1.206298828125, 1.36676025390625, 1.5272216796875, 1.68768310546875, 1.84814453125, 2.00860595703125, 2.1690673828125, 2.32952880859375, 2.489990234375, 2.65045166015625, 2.8109130859375, 2.97137451171875, 3.1318359375, 3.29229736328125, 3.4527587890625, 3.61322021484375, 3.773681640625, 3.93414306640625, 4.0946044921875, 4.25506591796875, 4.41552734375, 4.57598876953125, 4.7364501953125, 4.89691162109375, 5.057373046875, 5.21783447265625, 5.3782958984375, 5.53875732421875, 5.69921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 11.0, 13.0, 11.0, 25.0, 40.0, 38.0, 45.0, 75.0, 98.0, 122.0, 188.0, 262.0, 370.0, 643.0, 5744.0, 677859.0, 3456165.0, 49792.0, 1229.0, 449.0, 301.0, 202.0, 140.0, 114.0, 90.0, 65.0, 44.0, 32.0, 21.0, 26.0, 15.0, 13.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-20.125, -19.5697021484375, -19.014404296875, -18.4591064453125, -17.90380859375, -17.3485107421875, -16.793212890625, -16.2379150390625, -15.6826171875, -15.1273193359375, -14.572021484375, -14.0167236328125, -13.46142578125, -12.9061279296875, -12.350830078125, -11.7955322265625, -11.240234375, -10.6849365234375, -10.129638671875, -9.5743408203125, -9.01904296875, -8.4637451171875, -7.908447265625, -7.3531494140625, -6.7978515625, -6.2425537109375, -5.687255859375, -5.1319580078125, -4.57666015625, -4.0213623046875, -3.466064453125, -2.9107666015625, -2.35546875, -1.8001708984375, -1.244873046875, -0.6895751953125, -0.13427734375, 0.4210205078125, 0.976318359375, 1.5316162109375, 2.0869140625, 2.6422119140625, 3.197509765625, 3.7528076171875, 4.30810546875, 4.8634033203125, 5.418701171875, 5.9739990234375, 6.529296875, 7.0845947265625, 7.639892578125, 8.1951904296875, 8.75048828125, 9.3057861328125, 9.861083984375, 10.4163818359375, 10.9716796875, 11.5269775390625, 12.082275390625, 12.6375732421875, 13.19287109375, 13.7481689453125, 14.303466796875, 14.8587646484375, 15.4140625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 21.0, 27.0, 43.0, 74.0, 119.0, 122.0, 125.0, 112.0, 106.0, 85.0, 62.0, 51.0, 27.0, 11.0, 11.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.96943664550781, -38.07806396484375, -37.18669509887695, -36.29532241821289, -35.403953552246094, -34.51258087158203, -33.621212005615234, -32.72983932495117, -31.838468551635742, -30.947097778320312, -30.055727005004883, -29.164356231689453, -28.27298355102539, -27.381614685058594, -26.49024200439453, -25.5988712310791, -24.707500457763672, -23.816129684448242, -22.924758911132812, -22.033388137817383, -21.142017364501953, -20.25064468383789, -19.35927391052246, -18.46790313720703, -17.5765323638916, -16.685161590576172, -15.793790817260742, -14.902419090270996, -14.011048316955566, -13.119677543640137, -12.22830581665039, -11.336935043334961, -10.445564270019531, -9.554193496704102, -8.662822723388672, -7.771450996398926, -6.880080223083496, -5.988709449768066, -5.0973381996154785, -4.205966949462891, -3.314596176147461, -2.423225164413452, -1.5318541526794434, -0.6404831409454346, 0.2508878707885742, 1.142258644104004, 2.033629894256592, 2.9250011444091797, 3.8163719177246094, 4.707742691040039, 5.599113941192627, 6.490485191345215, 7.3818559646606445, 8.273226737976074, 9.16459846496582, 10.05596923828125, 10.94734001159668, 11.83871078491211, 12.730081558227539, 13.621453285217285, 14.512824058532715, 15.404194831848145, 16.29556655883789, 17.18693733215332, 18.07830810546875]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 8.0, 8.0, 11.0, 6.0, 12.0, 17.0, 16.0, 16.0, 28.0, 17.0, 19.0, 23.0, 31.0, 22.0, 35.0, 34.0, 49.0, 43.0, 49.0, 35.0, 43.0, 44.0, 50.0, 62.0, 31.0, 42.0, 45.0, 31.0, 26.0, 23.0, 35.0, 26.0, 14.0, 16.0, 8.0, 5.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.916261672973633, -19.291183471679688, -18.666105270385742, -18.041027069091797, -17.41594886779785, -16.790870666503906, -16.16579246520996, -15.5407133102417, -14.915635108947754, -14.290556907653809, -13.665478706359863, -13.040400505065918, -12.415321350097656, -11.790243148803711, -11.165164947509766, -10.54008674621582, -9.915008544921875, -9.28993034362793, -8.664852142333984, -8.039773941040039, -7.4146952629089355, -6.78961706161499, -6.164538383483887, -5.539460182189941, -4.914381980895996, -4.289303779602051, -3.6642253398895264, -3.039146900177002, -2.4140686988830566, -1.7889904975891113, -1.163912057876587, -0.5388336181640625, 0.08624267578125, 0.7113209962844849, 1.3363993167877197, 1.9614776372909546, 2.5865559577941895, 3.2116341590881348, 3.836712598800659, 4.461791038513184, 5.086869239807129, 5.711947441101074, 6.3370256423950195, 6.962104320526123, 7.587182521820068, 8.212261199951172, 8.837339401245117, 9.462417602539062, 10.087495803833008, 10.712574005126953, 11.337652206420898, 11.962730407714844, 12.587808609008789, 13.212886810302734, 13.837965965270996, 14.463044166564941, 15.088122367858887, 15.713200569152832, 16.338279724121094, 16.96335792541504, 17.588436126708984, 18.21351432800293, 18.838592529296875, 19.46367073059082, 20.088748931884766]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 9.0, 14.0, 17.0, 24.0, 20.0, 23.0, 14.0, 29.0, 30.0, 40.0, 27.0, 43.0, 30.0, 35.0, 59.0, 45.0, 45.0, 47.0, 41.0, 37.0, 33.0, 29.0, 36.0, 38.0, 37.0, 19.0, 29.0, 20.0, 15.0, 23.0, 17.0, 5.0, 10.0, 9.0, 4.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.833221435546875, -2.74847412109375, -2.663726806640625, -2.5789794921875, -2.494232177734375, -2.40948486328125, -2.324737548828125, -2.239990234375, -2.155242919921875, -2.07049560546875, -1.985748291015625, -1.9010009765625, -1.816253662109375, -1.73150634765625, -1.646759033203125, -1.56201171875, -1.477264404296875, -1.39251708984375, -1.307769775390625, -1.2230224609375, -1.138275146484375, -1.05352783203125, -0.968780517578125, -0.884033203125, -0.799285888671875, -0.71453857421875, -0.629791259765625, -0.5450439453125, -0.460296630859375, -0.37554931640625, -0.290802001953125, -0.2060546875, -0.121307373046875, -0.03656005859375, 0.048187255859375, 0.1329345703125, 0.217681884765625, 0.30242919921875, 0.387176513671875, 0.471923828125, 0.556671142578125, 0.64141845703125, 0.726165771484375, 0.8109130859375, 0.895660400390625, 0.98040771484375, 1.065155029296875, 1.14990234375, 1.234649658203125, 1.31939697265625, 1.404144287109375, 1.4888916015625, 1.573638916015625, 1.65838623046875, 1.743133544921875, 1.827880859375, 1.912628173828125, 1.99737548828125, 2.082122802734375, 2.1668701171875, 2.251617431640625, 2.33636474609375, 2.421112060546875, 2.505859375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 8.0, 4.0, 10.0, 7.0, 23.0, 22.0, 48.0, 48.0, 96.0, 156.0, 240.0, 376.0, 583.0, 945.0, 1602.0, 2642.0, 4175.0, 7143.0, 12092.0, 21835.0, 40398.0, 78425.0, 161323.0, 285185.0, 212234.0, 102817.0, 51582.0, 27411.0, 15127.0, 8773.0, 5137.0, 3120.0, 1864.0, 1135.0, 702.0, 450.0, 269.0, 199.0, 104.0, 82.0, 51.0, 43.0, 27.0, 15.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.403564453125, -0.3904151916503906, -0.37726593017578125, -0.3641166687011719, -0.3509674072265625, -0.3378181457519531, -0.32466888427734375, -0.3115196228027344, -0.298370361328125, -0.2852210998535156, -0.27207183837890625, -0.2589225769042969, -0.2457733154296875, -0.23262405395507812, -0.21947479248046875, -0.20632553100585938, -0.19317626953125, -0.18002700805664062, -0.16687774658203125, -0.15372848510742188, -0.1405792236328125, -0.12742996215820312, -0.11428070068359375, -0.10113143920898438, -0.087982177734375, -0.07483291625976562, -0.06168365478515625, -0.048534393310546875, -0.0353851318359375, -0.022235870361328125, -0.00908660888671875, 0.004062652587890625, 0.0172119140625, 0.030361175537109375, 0.04351043701171875, 0.056659698486328125, 0.0698089599609375, 0.08295822143554688, 0.09610748291015625, 0.10925674438476562, 0.122406005859375, 0.13555526733398438, 0.14870452880859375, 0.16185379028320312, 0.1750030517578125, 0.18815231323242188, 0.20130157470703125, 0.21445083618164062, 0.22760009765625, 0.24074935913085938, 0.25389862060546875, 0.2670478820800781, 0.2801971435546875, 0.2933464050292969, 0.30649566650390625, 0.3196449279785156, 0.332794189453125, 0.3459434509277344, 0.35909271240234375, 0.3722419738769531, 0.3853912353515625, 0.3985404968261719, 0.41168975830078125, 0.4248390197753906, 0.43798828125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 2.0, 7.0, 2.0, 11.0, 4.0, 7.0, 8.0, 13.0, 19.0, 22.0, 16.0, 24.0, 33.0, 27.0, 30.0, 30.0, 27.0, 29.0, 32.0, 29.0, 30.0, 55.0, 1065.0, 42.0, 36.0, 38.0, 31.0, 32.0, 35.0, 34.0, 30.0, 34.0, 29.0, 26.0, 19.0, 22.0, 22.0, 11.0, 16.0, 9.0, 7.0, 7.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.66015625, -1.6111907958984375, -1.562225341796875, -1.5132598876953125, -1.46429443359375, -1.4153289794921875, -1.366363525390625, -1.3173980712890625, -1.2684326171875, -1.2194671630859375, -1.170501708984375, -1.1215362548828125, -1.07257080078125, -1.0236053466796875, -0.974639892578125, -0.9256744384765625, -0.876708984375, -0.8277435302734375, -0.778778076171875, -0.7298126220703125, -0.68084716796875, -0.6318817138671875, -0.582916259765625, -0.5339508056640625, -0.4849853515625, -0.4360198974609375, -0.387054443359375, -0.3380889892578125, -0.28912353515625, -0.2401580810546875, -0.191192626953125, -0.1422271728515625, -0.09326171875, -0.0442962646484375, 0.004669189453125, 0.0536346435546875, 0.10260009765625, 0.1515655517578125, 0.200531005859375, 0.2494964599609375, 0.2984619140625, 0.3474273681640625, 0.396392822265625, 0.4453582763671875, 0.49432373046875, 0.5432891845703125, 0.592254638671875, 0.6412200927734375, 0.690185546875, 0.7391510009765625, 0.788116455078125, 0.8370819091796875, 0.88604736328125, 0.9350128173828125, 0.983978271484375, 1.0329437255859375, 1.0819091796875, 1.1308746337890625, 1.179840087890625, 1.2288055419921875, 1.27777099609375, 1.3267364501953125, 1.375701904296875, 1.4246673583984375, 1.4736328125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 11.0, 9.0, 10.0, 18.0, 13.0, 28.0, 43.0, 43.0, 68.0, 103.0, 140.0, 199.0, 258.0, 361.0, 525.0, 785.0, 1067.0, 1631.0, 2263.0, 3392.0, 5170.0, 7298.0, 11029.0, 16830.0, 25805.0, 40403.0, 64591.0, 106233.0, 169144.0, 1248722.0, 145965.0, 89408.0, 54448.0, 34423.0, 21934.0, 14374.0, 9681.0, 6307.0, 4352.0, 3106.0, 2057.0, 1479.0, 1068.0, 682.0, 517.0, 375.0, 254.0, 171.0, 117.0, 94.0, 51.0, 33.0, 22.0, 8.0, 13.0, 7.0, 1.0, 2.0, 3.0], "bins": [-0.2403564453125, -0.2333545684814453, -0.22635269165039062, -0.21935081481933594, -0.21234893798828125, -0.20534706115722656, -0.19834518432617188, -0.1913433074951172, -0.1843414306640625, -0.1773395538330078, -0.17033767700195312, -0.16333580017089844, -0.15633392333984375, -0.14933204650878906, -0.14233016967773438, -0.1353282928466797, -0.128326416015625, -0.12132453918457031, -0.11432266235351562, -0.10732078552246094, -0.10031890869140625, -0.09331703186035156, -0.08631515502929688, -0.07931327819824219, -0.0723114013671875, -0.06530952453613281, -0.058307647705078125, -0.05130577087402344, -0.04430389404296875, -0.03730201721191406, -0.030300140380859375, -0.023298263549804688, -0.01629638671875, -0.009294509887695312, -0.002292633056640625, 0.0047092437744140625, 0.01171112060546875, 0.018712997436523438, 0.025714874267578125, 0.03271675109863281, 0.0397186279296875, 0.04672050476074219, 0.053722381591796875, 0.06072425842285156, 0.06772613525390625, 0.07472801208496094, 0.08172988891601562, 0.08873176574707031, 0.095733642578125, 0.10273551940917969, 0.10973739624023438, 0.11673927307128906, 0.12374114990234375, 0.13074302673339844, 0.13774490356445312, 0.1447467803955078, 0.1517486572265625, 0.1587505340576172, 0.16575241088867188, 0.17275428771972656, 0.17975616455078125, 0.18675804138183594, 0.19375991821289062, 0.2007617950439453, 0.207763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 9.0, 24.0, 20.0, 27.0, 30.0, 46.0, 58.0, 58.0, 58.0, 65.0, 73.0, 66.0, 65.0, 59.0, 47.0, 58.0, 43.0, 31.0, 24.0, 31.0, 23.0, 15.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009121894836425781, -0.0008810833096504211, -0.0008499771356582642, -0.0008188709616661072, -0.0007877647876739502, -0.0007566586136817932, -0.0007255524396896362, -0.0006944462656974792, -0.0006633400917053223, -0.0006322339177131653, -0.0006011277437210083, -0.0005700215697288513, -0.0005389153957366943, -0.0005078092217445374, -0.00047670304775238037, -0.0004455968737602234, -0.0004144906997680664, -0.0003833845257759094, -0.00035227835178375244, -0.00032117217779159546, -0.0002900660037994385, -0.0002589598298072815, -0.0002278536558151245, -0.00019674748182296753, -0.00016564130783081055, -0.00013453513383865356, -0.00010342895984649658, -7.23227858543396e-05, -4.121661186218262e-05, -1.0110437870025635e-05, 2.0995736122131348e-05, 5.210191011428833e-05, 8.320808410644531e-05, 0.0001143142580986023, 0.00014542043209075928, 0.00017652660608291626, 0.00020763278007507324, 0.00023873895406723022, 0.0002698451280593872, 0.0003009513020515442, 0.00033205747604370117, 0.00036316365003585815, 0.00039426982402801514, 0.0004253759980201721, 0.0004564821720123291, 0.0004875883460044861, 0.0005186945199966431, 0.0005498006939888, 0.000580906867980957, 0.000612013041973114, 0.000643119215965271, 0.000674225389957428, 0.000705331563949585, 0.0007364377379417419, 0.0007675439119338989, 0.0007986500859260559, 0.0008297562599182129, 0.0008608624339103699, 0.0008919686079025269, 0.0009230747818946838, 0.0009541809558868408, 0.0009852871298789978, 0.0010163933038711548, 0.0010474994778633118, 0.0010786056518554688]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 19.0, 16.0, 21.0, 32.0, 31.0, 54.0, 84.0, 112.0, 187.0, 304.0, 967.0, 75129.0, 967083.0, 3248.0, 553.0, 221.0, 141.0, 95.0, 61.0, 51.0, 37.0, 23.0, 17.0, 10.0, 10.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228118896484375, -0.022145509719848633, -0.021479129791259766, -0.0208127498626709, -0.02014636993408203, -0.019479990005493164, -0.018813610076904297, -0.01814723014831543, -0.017480850219726562, -0.016814470291137695, -0.016148090362548828, -0.015481710433959961, -0.014815330505371094, -0.014148950576782227, -0.01348257064819336, -0.012816190719604492, -0.012149810791015625, -0.011483430862426758, -0.01081705093383789, -0.010150671005249023, -0.009484291076660156, -0.008817911148071289, -0.008151531219482422, -0.007485151290893555, -0.0068187713623046875, -0.00615239143371582, -0.005486011505126953, -0.004819631576538086, -0.004153251647949219, -0.0034868717193603516, -0.0028204917907714844, -0.002154111862182617, -0.00148773193359375, -0.0008213520050048828, -0.00015497207641601562, 0.0005114078521728516, 0.0011777877807617188, 0.001844167709350586, 0.002510547637939453, 0.0031769275665283203, 0.0038433074951171875, 0.004509687423706055, 0.005176067352294922, 0.005842447280883789, 0.006508827209472656, 0.0071752071380615234, 0.00784158706665039, 0.008507966995239258, 0.009174346923828125, 0.009840726852416992, 0.01050710678100586, 0.011173486709594727, 0.011839866638183594, 0.012506246566772461, 0.013172626495361328, 0.013839006423950195, 0.014505386352539062, 0.01517176628112793, 0.015838146209716797, 0.016504526138305664, 0.01717090606689453, 0.0178372859954834, 0.018503665924072266, 0.019170045852661133, 0.01983642578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 35.0, 86.0, 156.0, 219.0, 240.0, 146.0, 62.0, 35.0, 15.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021842936985194683, -0.0021414197981357574, -0.0020985458977520466, -0.002055671764537692, -0.002012797864153981, -0.0019699239637702703, -0.0019270499469712377, -0.001884175930172205, -0.0018413020297884941, -0.0017984281294047832, -0.0017555541126057506, -0.0017126800958067179, -0.001669806195423007, -0.0016269322950392962, -0.0015840582782402635, -0.0015411842614412308, -0.00149831036105752, -0.001455436460673809, -0.0014125624438747764, -0.0013696884270757437, -0.0013268145266920328, -0.001283940626308322, -0.0012410666095092893, -0.0011981925927102566, -0.0011553186923265457, -0.0011124447919428349, -0.0010695707751438022, -0.0010266967583447695, -0.0009838228579610586, -0.0009409488993696868, -0.0008980749407783151, -0.0008552009821869433, -0.0008123270235955715, -0.0007694530650041997, -0.000726579106412828, -0.0006837051478214562, -0.0006408311892300844, -0.0005979572306387126, -0.0005550832720473409, -0.0005122093134559691, -0.0004693353548645973, -0.00042646139627322555, -0.00038358743768185377, -0.000340713479090482, -0.0002978395204991102, -0.00025496556190773845, -0.00021209160331636667, -0.0001692176447249949, -0.00012634368613362312, -8.346972754225135e-05, -4.0595768950879574e-05, 2.278189640492201e-06, 4.5152148231863976e-05, 8.802610682323575e-05, 0.00013090006541460752, 0.0001737740240059793, 0.00021664798259735107, 0.00025952194118872285, 0.0003023958997800946, 0.0003452698583714664, 0.0003881438169628382, 0.00043101777555420995, 0.0004738917341455817, 0.0005167656927369535, 0.0005596396513283253]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 8.0, 6.0, 9.0, 11.0, 12.0, 15.0, 15.0, 31.0, 20.0, 26.0, 25.0, 29.0, 29.0, 43.0, 45.0, 35.0, 37.0, 45.0, 42.0, 36.0, 39.0, 34.0, 34.0, 42.0, 34.0, 27.0, 54.0, 29.0, 19.0, 20.0, 17.0, 11.0, 22.0, 16.0, 9.0, 13.0, 14.0, 6.0, 8.0, 4.0, 2.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0], "bins": [-0.0004981160163879395, -0.00048444420099258423, -0.000470772385597229, -0.0004571005702018738, -0.00044342875480651855, -0.00042975693941116333, -0.0004160851240158081, -0.0004024133086204529, -0.00038874149322509766, -0.00037506967782974243, -0.0003613978624343872, -0.000347726047039032, -0.00033405423164367676, -0.00032038241624832153, -0.0003067106008529663, -0.0002930387854576111, -0.00027936697006225586, -0.00026569515466690063, -0.0002520233392715454, -0.00023835152387619019, -0.00022467970848083496, -0.00021100789308547974, -0.0001973360776901245, -0.0001836642622947693, -0.00016999244689941406, -0.00015632063150405884, -0.0001426488161087036, -0.0001289770007133484, -0.00011530518531799316, -0.00010163336992263794, -8.796155452728271e-05, -7.428973913192749e-05, -6.0617923736572266e-05, -4.694610834121704e-05, -3.3274292945861816e-05, -1.9602477550506592e-05, -5.930662155151367e-06, 7.741153240203857e-06, 2.1412968635559082e-05, 3.508478403091431e-05, 4.875659942626953e-05, 6.242841482162476e-05, 7.610023021697998e-05, 8.97720456123352e-05, 0.00010344386100769043, 0.00011711567640304565, 0.00013078749179840088, 0.0001444593071937561, 0.00015813112258911133, 0.00017180293798446655, 0.00018547475337982178, 0.000199146568775177, 0.00021281838417053223, 0.00022649019956588745, 0.00024016201496124268, 0.0002538338303565979, 0.0002675056457519531, 0.00028117746114730835, 0.0002948492765426636, 0.0003085210919380188, 0.000322192907333374, 0.00033586472272872925, 0.00034953653812408447, 0.0003632083535194397, 0.0003768801689147949]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 9.0, 14.0, 17.0, 24.0, 20.0, 23.0, 14.0, 29.0, 30.0, 40.0, 27.0, 43.0, 30.0, 35.0, 59.0, 45.0, 45.0, 47.0, 41.0, 37.0, 33.0, 29.0, 36.0, 38.0, 37.0, 19.0, 29.0, 20.0, 15.0, 23.0, 17.0, 5.0, 10.0, 9.0, 4.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.833221435546875, -2.74847412109375, -2.663726806640625, -2.5789794921875, -2.494232177734375, -2.40948486328125, -2.324737548828125, -2.239990234375, -2.155242919921875, -2.07049560546875, -1.985748291015625, -1.9010009765625, -1.816253662109375, -1.73150634765625, -1.646759033203125, -1.56201171875, -1.477264404296875, -1.39251708984375, -1.307769775390625, -1.2230224609375, -1.138275146484375, -1.05352783203125, -0.968780517578125, -0.884033203125, -0.799285888671875, -0.71453857421875, -0.629791259765625, -0.5450439453125, -0.460296630859375, -0.37554931640625, -0.290802001953125, -0.2060546875, -0.121307373046875, -0.03656005859375, 0.048187255859375, 0.1329345703125, 0.217681884765625, 0.30242919921875, 0.387176513671875, 0.471923828125, 0.556671142578125, 0.64141845703125, 0.726165771484375, 0.8109130859375, 0.895660400390625, 0.98040771484375, 1.065155029296875, 1.14990234375, 1.234649658203125, 1.31939697265625, 1.404144287109375, 1.4888916015625, 1.573638916015625, 1.65838623046875, 1.743133544921875, 1.827880859375, 1.912628173828125, 1.99737548828125, 2.082122802734375, 2.1668701171875, 2.251617431640625, 2.33636474609375, 2.421112060546875, 2.505859375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 13.0, 10.0, 27.0, 30.0, 36.0, 45.0, 57.0, 92.0, 146.0, 226.0, 287.0, 516.0, 859.0, 1723.0, 3544.0, 7670.0, 17826.0, 43080.0, 100576.0, 223185.0, 359306.0, 162182.0, 72278.0, 30401.0, 12850.0, 5663.0, 2611.0, 1343.0, 711.0, 431.0, 238.0, 172.0, 107.0, 76.0, 53.0, 47.0, 38.0, 32.0, 19.0, 12.0, 9.0, 8.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8203125, -2.735626220703125, -2.65093994140625, -2.566253662109375, -2.4815673828125, -2.396881103515625, -2.31219482421875, -2.227508544921875, -2.142822265625, -2.058135986328125, -1.97344970703125, -1.888763427734375, -1.8040771484375, -1.719390869140625, -1.63470458984375, -1.550018310546875, -1.46533203125, -1.380645751953125, -1.29595947265625, -1.211273193359375, -1.1265869140625, -1.041900634765625, -0.95721435546875, -0.872528076171875, -0.787841796875, -0.703155517578125, -0.61846923828125, -0.533782958984375, -0.4490966796875, -0.364410400390625, -0.27972412109375, -0.195037841796875, -0.1103515625, -0.025665283203125, 0.05902099609375, 0.143707275390625, 0.2283935546875, 0.313079833984375, 0.39776611328125, 0.482452392578125, 0.567138671875, 0.651824951171875, 0.73651123046875, 0.821197509765625, 0.9058837890625, 0.990570068359375, 1.07525634765625, 1.159942626953125, 1.24462890625, 1.329315185546875, 1.41400146484375, 1.498687744140625, 1.5833740234375, 1.668060302734375, 1.75274658203125, 1.837432861328125, 1.922119140625, 2.006805419921875, 2.09149169921875, 2.176177978515625, 2.2608642578125, 2.345550537109375, 2.43023681640625, 2.514923095703125, 2.599609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 10.0, 10.0, 11.0, 6.0, 16.0, 21.0, 11.0, 13.0, 27.0, 28.0, 29.0, 31.0, 45.0, 33.0, 69.0, 76.0, 109.0, 244.0, 1452.0, 238.0, 109.0, 59.0, 53.0, 39.0, 54.0, 30.0, 23.0, 32.0, 29.0, 24.0, 20.0, 20.0, 14.0, 8.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.109375, -8.820556640625, -8.53173828125, -8.242919921875, -7.9541015625, -7.665283203125, -7.37646484375, -7.087646484375, -6.798828125, -6.510009765625, -6.22119140625, -5.932373046875, -5.6435546875, -5.354736328125, -5.06591796875, -4.777099609375, -4.48828125, -4.199462890625, -3.91064453125, -3.621826171875, -3.3330078125, -3.044189453125, -2.75537109375, -2.466552734375, -2.177734375, -1.888916015625, -1.60009765625, -1.311279296875, -1.0224609375, -0.733642578125, -0.44482421875, -0.156005859375, 0.1328125, 0.421630859375, 0.71044921875, 0.999267578125, 1.2880859375, 1.576904296875, 1.86572265625, 2.154541015625, 2.443359375, 2.732177734375, 3.02099609375, 3.309814453125, 3.5986328125, 3.887451171875, 4.17626953125, 4.465087890625, 4.75390625, 5.042724609375, 5.33154296875, 5.620361328125, 5.9091796875, 6.197998046875, 6.48681640625, 6.775634765625, 7.064453125, 7.353271484375, 7.64208984375, 7.930908203125, 8.2197265625, 8.508544921875, 8.79736328125, 9.086181640625, 9.375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 6.0, 7.0, 6.0, 14.0, 12.0, 19.0, 23.0, 35.0, 57.0, 82.0, 123.0, 238.0, 557.0, 2886.0, 3120670.0, 19133.0, 978.0, 337.0, 189.0, 98.0, 80.0, 39.0, 40.0, 24.0, 21.0, 14.0, 1.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.6875, -61.953125, -60.21875, -58.484375, -56.75, -55.015625, -53.28125, -51.546875, -49.8125, -48.078125, -46.34375, -44.609375, -42.875, -41.140625, -39.40625, -37.671875, -35.9375, -34.203125, -32.46875, -30.734375, -29.0, -27.265625, -25.53125, -23.796875, -22.0625, -20.328125, -18.59375, -16.859375, -15.125, -13.390625, -11.65625, -9.921875, -8.1875, -6.453125, -4.71875, -2.984375, -1.25, 0.484375, 2.21875, 3.953125, 5.6875, 7.421875, 9.15625, 10.890625, 12.625, 14.359375, 16.09375, 17.828125, 19.5625, 21.296875, 23.03125, 24.765625, 26.5, 28.234375, 29.96875, 31.703125, 33.4375, 35.171875, 36.90625, 38.640625, 40.375, 42.109375, 43.84375, 45.578125, 47.3125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 20.0, 102.0, 234.0, 331.0, 227.0, 79.0, 15.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.53334045410156, -53.475311279296875, -52.41728210449219, -51.359256744384766, -50.30122756958008, -49.24319839477539, -48.18517303466797, -47.12714385986328, -46.069114685058594, -45.011085510253906, -43.95305633544922, -42.8950309753418, -41.83700180053711, -40.77897262573242, -39.720947265625, -38.66291809082031, -37.604888916015625, -36.54685974121094, -35.48883056640625, -34.43080520629883, -33.37277603149414, -32.31474685668945, -31.2567195892334, -30.198692321777344, -29.140663146972656, -28.08263397216797, -27.024606704711914, -25.96657943725586, -24.908550262451172, -23.850521087646484, -22.79249382019043, -21.734466552734375, -20.676433563232422, -19.618404388427734, -18.56037712097168, -17.502349853515625, -16.444320678710938, -15.386292457580566, -14.328264236450195, -13.270236015319824, -12.21220874786377, -11.154180526733398, -10.096152305603027, -9.038124084472656, -7.980095863342285, -6.922067642211914, -5.864039421081543, -4.806011199951172, -3.747982978820801, -2.6899547576904297, -1.6319265365600586, -0.5738983154296875, 0.4841299057006836, 1.5421581268310547, 2.600186347961426, 3.658214569091797, 4.716242790222168, 5.774271011352539, 6.83229923248291, 7.890327453613281, 8.948355674743652, 10.006383895874023, 11.064412117004395, 12.122440338134766, 13.180468559265137]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 6.0, 5.0, 13.0, 6.0, 13.0, 11.0, 10.0, 12.0, 13.0, 19.0, 19.0, 22.0, 29.0, 28.0, 27.0, 31.0, 33.0, 34.0, 47.0, 33.0, 43.0, 31.0, 39.0, 34.0, 31.0, 34.0, 40.0, 40.0, 25.0, 26.0, 31.0, 31.0, 24.0, 32.0, 20.0, 17.0, 17.0, 15.0, 14.0, 12.0, 9.0, 5.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.148656845092773, -17.512428283691406, -16.876201629638672, -16.239973068237305, -15.60374641418457, -14.967517852783203, -14.331290245056152, -13.695062637329102, -13.05883502960205, -12.422607421875, -11.78637981414795, -11.150152206420898, -10.513923645019531, -9.877696990966797, -9.24146842956543, -8.605240821838379, -7.969013214111328, -7.332785606384277, -6.696557998657227, -6.060329914093018, -5.424102306365967, -4.787874698638916, -4.151646614074707, -3.5154190063476562, -2.8791913986206055, -2.2429637908935547, -1.6067359447479248, -0.9705082178115845, -0.33428049087524414, 0.30194711685180664, 0.9381749629974365, 1.5744028091430664, 2.2106285095214844, 2.846856117248535, 3.483083963394165, 4.119311809539795, 4.755539417266846, 5.3917670249938965, 6.0279951095581055, 6.664222717285156, 7.300450325012207, 7.936677932739258, 8.572905540466309, 9.20913314819336, 9.845361709594727, 10.481588363647461, 11.117816925048828, 11.754044532775879, 12.39027214050293, 13.02649974822998, 13.662727355957031, 14.298954963684082, 14.935182571411133, 15.5714111328125, 16.207637786865234, 16.8438663482666, 17.48009490966797, 18.116323471069336, 18.75255012512207, 19.388778686523438, 20.025005340576172, 20.66123390197754, 21.297460556030273, 21.93368911743164, 22.569915771484375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 17.0, 8.0, 15.0, 17.0, 29.0, 25.0, 22.0, 26.0, 32.0, 34.0, 30.0, 22.0, 42.0, 37.0, 43.0, 42.0, 36.0, 37.0, 44.0, 47.0, 36.0, 36.0, 25.0, 26.0, 29.0, 30.0, 31.0, 20.0, 21.0, 17.0, 16.0, 17.0, 9.0, 13.0, 5.0, 12.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.021484375, -2.93450927734375, -2.8475341796875, -2.76055908203125, -2.673583984375, -2.58660888671875, -2.4996337890625, -2.41265869140625, -2.32568359375, -2.23870849609375, -2.1517333984375, -2.06475830078125, -1.977783203125, -1.89080810546875, -1.8038330078125, -1.71685791015625, -1.6298828125, -1.54290771484375, -1.4559326171875, -1.36895751953125, -1.281982421875, -1.19500732421875, -1.1080322265625, -1.02105712890625, -0.93408203125, -0.84710693359375, -0.7601318359375, -0.67315673828125, -0.586181640625, -0.49920654296875, -0.4122314453125, -0.32525634765625, -0.23828125, -0.15130615234375, -0.0643310546875, 0.02264404296875, 0.109619140625, 0.19659423828125, 0.2835693359375, 0.37054443359375, 0.45751953125, 0.54449462890625, 0.6314697265625, 0.71844482421875, 0.805419921875, 0.89239501953125, 0.9793701171875, 1.06634521484375, 1.1533203125, 1.24029541015625, 1.3272705078125, 1.41424560546875, 1.501220703125, 1.58819580078125, 1.6751708984375, 1.76214599609375, 1.84912109375, 1.93609619140625, 2.0230712890625, 2.11004638671875, 2.197021484375, 2.28399658203125, 2.3709716796875, 2.45794677734375, 2.544921875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 20.0, 15.0, 16.0, 38.0, 22.0, 36.0, 41.0, 50.0, 76.0, 79.0, 108.0, 159.0, 247.0, 465.0, 1298.0, 6214.0, 50612.0, 516483.0, 2097913.0, 1316783.0, 180541.0, 18091.0, 3013.0, 802.0, 364.0, 185.0, 121.0, 77.0, 64.0, 67.0, 42.0, 38.0, 39.0, 25.0, 29.0, 16.0, 14.0, 19.0, 9.0, 7.0, 4.0, 5.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.05078125, -5.87158203125, -5.6923828125, -5.51318359375, -5.333984375, -5.15478515625, -4.9755859375, -4.79638671875, -4.6171875, -4.43798828125, -4.2587890625, -4.07958984375, -3.900390625, -3.72119140625, -3.5419921875, -3.36279296875, -3.18359375, -3.00439453125, -2.8251953125, -2.64599609375, -2.466796875, -2.28759765625, -2.1083984375, -1.92919921875, -1.75, -1.57080078125, -1.3916015625, -1.21240234375, -1.033203125, -0.85400390625, -0.6748046875, -0.49560546875, -0.31640625, -0.13720703125, 0.0419921875, 0.22119140625, 0.400390625, 0.57958984375, 0.7587890625, 0.93798828125, 1.1171875, 1.29638671875, 1.4755859375, 1.65478515625, 1.833984375, 2.01318359375, 2.1923828125, 2.37158203125, 2.55078125, 2.72998046875, 2.9091796875, 3.08837890625, 3.267578125, 3.44677734375, 3.6259765625, 3.80517578125, 3.984375, 4.16357421875, 4.3427734375, 4.52197265625, 4.701171875, 4.88037109375, 5.0595703125, 5.23876953125, 5.41796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 11.0, 11.0, 24.0, 22.0, 30.0, 55.0, 75.0, 101.0, 114.0, 164.0, 201.0, 246.0, 346.0, 389.0, 393.0, 375.0, 333.0, 273.0, 216.0, 166.0, 118.0, 88.0, 77.0, 54.0, 50.0, 41.0, 20.0, 9.0, 11.0, 11.0, 6.0, 10.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -6.01031494140625, -5.8370361328125, -5.66375732421875, -5.490478515625, -5.31719970703125, -5.1439208984375, -4.97064208984375, -4.79736328125, -4.62408447265625, -4.4508056640625, -4.27752685546875, -4.104248046875, -3.93096923828125, -3.7576904296875, -3.58441162109375, -3.4111328125, -3.23785400390625, -3.0645751953125, -2.89129638671875, -2.718017578125, -2.54473876953125, -2.3714599609375, -2.19818115234375, -2.02490234375, -1.85162353515625, -1.6783447265625, -1.50506591796875, -1.331787109375, -1.15850830078125, -0.9852294921875, -0.81195068359375, -0.638671875, -0.46539306640625, -0.2921142578125, -0.11883544921875, 0.054443359375, 0.22772216796875, 0.4010009765625, 0.57427978515625, 0.74755859375, 0.92083740234375, 1.0941162109375, 1.26739501953125, 1.440673828125, 1.61395263671875, 1.7872314453125, 1.96051025390625, 2.1337890625, 2.30706787109375, 2.4803466796875, 2.65362548828125, 2.826904296875, 3.00018310546875, 3.1734619140625, 3.34674072265625, 3.52001953125, 3.69329833984375, 3.8665771484375, 4.03985595703125, 4.213134765625, 4.38641357421875, 4.5596923828125, 4.73297119140625, 4.90625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 8.0, 13.0, 10.0, 13.0, 32.0, 47.0, 46.0, 74.0, 84.0, 107.0, 208.0, 260.0, 415.0, 907.0, 46598.0, 4069328.0, 73743.0, 989.0, 403.0, 254.0, 204.0, 156.0, 111.0, 76.0, 50.0, 32.0, 26.0, 18.0, 16.0, 10.0, 9.0, 7.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.265625, -22.4501953125, -21.634765625, -20.8193359375, -20.00390625, -19.1884765625, -18.373046875, -17.5576171875, -16.7421875, -15.9267578125, -15.111328125, -14.2958984375, -13.48046875, -12.6650390625, -11.849609375, -11.0341796875, -10.21875, -9.4033203125, -8.587890625, -7.7724609375, -6.95703125, -6.1416015625, -5.326171875, -4.5107421875, -3.6953125, -2.8798828125, -2.064453125, -1.2490234375, -0.43359375, 0.3818359375, 1.197265625, 2.0126953125, 2.828125, 3.6435546875, 4.458984375, 5.2744140625, 6.08984375, 6.9052734375, 7.720703125, 8.5361328125, 9.3515625, 10.1669921875, 10.982421875, 11.7978515625, 12.61328125, 13.4287109375, 14.244140625, 15.0595703125, 15.875, 16.6904296875, 17.505859375, 18.3212890625, 19.13671875, 19.9521484375, 20.767578125, 21.5830078125, 22.3984375, 23.2138671875, 24.029296875, 24.8447265625, 25.66015625, 26.4755859375, 27.291015625, 28.1064453125, 28.921875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 19.0, 134.0, 324.0, 352.0, 157.0, 24.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.35829162597656, -31.74428939819336, -29.130285263061523, -26.516281127929688, -23.902278900146484, -21.28827667236328, -18.674272537231445, -16.06026840209961, -13.446266174316406, -10.832262992858887, -8.218259811401367, -5.604256629943848, -2.990253448486328, -0.3762502670288086, 2.237752914428711, 4.851757049560547, 7.46575927734375, 10.07976245880127, 12.693765640258789, 15.307768821716309, 17.921772003173828, 20.53577423095703, 23.149778366088867, 25.763782501220703, 28.377784729003906, 30.99178695678711, 33.60578918457031, 36.21979522705078, 38.833797454833984, 41.44779968261719, 44.061805725097656, 46.67580795288086, 49.28981018066406, 51.903812408447266, 54.51781463623047, 57.13182067871094, 59.74582290649414, 62.359825134277344, 64.97383117675781, 67.58782958984375, 70.20183563232422, 72.81584167480469, 75.42984008789062, 78.0438461303711, 80.65785217285156, 83.2718505859375, 85.88585662841797, 88.49986267089844, 91.11386108398438, 93.72786712646484, 96.34186553955078, 98.95587158203125, 101.56986999511719, 104.18387603759766, 106.79788208007812, 109.41188049316406, 112.02588653564453, 114.639892578125, 117.25389099121094, 119.8678970336914, 122.48190307617188, 125.09590148925781, 127.70990753173828, 130.32391357421875, 132.9379119873047]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 6.0, 8.0, 3.0, 8.0, 11.0, 16.0, 17.0, 16.0, 16.0, 17.0, 20.0, 19.0, 26.0, 32.0, 32.0, 40.0, 37.0, 35.0, 39.0, 41.0, 35.0, 51.0, 32.0, 38.0, 40.0, 33.0, 40.0, 34.0, 36.0, 33.0, 27.0, 22.0, 21.0, 20.0, 13.0, 21.0, 14.0, 5.0, 10.0, 6.0, 8.0, 7.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.020042419433594, -16.443592071533203, -15.867141723632812, -15.290691375732422, -14.714241027832031, -14.13779067993164, -13.561339378356934, -12.984889030456543, -12.408438682556152, -11.831988334655762, -11.255537986755371, -10.67908763885498, -10.102636337280273, -9.526185989379883, -8.949735641479492, -8.373285293579102, -7.796834945678711, -7.22038459777832, -6.64393424987793, -6.067483425140381, -5.49103307723999, -4.9145827293396, -4.338131904602051, -3.76168155670166, -3.1852312088012695, -2.608780860900879, -2.032330274581909, -1.455879807472229, -0.8794293403625488, -0.3029789924621582, 0.2734715938568115, 0.8499221801757812, 1.4263725280761719, 2.0028228759765625, 2.5792734622955322, 3.155724048614502, 3.7321743965148926, 4.308624744415283, 4.885075569152832, 5.461525917053223, 6.037976264953613, 6.614426612854004, 7.1908769607543945, 7.767327785491943, 8.343778610229492, 8.920228958129883, 9.496679306030273, 10.073129653930664, 10.649580001831055, 11.226030349731445, 11.802480697631836, 12.378931045532227, 12.955381393432617, 13.531831741333008, 14.108283042907715, 14.684733390808105, 15.261183738708496, 15.837634086608887, 16.414085388183594, 16.990535736083984, 17.566986083984375, 18.143436431884766, 18.719886779785156, 19.296337127685547, 19.872787475585938]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 4.0, 10.0, 15.0, 26.0, 15.0, 11.0, 22.0, 19.0, 24.0, 25.0, 30.0, 35.0, 42.0, 22.0, 39.0, 38.0, 45.0, 46.0, 28.0, 33.0, 42.0, 38.0, 41.0, 31.0, 40.0, 40.0, 22.0, 23.0, 32.0, 21.0, 19.0, 17.0, 10.0, 16.0, 13.0, 15.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.833984375, -2.75152587890625, -2.6690673828125, -2.58660888671875, -2.504150390625, -2.42169189453125, -2.3392333984375, -2.25677490234375, -2.17431640625, -2.09185791015625, -2.0093994140625, -1.92694091796875, -1.844482421875, -1.76202392578125, -1.6795654296875, -1.59710693359375, -1.5146484375, -1.43218994140625, -1.3497314453125, -1.26727294921875, -1.184814453125, -1.10235595703125, -1.0198974609375, -0.93743896484375, -0.85498046875, -0.77252197265625, -0.6900634765625, -0.60760498046875, -0.525146484375, -0.44268798828125, -0.3602294921875, -0.27777099609375, -0.1953125, -0.11285400390625, -0.0303955078125, 0.05206298828125, 0.134521484375, 0.21697998046875, 0.2994384765625, 0.38189697265625, 0.46435546875, 0.54681396484375, 0.6292724609375, 0.71173095703125, 0.794189453125, 0.87664794921875, 0.9591064453125, 1.04156494140625, 1.1240234375, 1.20648193359375, 1.2889404296875, 1.37139892578125, 1.453857421875, 1.53631591796875, 1.6187744140625, 1.70123291015625, 1.78369140625, 1.86614990234375, 1.9486083984375, 2.03106689453125, 2.113525390625, 2.19598388671875, 2.2784423828125, 2.36090087890625, 2.443359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 22.0, 20.0, 26.0, 37.0, 57.0, 92.0, 124.0, 184.0, 252.0, 387.0, 592.0, 884.0, 1289.0, 1925.0, 2863.0, 4443.0, 6885.0, 10743.0, 16792.0, 27475.0, 45970.0, 79915.0, 143819.0, 227885.0, 196974.0, 114408.0, 63987.0, 37382.0, 22788.0, 14172.0, 8959.0, 5974.0, 3828.0, 2449.0, 1568.0, 1084.0, 738.0, 447.0, 330.0, 242.0, 183.0, 136.0, 68.0, 40.0, 30.0, 21.0, 28.0, 8.0, 5.0, 5.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.31884765625, -0.3088226318359375, -0.298797607421875, -0.2887725830078125, -0.27874755859375, -0.2687225341796875, -0.258697509765625, -0.2486724853515625, -0.2386474609375, -0.2286224365234375, -0.218597412109375, -0.2085723876953125, -0.19854736328125, -0.1885223388671875, -0.178497314453125, -0.1684722900390625, -0.158447265625, -0.1484222412109375, -0.138397216796875, -0.1283721923828125, -0.11834716796875, -0.1083221435546875, -0.098297119140625, -0.0882720947265625, -0.0782470703125, -0.0682220458984375, -0.058197021484375, -0.0481719970703125, -0.03814697265625, -0.0281219482421875, -0.018096923828125, -0.0080718994140625, 0.001953125, 0.0119781494140625, 0.022003173828125, 0.0320281982421875, 0.04205322265625, 0.0520782470703125, 0.062103271484375, 0.0721282958984375, 0.0821533203125, 0.0921783447265625, 0.102203369140625, 0.1122283935546875, 0.12225341796875, 0.1322784423828125, 0.142303466796875, 0.1523284912109375, 0.162353515625, 0.1723785400390625, 0.182403564453125, 0.1924285888671875, 0.20245361328125, 0.2124786376953125, 0.222503662109375, 0.2325286865234375, 0.2425537109375, 0.2525787353515625, 0.262603759765625, 0.2726287841796875, 0.28265380859375, 0.2926788330078125, 0.302703857421875, 0.3127288818359375, 0.32275390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 9.0, 4.0, 5.0, 3.0, 8.0, 3.0, 9.0, 12.0, 6.0, 17.0, 16.0, 20.0, 24.0, 28.0, 25.0, 38.0, 28.0, 39.0, 36.0, 25.0, 36.0, 42.0, 36.0, 1066.0, 42.0, 44.0, 36.0, 33.0, 38.0, 36.0, 34.0, 33.0, 29.0, 32.0, 25.0, 13.0, 16.0, 16.0, 8.0, 13.0, 15.0, 6.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6328125, -1.579132080078125, -1.52545166015625, -1.471771240234375, -1.4180908203125, -1.364410400390625, -1.31072998046875, -1.257049560546875, -1.203369140625, -1.149688720703125, -1.09600830078125, -1.042327880859375, -0.9886474609375, -0.934967041015625, -0.88128662109375, -0.827606201171875, -0.77392578125, -0.720245361328125, -0.66656494140625, -0.612884521484375, -0.5592041015625, -0.505523681640625, -0.45184326171875, -0.398162841796875, -0.344482421875, -0.290802001953125, -0.23712158203125, -0.183441162109375, -0.1297607421875, -0.076080322265625, -0.02239990234375, 0.031280517578125, 0.0849609375, 0.138641357421875, 0.19232177734375, 0.246002197265625, 0.2996826171875, 0.353363037109375, 0.40704345703125, 0.460723876953125, 0.514404296875, 0.568084716796875, 0.62176513671875, 0.675445556640625, 0.7291259765625, 0.782806396484375, 0.83648681640625, 0.890167236328125, 0.94384765625, 0.997528076171875, 1.05120849609375, 1.104888916015625, 1.1585693359375, 1.212249755859375, 1.26593017578125, 1.319610595703125, 1.373291015625, 1.426971435546875, 1.48065185546875, 1.534332275390625, 1.5880126953125, 1.641693115234375, 1.69537353515625, 1.749053955078125, 1.802734375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 11.0, 15.0, 17.0, 30.0, 40.0, 56.0, 78.0, 109.0, 193.0, 216.0, 364.0, 487.0, 671.0, 951.0, 1406.0, 2045.0, 3070.0, 4458.0, 6407.0, 9639.0, 14495.0, 21632.0, 33349.0, 52822.0, 86331.0, 141654.0, 1253132.0, 172750.0, 107142.0, 64629.0, 40288.0, 26121.0, 17019.0, 11353.0, 7640.0, 5096.0, 3433.0, 2444.0, 1663.0, 1147.0, 809.0, 564.0, 423.0, 274.0, 193.0, 150.0, 113.0, 71.0, 39.0, 21.0, 28.0, 19.0, 11.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.235595703125, -0.22792434692382812, -0.22025299072265625, -0.21258163452148438, -0.2049102783203125, -0.19723892211914062, -0.18956756591796875, -0.18189620971679688, -0.174224853515625, -0.16655349731445312, -0.15888214111328125, -0.15121078491210938, -0.1435394287109375, -0.13586807250976562, -0.12819671630859375, -0.12052536010742188, -0.11285400390625, -0.10518264770507812, -0.09751129150390625, -0.08983993530273438, -0.0821685791015625, -0.07449722290039062, -0.06682586669921875, -0.059154510498046875, -0.051483154296875, -0.043811798095703125, -0.03614044189453125, -0.028469085693359375, -0.0207977294921875, -0.013126373291015625, -0.00545501708984375, 0.002216339111328125, 0.0098876953125, 0.017559051513671875, 0.02523040771484375, 0.032901763916015625, 0.0405731201171875, 0.048244476318359375, 0.05591583251953125, 0.06358718872070312, 0.071258544921875, 0.07892990112304688, 0.08660125732421875, 0.09427261352539062, 0.1019439697265625, 0.10961532592773438, 0.11728668212890625, 0.12495803833007812, 0.13262939453125, 0.14030075073242188, 0.14797210693359375, 0.15564346313476562, 0.1633148193359375, 0.17098617553710938, 0.17865753173828125, 0.18632888793945312, 0.194000244140625, 0.20167160034179688, 0.20934295654296875, 0.21701431274414062, 0.2246856689453125, 0.23235702514648438, 0.24002838134765625, 0.24769973754882812, 0.25537109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 8.0, 10.0, 6.0, 12.0, 20.0, 18.0, 20.0, 46.0, 44.0, 49.0, 58.0, 54.0, 56.0, 83.0, 79.0, 67.0, 52.0, 60.0, 52.0, 41.0, 37.0, 19.0, 15.0, 17.0, 11.0, 11.0, 5.0, 7.0, 9.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001087188720703125, -0.0010554268956184387, -0.0010236650705337524, -0.0009919032454490662, -0.0009601414203643799, -0.0009283795952796936, -0.0008966177701950073, -0.000864855945110321, -0.0008330941200256348, -0.0008013322949409485, -0.0007695704698562622, -0.0007378086447715759, -0.0007060468196868896, -0.0006742849946022034, -0.0006425231695175171, -0.0006107613444328308, -0.0005789995193481445, -0.0005472376942634583, -0.000515475869178772, -0.0004837140440940857, -0.0004519522190093994, -0.00042019039392471313, -0.00038842856884002686, -0.0003566667437553406, -0.0003249049186706543, -0.000293143093585968, -0.00026138126850128174, -0.00022961944341659546, -0.00019785761833190918, -0.0001660957932472229, -0.00013433396816253662, -0.00010257214307785034, -7.081031799316406e-05, -3.904849290847778e-05, -7.286667823791504e-06, 2.4475157260894775e-05, 5.6236982345581055e-05, 8.799880743026733e-05, 0.00011976063251495361, 0.0001515224575996399, 0.00018328428268432617, 0.00021504610776901245, 0.00024680793285369873, 0.000278569757938385, 0.0003103315830230713, 0.00034209340810775757, 0.00037385523319244385, 0.0004056170582771301, 0.0004373788833618164, 0.0004691407084465027, 0.000500902533531189, 0.0005326643586158752, 0.0005644261837005615, 0.0005961880087852478, 0.0006279498338699341, 0.0006597116589546204, 0.0006914734840393066, 0.0007232353091239929, 0.0007549971342086792, 0.0007867589592933655, 0.0008185207843780518, 0.000850282609462738, 0.0008820444345474243, 0.0009138062596321106, 0.0009455680847167969]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 32.0, 31.0, 36.0, 62.0, 81.0, 153.0, 265.0, 536.0, 4799.0, 1021433.0, 19499.0, 676.0, 332.0, 148.0, 102.0, 79.0, 71.0, 27.0, 30.0, 16.0, 19.0, 16.0, 8.0, 13.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020721435546875, -0.020021677017211914, -0.019321918487548828, -0.018622159957885742, -0.017922401428222656, -0.01722264289855957, -0.016522884368896484, -0.0158231258392334, -0.015123367309570312, -0.014423608779907227, -0.01372385025024414, -0.013024091720581055, -0.012324333190917969, -0.011624574661254883, -0.010924816131591797, -0.010225057601928711, -0.009525299072265625, -0.008825540542602539, -0.008125782012939453, -0.007426023483276367, -0.006726264953613281, -0.006026506423950195, -0.005326747894287109, -0.0046269893646240234, -0.0039272308349609375, -0.0032274723052978516, -0.0025277137756347656, -0.0018279552459716797, -0.0011281967163085938, -0.0004284381866455078, 0.0002713203430175781, 0.0009710788726806641, 0.00167083740234375, 0.002370595932006836, 0.003070354461669922, 0.003770112991333008, 0.004469871520996094, 0.00516963005065918, 0.005869388580322266, 0.0065691471099853516, 0.0072689056396484375, 0.007968664169311523, 0.00866842269897461, 0.009368181228637695, 0.010067939758300781, 0.010767698287963867, 0.011467456817626953, 0.012167215347290039, 0.012866973876953125, 0.013566732406616211, 0.014266490936279297, 0.014966249465942383, 0.01566600799560547, 0.016365766525268555, 0.01706552505493164, 0.017765283584594727, 0.018465042114257812, 0.0191648006439209, 0.019864559173583984, 0.02056431770324707, 0.021264076232910156, 0.021963834762573242, 0.022663593292236328, 0.023363351821899414, 0.0240631103515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 27.0, 93.0, 206.0, 281.0, 229.0, 114.0, 42.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026760930195450783, -0.0026253708638250828, -0.002574648940935731, -0.002523927018046379, -0.0024732048623263836, -0.002422482706606388, -0.0023717607837170362, -0.0023210388608276844, -0.002270316705107689, -0.0022195945493876934, -0.0021688726264983416, -0.0021181507036089897, -0.0020674285478889942, -0.0020167063921689987, -0.001965984469279647, -0.0019152624299749732, -0.0018645403906702995, -0.0018138183513656259, -0.0017630963120609522, -0.0017123742727562785, -0.0016616522334516048, -0.0016109301941469312, -0.0015602081548422575, -0.0015094861155375838, -0.0014587640762329102, -0.0014080420369282365, -0.0013573199976235628, -0.0013065979583188891, -0.0012558759190142155, -0.0012051538797095418, -0.0011544318404048681, -0.0011037098011001945, -0.0010529878782108426, -0.001002265838906169, -0.0009515437996014953, -0.0009008217602968216, -0.0008500997209921479, -0.0007993776816874743, -0.0007486556423828006, -0.0006979336030781269, -0.0006472115637734532, -0.0005964895244687796, -0.0005457674851641059, -0.0004950454458594322, -0.00044432340655475855, -0.0003936013672500849, -0.0003428793279454112, -0.00029215728864073753, -0.00024143524933606386, -0.0001907132100313902, -0.00013999117072671652, -8.926913142204285e-05, -3.8547092117369175e-05, 1.2174947187304497e-05, 6.289698649197817e-05, 0.00011361902579665184, 0.0001643410651013255, 0.00021506310440599918, 0.00026578514371067286, 0.0003165071830153465, 0.0003672292223200202, 0.00041795126162469387, 0.00046867330092936754, 0.0005193953402340412, 0.0005701173795387149]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 14.0, 6.0, 16.0, 16.0, 18.0, 18.0, 24.0, 23.0, 28.0, 28.0, 27.0, 27.0, 33.0, 30.0, 28.0, 39.0, 41.0, 38.0, 34.0, 35.0, 37.0, 38.0, 30.0, 38.0, 31.0, 36.0, 22.0, 33.0, 25.0, 20.0, 20.0, 26.0, 20.0, 9.0, 14.0, 17.0, 8.0, 7.0, 7.0, 3.0, 1.0, 6.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004534125328063965, -0.00043966155499219894, -0.0004259105771780014, -0.00041215959936380386, -0.0003984086215496063, -0.0003846576437354088, -0.00037090666592121124, -0.0003571556881070137, -0.00034340471029281616, -0.0003296537324786186, -0.0003159027546644211, -0.00030215177685022354, -0.000288400799036026, -0.00027464982122182846, -0.0002608988434076309, -0.0002471478655934334, -0.00023339688777923584, -0.0002196459099650383, -0.00020589493215084076, -0.00019214395433664322, -0.00017839297652244568, -0.00016464199870824814, -0.0001508910208940506, -0.00013714004307985306, -0.00012338906526565552, -0.00010963808745145798, -9.588710963726044e-05, -8.21361318230629e-05, -6.838515400886536e-05, -5.4634176194667816e-05, -4.0883198380470276e-05, -2.7132220566272736e-05, -1.3381242752075195e-05, 3.6973506212234497e-07, 1.4120712876319885e-05, 2.7871690690517426e-05, 4.1622668504714966e-05, 5.5373646318912506e-05, 6.912462413311005e-05, 8.287560194730759e-05, 9.662657976150513e-05, 0.00011037755757570267, 0.0001241285353899002, 0.00013787951320409775, 0.0001516304910182953, 0.00016538146883249283, 0.00017913244664669037, 0.0001928834244608879, 0.00020663440227508545, 0.000220385380089283, 0.00023413635790348053, 0.00024788733571767807, 0.0002616383135318756, 0.00027538929134607315, 0.0002891402691602707, 0.00030289124697446823, 0.00031664222478866577, 0.0003303932026028633, 0.00034414418041706085, 0.0003578951582312584, 0.00037164613604545593, 0.0003853971138596535, 0.000399148091673851, 0.00041289906948804855, 0.0004266500473022461]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 4.0, 10.0, 15.0, 26.0, 15.0, 11.0, 22.0, 19.0, 24.0, 25.0, 30.0, 35.0, 42.0, 22.0, 39.0, 38.0, 45.0, 46.0, 28.0, 33.0, 42.0, 38.0, 41.0, 31.0, 40.0, 40.0, 22.0, 23.0, 32.0, 21.0, 19.0, 17.0, 10.0, 16.0, 13.0, 15.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.833984375, -2.75152587890625, -2.6690673828125, -2.58660888671875, -2.504150390625, -2.42169189453125, -2.3392333984375, -2.25677490234375, -2.17431640625, -2.09185791015625, -2.0093994140625, -1.92694091796875, -1.844482421875, -1.76202392578125, -1.6795654296875, -1.59710693359375, -1.5146484375, -1.43218994140625, -1.3497314453125, -1.26727294921875, -1.184814453125, -1.10235595703125, -1.0198974609375, -0.93743896484375, -0.85498046875, -0.77252197265625, -0.6900634765625, -0.60760498046875, -0.525146484375, -0.44268798828125, -0.3602294921875, -0.27777099609375, -0.1953125, -0.11285400390625, -0.0303955078125, 0.05206298828125, 0.134521484375, 0.21697998046875, 0.2994384765625, 0.38189697265625, 0.46435546875, 0.54681396484375, 0.6292724609375, 0.71173095703125, 0.794189453125, 0.87664794921875, 0.9591064453125, 1.04156494140625, 1.1240234375, 1.20648193359375, 1.2889404296875, 1.37139892578125, 1.453857421875, 1.53631591796875, 1.6187744140625, 1.70123291015625, 1.78369140625, 1.86614990234375, 1.9486083984375, 2.03106689453125, 2.113525390625, 2.19598388671875, 2.2784423828125, 2.36090087890625, 2.443359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 6.0, 10.0, 10.0, 10.0, 21.0, 24.0, 35.0, 44.0, 79.0, 156.0, 293.0, 597.0, 1229.0, 2636.0, 5509.0, 11063.0, 23081.0, 53299.0, 138717.0, 345721.0, 282609.0, 104967.0, 41867.0, 18889.0, 8974.0, 4486.0, 2056.0, 1050.0, 483.0, 232.0, 147.0, 79.0, 42.0, 42.0, 24.0, 13.0, 12.0, 12.0, 8.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.713165283203125, -2.61578369140625, -2.518402099609375, -2.4210205078125, -2.323638916015625, -2.22625732421875, -2.128875732421875, -2.031494140625, -1.934112548828125, -1.83673095703125, -1.739349365234375, -1.6419677734375, -1.544586181640625, -1.44720458984375, -1.349822998046875, -1.25244140625, -1.155059814453125, -1.05767822265625, -0.960296630859375, -0.8629150390625, -0.765533447265625, -0.66815185546875, -0.570770263671875, -0.473388671875, -0.376007080078125, -0.27862548828125, -0.181243896484375, -0.0838623046875, 0.013519287109375, 0.11090087890625, 0.208282470703125, 0.3056640625, 0.403045654296875, 0.50042724609375, 0.597808837890625, 0.6951904296875, 0.792572021484375, 0.88995361328125, 0.987335205078125, 1.084716796875, 1.182098388671875, 1.27947998046875, 1.376861572265625, 1.4742431640625, 1.571624755859375, 1.66900634765625, 1.766387939453125, 1.86376953125, 1.961151123046875, 2.05853271484375, 2.155914306640625, 2.2532958984375, 2.350677490234375, 2.44805908203125, 2.545440673828125, 2.642822265625, 2.740203857421875, 2.83758544921875, 2.934967041015625, 3.0323486328125, 3.129730224609375, 3.22711181640625, 3.324493408203125, 3.421875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 9.0, 3.0, 7.0, 10.0, 12.0, 15.0, 11.0, 12.0, 14.0, 25.0, 26.0, 38.0, 35.0, 39.0, 36.0, 58.0, 59.0, 89.0, 170.0, 1421.0, 374.0, 146.0, 78.0, 43.0, 37.0, 43.0, 38.0, 25.0, 27.0, 29.0, 14.0, 20.0, 16.0, 18.0, 10.0, 5.0, 9.0, 10.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.09375, -11.747802734375, -11.40185546875, -11.055908203125, -10.7099609375, -10.364013671875, -10.01806640625, -9.672119140625, -9.326171875, -8.980224609375, -8.63427734375, -8.288330078125, -7.9423828125, -7.596435546875, -7.25048828125, -6.904541015625, -6.55859375, -6.212646484375, -5.86669921875, -5.520751953125, -5.1748046875, -4.828857421875, -4.48291015625, -4.136962890625, -3.791015625, -3.445068359375, -3.09912109375, -2.753173828125, -2.4072265625, -2.061279296875, -1.71533203125, -1.369384765625, -1.0234375, -0.677490234375, -0.33154296875, 0.014404296875, 0.3603515625, 0.706298828125, 1.05224609375, 1.398193359375, 1.744140625, 2.090087890625, 2.43603515625, 2.781982421875, 3.1279296875, 3.473876953125, 3.81982421875, 4.165771484375, 4.51171875, 4.857666015625, 5.20361328125, 5.549560546875, 5.8955078125, 6.241455078125, 6.58740234375, 6.933349609375, 7.279296875, 7.625244140625, 7.97119140625, 8.317138671875, 8.6630859375, 9.009033203125, 9.35498046875, 9.700927734375, 10.046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 11.0, 9.0, 8.0, 18.0, 23.0, 26.0, 37.0, 44.0, 64.0, 85.0, 116.0, 242.0, 394.0, 807.0, 18580.0, 3116954.0, 6564.0, 700.0, 322.0, 208.0, 157.0, 84.0, 65.0, 48.0, 47.0, 22.0, 21.0, 19.0, 4.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.6875, -40.43994140625, -39.1923828125, -37.94482421875, -36.697265625, -35.44970703125, -34.2021484375, -32.95458984375, -31.70703125, -30.45947265625, -29.2119140625, -27.96435546875, -26.716796875, -25.46923828125, -24.2216796875, -22.97412109375, -21.7265625, -20.47900390625, -19.2314453125, -17.98388671875, -16.736328125, -15.48876953125, -14.2412109375, -12.99365234375, -11.74609375, -10.49853515625, -9.2509765625, -8.00341796875, -6.755859375, -5.50830078125, -4.2607421875, -3.01318359375, -1.765625, -0.51806640625, 0.7294921875, 1.97705078125, 3.224609375, 4.47216796875, 5.7197265625, 6.96728515625, 8.21484375, 9.46240234375, 10.7099609375, 11.95751953125, 13.205078125, 14.45263671875, 15.7001953125, 16.94775390625, 18.1953125, 19.44287109375, 20.6904296875, 21.93798828125, 23.185546875, 24.43310546875, 25.6806640625, 26.92822265625, 28.17578125, 29.42333984375, 30.6708984375, 31.91845703125, 33.166015625, 34.41357421875, 35.6611328125, 36.90869140625, 38.15625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 34.0, 307.0, 502.0, 153.0, 14.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.717714309692383, -29.986541748046875, -28.255369186401367, -26.52419662475586, -24.793025970458984, -23.061851501464844, -21.33068084716797, -19.59950828552246, -17.868335723876953, -16.137163162231445, -14.405990600585938, -12.674818992614746, -10.943646430969238, -9.21247386932373, -7.481302261352539, -5.750129699707031, -4.018957138061523, -2.2877848148345947, -0.556612491607666, 1.1745595932006836, 2.9057321548461914, 4.636904716491699, 6.368076324462891, 8.099248886108398, 9.830421447753906, 11.561594009399414, 13.292766571044922, 15.023938179016113, 16.755111694335938, 18.486282348632812, 20.21745491027832, 21.948627471923828, 23.67980194091797, 25.410974502563477, 27.142147064208984, 28.87331771850586, 30.6044921875, 32.335662841796875, 34.06683349609375, 35.79800796508789, 37.52918243408203, 39.260353088378906, 40.99152755737305, 42.72269821166992, 44.45387268066406, 46.18504333496094, 47.91621398925781, 49.64738845825195, 51.37855911254883, 53.1097297668457, 54.840904235839844, 56.57207489013672, 58.30324935913086, 60.034420013427734, 61.765594482421875, 63.49676513671875, 65.22793579101562, 66.9591064453125, 68.69027709960938, 70.42145538330078, 72.15262603759766, 73.88379669189453, 75.6149673461914, 77.34614562988281, 79.07731628417969]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 6.0, 3.0, 9.0, 9.0, 10.0, 14.0, 17.0, 19.0, 21.0, 26.0, 20.0, 23.0, 22.0, 22.0, 23.0, 33.0, 36.0, 36.0, 46.0, 30.0, 42.0, 31.0, 39.0, 51.0, 46.0, 34.0, 53.0, 33.0, 35.0, 36.0, 30.0, 22.0, 21.0, 11.0, 16.0, 17.0, 8.0, 11.0, 5.0, 4.0, 9.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.147106170654297, -22.370359420776367, -21.593612670898438, -20.816865921020508, -20.040119171142578, -19.263370513916016, -18.486623764038086, -17.709877014160156, -16.933130264282227, -16.156383514404297, -15.379636764526367, -14.602889060974121, -13.826142311096191, -13.049395561218262, -12.272647857666016, -11.495901107788086, -10.719154357910156, -9.942407608032227, -9.165660858154297, -8.38891315460205, -7.612166404724121, -6.835419654846191, -6.0586724281311035, -5.281925201416016, -4.505178451538086, -3.728431463241577, -2.9516844749450684, -2.1749374866485596, -1.3981904983520508, -0.621443510055542, 0.1553034782409668, 0.9320507049560547, 1.7087955474853516, 2.4855425357818604, 3.262289524078369, 4.039036750793457, 4.815783500671387, 5.592530250549316, 6.369277477264404, 7.146024703979492, 7.922771453857422, 8.699518203735352, 9.476264953613281, 10.253012657165527, 11.029759407043457, 11.806506156921387, 12.583253860473633, 13.360000610351562, 14.136747360229492, 14.913494110107422, 15.690240859985352, 16.46698760986328, 17.243736267089844, 18.020483016967773, 18.797229766845703, 19.573976516723633, 20.350723266601562, 21.127470016479492, 21.904216766357422, 22.68096351623535, 23.45771026611328, 24.234458923339844, 25.011205673217773, 25.787952423095703, 26.564699172973633]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 4.0, 3.0, 6.0, 7.0, 15.0, 8.0, 10.0, 26.0, 18.0, 19.0, 16.0, 27.0, 35.0, 25.0, 28.0, 39.0, 42.0, 30.0, 38.0, 33.0, 40.0, 46.0, 45.0, 32.0, 41.0, 44.0, 39.0, 40.0, 34.0, 28.0, 26.0, 23.0, 19.0, 20.0, 12.0, 13.0, 15.0, 14.0, 6.0, 3.0, 8.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.123046875, -3.028045654296875, -2.93304443359375, -2.838043212890625, -2.7430419921875, -2.648040771484375, -2.55303955078125, -2.458038330078125, -2.363037109375, -2.268035888671875, -2.17303466796875, -2.078033447265625, -1.9830322265625, -1.888031005859375, -1.79302978515625, -1.698028564453125, -1.60302734375, -1.508026123046875, -1.41302490234375, -1.318023681640625, -1.2230224609375, -1.128021240234375, -1.03302001953125, -0.938018798828125, -0.843017578125, -0.748016357421875, -0.65301513671875, -0.558013916015625, -0.4630126953125, -0.368011474609375, -0.27301025390625, -0.178009033203125, -0.0830078125, 0.011993408203125, 0.10699462890625, 0.201995849609375, 0.2969970703125, 0.391998291015625, 0.48699951171875, 0.582000732421875, 0.677001953125, 0.772003173828125, 0.86700439453125, 0.962005615234375, 1.0570068359375, 1.152008056640625, 1.24700927734375, 1.342010498046875, 1.43701171875, 1.532012939453125, 1.62701416015625, 1.722015380859375, 1.8170166015625, 1.912017822265625, 2.00701904296875, 2.102020263671875, 2.197021484375, 2.292022705078125, 2.38702392578125, 2.482025146484375, 2.5770263671875, 2.672027587890625, 2.76702880859375, 2.862030029296875, 2.95703125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 7.0, 7.0, 7.0, 8.0, 7.0, 13.0, 22.0, 26.0, 22.0, 29.0, 44.0, 56.0, 55.0, 66.0, 122.0, 148.0, 278.0, 700.0, 2958.0, 33146.0, 696111.0, 2847844.0, 580774.0, 27539.0, 2674.0, 705.0, 269.0, 156.0, 101.0, 82.0, 69.0, 42.0, 45.0, 27.0, 31.0, 23.0, 14.0, 16.0, 6.0, 11.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.046875, -7.7911376953125, -7.535400390625, -7.2796630859375, -7.02392578125, -6.7681884765625, -6.512451171875, -6.2567138671875, -6.0009765625, -5.7452392578125, -5.489501953125, -5.2337646484375, -4.97802734375, -4.7222900390625, -4.466552734375, -4.2108154296875, -3.955078125, -3.6993408203125, -3.443603515625, -3.1878662109375, -2.93212890625, -2.6763916015625, -2.420654296875, -2.1649169921875, -1.9091796875, -1.6534423828125, -1.397705078125, -1.1419677734375, -0.88623046875, -0.6304931640625, -0.374755859375, -0.1190185546875, 0.13671875, 0.3924560546875, 0.648193359375, 0.9039306640625, 1.15966796875, 1.4154052734375, 1.671142578125, 1.9268798828125, 2.1826171875, 2.4383544921875, 2.694091796875, 2.9498291015625, 3.20556640625, 3.4613037109375, 3.717041015625, 3.9727783203125, 4.228515625, 4.4842529296875, 4.739990234375, 4.9957275390625, 5.25146484375, 5.5072021484375, 5.762939453125, 6.0186767578125, 6.2744140625, 6.5301513671875, 6.785888671875, 7.0416259765625, 7.29736328125, 7.5531005859375, 7.808837890625, 8.0645751953125, 8.3203125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 4.0, 11.0, 9.0, 16.0, 22.0, 34.0, 58.0, 75.0, 99.0, 141.0, 182.0, 278.0, 335.0, 463.0, 460.0, 446.0, 376.0, 316.0, 184.0, 162.0, 113.0, 77.0, 48.0, 49.0, 34.0, 21.0, 14.0, 14.0, 8.0, 8.0, 9.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.7786865234375, -5.576904296875, -5.3751220703125, -5.17333984375, -4.9715576171875, -4.769775390625, -4.5679931640625, -4.3662109375, -4.1644287109375, -3.962646484375, -3.7608642578125, -3.55908203125, -3.3572998046875, -3.155517578125, -2.9537353515625, -2.751953125, -2.5501708984375, -2.348388671875, -2.1466064453125, -1.94482421875, -1.7430419921875, -1.541259765625, -1.3394775390625, -1.1376953125, -0.9359130859375, -0.734130859375, -0.5323486328125, -0.33056640625, -0.1287841796875, 0.072998046875, 0.2747802734375, 0.4765625, 0.6783447265625, 0.880126953125, 1.0819091796875, 1.28369140625, 1.4854736328125, 1.687255859375, 1.8890380859375, 2.0908203125, 2.2926025390625, 2.494384765625, 2.6961669921875, 2.89794921875, 3.0997314453125, 3.301513671875, 3.5032958984375, 3.705078125, 3.9068603515625, 4.108642578125, 4.3104248046875, 4.51220703125, 4.7139892578125, 4.915771484375, 5.1175537109375, 5.3193359375, 5.5211181640625, 5.722900390625, 5.9246826171875, 6.12646484375, 6.3282470703125, 6.530029296875, 6.7318115234375, 6.93359375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 8.0, 6.0, 15.0, 14.0, 20.0, 34.0, 49.0, 54.0, 70.0, 132.0, 174.0, 249.0, 394.0, 781.0, 31086.0, 4094991.0, 64070.0, 875.0, 435.0, 255.0, 172.0, 132.0, 76.0, 61.0, 40.0, 26.0, 21.0, 14.0, 7.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.646484375, -30.73046875, -29.814453125, -28.8984375, -27.982421875, -27.06640625, -26.150390625, -25.234375, -24.318359375, -23.40234375, -22.486328125, -21.5703125, -20.654296875, -19.73828125, -18.822265625, -17.90625, -16.990234375, -16.07421875, -15.158203125, -14.2421875, -13.326171875, -12.41015625, -11.494140625, -10.578125, -9.662109375, -8.74609375, -7.830078125, -6.9140625, -5.998046875, -5.08203125, -4.166015625, -3.25, -2.333984375, -1.41796875, -0.501953125, 0.4140625, 1.330078125, 2.24609375, 3.162109375, 4.078125, 4.994140625, 5.91015625, 6.826171875, 7.7421875, 8.658203125, 9.57421875, 10.490234375, 11.40625, 12.322265625, 13.23828125, 14.154296875, 15.0703125, 15.986328125, 16.90234375, 17.818359375, 18.734375, 19.650390625, 20.56640625, 21.482421875, 22.3984375, 23.314453125, 24.23046875, 25.146484375, 26.0625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 55.0, 224.0, 390.0, 271.0, 57.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.12668228149414, -26.58468246459961, -24.04268455505371, -21.50068473815918, -18.95868682861328, -16.41668701171875, -13.874687194824219, -11.33268928527832, -8.790689468383789, -6.248690605163574, -3.706691265106201, -1.1646919250488281, 1.3773069381713867, 3.9193058013916016, 6.461305618286133, 9.003303527832031, 11.545303344726562, 14.087302207946777, 16.629301071166992, 19.171300888061523, 21.713298797607422, 24.255298614501953, 26.797298431396484, 29.339296340942383, 31.881296157836914, 34.42329406738281, 36.965293884277344, 39.507293701171875, 42.049293518066406, 44.59129333496094, 47.13329315185547, 49.675289154052734, 52.21729278564453, 54.75929260253906, 57.301292419433594, 59.843292236328125, 62.38528823852539, 64.92729187011719, 67.46928405761719, 70.01128387451172, 72.55328369140625, 75.09528350830078, 77.63728332519531, 80.17928314208984, 82.72128295898438, 85.26327514648438, 87.80528259277344, 90.34727478027344, 92.8892822265625, 95.43128204345703, 97.97328186035156, 100.5152816772461, 103.05728149414062, 105.59927368164062, 108.14128112792969, 110.68327331542969, 113.22527313232422, 115.76727294921875, 118.30927276611328, 120.85127258300781, 123.39327239990234, 125.93527221679688, 128.47726440429688, 131.01927185058594, 133.56126403808594]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 9.0, 10.0, 9.0, 17.0, 12.0, 6.0, 19.0, 30.0, 33.0, 38.0, 36.0, 34.0, 33.0, 48.0, 38.0, 42.0, 40.0, 49.0, 48.0, 41.0, 51.0, 31.0, 42.0, 31.0, 24.0, 40.0, 19.0, 24.0, 25.0, 18.0, 12.0, 15.0, 11.0, 12.0, 8.0, 9.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.853904724121094, -18.2478084564209, -17.641714096069336, -17.03561782836914, -16.429523468017578, -15.823427200317383, -15.217331886291504, -14.611236572265625, -14.00514030456543, -13.39904499053955, -12.792949676513672, -12.186853408813477, -11.580758094787598, -10.974662780761719, -10.36856746673584, -9.762472152709961, -9.156376838684082, -8.550281524658203, -7.944185733795166, -7.338090419769287, -6.73199462890625, -6.125899314880371, -5.519804000854492, -4.913708209991455, -4.307612895965576, -3.701517343521118, -3.09542179107666, -2.4893264770507812, -1.8832309246063232, -1.2771353721618652, -0.6710400581359863, -0.06494426727294922, 0.5411510467529297, 1.1472465991973877, 1.7533420324325562, 2.3594374656677246, 2.9655330181121826, 3.5716285705566406, 4.1777238845825195, 4.783819675445557, 5.3899149894714355, 5.9960103034973145, 6.602106094360352, 7.2082014083862305, 7.814296722412109, 8.420392990112305, 9.026487350463867, 9.632583618164062, 10.238678932189941, 10.84477424621582, 11.4508695602417, 12.056964874267578, 12.663061141967773, 13.269156455993652, 13.875251770019531, 14.481348037719727, 15.087442398071289, 15.693537712097168, 16.299633026123047, 16.905729293823242, 17.511823654174805, 18.117919921875, 18.724014282226562, 19.330110549926758, 19.936206817626953]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 7.0, 5.0, 6.0, 8.0, 7.0, 16.0, 22.0, 14.0, 29.0, 25.0, 26.0, 32.0, 33.0, 33.0, 45.0, 44.0, 41.0, 44.0, 39.0, 39.0, 47.0, 34.0, 45.0, 28.0, 31.0, 36.0, 35.0, 29.0, 40.0, 34.0, 19.0, 14.0, 14.0, 15.0, 10.0, 13.0, 9.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.236297607421875, -3.14447021484375, -3.052642822265625, -2.9608154296875, -2.868988037109375, -2.77716064453125, -2.685333251953125, -2.593505859375, -2.501678466796875, -2.40985107421875, -2.318023681640625, -2.2261962890625, -2.134368896484375, -2.04254150390625, -1.950714111328125, -1.85888671875, -1.767059326171875, -1.67523193359375, -1.583404541015625, -1.4915771484375, -1.399749755859375, -1.30792236328125, -1.216094970703125, -1.124267578125, -1.032440185546875, -0.94061279296875, -0.848785400390625, -0.7569580078125, -0.665130615234375, -0.57330322265625, -0.481475830078125, -0.3896484375, -0.297821044921875, -0.20599365234375, -0.114166259765625, -0.0223388671875, 0.069488525390625, 0.16131591796875, 0.253143310546875, 0.344970703125, 0.436798095703125, 0.52862548828125, 0.620452880859375, 0.7122802734375, 0.804107666015625, 0.89593505859375, 0.987762451171875, 1.07958984375, 1.171417236328125, 1.26324462890625, 1.355072021484375, 1.4468994140625, 1.538726806640625, 1.63055419921875, 1.722381591796875, 1.814208984375, 1.906036376953125, 1.99786376953125, 2.089691162109375, 2.1815185546875, 2.273345947265625, 2.36517333984375, 2.457000732421875, 2.548828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 6.0, 5.0, 5.0, 16.0, 14.0, 33.0, 46.0, 50.0, 104.0, 140.0, 173.0, 279.0, 405.0, 568.0, 916.0, 1438.0, 2182.0, 3184.0, 4859.0, 7624.0, 11832.0, 18857.0, 30888.0, 50218.0, 85151.0, 145657.0, 223175.0, 184707.0, 108962.0, 63364.0, 38649.0, 23642.0, 14626.0, 9249.0, 5920.0, 3981.0, 2586.0, 1657.0, 1128.0, 751.0, 487.0, 345.0, 219.0, 144.0, 112.0, 60.0, 46.0, 36.0, 32.0, 8.0, 6.0, 12.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.309814453125, -0.2997322082519531, -0.28964996337890625, -0.2795677185058594, -0.2694854736328125, -0.2594032287597656, -0.24932098388671875, -0.23923873901367188, -0.229156494140625, -0.21907424926757812, -0.20899200439453125, -0.19890975952148438, -0.1888275146484375, -0.17874526977539062, -0.16866302490234375, -0.15858078002929688, -0.14849853515625, -0.13841629028320312, -0.12833404541015625, -0.11825180053710938, -0.1081695556640625, -0.09808731079101562, -0.08800506591796875, -0.07792282104492188, -0.067840576171875, -0.057758331298828125, -0.04767608642578125, -0.037593841552734375, -0.0275115966796875, -0.017429351806640625, -0.00734710693359375, 0.002735137939453125, 0.0128173828125, 0.022899627685546875, 0.03298187255859375, 0.043064117431640625, 0.0531463623046875, 0.06322860717773438, 0.07331085205078125, 0.08339309692382812, 0.093475341796875, 0.10355758666992188, 0.11363983154296875, 0.12372207641601562, 0.1338043212890625, 0.14388656616210938, 0.15396881103515625, 0.16405105590820312, 0.17413330078125, 0.18421554565429688, 0.19429779052734375, 0.20438003540039062, 0.2144622802734375, 0.22454452514648438, 0.23462677001953125, 0.24470901489257812, 0.254791259765625, 0.2648735046386719, 0.27495574951171875, 0.2850379943847656, 0.2951202392578125, 0.3052024841308594, 0.31528472900390625, 0.3253669738769531, 0.33544921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 7.0, 5.0, 6.0, 7.0, 11.0, 15.0, 4.0, 12.0, 16.0, 21.0, 16.0, 25.0, 32.0, 24.0, 27.0, 31.0, 33.0, 38.0, 38.0, 39.0, 52.0, 1060.0, 51.0, 50.0, 32.0, 35.0, 30.0, 35.0, 32.0, 32.0, 31.0, 30.0, 20.0, 13.0, 24.0, 17.0, 14.0, 14.0, 9.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.560546875, -1.505767822265625, -1.45098876953125, -1.396209716796875, -1.3414306640625, -1.286651611328125, -1.23187255859375, -1.177093505859375, -1.122314453125, -1.067535400390625, -1.01275634765625, -0.957977294921875, -0.9031982421875, -0.848419189453125, -0.79364013671875, -0.738861083984375, -0.68408203125, -0.629302978515625, -0.57452392578125, -0.519744873046875, -0.4649658203125, -0.410186767578125, -0.35540771484375, -0.300628662109375, -0.245849609375, -0.191070556640625, -0.13629150390625, -0.081512451171875, -0.0267333984375, 0.028045654296875, 0.08282470703125, 0.137603759765625, 0.1923828125, 0.247161865234375, 0.30194091796875, 0.356719970703125, 0.4114990234375, 0.466278076171875, 0.52105712890625, 0.575836181640625, 0.630615234375, 0.685394287109375, 0.74017333984375, 0.794952392578125, 0.8497314453125, 0.904510498046875, 0.95928955078125, 1.014068603515625, 1.06884765625, 1.123626708984375, 1.17840576171875, 1.233184814453125, 1.2879638671875, 1.342742919921875, 1.39752197265625, 1.452301025390625, 1.507080078125, 1.561859130859375, 1.61663818359375, 1.671417236328125, 1.7261962890625, 1.780975341796875, 1.83575439453125, 1.890533447265625, 1.9453125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 10.0, 16.0, 21.0, 23.0, 35.0, 56.0, 83.0, 146.0, 188.0, 272.0, 468.0, 659.0, 972.0, 1508.0, 2353.0, 3640.0, 5671.0, 8999.0, 14453.0, 23474.0, 39214.0, 66121.0, 115581.0, 199311.0, 1273222.0, 140118.0, 79842.0, 46663.0, 27699.0, 16856.0, 10501.0, 6723.0, 4253.0, 2718.0, 1809.0, 1200.0, 790.0, 489.0, 343.0, 225.0, 151.0, 90.0, 57.0, 38.0, 27.0, 20.0, 14.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.305908203125, -0.2969551086425781, -0.28800201416015625, -0.2790489196777344, -0.2700958251953125, -0.2611427307128906, -0.25218963623046875, -0.24323654174804688, -0.234283447265625, -0.22533035278320312, -0.21637725830078125, -0.20742416381835938, -0.1984710693359375, -0.18951797485351562, -0.18056488037109375, -0.17161178588867188, -0.16265869140625, -0.15370559692382812, -0.14475250244140625, -0.13579940795898438, -0.1268463134765625, -0.11789321899414062, -0.10894012451171875, -0.09998703002929688, -0.091033935546875, -0.08208084106445312, -0.07312774658203125, -0.06417465209960938, -0.0552215576171875, -0.046268463134765625, -0.03731536865234375, -0.028362274169921875, -0.0194091796875, -0.010456085205078125, -0.00150299072265625, 0.007450103759765625, 0.0164031982421875, 0.025356292724609375, 0.03430938720703125, 0.043262481689453125, 0.052215576171875, 0.061168670654296875, 0.07012176513671875, 0.07907485961914062, 0.0880279541015625, 0.09698104858398438, 0.10593414306640625, 0.11488723754882812, 0.12384033203125, 0.13279342651367188, 0.14174652099609375, 0.15069961547851562, 0.1596527099609375, 0.16860580444335938, 0.17755889892578125, 0.18651199340820312, 0.195465087890625, 0.20441818237304688, 0.21337127685546875, 0.22232437133789062, 0.2312774658203125, 0.24023056030273438, 0.24918365478515625, 0.2581367492675781, 0.26708984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 9.0, 13.0, 23.0, 30.0, 38.0, 20.0, 35.0, 45.0, 44.0, 44.0, 66.0, 55.0, 60.0, 51.0, 57.0, 67.0, 45.0, 50.0, 37.0, 29.0, 36.0, 30.0, 20.0, 13.0, 15.0, 10.0, 14.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008945465087890625, -0.000864759087562561, -0.0008349716663360596, -0.0008051842451095581, -0.0007753968238830566, -0.0007456094026565552, -0.0007158219814300537, -0.0006860345602035522, -0.0006562471389770508, -0.0006264597177505493, -0.0005966722965240479, -0.0005668848752975464, -0.0005370974540710449, -0.0005073100328445435, -0.000477522611618042, -0.00044773519039154053, -0.00041794776916503906, -0.0003881603479385376, -0.00035837292671203613, -0.00032858550548553467, -0.0002987980842590332, -0.00026901066303253174, -0.00023922324180603027, -0.0002094358205795288, -0.00017964839935302734, -0.00014986097812652588, -0.00012007355690002441, -9.028613567352295e-05, -6.0498714447021484e-05, -3.071129322052002e-05, -9.238719940185547e-07, 2.886354923248291e-05, 5.8650970458984375e-05, 8.843839168548584e-05, 0.0001182258129119873, 0.00014801323413848877, 0.00017780065536499023, 0.0002075880765914917, 0.00023737549781799316, 0.00026716291904449463, 0.0002969503402709961, 0.00032673776149749756, 0.000356525182723999, 0.0003863126039505005, 0.00041610002517700195, 0.0004458874464035034, 0.0004756748676300049, 0.0005054622888565063, 0.0005352497100830078, 0.0005650371313095093, 0.0005948245525360107, 0.0006246119737625122, 0.0006543993949890137, 0.0006841868162155151, 0.0007139742374420166, 0.0007437616586685181, 0.0007735490798950195, 0.000803336501121521, 0.0008331239223480225, 0.0008629113435745239, 0.0008926987648010254, 0.0009224861860275269, 0.0009522736072540283, 0.0009820610284805298, 0.0010118484497070312]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 6.0, 4.0, 8.0, 13.0, 13.0, 16.0, 13.0, 26.0, 36.0, 45.0, 61.0, 71.0, 96.0, 146.0, 291.0, 746.0, 10334.0, 1016861.0, 18014.0, 844.0, 299.0, 150.0, 115.0, 88.0, 65.0, 51.0, 47.0, 25.0, 19.0, 12.0, 9.0, 10.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0223541259765625, -0.02170705795288086, -0.02105998992919922, -0.020412921905517578, -0.019765853881835938, -0.019118785858154297, -0.018471717834472656, -0.017824649810791016, -0.017177581787109375, -0.016530513763427734, -0.015883445739746094, -0.015236377716064453, -0.014589309692382812, -0.013942241668701172, -0.013295173645019531, -0.01264810562133789, -0.01200103759765625, -0.01135396957397461, -0.010706901550292969, -0.010059833526611328, -0.009412765502929688, -0.008765697479248047, -0.008118629455566406, -0.007471561431884766, -0.006824493408203125, -0.006177425384521484, -0.005530357360839844, -0.004883289337158203, -0.0042362213134765625, -0.003589153289794922, -0.0029420852661132812, -0.0022950172424316406, -0.00164794921875, -0.0010008811950683594, -0.00035381317138671875, 0.0002932548522949219, 0.0009403228759765625, 0.0015873908996582031, 0.0022344589233398438, 0.0028815269470214844, 0.003528594970703125, 0.004175662994384766, 0.004822731018066406, 0.005469799041748047, 0.0061168670654296875, 0.006763935089111328, 0.007411003112792969, 0.00805807113647461, 0.00870513916015625, 0.00935220718383789, 0.009999275207519531, 0.010646343231201172, 0.011293411254882812, 0.011940479278564453, 0.012587547302246094, 0.013234615325927734, 0.013881683349609375, 0.014528751373291016, 0.015175819396972656, 0.015822887420654297, 0.016469955444335938, 0.017117023468017578, 0.01776409149169922, 0.01841115951538086, 0.0190582275390625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 51.0, 178.0, 325.0, 273.0, 135.0, 32.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036826252471655607, -0.0003052189131267369, -0.00024217528698500246, -0.00017913166084326804, -0.00011608804925344884, -5.304443766362965e-05, 9.999203030019999e-06, 7.304281461983919e-05, 0.00013608642620965838, 0.00019913003779947758, 0.00026217364938929677, 0.0003252172900829464, 0.0003882609016727656, 0.0004513045132625848, 0.0005143481539562345, 0.0005773917655460536, 0.0006404353771358728, 0.000703478988725692, 0.0007665226003155112, 0.0008295662701129913, 0.0008926098234951496, 0.0009556534932926297, 0.0010186971630901098, 0.001081740716472268, 0.0011447842698544264, 0.0012078279396519065, 0.0012708714930340648, 0.0013339151628315449, 0.0013969587162137032, 0.0014600023860111833, 0.0015230460558086634, 0.0015860896091908216, 0.0016491333954036236, 0.0017121770652011037, 0.001775220618583262, 0.001838264288380742, 0.0019013078417629004, 0.0019643513951450586, 0.0020273951813578606, 0.002090438734740019, 0.002153482288122177, 0.0022165258415043354, 0.0022795696277171373, 0.0023426131810992956, 0.002405656734481454, 0.002468700287863612, 0.002531744074076414, 0.0025947876274585724, 0.0026578311808407307, 0.002720874734222889, 0.002783918520435691, 0.002846962073817849, 0.0029100056272000074, 0.0029730491805821657, 0.0030360929667949677, 0.003099136520177126, 0.003162180306389928, 0.003225223859772086, 0.003288267645984888, 0.0033513111993670464, 0.0034143547527492046, 0.003477398306131363, 0.003540442092344165, 0.003603485645726323, 0.0036665291991084814]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 7.0, 16.0, 15.0, 12.0, 20.0, 19.0, 28.0, 27.0, 30.0, 25.0, 35.0, 38.0, 41.0, 38.0, 33.0, 39.0, 33.0, 33.0, 45.0, 43.0, 46.0, 32.0, 48.0, 29.0, 34.0, 33.0, 32.0, 24.0, 22.0, 16.0, 25.0, 10.0, 13.0, 7.0, 9.0, 6.0, 4.0, 3.0, 9.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004811286926269531, -0.0004660738632082939, -0.0004510190337896347, -0.0004359642043709755, -0.0004209093749523163, -0.0004058545455336571, -0.00039079971611499786, -0.00037574488669633865, -0.00036069005727767944, -0.00034563522785902023, -0.000330580398440361, -0.0003155255690217018, -0.0003004707396030426, -0.0002854159101843834, -0.0002703610807657242, -0.00025530625134706497, -0.00024025142192840576, -0.00022519659250974655, -0.00021014176309108734, -0.00019508693367242813, -0.00018003210425376892, -0.0001649772748351097, -0.0001499224454164505, -0.0001348676159977913, -0.00011981278657913208, -0.00010475795716047287, -8.970312774181366e-05, -7.464829832315445e-05, -5.959346890449524e-05, -4.453863948583603e-05, -2.948381006717682e-05, -1.4428980648517609e-05, 6.258487701416016e-07, 1.5680678188800812e-05, 3.073550760746002e-05, 4.579033702611923e-05, 6.084516644477844e-05, 7.589999586343765e-05, 9.095482528209686e-05, 0.00010600965470075607, 0.00012106448411941528, 0.0001361193135380745, 0.0001511741429567337, 0.00016622897237539291, 0.00018128380179405212, 0.00019633863121271133, 0.00021139346063137054, 0.00022644829005002975, 0.00024150311946868896, 0.0002565579488873482, 0.0002716127783060074, 0.0002866676077246666, 0.0003017224371433258, 0.000316777266561985, 0.0003318320959806442, 0.00034688692539930344, 0.00036194175481796265, 0.00037699658423662186, 0.00039205141365528107, 0.0004071062430739403, 0.0004221610724925995, 0.0004372159019112587, 0.0004522707313299179, 0.0004673255607485771, 0.00048238039016723633]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 7.0, 5.0, 6.0, 8.0, 7.0, 16.0, 22.0, 14.0, 29.0, 25.0, 26.0, 32.0, 33.0, 33.0, 45.0, 44.0, 41.0, 44.0, 39.0, 39.0, 47.0, 34.0, 45.0, 28.0, 31.0, 36.0, 35.0, 29.0, 41.0, 33.0, 19.0, 14.0, 14.0, 15.0, 10.0, 13.0, 9.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.236297607421875, -3.14447021484375, -3.052642822265625, -2.9608154296875, -2.868988037109375, -2.77716064453125, -2.685333251953125, -2.593505859375, -2.501678466796875, -2.40985107421875, -2.318023681640625, -2.2261962890625, -2.134368896484375, -2.04254150390625, -1.950714111328125, -1.85888671875, -1.767059326171875, -1.67523193359375, -1.583404541015625, -1.4915771484375, -1.399749755859375, -1.30792236328125, -1.216094970703125, -1.124267578125, -1.032440185546875, -0.94061279296875, -0.848785400390625, -0.7569580078125, -0.665130615234375, -0.57330322265625, -0.481475830078125, -0.3896484375, -0.297821044921875, -0.20599365234375, -0.114166259765625, -0.0223388671875, 0.069488525390625, 0.16131591796875, 0.253143310546875, 0.344970703125, 0.436798095703125, 0.52862548828125, 0.620452880859375, 0.7122802734375, 0.804107666015625, 0.89593505859375, 0.987762451171875, 1.07958984375, 1.171417236328125, 1.26324462890625, 1.355072021484375, 1.4468994140625, 1.538726806640625, 1.63055419921875, 1.722381591796875, 1.814208984375, 1.906036376953125, 1.99786376953125, 2.089691162109375, 2.1815185546875, 2.273345947265625, 2.36517333984375, 2.457000732421875, 2.548828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 8.0, 11.0, 16.0, 15.0, 16.0, 22.0, 27.0, 30.0, 53.0, 66.0, 68.0, 120.0, 191.0, 376.0, 743.0, 1672.0, 3992.0, 9455.0, 22631.0, 52859.0, 120691.0, 278313.0, 313941.0, 137597.0, 60436.0, 25803.0, 11000.0, 4521.0, 1922.0, 817.0, 394.0, 211.0, 146.0, 80.0, 72.0, 56.0, 41.0, 27.0, 26.0, 25.0, 12.0, 14.0, 12.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-3.48046875, -3.384002685546875, -3.28753662109375, -3.191070556640625, -3.0946044921875, -2.998138427734375, -2.90167236328125, -2.805206298828125, -2.708740234375, -2.612274169921875, -2.51580810546875, -2.419342041015625, -2.3228759765625, -2.226409912109375, -2.12994384765625, -2.033477783203125, -1.93701171875, -1.840545654296875, -1.74407958984375, -1.647613525390625, -1.5511474609375, -1.454681396484375, -1.35821533203125, -1.261749267578125, -1.165283203125, -1.068817138671875, -0.97235107421875, -0.875885009765625, -0.7794189453125, -0.682952880859375, -0.58648681640625, -0.490020751953125, -0.3935546875, -0.297088623046875, -0.20062255859375, -0.104156494140625, -0.0076904296875, 0.088775634765625, 0.18524169921875, 0.281707763671875, 0.378173828125, 0.474639892578125, 0.57110595703125, 0.667572021484375, 0.7640380859375, 0.860504150390625, 0.95697021484375, 1.053436279296875, 1.14990234375, 1.246368408203125, 1.34283447265625, 1.439300537109375, 1.5357666015625, 1.632232666015625, 1.72869873046875, 1.825164794921875, 1.921630859375, 2.018096923828125, 2.11456298828125, 2.211029052734375, 2.3074951171875, 2.403961181640625, 2.50042724609375, 2.596893310546875, 2.693359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 11.0, 8.0, 8.0, 5.0, 12.0, 23.0, 16.0, 14.0, 23.0, 32.0, 37.0, 30.0, 34.0, 39.0, 36.0, 46.0, 58.0, 88.0, 187.0, 1442.0, 306.0, 132.0, 66.0, 43.0, 41.0, 40.0, 35.0, 25.0, 27.0, 24.0, 30.0, 21.0, 18.0, 12.0, 13.0, 10.0, 7.0, 11.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.796875, -8.520263671875, -8.24365234375, -7.967041015625, -7.6904296875, -7.413818359375, -7.13720703125, -6.860595703125, -6.583984375, -6.307373046875, -6.03076171875, -5.754150390625, -5.4775390625, -5.200927734375, -4.92431640625, -4.647705078125, -4.37109375, -4.094482421875, -3.81787109375, -3.541259765625, -3.2646484375, -2.988037109375, -2.71142578125, -2.434814453125, -2.158203125, -1.881591796875, -1.60498046875, -1.328369140625, -1.0517578125, -0.775146484375, -0.49853515625, -0.221923828125, 0.0546875, 0.331298828125, 0.60791015625, 0.884521484375, 1.1611328125, 1.437744140625, 1.71435546875, 1.990966796875, 2.267578125, 2.544189453125, 2.82080078125, 3.097412109375, 3.3740234375, 3.650634765625, 3.92724609375, 4.203857421875, 4.48046875, 4.757080078125, 5.03369140625, 5.310302734375, 5.5869140625, 5.863525390625, 6.14013671875, 6.416748046875, 6.693359375, 6.969970703125, 7.24658203125, 7.523193359375, 7.7998046875, 8.076416015625, 8.35302734375, 8.629638671875, 8.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 9.0, 8.0, 10.0, 16.0, 15.0, 16.0, 27.0, 33.0, 51.0, 56.0, 93.0, 135.0, 238.0, 514.0, 1176.0, 17447.0, 3116982.0, 6715.0, 1004.0, 434.0, 220.0, 139.0, 90.0, 62.0, 43.0, 32.0, 31.0, 17.0, 24.0, 13.0, 10.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.85693359375, -37.6201171875, -36.38330078125, -35.146484375, -33.90966796875, -32.6728515625, -31.43603515625, -30.19921875, -28.96240234375, -27.7255859375, -26.48876953125, -25.251953125, -24.01513671875, -22.7783203125, -21.54150390625, -20.3046875, -19.06787109375, -17.8310546875, -16.59423828125, -15.357421875, -14.12060546875, -12.8837890625, -11.64697265625, -10.41015625, -9.17333984375, -7.9365234375, -6.69970703125, -5.462890625, -4.22607421875, -2.9892578125, -1.75244140625, -0.515625, 0.72119140625, 1.9580078125, 3.19482421875, 4.431640625, 5.66845703125, 6.9052734375, 8.14208984375, 9.37890625, 10.61572265625, 11.8525390625, 13.08935546875, 14.326171875, 15.56298828125, 16.7998046875, 18.03662109375, 19.2734375, 20.51025390625, 21.7470703125, 22.98388671875, 24.220703125, 25.45751953125, 26.6943359375, 27.93115234375, 29.16796875, 30.40478515625, 31.6416015625, 32.87841796875, 34.115234375, 35.35205078125, 36.5888671875, 37.82568359375, 39.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 67.0, 357.0, 404.0, 165.0, 18.0, 3.0], "bins": [-90.95111083984375, -89.43952941894531, -87.92794036865234, -86.4163589477539, -84.90476989746094, -83.3931884765625, -81.88160705566406, -80.3700180053711, -78.85843658447266, -77.34685516357422, -75.83526611328125, -74.32368469238281, -72.81209564208984, -71.3005142211914, -69.78892517089844, -68.27734375, -66.76575469970703, -65.2541732788086, -63.742584228515625, -62.23100280761719, -60.719417572021484, -59.20783233642578, -57.69624710083008, -56.184661865234375, -54.67308044433594, -53.161495208740234, -51.64990997314453, -50.138328552246094, -48.62674331665039, -47.11515808105469, -45.603572845458984, -44.09198760986328, -42.58039855957031, -41.06881332397461, -39.557228088378906, -38.04564666748047, -36.534061431884766, -35.02247619628906, -33.51089096069336, -31.999305725097656, -30.487722396850586, -28.976137161254883, -27.464553833007812, -25.95296859741211, -24.441383361816406, -22.929798126220703, -21.418214797973633, -19.90662956237793, -18.39504623413086, -16.883460998535156, -15.37187671661377, -13.860292434692383, -12.34870719909668, -10.837122917175293, -9.325538635253906, -7.813953399658203, -6.302368640899658, -4.790783882141113, -3.2791993618011475, -1.7676148414611816, -0.2560300827026367, 1.2555546760559082, 2.767138957977295, 4.278724193572998, 5.790308475494385]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 18.0, 18.0, 17.0, 13.0, 32.0, 28.0, 21.0, 24.0, 25.0, 22.0, 33.0, 27.0, 40.0, 33.0, 38.0, 33.0, 48.0, 38.0, 26.0, 31.0, 43.0, 30.0, 30.0, 29.0, 39.0, 33.0, 29.0, 26.0, 15.0, 26.0, 13.0, 12.0, 12.0, 9.0, 14.0, 13.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.692134857177734, -19.065324783325195, -18.438514709472656, -17.81170654296875, -17.18489646911621, -16.558086395263672, -15.931276321411133, -15.304466247558594, -14.677657127380371, -14.050847053527832, -13.42403793334961, -12.79722785949707, -12.170417785644531, -11.543608665466309, -10.91679859161377, -10.289989471435547, -9.663179397583008, -9.036369323730469, -8.409560203552246, -7.782750129699707, -7.155940532684326, -6.529130935668945, -5.902320861816406, -5.275511264801025, -4.6487016677856445, -4.021892070770264, -3.3950822353363037, -2.7682723999023438, -2.141462802886963, -1.514653205871582, -0.8878433704376221, -0.2610335350036621, 0.36577796936035156, 0.992587685585022, 1.6193974018096924, 2.2462072372436523, 2.873016834259033, 3.499826431274414, 4.126636505126953, 4.753446102142334, 5.380255699157715, 6.007065296173096, 6.633874893188477, 7.260684967041016, 7.8874945640563965, 8.514304161071777, 9.141114234924316, 9.767923355102539, 10.394733428955078, 11.021543502807617, 11.64835262298584, 12.275162696838379, 12.901971817016602, 13.52878189086914, 14.15559196472168, 14.782402038574219, 15.409211158752441, 16.036020278930664, 16.662830352783203, 17.289640426635742, 17.91645050048828, 18.543258666992188, 19.170068740844727, 19.796878814697266, 20.423688888549805]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 6.0, 11.0, 9.0, 12.0, 8.0, 27.0, 16.0, 23.0, 34.0, 31.0, 29.0, 40.0, 28.0, 35.0, 43.0, 40.0, 40.0, 43.0, 40.0, 38.0, 56.0, 35.0, 35.0, 45.0, 31.0, 39.0, 26.0, 15.0, 32.0, 21.0, 15.0, 21.0, 10.0, 14.0, 12.0, 4.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.350677490234375, -3.24627685546875, -3.141876220703125, -3.0374755859375, -2.933074951171875, -2.82867431640625, -2.724273681640625, -2.619873046875, -2.515472412109375, -2.41107177734375, -2.306671142578125, -2.2022705078125, -2.097869873046875, -1.99346923828125, -1.889068603515625, -1.78466796875, -1.680267333984375, -1.57586669921875, -1.471466064453125, -1.3670654296875, -1.262664794921875, -1.15826416015625, -1.053863525390625, -0.949462890625, -0.845062255859375, -0.74066162109375, -0.636260986328125, -0.5318603515625, -0.427459716796875, -0.32305908203125, -0.218658447265625, -0.1142578125, -0.009857177734375, 0.09454345703125, 0.198944091796875, 0.3033447265625, 0.407745361328125, 0.51214599609375, 0.616546630859375, 0.720947265625, 0.825347900390625, 0.92974853515625, 1.034149169921875, 1.1385498046875, 1.242950439453125, 1.34735107421875, 1.451751708984375, 1.55615234375, 1.660552978515625, 1.76495361328125, 1.869354248046875, 1.9737548828125, 2.078155517578125, 2.18255615234375, 2.286956787109375, 2.391357421875, 2.495758056640625, 2.60015869140625, 2.704559326171875, 2.8089599609375, 2.913360595703125, 3.01776123046875, 3.122161865234375, 3.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 16.0, 9.0, 23.0, 17.0, 24.0, 26.0, 29.0, 53.0, 63.0, 68.0, 95.0, 116.0, 158.0, 344.0, 1104.0, 13575.0, 467158.0, 3162709.0, 530768.0, 15528.0, 1274.0, 398.0, 155.0, 120.0, 70.0, 79.0, 61.0, 50.0, 43.0, 28.0, 26.0, 18.0, 14.0, 13.0, 10.0, 8.0, 11.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.868408203125, -9.56494140625, -9.261474609375, -8.9580078125, -8.654541015625, -8.35107421875, -8.047607421875, -7.744140625, -7.440673828125, -7.13720703125, -6.833740234375, -6.5302734375, -6.226806640625, -5.92333984375, -5.619873046875, -5.31640625, -5.012939453125, -4.70947265625, -4.406005859375, -4.1025390625, -3.799072265625, -3.49560546875, -3.192138671875, -2.888671875, -2.585205078125, -2.28173828125, -1.978271484375, -1.6748046875, -1.371337890625, -1.06787109375, -0.764404296875, -0.4609375, -0.157470703125, 0.14599609375, 0.449462890625, 0.7529296875, 1.056396484375, 1.35986328125, 1.663330078125, 1.966796875, 2.270263671875, 2.57373046875, 2.877197265625, 3.1806640625, 3.484130859375, 3.78759765625, 4.091064453125, 4.39453125, 4.697998046875, 5.00146484375, 5.304931640625, 5.6083984375, 5.911865234375, 6.21533203125, 6.518798828125, 6.822265625, 7.125732421875, 7.42919921875, 7.732666015625, 8.0361328125, 8.339599609375, 8.64306640625, 8.946533203125, 9.25]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 2.0, 3.0, 12.0, 10.0, 13.0, 23.0, 30.0, 30.0, 44.0, 58.0, 74.0, 95.0, 135.0, 197.0, 237.0, 339.0, 435.0, 473.0, 447.0, 363.0, 275.0, 196.0, 161.0, 101.0, 74.0, 56.0, 37.0, 41.0, 29.0, 11.0, 19.0, 12.0, 10.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.18682861328125, -6.0025634765625, -5.81829833984375, -5.634033203125, -5.44976806640625, -5.2655029296875, -5.08123779296875, -4.89697265625, -4.71270751953125, -4.5284423828125, -4.34417724609375, -4.159912109375, -3.97564697265625, -3.7913818359375, -3.60711669921875, -3.4228515625, -3.23858642578125, -3.0543212890625, -2.87005615234375, -2.685791015625, -2.50152587890625, -2.3172607421875, -2.13299560546875, -1.94873046875, -1.76446533203125, -1.5802001953125, -1.39593505859375, -1.211669921875, -1.02740478515625, -0.8431396484375, -0.65887451171875, -0.474609375, -0.29034423828125, -0.1060791015625, 0.07818603515625, 0.262451171875, 0.44671630859375, 0.6309814453125, 0.81524658203125, 0.99951171875, 1.18377685546875, 1.3680419921875, 1.55230712890625, 1.736572265625, 1.92083740234375, 2.1051025390625, 2.28936767578125, 2.4736328125, 2.65789794921875, 2.8421630859375, 3.02642822265625, 3.210693359375, 3.39495849609375, 3.5792236328125, 3.76348876953125, 3.94775390625, 4.13201904296875, 4.3162841796875, 4.50054931640625, 4.684814453125, 4.86907958984375, 5.0533447265625, 5.23760986328125, 5.421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 16.0, 10.0, 17.0, 32.0, 34.0, 36.0, 57.0, 74.0, 103.0, 168.0, 222.0, 388.0, 632.0, 9093.0, 3940261.0, 240539.0, 1177.0, 439.0, 279.0, 191.0, 122.0, 89.0, 83.0, 43.0, 45.0, 26.0, 21.0, 15.0, 13.0, 11.0, 5.0, 5.0, 4.0, 7.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.405517578125, -26.45166015625, -25.497802734375, -24.5439453125, -23.590087890625, -22.63623046875, -21.682373046875, -20.728515625, -19.774658203125, -18.82080078125, -17.866943359375, -16.9130859375, -15.959228515625, -15.00537109375, -14.051513671875, -13.09765625, -12.143798828125, -11.18994140625, -10.236083984375, -9.2822265625, -8.328369140625, -7.37451171875, -6.420654296875, -5.466796875, -4.512939453125, -3.55908203125, -2.605224609375, -1.6513671875, -0.697509765625, 0.25634765625, 1.210205078125, 2.1640625, 3.117919921875, 4.07177734375, 5.025634765625, 5.9794921875, 6.933349609375, 7.88720703125, 8.841064453125, 9.794921875, 10.748779296875, 11.70263671875, 12.656494140625, 13.6103515625, 14.564208984375, 15.51806640625, 16.471923828125, 17.42578125, 18.379638671875, 19.33349609375, 20.287353515625, 21.2412109375, 22.195068359375, 23.14892578125, 24.102783203125, 25.056640625, 26.010498046875, 26.96435546875, 27.918212890625, 28.8720703125, 29.825927734375, 30.77978515625, 31.733642578125, 32.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 21.0, 75.0, 188.0, 310.0, 240.0, 136.0, 37.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.42640495300293, -12.593167304992676, -10.759929656982422, -8.926691055297852, -7.093453407287598, -5.260215759277344, -3.4269771575927734, -1.5937395095825195, 0.23949813842773438, 2.0727360248565674, 3.9059739112854004, 5.7392120361328125, 7.572449684143066, 9.40568733215332, 11.23892593383789, 13.072163581848145, 14.905401229858398, 16.73863983154297, 18.571876525878906, 20.405115127563477, 22.238353729248047, 24.071590423583984, 25.904829025268555, 27.738067626953125, 29.571304321289062, 31.404542922973633, 33.2377815246582, 35.07101821899414, 36.90425491333008, 38.73749542236328, 40.57073211669922, 42.403968811035156, 44.237205505371094, 46.07044219970703, 47.903682708740234, 49.73691940307617, 51.57015609741211, 53.40339660644531, 55.23663330078125, 57.06986999511719, 58.903106689453125, 60.73634338378906, 62.569583892822266, 64.40281677246094, 66.2360610961914, 68.06929779052734, 69.90253448486328, 71.73577117919922, 73.56901550292969, 75.40225219726562, 77.23548889160156, 79.0687255859375, 80.90196990966797, 82.7352066040039, 84.56844329833984, 86.40167999267578, 88.23491668701172, 90.06815338134766, 91.9013900756836, 93.73463439941406, 95.56787109375, 97.40110778808594, 99.23434448242188, 101.06758117675781, 102.90081787109375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 8.0, 7.0, 11.0, 11.0, 17.0, 17.0, 16.0, 30.0, 27.0, 29.0, 29.0, 38.0, 41.0, 37.0, 49.0, 57.0, 52.0, 49.0, 41.0, 40.0, 34.0, 51.0, 30.0, 39.0, 36.0, 39.0, 30.0, 17.0, 26.0, 14.0, 12.0, 8.0, 12.0, 11.0, 9.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.768802642822266, -22.105358123779297, -21.441913604736328, -20.77846908569336, -20.11502456665039, -19.451580047607422, -18.788135528564453, -18.124691009521484, -17.461246490478516, -16.797801971435547, -16.134357452392578, -15.47091293334961, -14.80746841430664, -14.144023895263672, -13.48058032989502, -12.81713581085205, -12.153692245483398, -11.49024772644043, -10.826803207397461, -10.163358688354492, -9.499914169311523, -8.836469650268555, -8.173026084899902, -7.509581565856934, -6.846137046813965, -6.182692527770996, -5.519248008728027, -4.855803966522217, -4.192359447479248, -3.5289149284362793, -2.8654706478118896, -2.2020263671875, -1.5385799407958984, -0.8751355409622192, -0.21169114112854004, 0.45175325870513916, 1.1151976585388184, 1.778642177581787, 2.4420864582061768, 3.1055307388305664, 3.768975257873535, 4.432419776916504, 5.095864295959473, 5.759308338165283, 6.422752857208252, 7.086197376251221, 7.749641418457031, 8.4130859375, 9.076530456542969, 9.739974975585938, 10.403419494628906, 11.066864013671875, 11.730308532714844, 12.393753051757812, 13.057196617126465, 13.720641136169434, 14.384085655212402, 15.047530174255371, 15.71097469329834, 16.374418258666992, 17.03786277770996, 17.70130729675293, 18.3647518157959, 19.028196334838867, 19.691640853881836]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 3.0, 10.0, 9.0, 9.0, 8.0, 19.0, 16.0, 22.0, 25.0, 22.0, 27.0, 36.0, 34.0, 36.0, 34.0, 27.0, 37.0, 54.0, 40.0, 37.0, 39.0, 42.0, 42.0, 39.0, 48.0, 40.0, 27.0, 26.0, 30.0, 28.0, 21.0, 11.0, 12.0, 19.0, 12.0, 17.0, 7.0, 9.0, 5.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.54296875, -3.4454345703125, -3.347900390625, -3.2503662109375, -3.15283203125, -3.0552978515625, -2.957763671875, -2.8602294921875, -2.7626953125, -2.6651611328125, -2.567626953125, -2.4700927734375, -2.37255859375, -2.2750244140625, -2.177490234375, -2.0799560546875, -1.982421875, -1.8848876953125, -1.787353515625, -1.6898193359375, -1.59228515625, -1.4947509765625, -1.397216796875, -1.2996826171875, -1.2021484375, -1.1046142578125, -1.007080078125, -0.9095458984375, -0.81201171875, -0.7144775390625, -0.616943359375, -0.5194091796875, -0.421875, -0.3243408203125, -0.226806640625, -0.1292724609375, -0.03173828125, 0.0657958984375, 0.163330078125, 0.2608642578125, 0.3583984375, 0.4559326171875, 0.553466796875, 0.6510009765625, 0.74853515625, 0.8460693359375, 0.943603515625, 1.0411376953125, 1.138671875, 1.2362060546875, 1.333740234375, 1.4312744140625, 1.52880859375, 1.6263427734375, 1.723876953125, 1.8214111328125, 1.9189453125, 2.0164794921875, 2.114013671875, 2.2115478515625, 2.30908203125, 2.4066162109375, 2.504150390625, 2.6016845703125, 2.69921875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 14.0, 16.0, 23.0, 36.0, 75.0, 80.0, 104.0, 143.0, 210.0, 322.0, 444.0, 673.0, 808.0, 1266.0, 1721.0, 2394.0, 3479.0, 4890.0, 6853.0, 9853.0, 14136.0, 21067.0, 31714.0, 47856.0, 74776.0, 117316.0, 176022.0, 180315.0, 121587.0, 77489.0, 49603.0, 32404.0, 21797.0, 14797.0, 10144.0, 7063.0, 4980.0, 3517.0, 2474.0, 1779.0, 1231.0, 899.0, 648.0, 465.0, 322.0, 230.0, 165.0, 112.0, 73.0, 58.0, 42.0, 26.0, 16.0, 12.0, 6.0, 8.0, 2.0, 3.0, 2.0], "bins": [-0.297607421875, -0.2883186340332031, -0.27902984619140625, -0.2697410583496094, -0.2604522705078125, -0.2511634826660156, -0.24187469482421875, -0.23258590698242188, -0.223297119140625, -0.21400833129882812, -0.20471954345703125, -0.19543075561523438, -0.1861419677734375, -0.17685317993164062, -0.16756439208984375, -0.15827560424804688, -0.14898681640625, -0.13969802856445312, -0.13040924072265625, -0.12112045288085938, -0.1118316650390625, -0.10254287719726562, -0.09325408935546875, -0.08396530151367188, -0.074676513671875, -0.06538772583007812, -0.05609893798828125, -0.046810150146484375, -0.0375213623046875, -0.028232574462890625, -0.01894378662109375, -0.009654998779296875, -0.0003662109375, 0.008922576904296875, 0.01821136474609375, 0.027500152587890625, 0.0367889404296875, 0.046077728271484375, 0.05536651611328125, 0.06465530395507812, 0.073944091796875, 0.08323287963867188, 0.09252166748046875, 0.10181045532226562, 0.1110992431640625, 0.12038803100585938, 0.12967681884765625, 0.13896560668945312, 0.14825439453125, 0.15754318237304688, 0.16683197021484375, 0.17612075805664062, 0.1854095458984375, 0.19469833374023438, 0.20398712158203125, 0.21327590942382812, 0.222564697265625, 0.23185348510742188, 0.24114227294921875, 0.2504310607910156, 0.2597198486328125, 0.2690086364746094, 0.27829742431640625, 0.2875862121582031, 0.296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 15.0, 14.0, 13.0, 12.0, 22.0, 26.0, 25.0, 25.0, 23.0, 32.0, 31.0, 34.0, 49.0, 45.0, 44.0, 1060.0, 47.0, 57.0, 49.0, 44.0, 40.0, 36.0, 32.0, 24.0, 23.0, 34.0, 23.0, 22.0, 21.0, 14.0, 18.0, 12.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.173797607421875, -2.10540771484375, -2.037017822265625, -1.9686279296875, -1.900238037109375, -1.83184814453125, -1.763458251953125, -1.695068359375, -1.626678466796875, -1.55828857421875, -1.489898681640625, -1.4215087890625, -1.353118896484375, -1.28472900390625, -1.216339111328125, -1.14794921875, -1.079559326171875, -1.01116943359375, -0.942779541015625, -0.8743896484375, -0.805999755859375, -0.73760986328125, -0.669219970703125, -0.600830078125, -0.532440185546875, -0.46405029296875, -0.395660400390625, -0.3272705078125, -0.258880615234375, -0.19049072265625, -0.122100830078125, -0.0537109375, 0.014678955078125, 0.08306884765625, 0.151458740234375, 0.2198486328125, 0.288238525390625, 0.35662841796875, 0.425018310546875, 0.493408203125, 0.561798095703125, 0.63018798828125, 0.698577880859375, 0.7669677734375, 0.835357666015625, 0.90374755859375, 0.972137451171875, 1.04052734375, 1.108917236328125, 1.17730712890625, 1.245697021484375, 1.3140869140625, 1.382476806640625, 1.45086669921875, 1.519256591796875, 1.587646484375, 1.656036376953125, 1.72442626953125, 1.792816162109375, 1.8612060546875, 1.929595947265625, 1.99798583984375, 2.066375732421875, 2.134765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 11.0, 13.0, 16.0, 28.0, 34.0, 56.0, 63.0, 94.0, 165.0, 216.0, 287.0, 425.0, 684.0, 942.0, 1432.0, 2282.0, 3350.0, 5305.0, 8113.0, 12844.0, 20096.0, 32685.0, 53131.0, 88320.0, 148627.0, 1260752.0, 177725.0, 108575.0, 64784.0, 38984.0, 24119.0, 14963.0, 9545.0, 6094.0, 4146.0, 2697.0, 1866.0, 1176.0, 790.0, 567.0, 393.0, 252.0, 162.0, 121.0, 67.0, 52.0, 36.0, 24.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.303466796875, -0.2944602966308594, -0.28545379638671875, -0.2764472961425781, -0.2674407958984375, -0.2584342956542969, -0.24942779541015625, -0.24042129516601562, -0.231414794921875, -0.22240829467773438, -0.21340179443359375, -0.20439529418945312, -0.1953887939453125, -0.18638229370117188, -0.17737579345703125, -0.16836929321289062, -0.15936279296875, -0.15035629272460938, -0.14134979248046875, -0.13234329223632812, -0.1233367919921875, -0.11433029174804688, -0.10532379150390625, -0.09631729125976562, -0.087310791015625, -0.07830429077148438, -0.06929779052734375, -0.060291290283203125, -0.0512847900390625, -0.042278289794921875, -0.03327178955078125, -0.024265289306640625, -0.0152587890625, -0.006252288818359375, 0.00275421142578125, 0.011760711669921875, 0.0207672119140625, 0.029773712158203125, 0.03878021240234375, 0.047786712646484375, 0.056793212890625, 0.06579971313476562, 0.07480621337890625, 0.08381271362304688, 0.0928192138671875, 0.10182571411132812, 0.11083221435546875, 0.11983871459960938, 0.12884521484375, 0.13785171508789062, 0.14685821533203125, 0.15586471557617188, 0.1648712158203125, 0.17387771606445312, 0.18288421630859375, 0.19189071655273438, 0.200897216796875, 0.20990371704101562, 0.21891021728515625, 0.22791671752929688, 0.2369232177734375, 0.24592971801757812, 0.25493621826171875, 0.2639427185058594, 0.27294921875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 6.0, 13.0, 14.0, 11.0, 19.0, 11.0, 24.0, 45.0, 38.0, 38.0, 64.0, 65.0, 67.0, 71.0, 71.0, 64.0, 67.0, 49.0, 49.0, 43.0, 35.0, 22.0, 23.0, 18.0, 18.0, 13.0, 11.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001544952392578125, -0.0015029311180114746, -0.0014609098434448242, -0.0014188885688781738, -0.0013768672943115234, -0.001334846019744873, -0.0012928247451782227, -0.0012508034706115723, -0.0012087821960449219, -0.0011667609214782715, -0.001124739646911621, -0.0010827183723449707, -0.0010406970977783203, -0.00099867582321167, -0.0009566545486450195, -0.0009146332740783691, -0.0008726119995117188, -0.0008305907249450684, -0.000788569450378418, -0.0007465481758117676, -0.0007045269012451172, -0.0006625056266784668, -0.0006204843521118164, -0.000578463077545166, -0.0005364418029785156, -0.0004944205284118652, -0.00045239925384521484, -0.00041037797927856445, -0.00036835670471191406, -0.00032633543014526367, -0.0002843141555786133, -0.0002422928810119629, -0.0002002716064453125, -0.0001582503318786621, -0.00011622905731201172, -7.420778274536133e-05, -3.218650817871094e-05, 9.834766387939453e-06, 5.1856040954589844e-05, 9.387731552124023e-05, 0.00013589859008789062, 0.00017791986465454102, 0.0002199411392211914, 0.0002619624137878418, 0.0003039836883544922, 0.0003460049629211426, 0.00038802623748779297, 0.00043004751205444336, 0.00047206878662109375, 0.0005140900611877441, 0.0005561113357543945, 0.0005981326103210449, 0.0006401538848876953, 0.0006821751594543457, 0.0007241964340209961, 0.0007662177085876465, 0.0008082389831542969, 0.0008502602577209473, 0.0008922815322875977, 0.000934302806854248, 0.0009763240814208984, 0.0010183453559875488, 0.0010603666305541992, 0.0011023879051208496, 0.0011444091796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 13.0, 13.0, 14.0, 20.0, 22.0, 23.0, 49.0, 63.0, 77.0, 113.0, 149.0, 294.0, 659.0, 7015.0, 1032095.0, 6450.0, 668.0, 297.0, 137.0, 98.0, 76.0, 52.0, 34.0, 31.0, 21.0, 19.0, 12.0, 14.0, 3.0, 4.0, 9.0, 5.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0255889892578125, -0.024690866470336914, -0.023792743682861328, -0.022894620895385742, -0.021996498107910156, -0.02109837532043457, -0.020200252532958984, -0.0193021297454834, -0.018404006958007812, -0.017505884170532227, -0.01660776138305664, -0.015709638595581055, -0.014811515808105469, -0.013913393020629883, -0.013015270233154297, -0.012117147445678711, -0.011219024658203125, -0.010320901870727539, -0.009422779083251953, -0.008524656295776367, -0.007626533508300781, -0.006728410720825195, -0.005830287933349609, -0.0049321651458740234, -0.0040340423583984375, -0.0031359195709228516, -0.0022377967834472656, -0.0013396739959716797, -0.00044155120849609375, 0.0004565715789794922, 0.0013546943664550781, 0.002252817153930664, 0.00315093994140625, 0.004049062728881836, 0.004947185516357422, 0.005845308303833008, 0.006743431091308594, 0.00764155387878418, 0.008539676666259766, 0.009437799453735352, 0.010335922241210938, 0.011234045028686523, 0.01213216781616211, 0.013030290603637695, 0.013928413391113281, 0.014826536178588867, 0.015724658966064453, 0.01662278175354004, 0.017520904541015625, 0.01841902732849121, 0.019317150115966797, 0.020215272903442383, 0.02111339569091797, 0.022011518478393555, 0.02290964126586914, 0.023807764053344727, 0.024705886840820312, 0.0256040096282959, 0.026502132415771484, 0.02740025520324707, 0.028298377990722656, 0.029196500778198242, 0.030094623565673828, 0.030992746353149414, 0.031890869140625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [9.0, 28.0, 216.0, 504.0, 226.0, 32.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036319735227152705, -0.00025987246772274375, -0.00015654756862204522, -5.322266952134669e-05, 5.0102215027436614e-05, 0.00015342712868005037, 0.0002567520132288337, 0.000360076897777617, 0.0004634017823264003, 0.0005667266668751836, 0.0006700515514239669, 0.0007733764359727502, 0.0008767013205215335, 0.0009800263214856386, 0.001083351206034422, 0.0011866760905832052, 0.0012900009751319885, 0.0013933258596807718, 0.0014966507442295551, 0.0015999756287783384, 0.0017033005133271217, 0.001806625397875905, 0.0019099502824246883, 0.0020132751669734716, 0.002116600051522255, 0.0022199249360710382, 0.0023232498206198215, 0.002426574705168605, 0.002529899589717388, 0.0026332244742661715, 0.0027365493588149548, 0.002839874243363738, 0.002943199360743165, 0.0030465242452919483, 0.0031498491298407316, 0.003253174014389515, 0.0033564988989382982, 0.0034598237834870815, 0.003563148668035865, 0.003666473552584648, 0.0037697984371334314, 0.0038731233216822147, 0.003976448439061642, 0.004079773090779781, 0.004183098208159208, 0.004286422859877348, 0.004389747977256775, 0.0044930726289749146, 0.0045963977463543415, 0.0046997228637337685, 0.004803047515451908, 0.004906372632831335, 0.005009697284549475, 0.005113022401928902, 0.005216347053647041, 0.005319672171026468, 0.005422996822744608, 0.005526321940124035, 0.0056296465918421745, 0.0057329717092216015, 0.005836296360939741, 0.005939621478319168, 0.006042946130037308, 0.006146271247416735, 0.006249595899134874]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 9.0, 11.0, 11.0, 20.0, 17.0, 20.0, 22.0, 29.0, 28.0, 38.0, 29.0, 45.0, 37.0, 38.0, 33.0, 36.0, 30.0, 41.0, 43.0, 47.0, 37.0, 36.0, 29.0, 43.0, 39.0, 20.0, 35.0, 16.0, 18.0, 18.0, 27.0, 13.0, 17.0, 4.0, 5.0, 14.0, 5.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000550389289855957, -0.0005315355956554413, -0.0005126819014549255, -0.0004938282072544098, -0.00047497451305389404, -0.0004561208188533783, -0.00043726712465286255, -0.0004184134304523468, -0.00039955973625183105, -0.0003807060420513153, -0.00036185234785079956, -0.0003429986536502838, -0.00032414495944976807, -0.0003052912652492523, -0.00028643757104873657, -0.0002675838768482208, -0.0002487301826477051, -0.00022987648844718933, -0.00021102279424667358, -0.00019216910004615784, -0.0001733154058456421, -0.00015446171164512634, -0.0001356080174446106, -0.00011675432324409485, -9.79006290435791e-05, -7.904693484306335e-05, -6.019324064254761e-05, -4.133954644203186e-05, -2.2485852241516113e-05, -3.632158041000366e-06, 1.5221536159515381e-05, 3.407523036003113e-05, 5.2928924560546875e-05, 7.178261876106262e-05, 9.063631296157837e-05, 0.00010949000716209412, 0.00012834370136260986, 0.0001471973955631256, 0.00016605108976364136, 0.0001849047839641571, 0.00020375847816467285, 0.0002226121723651886, 0.00024146586656570435, 0.0002603195607662201, 0.00027917325496673584, 0.0002980269491672516, 0.00031688064336776733, 0.0003357343375682831, 0.00035458803176879883, 0.0003734417259693146, 0.0003922954201698303, 0.00041114911437034607, 0.0004300028085708618, 0.00044885650277137756, 0.0004677101969718933, 0.00048656389117240906, 0.0005054175853729248, 0.0005242712795734406, 0.0005431249737739563, 0.000561978667974472, 0.0005808323621749878, 0.0005996860563755035, 0.0006185397505760193, 0.000637393444776535, 0.0006562471389770508]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 3.0, 10.0, 9.0, 9.0, 8.0, 19.0, 16.0, 22.0, 25.0, 22.0, 27.0, 36.0, 34.0, 36.0, 34.0, 27.0, 37.0, 54.0, 40.0, 37.0, 39.0, 42.0, 42.0, 39.0, 48.0, 40.0, 27.0, 26.0, 30.0, 28.0, 20.0, 12.0, 12.0, 19.0, 12.0, 17.0, 7.0, 9.0, 5.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.54296875, -3.4454345703125, -3.347900390625, -3.2503662109375, -3.15283203125, -3.0552978515625, -2.957763671875, -2.8602294921875, -2.7626953125, -2.6651611328125, -2.567626953125, -2.4700927734375, -2.37255859375, -2.2750244140625, -2.177490234375, -2.0799560546875, -1.982421875, -1.8848876953125, -1.787353515625, -1.6898193359375, -1.59228515625, -1.4947509765625, -1.397216796875, -1.2996826171875, -1.2021484375, -1.1046142578125, -1.007080078125, -0.9095458984375, -0.81201171875, -0.7144775390625, -0.616943359375, -0.5194091796875, -0.421875, -0.3243408203125, -0.226806640625, -0.1292724609375, -0.03173828125, 0.0657958984375, 0.163330078125, 0.2608642578125, 0.3583984375, 0.4559326171875, 0.553466796875, 0.6510009765625, 0.74853515625, 0.8460693359375, 0.943603515625, 1.0411376953125, 1.138671875, 1.2362060546875, 1.333740234375, 1.4312744140625, 1.52880859375, 1.6263427734375, 1.723876953125, 1.8214111328125, 1.9189453125, 2.0164794921875, 2.114013671875, 2.2115478515625, 2.30908203125, 2.4066162109375, 2.504150390625, 2.6016845703125, 2.69921875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 15.0, 24.0, 25.0, 28.0, 36.0, 48.0, 81.0, 87.0, 133.0, 193.0, 408.0, 874.0, 3352.0, 17362.0, 92546.0, 594576.0, 279768.0, 46741.0, 8817.0, 1861.0, 600.0, 290.0, 182.0, 113.0, 89.0, 61.0, 46.0, 37.0, 30.0, 22.0, 14.0, 9.0, 10.0, 9.0, 13.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.671875, -7.46337890625, -7.2548828125, -7.04638671875, -6.837890625, -6.62939453125, -6.4208984375, -6.21240234375, -6.00390625, -5.79541015625, -5.5869140625, -5.37841796875, -5.169921875, -4.96142578125, -4.7529296875, -4.54443359375, -4.3359375, -4.12744140625, -3.9189453125, -3.71044921875, -3.501953125, -3.29345703125, -3.0849609375, -2.87646484375, -2.66796875, -2.45947265625, -2.2509765625, -2.04248046875, -1.833984375, -1.62548828125, -1.4169921875, -1.20849609375, -1.0, -0.79150390625, -0.5830078125, -0.37451171875, -0.166015625, 0.04248046875, 0.2509765625, 0.45947265625, 0.66796875, 0.87646484375, 1.0849609375, 1.29345703125, 1.501953125, 1.71044921875, 1.9189453125, 2.12744140625, 2.3359375, 2.54443359375, 2.7529296875, 2.96142578125, 3.169921875, 3.37841796875, 3.5869140625, 3.79541015625, 4.00390625, 4.21240234375, 4.4208984375, 4.62939453125, 4.837890625, 5.04638671875, 5.2548828125, 5.46337890625, 5.671875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 10.0, 1.0, 8.0, 12.0, 16.0, 16.0, 11.0, 10.0, 23.0, 20.0, 23.0, 37.0, 31.0, 32.0, 48.0, 53.0, 68.0, 98.0, 222.0, 1563.0, 227.0, 99.0, 60.0, 43.0, 39.0, 37.0, 41.0, 38.0, 26.0, 23.0, 19.0, 20.0, 21.0, 9.0, 9.0, 9.0, 5.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0413818359375, -8.699951171875, -8.3585205078125, -8.01708984375, -7.6756591796875, -7.334228515625, -6.9927978515625, -6.6513671875, -6.3099365234375, -5.968505859375, -5.6270751953125, -5.28564453125, -4.9442138671875, -4.602783203125, -4.2613525390625, -3.919921875, -3.5784912109375, -3.237060546875, -2.8956298828125, -2.55419921875, -2.2127685546875, -1.871337890625, -1.5299072265625, -1.1884765625, -0.8470458984375, -0.505615234375, -0.1641845703125, 0.17724609375, 0.5186767578125, 0.860107421875, 1.2015380859375, 1.54296875, 1.8843994140625, 2.225830078125, 2.5672607421875, 2.90869140625, 3.2501220703125, 3.591552734375, 3.9329833984375, 4.2744140625, 4.6158447265625, 4.957275390625, 5.2987060546875, 5.64013671875, 5.9815673828125, 6.322998046875, 6.6644287109375, 7.005859375, 7.3472900390625, 7.688720703125, 8.0301513671875, 8.37158203125, 8.7130126953125, 9.054443359375, 9.3958740234375, 9.7373046875, 10.0787353515625, 10.420166015625, 10.7615966796875, 11.10302734375, 11.4444580078125, 11.785888671875, 12.1273193359375, 12.46875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 3.0, 8.0, 7.0, 16.0, 13.0, 9.0, 15.0, 35.0, 29.0, 30.0, 43.0, 68.0, 75.0, 101.0, 123.0, 193.0, 414.0, 976.0, 9924.0, 3097600.0, 33470.0, 1254.0, 481.0, 243.0, 132.0, 91.0, 78.0, 60.0, 40.0, 26.0, 30.0, 21.0, 19.0, 22.0, 18.0, 8.0, 8.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.71875, -34.65576171875, -33.5927734375, -32.52978515625, -31.466796875, -30.40380859375, -29.3408203125, -28.27783203125, -27.21484375, -26.15185546875, -25.0888671875, -24.02587890625, -22.962890625, -21.89990234375, -20.8369140625, -19.77392578125, -18.7109375, -17.64794921875, -16.5849609375, -15.52197265625, -14.458984375, -13.39599609375, -12.3330078125, -11.27001953125, -10.20703125, -9.14404296875, -8.0810546875, -7.01806640625, -5.955078125, -4.89208984375, -3.8291015625, -2.76611328125, -1.703125, -0.64013671875, 0.4228515625, 1.48583984375, 2.548828125, 3.61181640625, 4.6748046875, 5.73779296875, 6.80078125, 7.86376953125, 8.9267578125, 9.98974609375, 11.052734375, 12.11572265625, 13.1787109375, 14.24169921875, 15.3046875, 16.36767578125, 17.4306640625, 18.49365234375, 19.556640625, 20.61962890625, 21.6826171875, 22.74560546875, 23.80859375, 24.87158203125, 25.9345703125, 26.99755859375, 28.060546875, 29.12353515625, 30.1865234375, 31.24951171875, 32.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 50.0, 317.0, 484.0, 149.0, 13.0, 1.0, 0.0, 1.0], "bins": [-88.41070556640625, -86.89360046386719, -85.37649536132812, -83.8593978881836, -82.34229278564453, -80.82518768310547, -79.3080825805664, -77.79097747802734, -76.27388000488281, -74.75677490234375, -73.23966979980469, -71.72257232666016, -70.2054672241211, -68.68836212158203, -67.17125701904297, -65.6541519165039, -64.13704681396484, -62.61994171142578, -61.102840423583984, -59.58573532104492, -58.068634033203125, -56.55152893066406, -55.034423828125, -53.5173225402832, -52.000221252441406, -50.483116149902344, -48.96601486206055, -47.448909759521484, -45.93180847167969, -44.414703369140625, -42.89759826660156, -41.380496978759766, -39.8633918762207, -38.34628677368164, -36.829185485839844, -35.31208038330078, -33.794979095458984, -32.27787399291992, -30.760770797729492, -29.243667602539062, -27.7265625, -26.20945930480957, -24.69235610961914, -23.175251007080078, -21.65814781188965, -20.14104461669922, -18.62394142150879, -17.10683822631836, -15.58973503112793, -14.0726318359375, -12.555527687072754, -11.038424491882324, -9.521320343017578, -8.004217147827148, -6.487113952636719, -4.970009803771973, -3.452906608581543, -1.9358030557632446, -0.4186995029449463, 1.0984039306640625, 2.6155076026916504, 4.132611274719238, 5.649714469909668, 7.166818618774414, 8.683921813964844]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 4.0, 0.0, 11.0, 8.0, 15.0, 17.0, 18.0, 17.0, 25.0, 34.0, 31.0, 38.0, 38.0, 40.0, 53.0, 48.0, 58.0, 48.0, 55.0, 51.0, 40.0, 54.0, 46.0, 39.0, 32.0, 36.0, 31.0, 20.0, 21.0, 16.0, 21.0, 14.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.62425231933594, -41.49089813232422, -40.3575439453125, -39.224185943603516, -38.0908317565918, -36.95747756958008, -35.82412338256836, -34.690765380859375, -33.557411193847656, -32.42405700683594, -31.290700912475586, -30.157346725463867, -29.023990631103516, -27.890636444091797, -26.757282257080078, -25.623926162719727, -24.490571975708008, -23.35721778869629, -22.223861694335938, -21.09050750732422, -19.957151412963867, -18.82379722595215, -17.690441131591797, -16.557086944580078, -15.423731803894043, -14.290376663208008, -13.157021522521973, -12.023666381835938, -10.890312194824219, -9.756956100463867, -8.623601913452148, -7.490246772766113, -6.356893539428711, -5.223538398742676, -4.090183258056641, -2.9568285942077637, -1.8234734535217285, -0.6901183128356934, 0.4432363510131836, 1.5765914916992188, 2.709946632385254, 3.843301773071289, 4.976656913757324, 6.110011577606201, 7.243366718292236, 8.37672233581543, 9.510076522827148, 10.643431663513184, 11.776786804199219, 12.910141944885254, 14.043497085571289, 15.176851272583008, 16.31020736694336, 17.443561553955078, 18.576915740966797, 19.71027183532715, 20.8436279296875, 21.97698211669922, 23.11033821105957, 24.24369239807129, 25.37704849243164, 26.51040267944336, 27.643756866455078, 28.77711296081543, 29.91046714782715]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 5.0, 10.0, 3.0, 9.0, 14.0, 16.0, 18.0, 16.0, 20.0, 20.0, 31.0, 29.0, 28.0, 28.0, 29.0, 30.0, 29.0, 31.0, 35.0, 46.0, 44.0, 47.0, 44.0, 39.0, 48.0, 37.0, 34.0, 38.0, 17.0, 29.0, 25.0, 17.0, 18.0, 15.0, 19.0, 9.0, 14.0, 7.0, 14.0, 8.0, 3.0, 5.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.716796875, -3.61163330078125, -3.5064697265625, -3.40130615234375, -3.296142578125, -3.19097900390625, -3.0858154296875, -2.98065185546875, -2.87548828125, -2.77032470703125, -2.6651611328125, -2.55999755859375, -2.454833984375, -2.34967041015625, -2.2445068359375, -2.13934326171875, -2.0341796875, -1.92901611328125, -1.8238525390625, -1.71868896484375, -1.613525390625, -1.50836181640625, -1.4031982421875, -1.29803466796875, -1.19287109375, -1.08770751953125, -0.9825439453125, -0.87738037109375, -0.772216796875, -0.66705322265625, -0.5618896484375, -0.45672607421875, -0.3515625, -0.24639892578125, -0.1412353515625, -0.03607177734375, 0.069091796875, 0.17425537109375, 0.2794189453125, 0.38458251953125, 0.48974609375, 0.59490966796875, 0.7000732421875, 0.80523681640625, 0.910400390625, 1.01556396484375, 1.1207275390625, 1.22589111328125, 1.3310546875, 1.43621826171875, 1.5413818359375, 1.64654541015625, 1.751708984375, 1.85687255859375, 1.9620361328125, 2.06719970703125, 2.17236328125, 2.27752685546875, 2.3826904296875, 2.48785400390625, 2.593017578125, 2.69818115234375, 2.8033447265625, 2.90850830078125, 3.013671875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 12.0, 9.0, 10.0, 13.0, 23.0, 30.0, 39.0, 32.0, 62.0, 70.0, 111.0, 179.0, 269.0, 512.0, 1278.0, 3900.0, 17300.0, 86886.0, 394175.0, 1153568.0, 1506988.0, 760682.0, 211423.0, 43433.0, 8993.0, 2336.0, 831.0, 382.0, 227.0, 130.0, 84.0, 57.0, 42.0, 31.0, 43.0, 18.0, 16.0, 14.0, 7.0, 10.0, 9.0, 4.0, 9.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.5, -4.36871337890625, -4.2374267578125, -4.10614013671875, -3.974853515625, -3.84356689453125, -3.7122802734375, -3.58099365234375, -3.44970703125, -3.31842041015625, -3.1871337890625, -3.05584716796875, -2.924560546875, -2.79327392578125, -2.6619873046875, -2.53070068359375, -2.3994140625, -2.26812744140625, -2.1368408203125, -2.00555419921875, -1.874267578125, -1.74298095703125, -1.6116943359375, -1.48040771484375, -1.34912109375, -1.21783447265625, -1.0865478515625, -0.95526123046875, -0.823974609375, -0.69268798828125, -0.5614013671875, -0.43011474609375, -0.298828125, -0.16754150390625, -0.0362548828125, 0.09503173828125, 0.226318359375, 0.35760498046875, 0.4888916015625, 0.62017822265625, 0.75146484375, 0.88275146484375, 1.0140380859375, 1.14532470703125, 1.276611328125, 1.40789794921875, 1.5391845703125, 1.67047119140625, 1.8017578125, 1.93304443359375, 2.0643310546875, 2.19561767578125, 2.326904296875, 2.45819091796875, 2.5894775390625, 2.72076416015625, 2.85205078125, 2.98333740234375, 3.1146240234375, 3.24591064453125, 3.377197265625, 3.50848388671875, 3.6397705078125, 3.77105712890625, 3.90234375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 8.0, 7.0, 11.0, 16.0, 15.0, 17.0, 29.0, 34.0, 42.0, 62.0, 77.0, 95.0, 122.0, 173.0, 187.0, 245.0, 321.0, 350.0, 406.0, 389.0, 312.0, 253.0, 183.0, 158.0, 145.0, 98.0, 80.0, 44.0, 43.0, 31.0, 22.0, 18.0, 19.0, 13.0, 12.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.262451171875, -5.09521484375, -4.927978515625, -4.7607421875, -4.593505859375, -4.42626953125, -4.259033203125, -4.091796875, -3.924560546875, -3.75732421875, -3.590087890625, -3.4228515625, -3.255615234375, -3.08837890625, -2.921142578125, -2.75390625, -2.586669921875, -2.41943359375, -2.252197265625, -2.0849609375, -1.917724609375, -1.75048828125, -1.583251953125, -1.416015625, -1.248779296875, -1.08154296875, -0.914306640625, -0.7470703125, -0.579833984375, -0.41259765625, -0.245361328125, -0.078125, 0.089111328125, 0.25634765625, 0.423583984375, 0.5908203125, 0.758056640625, 0.92529296875, 1.092529296875, 1.259765625, 1.427001953125, 1.59423828125, 1.761474609375, 1.9287109375, 2.095947265625, 2.26318359375, 2.430419921875, 2.59765625, 2.764892578125, 2.93212890625, 3.099365234375, 3.2666015625, 3.433837890625, 3.60107421875, 3.768310546875, 3.935546875, 4.102783203125, 4.27001953125, 4.437255859375, 4.6044921875, 4.771728515625, 4.93896484375, 5.106201171875, 5.2734375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 16.0, 8.0, 12.0, 19.0, 23.0, 27.0, 55.0, 58.0, 75.0, 155.0, 239.0, 353.0, 602.0, 1338.0, 4855.0, 512171.0, 3641168.0, 28972.0, 1996.0, 839.0, 447.0, 256.0, 177.0, 122.0, 89.0, 56.0, 41.0, 21.0, 20.0, 15.0, 15.0, 8.0, 13.0, 9.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.640380859375, -16.96826171875, -16.296142578125, -15.6240234375, -14.951904296875, -14.27978515625, -13.607666015625, -12.935546875, -12.263427734375, -11.59130859375, -10.919189453125, -10.2470703125, -9.574951171875, -8.90283203125, -8.230712890625, -7.55859375, -6.886474609375, -6.21435546875, -5.542236328125, -4.8701171875, -4.197998046875, -3.52587890625, -2.853759765625, -2.181640625, -1.509521484375, -0.83740234375, -0.165283203125, 0.5068359375, 1.178955078125, 1.85107421875, 2.523193359375, 3.1953125, 3.867431640625, 4.53955078125, 5.211669921875, 5.8837890625, 6.555908203125, 7.22802734375, 7.900146484375, 8.572265625, 9.244384765625, 9.91650390625, 10.588623046875, 11.2607421875, 11.932861328125, 12.60498046875, 13.277099609375, 13.94921875, 14.621337890625, 15.29345703125, 15.965576171875, 16.6376953125, 17.309814453125, 17.98193359375, 18.654052734375, 19.326171875, 19.998291015625, 20.67041015625, 21.342529296875, 22.0146484375, 22.686767578125, 23.35888671875, 24.031005859375, 24.703125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 14.0, 257.0, 591.0, 148.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.32321166992188, -140.24261474609375, -136.16200256347656, -132.08140563964844, -128.0008087158203, -123.92019653320312, -119.839599609375, -115.75899505615234, -111.67839050292969, -107.59778594970703, -103.5171890258789, -99.43658447265625, -95.3559799194336, -91.27537536621094, -87.19477844238281, -83.11417388916016, -79.03357696533203, -74.95297241210938, -70.87237548828125, -66.7917709350586, -62.71116638183594, -58.63056564331055, -54.549964904785156, -50.4693603515625, -46.38875961303711, -42.30815887451172, -38.22755432128906, -34.14695358276367, -30.06635093688965, -25.985748291015625, -21.905147552490234, -17.82454490661621, -13.743942260742188, -9.663339614868164, -5.582737922668457, -1.50213623046875, 2.5784664154052734, 6.659069061279297, 10.739669799804688, 14.820272445678711, 18.900875091552734, 22.981477737426758, 27.06208038330078, 31.142681121826172, 35.22328186035156, 39.30388641357422, 43.38448715209961, 47.465087890625, 51.545692443847656, 55.62629318237305, 59.7068977355957, 63.787498474121094, 67.86810302734375, 71.94869995117188, 76.02930450439453, 80.10990905761719, 84.19050598144531, 88.27111053466797, 92.3517074584961, 96.43231201171875, 100.5129165649414, 104.59352111816406, 108.67411804199219, 112.75472259521484, 116.8353271484375]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 12.0, 10.0, 6.0, 17.0, 13.0, 16.0, 32.0, 23.0, 33.0, 36.0, 28.0, 39.0, 49.0, 40.0, 39.0, 39.0, 31.0, 37.0, 37.0, 43.0, 42.0, 30.0, 44.0, 34.0, 34.0, 38.0, 21.0, 23.0, 27.0, 15.0, 15.0, 10.0, 13.0, 13.0, 10.0, 7.0, 8.0, 7.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.16440200805664, -18.533411026000977, -17.902420043945312, -17.27142906188965, -16.640438079833984, -16.009445190429688, -15.378454208374023, -14.74746322631836, -14.116472244262695, -13.485481262207031, -12.854490280151367, -12.223498344421387, -11.592507362365723, -10.961516380310059, -10.330524444580078, -9.699533462524414, -9.06854248046875, -8.437551498413086, -7.806560039520264, -7.175568580627441, -6.544577598571777, -5.913586616516113, -5.282595157623291, -4.651603698730469, -4.020612716674805, -3.3896214962005615, -2.7586302757263184, -2.127639055252075, -1.496647834777832, -0.8656566143035889, -0.2346653938293457, 0.39632606506347656, 1.0273151397705078, 1.658306360244751, 2.289297580718994, 2.9202888011932373, 3.5512800216674805, 4.1822710037231445, 4.813262462615967, 5.444253921508789, 6.075244903564453, 6.706235885620117, 7.3372273445129395, 7.968218803405762, 8.599209785461426, 9.23020076751709, 9.86119270324707, 10.492183685302734, 11.123174667358398, 11.754165649414062, 12.385156631469727, 13.016148567199707, 13.647139549255371, 14.278130531311035, 14.909122467041016, 15.54011344909668, 16.171104431152344, 16.802095413208008, 17.433086395263672, 18.064077377319336, 18.695068359375, 19.326061248779297, 19.95705223083496, 20.588043212890625, 21.21903419494629]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 11.0, 10.0, 14.0, 11.0, 21.0, 11.0, 26.0, 26.0, 29.0, 25.0, 27.0, 41.0, 28.0, 45.0, 49.0, 38.0, 59.0, 36.0, 46.0, 38.0, 39.0, 38.0, 34.0, 32.0, 40.0, 38.0, 21.0, 24.0, 8.0, 24.0, 17.0, 20.0, 13.0, 5.0, 11.0, 8.0, 4.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.486297607421875, -3.38470458984375, -3.283111572265625, -3.1815185546875, -3.079925537109375, -2.97833251953125, -2.876739501953125, -2.775146484375, -2.673553466796875, -2.57196044921875, -2.470367431640625, -2.3687744140625, -2.267181396484375, -2.16558837890625, -2.063995361328125, -1.96240234375, -1.860809326171875, -1.75921630859375, -1.657623291015625, -1.5560302734375, -1.454437255859375, -1.35284423828125, -1.251251220703125, -1.149658203125, -1.048065185546875, -0.94647216796875, -0.844879150390625, -0.7432861328125, -0.641693115234375, -0.54010009765625, -0.438507080078125, -0.3369140625, -0.235321044921875, -0.13372802734375, -0.032135009765625, 0.0694580078125, 0.171051025390625, 0.27264404296875, 0.374237060546875, 0.475830078125, 0.577423095703125, 0.67901611328125, 0.780609130859375, 0.8822021484375, 0.983795166015625, 1.08538818359375, 1.186981201171875, 1.28857421875, 1.390167236328125, 1.49176025390625, 1.593353271484375, 1.6949462890625, 1.796539306640625, 1.89813232421875, 1.999725341796875, 2.101318359375, 2.202911376953125, 2.30450439453125, 2.406097412109375, 2.5076904296875, 2.609283447265625, 2.71087646484375, 2.812469482421875, 2.9140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 11.0, 13.0, 38.0, 42.0, 64.0, 89.0, 124.0, 179.0, 244.0, 363.0, 539.0, 801.0, 1015.0, 1548.0, 2173.0, 3268.0, 4714.0, 6992.0, 10399.0, 15530.0, 23955.0, 38047.0, 62361.0, 104587.0, 178810.0, 222825.0, 143593.0, 83552.0, 50564.0, 31048.0, 20155.0, 13001.0, 8929.0, 5927.0, 3973.0, 2763.0, 1946.0, 1335.0, 923.0, 607.0, 445.0, 311.0, 238.0, 150.0, 104.0, 79.0, 66.0, 32.0, 22.0, 27.0, 15.0, 11.0, 3.0, 5.0, 0.0, 3.0], "bins": [-0.364990234375, -0.35402679443359375, -0.3430633544921875, -0.33209991455078125, -0.321136474609375, -0.31017303466796875, -0.2992095947265625, -0.28824615478515625, -0.27728271484375, -0.26631927490234375, -0.2553558349609375, -0.24439239501953125, -0.233428955078125, -0.22246551513671875, -0.2115020751953125, -0.20053863525390625, -0.1895751953125, -0.17861175537109375, -0.1676483154296875, -0.15668487548828125, -0.145721435546875, -0.13475799560546875, -0.1237945556640625, -0.11283111572265625, -0.10186767578125, -0.09090423583984375, -0.0799407958984375, -0.06897735595703125, -0.058013916015625, -0.04705047607421875, -0.0360870361328125, -0.02512359619140625, -0.01416015625, -0.00319671630859375, 0.0077667236328125, 0.01873016357421875, 0.029693603515625, 0.04065704345703125, 0.0516204833984375, 0.06258392333984375, 0.07354736328125, 0.08451080322265625, 0.0954742431640625, 0.10643768310546875, 0.117401123046875, 0.12836456298828125, 0.1393280029296875, 0.15029144287109375, 0.1612548828125, 0.17221832275390625, 0.1831817626953125, 0.19414520263671875, 0.205108642578125, 0.21607208251953125, 0.2270355224609375, 0.23799896240234375, 0.24896240234375, 0.25992584228515625, 0.2708892822265625, 0.28185272216796875, 0.292816162109375, 0.30377960205078125, 0.3147430419921875, 0.32570648193359375, 0.336669921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 12.0, 17.0, 17.0, 23.0, 28.0, 26.0, 33.0, 25.0, 31.0, 25.0, 39.0, 36.0, 34.0, 51.0, 33.0, 1072.0, 37.0, 38.0, 28.0, 36.0, 39.0, 38.0, 26.0, 30.0, 25.0, 26.0, 19.0, 21.0, 23.0, 18.0, 15.0, 12.0, 11.0, 8.0, 9.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9814453125, -1.92205810546875, -1.8626708984375, -1.80328369140625, -1.743896484375, -1.68450927734375, -1.6251220703125, -1.56573486328125, -1.50634765625, -1.44696044921875, -1.3875732421875, -1.32818603515625, -1.268798828125, -1.20941162109375, -1.1500244140625, -1.09063720703125, -1.03125, -0.97186279296875, -0.9124755859375, -0.85308837890625, -0.793701171875, -0.73431396484375, -0.6749267578125, -0.61553955078125, -0.55615234375, -0.49676513671875, -0.4373779296875, -0.37799072265625, -0.318603515625, -0.25921630859375, -0.1998291015625, -0.14044189453125, -0.0810546875, -0.02166748046875, 0.0377197265625, 0.09710693359375, 0.156494140625, 0.21588134765625, 0.2752685546875, 0.33465576171875, 0.39404296875, 0.45343017578125, 0.5128173828125, 0.57220458984375, 0.631591796875, 0.69097900390625, 0.7503662109375, 0.80975341796875, 0.869140625, 0.92852783203125, 0.9879150390625, 1.04730224609375, 1.106689453125, 1.16607666015625, 1.2254638671875, 1.28485107421875, 1.34423828125, 1.40362548828125, 1.4630126953125, 1.52239990234375, 1.581787109375, 1.64117431640625, 1.7005615234375, 1.75994873046875, 1.8193359375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 7.0, 8.0, 14.0, 29.0, 44.0, 54.0, 63.0, 107.0, 141.0, 213.0, 249.0, 399.0, 539.0, 821.0, 1102.0, 1568.0, 2276.0, 3384.0, 5001.0, 7789.0, 11444.0, 17283.0, 26727.0, 41957.0, 67909.0, 114255.0, 185880.0, 1252087.0, 135622.0, 81107.0, 48547.0, 30626.0, 19516.0, 12918.0, 8464.0, 5936.0, 4056.0, 2817.0, 1908.0, 1299.0, 896.0, 668.0, 470.0, 324.0, 214.0, 139.0, 83.0, 67.0, 40.0, 25.0, 18.0, 14.0, 3.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27490234375, -0.2657890319824219, -0.25667572021484375, -0.24756240844726562, -0.2384490966796875, -0.22933578491210938, -0.22022247314453125, -0.21110916137695312, -0.201995849609375, -0.19288253784179688, -0.18376922607421875, -0.17465591430664062, -0.1655426025390625, -0.15642929077148438, -0.14731597900390625, -0.13820266723632812, -0.12908935546875, -0.11997604370117188, -0.11086273193359375, -0.10174942016601562, -0.0926361083984375, -0.08352279663085938, -0.07440948486328125, -0.06529617309570312, -0.056182861328125, -0.047069549560546875, -0.03795623779296875, -0.028842926025390625, -0.0197296142578125, -0.010616302490234375, -0.00150299072265625, 0.007610321044921875, 0.0167236328125, 0.025836944580078125, 0.03495025634765625, 0.044063568115234375, 0.0531768798828125, 0.062290191650390625, 0.07140350341796875, 0.08051681518554688, 0.089630126953125, 0.09874343872070312, 0.10785675048828125, 0.11697006225585938, 0.1260833740234375, 0.13519668579101562, 0.14430999755859375, 0.15342330932617188, 0.16253662109375, 0.17164993286132812, 0.18076324462890625, 0.18987655639648438, 0.1989898681640625, 0.20810317993164062, 0.21721649169921875, 0.22632980346679688, 0.235443115234375, 0.24455642700195312, 0.25366973876953125, 0.2627830505371094, 0.2718963623046875, 0.2810096740722656, 0.29012298583984375, 0.2992362976074219, 0.308349609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 7.0, 6.0, 9.0, 23.0, 17.0, 22.0, 35.0, 38.0, 52.0, 40.0, 65.0, 71.0, 69.0, 75.0, 71.0, 64.0, 83.0, 61.0, 44.0, 26.0, 31.0, 14.0, 14.0, 13.0, 15.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0014362335205078125, -0.0013933032751083374, -0.0013503730297088623, -0.0013074427843093872, -0.0012645125389099121, -0.001221582293510437, -0.001178652048110962, -0.0011357218027114868, -0.0010927915573120117, -0.0010498613119125366, -0.0010069310665130615, -0.0009640008211135864, -0.0009210705757141113, -0.0008781403303146362, -0.0008352100849151611, -0.000792279839515686, -0.0007493495941162109, -0.0007064193487167358, -0.0006634891033172607, -0.0006205588579177856, -0.0005776286125183105, -0.0005346983671188354, -0.0004917681217193604, -0.00044883787631988525, -0.00040590763092041016, -0.00036297738552093506, -0.00032004714012145996, -0.00027711689472198486, -0.00023418664932250977, -0.00019125640392303467, -0.00014832615852355957, -0.00010539591312408447, -6.246566772460938e-05, -1.9535422325134277e-05, 2.339482307434082e-05, 6.632506847381592e-05, 0.00010925531387329102, 0.0001521855592727661, 0.0001951158046722412, 0.0002380460500717163, 0.0002809762954711914, 0.0003239065408706665, 0.0003668367862701416, 0.0004097670316696167, 0.0004526972770690918, 0.0004956275224685669, 0.000538557767868042, 0.0005814880132675171, 0.0006244182586669922, 0.0006673485040664673, 0.0007102787494659424, 0.0007532089948654175, 0.0007961392402648926, 0.0008390694856643677, 0.0008819997310638428, 0.0009249299764633179, 0.000967860221862793, 0.001010790467262268, 0.0010537207126617432, 0.0010966509580612183, 0.0011395812034606934, 0.0011825114488601685, 0.0012254416942596436, 0.0012683719396591187, 0.0013113021850585938]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 11.0, 10.0, 14.0, 17.0, 28.0, 32.0, 54.0, 59.0, 87.0, 136.0, 250.0, 496.0, 1402.0, 726922.0, 316644.0, 1229.0, 431.0, 208.0, 134.0, 87.0, 85.0, 51.0, 34.0, 32.0, 24.0, 14.0, 9.0, 8.0, 7.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02667236328125, -0.02581048011779785, -0.024948596954345703, -0.024086713790893555, -0.023224830627441406, -0.022362947463989258, -0.02150106430053711, -0.02063918113708496, -0.019777297973632812, -0.018915414810180664, -0.018053531646728516, -0.017191648483276367, -0.01632976531982422, -0.01546788215637207, -0.014605998992919922, -0.013744115829467773, -0.012882232666015625, -0.012020349502563477, -0.011158466339111328, -0.01029658317565918, -0.009434700012207031, -0.008572816848754883, -0.007710933685302734, -0.006849050521850586, -0.0059871673583984375, -0.005125284194946289, -0.004263401031494141, -0.003401517868041992, -0.0025396347045898438, -0.0016777515411376953, -0.0008158683776855469, 4.601478576660156e-05, 0.00090789794921875, 0.0017697811126708984, 0.002631664276123047, 0.0034935474395751953, 0.004355430603027344, 0.005217313766479492, 0.006079196929931641, 0.006941080093383789, 0.0078029632568359375, 0.008664846420288086, 0.009526729583740234, 0.010388612747192383, 0.011250495910644531, 0.01211237907409668, 0.012974262237548828, 0.013836145401000977, 0.014698028564453125, 0.015559911727905273, 0.016421794891357422, 0.01728367805480957, 0.01814556121826172, 0.019007444381713867, 0.019869327545166016, 0.020731210708618164, 0.021593093872070312, 0.02245497703552246, 0.02331686019897461, 0.024178743362426758, 0.025040626525878906, 0.025902509689331055, 0.026764392852783203, 0.02762627601623535, 0.0284881591796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 108.0, 875.0, 34.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033679408952593803, -0.003117086598649621, -0.0028662323020398617, -0.002615378238260746, -0.0023645239416509867, -0.0021136696450412273, -0.0018628154648467898, -0.0016119612846523523, -0.001361106988042593, -0.0011102526914328337, -0.0008593985112383962, -0.0006085442728362978, -0.00035769003443419933, -0.00010683573782444, 0.0001440184423699975, 0.000394872622564435, 0.0006457269191741943, 0.0008965811575762928, 0.0011474353959783912, 0.0013982895761728287, 0.001649143872782588, 0.0018999981693923473, 0.002150852233171463, 0.0024017065297812223, 0.0026525608263909817, 0.002903415123000741, 0.0031542694196105003, 0.003405123483389616, 0.0036559777799993753, 0.003906832076609135, 0.00415768614038825, 0.004408540204167366, 0.004659393802285194, 0.00491024786606431, 0.005161102395504713, 0.005411956459283829, 0.005662810988724232, 0.005913665052503347, 0.006164519116282463, 0.006415373645722866, 0.006666227709501982, 0.006917081773281097, 0.0071679363027215, 0.007418790366500616, 0.007669644430279732, 0.007920498959720135, 0.008171353489160538, 0.008422207087278366, 0.008673061616718769, 0.008923916146159172, 0.009174769744277, 0.009425624273717403, 0.009676478803157806, 0.009927332401275635, 0.010178186930716038, 0.01042904146015644, 0.010679895058274269, 0.010930749587714672, 0.0111816031858325, 0.011432457715272903, 0.011683312244713306, 0.01193416677415371, 0.012185020372271538, 0.01243587490171194, 0.012686729431152344]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 5.0, 6.0, 15.0, 8.0, 18.0, 21.0, 27.0, 30.0, 31.0, 34.0, 31.0, 31.0, 29.0, 33.0, 35.0, 27.0, 44.0, 44.0, 39.0, 54.0, 35.0, 48.0, 29.0, 36.0, 33.0, 39.0, 32.0, 29.0, 22.0, 26.0, 14.0, 21.0, 15.0, 11.0, 4.0, 12.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006464123725891113, -0.0006269291043281555, -0.0006074458360671997, -0.0005879625678062439, -0.0005684792995452881, -0.0005489960312843323, -0.0005295127630233765, -0.0005100294947624207, -0.0004905462265014648, -0.00047106295824050903, -0.0004515796899795532, -0.0004320964217185974, -0.0004126131534576416, -0.0003931298851966858, -0.00037364661693573, -0.00035416334867477417, -0.00033468008041381836, -0.00031519681215286255, -0.00029571354389190674, -0.00027623027563095093, -0.0002567470073699951, -0.0002372637391090393, -0.0002177804708480835, -0.00019829720258712769, -0.00017881393432617188, -0.00015933066606521606, -0.00013984739780426025, -0.00012036412954330444, -0.00010088086128234863, -8.139759302139282e-05, -6.191432476043701e-05, -4.24310564994812e-05, -2.294778823852539e-05, -3.46451997756958e-06, 1.601874828338623e-05, 3.550201654434204e-05, 5.498528480529785e-05, 7.446855306625366e-05, 9.395182132720947e-05, 0.00011343508958816528, 0.0001329183578491211, 0.0001524016261100769, 0.00017188489437103271, 0.00019136816263198853, 0.00021085143089294434, 0.00023033469915390015, 0.00024981796741485596, 0.00026930123567581177, 0.0002887845039367676, 0.0003082677721977234, 0.0003277510404586792, 0.000347234308719635, 0.0003667175769805908, 0.00038620084524154663, 0.00040568411350250244, 0.00042516738176345825, 0.00044465065002441406, 0.0004641339182853699, 0.0004836171865463257, 0.0005031004548072815, 0.0005225837230682373, 0.0005420669913291931, 0.0005615502595901489, 0.0005810335278511047, 0.0006005167961120605]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 11.0, 10.0, 14.0, 11.0, 21.0, 11.0, 26.0, 26.0, 29.0, 25.0, 27.0, 41.0, 28.0, 45.0, 49.0, 38.0, 59.0, 36.0, 46.0, 38.0, 39.0, 38.0, 34.0, 32.0, 40.0, 38.0, 21.0, 24.0, 8.0, 24.0, 17.0, 20.0, 13.0, 5.0, 11.0, 8.0, 4.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.486297607421875, -3.38470458984375, -3.283111572265625, -3.1815185546875, -3.079925537109375, -2.97833251953125, -2.876739501953125, -2.775146484375, -2.673553466796875, -2.57196044921875, -2.470367431640625, -2.3687744140625, -2.267181396484375, -2.16558837890625, -2.063995361328125, -1.96240234375, -1.860809326171875, -1.75921630859375, -1.657623291015625, -1.5560302734375, -1.454437255859375, -1.35284423828125, -1.251251220703125, -1.149658203125, -1.048065185546875, -0.94647216796875, -0.844879150390625, -0.7432861328125, -0.641693115234375, -0.54010009765625, -0.438507080078125, -0.3369140625, -0.235321044921875, -0.13372802734375, -0.032135009765625, 0.0694580078125, 0.171051025390625, 0.27264404296875, 0.374237060546875, 0.475830078125, 0.577423095703125, 0.67901611328125, 0.780609130859375, 0.8822021484375, 0.983795166015625, 1.08538818359375, 1.186981201171875, 1.28857421875, 1.390167236328125, 1.49176025390625, 1.593353271484375, 1.6949462890625, 1.796539306640625, 1.89813232421875, 1.999725341796875, 2.101318359375, 2.202911376953125, 2.30450439453125, 2.406097412109375, 2.5076904296875, 2.609283447265625, 2.71087646484375, 2.812469482421875, 2.9140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 5.0, 12.0, 9.0, 16.0, 24.0, 17.0, 35.0, 53.0, 75.0, 162.0, 321.0, 714.0, 1766.0, 4537.0, 11566.0, 28811.0, 73688.0, 203260.0, 392157.0, 207330.0, 74790.0, 29555.0, 11766.0, 4555.0, 1839.0, 712.0, 329.0, 159.0, 96.0, 40.0, 32.0, 26.0, 24.0, 19.0, 5.0, 9.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.13671875, -4.016845703125, -3.89697265625, -3.777099609375, -3.6572265625, -3.537353515625, -3.41748046875, -3.297607421875, -3.177734375, -3.057861328125, -2.93798828125, -2.818115234375, -2.6982421875, -2.578369140625, -2.45849609375, -2.338623046875, -2.21875, -2.098876953125, -1.97900390625, -1.859130859375, -1.7392578125, -1.619384765625, -1.49951171875, -1.379638671875, -1.259765625, -1.139892578125, -1.02001953125, -0.900146484375, -0.7802734375, -0.660400390625, -0.54052734375, -0.420654296875, -0.30078125, -0.180908203125, -0.06103515625, 0.058837890625, 0.1787109375, 0.298583984375, 0.41845703125, 0.538330078125, 0.658203125, 0.778076171875, 0.89794921875, 1.017822265625, 1.1376953125, 1.257568359375, 1.37744140625, 1.497314453125, 1.6171875, 1.737060546875, 1.85693359375, 1.976806640625, 2.0966796875, 2.216552734375, 2.33642578125, 2.456298828125, 2.576171875, 2.696044921875, 2.81591796875, 2.935791015625, 3.0556640625, 3.175537109375, 3.29541015625, 3.415283203125, 3.53515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 7.0, 9.0, 8.0, 8.0, 8.0, 17.0, 11.0, 14.0, 13.0, 27.0, 25.0, 39.0, 38.0, 30.0, 36.0, 50.0, 64.0, 78.0, 152.0, 1404.0, 396.0, 134.0, 88.0, 59.0, 44.0, 46.0, 40.0, 33.0, 28.0, 19.0, 25.0, 20.0, 18.0, 11.0, 12.0, 8.0, 5.0, 7.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7421875, -10.40576171875, -10.0693359375, -9.73291015625, -9.396484375, -9.06005859375, -8.7236328125, -8.38720703125, -8.05078125, -7.71435546875, -7.3779296875, -7.04150390625, -6.705078125, -6.36865234375, -6.0322265625, -5.69580078125, -5.359375, -5.02294921875, -4.6865234375, -4.35009765625, -4.013671875, -3.67724609375, -3.3408203125, -3.00439453125, -2.66796875, -2.33154296875, -1.9951171875, -1.65869140625, -1.322265625, -0.98583984375, -0.6494140625, -0.31298828125, 0.0234375, 0.35986328125, 0.6962890625, 1.03271484375, 1.369140625, 1.70556640625, 2.0419921875, 2.37841796875, 2.71484375, 3.05126953125, 3.3876953125, 3.72412109375, 4.060546875, 4.39697265625, 4.7333984375, 5.06982421875, 5.40625, 5.74267578125, 6.0791015625, 6.41552734375, 6.751953125, 7.08837890625, 7.4248046875, 7.76123046875, 8.09765625, 8.43408203125, 8.7705078125, 9.10693359375, 9.443359375, 9.77978515625, 10.1162109375, 10.45263671875, 10.7890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 7.0, 5.0, 5.0, 8.0, 24.0, 18.0, 28.0, 27.0, 42.0, 67.0, 96.0, 186.0, 286.0, 489.0, 1233.0, 11955.0, 3036414.0, 91263.0, 1888.0, 667.0, 364.0, 212.0, 121.0, 66.0, 47.0, 50.0, 33.0, 30.0, 18.0, 14.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.7353515625, -22.845703125, -21.9560546875, -21.06640625, -20.1767578125, -19.287109375, -18.3974609375, -17.5078125, -16.6181640625, -15.728515625, -14.8388671875, -13.94921875, -13.0595703125, -12.169921875, -11.2802734375, -10.390625, -9.5009765625, -8.611328125, -7.7216796875, -6.83203125, -5.9423828125, -5.052734375, -4.1630859375, -3.2734375, -2.3837890625, -1.494140625, -0.6044921875, 0.28515625, 1.1748046875, 2.064453125, 2.9541015625, 3.84375, 4.7333984375, 5.623046875, 6.5126953125, 7.40234375, 8.2919921875, 9.181640625, 10.0712890625, 10.9609375, 11.8505859375, 12.740234375, 13.6298828125, 14.51953125, 15.4091796875, 16.298828125, 17.1884765625, 18.078125, 18.9677734375, 19.857421875, 20.7470703125, 21.63671875, 22.5263671875, 23.416015625, 24.3056640625, 25.1953125, 26.0849609375, 26.974609375, 27.8642578125, 28.75390625, 29.6435546875, 30.533203125, 31.4228515625, 32.3125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 371.0, 624.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.21812438964844, -207.449462890625, -203.6807861328125, -199.91212463378906, -196.14346313476562, -192.3748016357422, -188.60614013671875, -184.83746337890625, -181.0688018798828, -177.30014038085938, -173.53146362304688, -169.76280212402344, -165.994140625, -162.22547912597656, -158.45681762695312, -154.68814086914062, -150.9194793701172, -147.15081787109375, -143.38214111328125, -139.6134796142578, -135.84481811523438, -132.07615661621094, -128.3074951171875, -124.538818359375, -120.77015686035156, -117.00149536132812, -113.23282623291016, -109.46415710449219, -105.69549560546875, -101.92683410644531, -98.15816497802734, -94.38949584960938, -90.62084197998047, -86.8521728515625, -83.08351135253906, -79.31484985351562, -75.54618072509766, -71.77751159667969, -68.00885009765625, -64.24018859863281, -60.471519470214844, -56.70285415649414, -52.93418884277344, -49.165523529052734, -45.39685821533203, -41.62819290161133, -37.859527587890625, -34.09086227416992, -30.32219696044922, -26.553531646728516, -22.784866333007812, -19.01620101928711, -15.247535705566406, -11.478870391845703, -7.710205078125, -3.941539764404297, -0.17287445068359375, 3.5957908630371094, 7.3644561767578125, 11.133121490478516, 14.901786804199219, 18.670452117919922, 22.439117431640625, 26.207782745361328, 29.97644805908203]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 8.0, 9.0, 12.0, 11.0, 23.0, 21.0, 30.0, 27.0, 42.0, 32.0, 38.0, 39.0, 43.0, 54.0, 63.0, 52.0, 56.0, 44.0, 44.0, 46.0, 42.0, 55.0, 26.0, 19.0, 28.0, 28.0, 18.0, 20.0, 11.0, 20.0, 10.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.94858741760254, -30.017314910888672, -29.086042404174805, -28.154769897460938, -27.22349739074707, -26.292224884033203, -25.360952377319336, -24.42967987060547, -23.4984073638916, -22.567134857177734, -21.635862350463867, -20.70458984375, -19.773317337036133, -18.842044830322266, -17.9107723236084, -16.97949981689453, -16.04822540283203, -15.116952896118164, -14.185680389404297, -13.25440788269043, -12.323135375976562, -11.391862869262695, -10.460590362548828, -9.529317855834961, -8.598045349121094, -7.666772842407227, -6.735500335693359, -5.804227828979492, -4.872955322265625, -3.9416823387145996, -3.0104098320007324, -2.0791373252868652, -1.1478652954101562, -0.2165927290916443, 0.7146798372268677, 1.6459524631500244, 2.5772249698638916, 3.508497714996338, 4.439770221710205, 5.371042728424072, 6.3023152351379395, 7.233587741851807, 8.164860725402832, 9.0961332321167, 10.027405738830566, 10.958678245544434, 11.8899507522583, 12.821223258972168, 13.752495765686035, 14.683768272399902, 15.61504077911377, 16.546314239501953, 17.47758674621582, 18.408859252929688, 19.340131759643555, 20.271404266357422, 21.20267677307129, 22.133949279785156, 23.065221786499023, 23.99649429321289, 24.927766799926758, 25.859039306640625, 26.790311813354492, 27.72158432006836, 28.652856826782227]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 7.0, 14.0, 12.0, 14.0, 23.0, 21.0, 15.0, 27.0, 18.0, 23.0, 47.0, 47.0, 42.0, 37.0, 39.0, 49.0, 58.0, 41.0, 33.0, 43.0, 37.0, 35.0, 42.0, 28.0, 44.0, 29.0, 15.0, 23.0, 17.0, 21.0, 18.0, 14.0, 17.0, 4.0, 10.0, 4.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8046875, -3.688934326171875, -3.57318115234375, -3.457427978515625, -3.3416748046875, -3.225921630859375, -3.11016845703125, -2.994415283203125, -2.878662109375, -2.762908935546875, -2.64715576171875, -2.531402587890625, -2.4156494140625, -2.299896240234375, -2.18414306640625, -2.068389892578125, -1.95263671875, -1.836883544921875, -1.72113037109375, -1.605377197265625, -1.4896240234375, -1.373870849609375, -1.25811767578125, -1.142364501953125, -1.026611328125, -0.910858154296875, -0.79510498046875, -0.679351806640625, -0.5635986328125, -0.447845458984375, -0.33209228515625, -0.216339111328125, -0.1005859375, 0.015167236328125, 0.13092041015625, 0.246673583984375, 0.3624267578125, 0.478179931640625, 0.59393310546875, 0.709686279296875, 0.825439453125, 0.941192626953125, 1.05694580078125, 1.172698974609375, 1.2884521484375, 1.404205322265625, 1.51995849609375, 1.635711669921875, 1.75146484375, 1.867218017578125, 1.98297119140625, 2.098724365234375, 2.2144775390625, 2.330230712890625, 2.44598388671875, 2.561737060546875, 2.677490234375, 2.793243408203125, 2.90899658203125, 3.024749755859375, 3.1405029296875, 3.256256103515625, 3.37200927734375, 3.487762451171875, 3.603515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 1.0, 5.0, 6.0, 5.0, 11.0, 11.0, 13.0, 13.0, 17.0, 16.0, 23.0, 32.0, 34.0, 62.0, 68.0, 75.0, 138.0, 238.0, 573.0, 6314.0, 267336.0, 3126033.0, 772834.0, 18503.0, 1054.0, 268.0, 124.0, 109.0, 82.0, 51.0, 39.0, 30.0, 30.0, 23.0, 27.0, 13.0, 17.0, 11.0, 11.0, 4.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.369873046875, -10.05224609375, -9.734619140625, -9.4169921875, -9.099365234375, -8.78173828125, -8.464111328125, -8.146484375, -7.828857421875, -7.51123046875, -7.193603515625, -6.8759765625, -6.558349609375, -6.24072265625, -5.923095703125, -5.60546875, -5.287841796875, -4.97021484375, -4.652587890625, -4.3349609375, -4.017333984375, -3.69970703125, -3.382080078125, -3.064453125, -2.746826171875, -2.42919921875, -2.111572265625, -1.7939453125, -1.476318359375, -1.15869140625, -0.841064453125, -0.5234375, -0.205810546875, 0.11181640625, 0.429443359375, 0.7470703125, 1.064697265625, 1.38232421875, 1.699951171875, 2.017578125, 2.335205078125, 2.65283203125, 2.970458984375, 3.2880859375, 3.605712890625, 3.92333984375, 4.240966796875, 4.55859375, 4.876220703125, 5.19384765625, 5.511474609375, 5.8291015625, 6.146728515625, 6.46435546875, 6.781982421875, 7.099609375, 7.417236328125, 7.73486328125, 8.052490234375, 8.3701171875, 8.687744140625, 9.00537109375, 9.322998046875, 9.640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 16.0, 13.0, 20.0, 31.0, 44.0, 70.0, 113.0, 135.0, 236.0, 353.0, 504.0, 610.0, 573.0, 449.0, 328.0, 207.0, 148.0, 66.0, 52.0, 37.0, 25.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-11.015625, -10.775390625, -10.53515625, -10.294921875, -10.0546875, -9.814453125, -9.57421875, -9.333984375, -9.09375, -8.853515625, -8.61328125, -8.373046875, -8.1328125, -7.892578125, -7.65234375, -7.412109375, -7.171875, -6.931640625, -6.69140625, -6.451171875, -6.2109375, -5.970703125, -5.73046875, -5.490234375, -5.25, -5.009765625, -4.76953125, -4.529296875, -4.2890625, -4.048828125, -3.80859375, -3.568359375, -3.328125, -3.087890625, -2.84765625, -2.607421875, -2.3671875, -2.126953125, -1.88671875, -1.646484375, -1.40625, -1.166015625, -0.92578125, -0.685546875, -0.4453125, -0.205078125, 0.03515625, 0.275390625, 0.515625, 0.755859375, 0.99609375, 1.236328125, 1.4765625, 1.716796875, 1.95703125, 2.197265625, 2.4375, 2.677734375, 2.91796875, 3.158203125, 3.3984375, 3.638671875, 3.87890625, 4.119140625, 4.359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 15.0, 14.0, 20.0, 42.0, 64.0, 105.0, 162.0, 267.0, 440.0, 919.0, 5848.0, 1852466.0, 2324820.0, 6982.0, 892.0, 441.0, 279.0, 178.0, 108.0, 78.0, 40.0, 27.0, 21.0, 15.0, 15.0, 8.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7890625, -14.0115966796875, -13.234130859375, -12.4566650390625, -11.67919921875, -10.9017333984375, -10.124267578125, -9.3468017578125, -8.5693359375, -7.7918701171875, -7.014404296875, -6.2369384765625, -5.45947265625, -4.6820068359375, -3.904541015625, -3.1270751953125, -2.349609375, -1.5721435546875, -0.794677734375, -0.0172119140625, 0.76025390625, 1.5377197265625, 2.315185546875, 3.0926513671875, 3.8701171875, 4.6475830078125, 5.425048828125, 6.2025146484375, 6.97998046875, 7.7574462890625, 8.534912109375, 9.3123779296875, 10.08984375, 10.8673095703125, 11.644775390625, 12.4222412109375, 13.19970703125, 13.9771728515625, 14.754638671875, 15.5321044921875, 16.3095703125, 17.0870361328125, 17.864501953125, 18.6419677734375, 19.41943359375, 20.1968994140625, 20.974365234375, 21.7518310546875, 22.529296875, 23.3067626953125, 24.084228515625, 24.8616943359375, 25.63916015625, 26.4166259765625, 27.194091796875, 27.9715576171875, 28.7490234375, 29.5264892578125, 30.303955078125, 31.0814208984375, 31.85888671875, 32.6363525390625, 33.413818359375, 34.1912841796875, 34.96875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 107.0, 432.0, 384.0, 76.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.24429321289062, -108.3926773071289, -105.54106903076172, -102.689453125, -99.83783721923828, -96.9862289428711, -94.13461303710938, -91.28300476074219, -88.43138885498047, -85.57977294921875, -82.72816467285156, -79.87654876708984, -77.02493286132812, -74.17332458496094, -71.32170867919922, -68.4700927734375, -65.61848449707031, -62.76687240600586, -59.91525650024414, -57.06364440917969, -54.212032318115234, -51.36042022705078, -48.50880432128906, -45.65719223022461, -42.805572509765625, -39.95396041870117, -37.10234451293945, -34.250732421875, -31.399120330810547, -28.54750633239746, -25.695892333984375, -22.844280242919922, -19.99266815185547, -17.141054153442383, -14.28944206237793, -11.437828063964844, -8.586215019226074, -5.734601974487305, -2.8829879760742188, -0.031375885009765625, 2.8202381134033203, 5.67185115814209, 8.52346420288086, 11.375078201293945, 14.226691246032715, 17.078304290771484, 19.92991828918457, 22.781530380249023, 25.63314437866211, 28.484758377075195, 31.33637046813965, 34.187984466552734, 37.03959655761719, 39.891212463378906, 42.74282455444336, 45.59443664550781, 48.44605255126953, 51.297664642333984, 54.1492805480957, 57.000892639160156, 59.85250473022461, 62.70411682128906, 65.55573272705078, 68.4073486328125, 71.25895690917969]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 10.0, 8.0, 12.0, 16.0, 17.0, 22.0, 19.0, 21.0, 27.0, 37.0, 34.0, 36.0, 33.0, 43.0, 50.0, 39.0, 46.0, 31.0, 30.0, 41.0, 36.0, 45.0, 36.0, 44.0, 28.0, 28.0, 25.0, 22.0, 22.0, 19.0, 11.0, 17.0, 10.0, 10.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-19.536033630371094, -18.953569412231445, -18.37110710144043, -17.78864288330078, -17.206178665161133, -16.623716354370117, -16.04125213623047, -15.458788871765137, -14.876325607299805, -14.293862342834473, -13.711398124694824, -13.128934860229492, -12.54647159576416, -11.964008331298828, -11.38154411315918, -10.799080848693848, -10.2166166305542, -9.634153366088867, -9.051689147949219, -8.469225883483887, -7.886762619018555, -7.3042988777160645, -6.721835136413574, -6.139371871948242, -5.556908130645752, -4.974444389343262, -4.39198112487793, -3.8095173835754395, -3.2270538806915283, -2.644590377807617, -2.062126636505127, -1.479663372039795, -0.8971996307373047, -0.3147360682487488, 0.26772749423980713, 0.8501911163330078, 1.432654619216919, 2.01511812210083, 2.5975818634033203, 3.1800451278686523, 3.7625088691711426, 4.344972610473633, 4.927435874938965, 5.509899616241455, 6.092363357543945, 6.674826622009277, 7.257290363311768, 7.8397536277771, 8.42221736907959, 9.004680633544922, 9.58714485168457, 10.169608116149902, 10.752071380615234, 11.334535598754883, 11.916998863220215, 12.499462127685547, 13.081926345825195, 13.664389610290527, 14.246853828430176, 14.829317092895508, 15.41178035736084, 15.994243621826172, 16.57670783996582, 17.15917205810547, 17.741634368896484]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 11.0, 12.0, 8.0, 18.0, 13.0, 19.0, 28.0, 38.0, 27.0, 29.0, 36.0, 46.0, 36.0, 45.0, 51.0, 58.0, 40.0, 46.0, 51.0, 38.0, 41.0, 33.0, 34.0, 30.0, 31.0, 37.0, 18.0, 25.0, 18.0, 11.0, 14.0, 7.0, 8.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.4609375, -4.343902587890625, -4.22686767578125, -4.109832763671875, -3.9927978515625, -3.875762939453125, -3.75872802734375, -3.641693115234375, -3.524658203125, -3.407623291015625, -3.29058837890625, -3.173553466796875, -3.0565185546875, -2.939483642578125, -2.82244873046875, -2.705413818359375, -2.58837890625, -2.471343994140625, -2.35430908203125, -2.237274169921875, -2.1202392578125, -2.003204345703125, -1.88616943359375, -1.769134521484375, -1.652099609375, -1.535064697265625, -1.41802978515625, -1.300994873046875, -1.1839599609375, -1.066925048828125, -0.94989013671875, -0.832855224609375, -0.7158203125, -0.598785400390625, -0.48175048828125, -0.364715576171875, -0.2476806640625, -0.130645751953125, -0.01361083984375, 0.103424072265625, 0.220458984375, 0.337493896484375, 0.45452880859375, 0.571563720703125, 0.6885986328125, 0.805633544921875, 0.92266845703125, 1.039703369140625, 1.15673828125, 1.273773193359375, 1.39080810546875, 1.507843017578125, 1.6248779296875, 1.741912841796875, 1.85894775390625, 1.975982666015625, 2.093017578125, 2.210052490234375, 2.32708740234375, 2.444122314453125, 2.5611572265625, 2.678192138671875, 2.79522705078125, 2.912261962890625, 3.029296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 16.0, 22.0, 28.0, 58.0, 72.0, 94.0, 145.0, 225.0, 290.0, 456.0, 691.0, 917.0, 1422.0, 1965.0, 2951.0, 4023.0, 5814.0, 8666.0, 12424.0, 18592.0, 27952.0, 43040.0, 69962.0, 115558.0, 181873.0, 197081.0, 130305.0, 79765.0, 48647.0, 30906.0, 20249.0, 13717.0, 9458.0, 6453.0, 4591.0, 3148.0, 2161.0, 1481.0, 1026.0, 715.0, 527.0, 311.0, 245.0, 141.0, 130.0, 80.0, 46.0, 43.0, 29.0, 18.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0], "bins": [-0.34521484375, -0.3347930908203125, -0.324371337890625, -0.3139495849609375, -0.30352783203125, -0.2931060791015625, -0.282684326171875, -0.2722625732421875, -0.2618408203125, -0.2514190673828125, -0.240997314453125, -0.2305755615234375, -0.22015380859375, -0.2097320556640625, -0.199310302734375, -0.1888885498046875, -0.178466796875, -0.1680450439453125, -0.157623291015625, -0.1472015380859375, -0.13677978515625, -0.1263580322265625, -0.115936279296875, -0.1055145263671875, -0.0950927734375, -0.0846710205078125, -0.074249267578125, -0.0638275146484375, -0.05340576171875, -0.0429840087890625, -0.032562255859375, -0.0221405029296875, -0.01171875, -0.0012969970703125, 0.009124755859375, 0.0195465087890625, 0.02996826171875, 0.0403900146484375, 0.050811767578125, 0.0612335205078125, 0.0716552734375, 0.0820770263671875, 0.092498779296875, 0.1029205322265625, 0.11334228515625, 0.1237640380859375, 0.134185791015625, 0.1446075439453125, 0.155029296875, 0.1654510498046875, 0.175872802734375, 0.1862945556640625, 0.19671630859375, 0.2071380615234375, 0.217559814453125, 0.2279815673828125, 0.2384033203125, 0.2488250732421875, 0.259246826171875, 0.2696685791015625, 0.28009033203125, 0.2905120849609375, 0.300933837890625, 0.3113555908203125, 0.32177734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 7.0, 9.0, 9.0, 13.0, 14.0, 12.0, 17.0, 21.0, 18.0, 21.0, 20.0, 40.0, 31.0, 47.0, 40.0, 34.0, 28.0, 39.0, 43.0, 1059.0, 32.0, 38.0, 30.0, 34.0, 28.0, 29.0, 33.0, 29.0, 31.0, 23.0, 33.0, 20.0, 19.0, 14.0, 13.0, 8.0, 12.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.921875, -1.8609466552734375, -1.800018310546875, -1.7390899658203125, -1.67816162109375, -1.6172332763671875, -1.556304931640625, -1.4953765869140625, -1.4344482421875, -1.3735198974609375, -1.312591552734375, -1.2516632080078125, -1.19073486328125, -1.1298065185546875, -1.068878173828125, -1.0079498291015625, -0.947021484375, -0.8860931396484375, -0.825164794921875, -0.7642364501953125, -0.70330810546875, -0.6423797607421875, -0.581451416015625, -0.5205230712890625, -0.4595947265625, -0.3986663818359375, -0.337738037109375, -0.2768096923828125, -0.21588134765625, -0.1549530029296875, -0.094024658203125, -0.0330963134765625, 0.02783203125, 0.0887603759765625, 0.149688720703125, 0.2106170654296875, 0.27154541015625, 0.3324737548828125, 0.393402099609375, 0.4543304443359375, 0.5152587890625, 0.5761871337890625, 0.637115478515625, 0.6980438232421875, 0.75897216796875, 0.8199005126953125, 0.880828857421875, 0.9417572021484375, 1.002685546875, 1.0636138916015625, 1.124542236328125, 1.1854705810546875, 1.24639892578125, 1.3073272705078125, 1.368255615234375, 1.4291839599609375, 1.4901123046875, 1.5510406494140625, 1.611968994140625, 1.6728973388671875, 1.73382568359375, 1.7947540283203125, 1.855682373046875, 1.9166107177734375, 1.9775390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 22.0, 37.0, 47.0, 80.0, 144.0, 205.0, 324.0, 516.0, 753.0, 1285.0, 1997.0, 3355.0, 5610.0, 9706.0, 16581.0, 30057.0, 54682.0, 103819.0, 202310.0, 1317646.0, 161382.0, 83147.0, 44288.0, 24668.0, 14073.0, 8179.0, 4827.0, 2867.0, 1652.0, 1050.0, 624.0, 433.0, 266.0, 168.0, 107.0, 63.0, 46.0, 27.0, 22.0, 14.0, 13.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.41552734375, -0.4034233093261719, -0.39131927490234375, -0.3792152404785156, -0.3671112060546875, -0.3550071716308594, -0.34290313720703125, -0.3307991027832031, -0.318695068359375, -0.3065910339355469, -0.29448699951171875, -0.2823829650878906, -0.2702789306640625, -0.2581748962402344, -0.24607086181640625, -0.23396682739257812, -0.22186279296875, -0.20975875854492188, -0.19765472412109375, -0.18555068969726562, -0.1734466552734375, -0.16134262084960938, -0.14923858642578125, -0.13713455200195312, -0.125030517578125, -0.11292648315429688, -0.10082244873046875, -0.08871841430664062, -0.0766143798828125, -0.06451034545898438, -0.05240631103515625, -0.040302276611328125, -0.0281982421875, -0.016094207763671875, -0.00399017333984375, 0.008113861083984375, 0.0202178955078125, 0.032321929931640625, 0.04442596435546875, 0.056529998779296875, 0.068634033203125, 0.08073806762695312, 0.09284210205078125, 0.10494613647460938, 0.1170501708984375, 0.12915420532226562, 0.14125823974609375, 0.15336227416992188, 0.16546630859375, 0.17757034301757812, 0.18967437744140625, 0.20177841186523438, 0.2138824462890625, 0.22598648071289062, 0.23809051513671875, 0.2501945495605469, 0.262298583984375, 0.2744026184082031, 0.28650665283203125, 0.2986106872558594, 0.3107147216796875, 0.3228187561035156, 0.33492279052734375, 0.3470268249511719, 0.359130859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 4.0, 6.0, 13.0, 15.0, 20.0, 26.0, 40.0, 44.0, 58.0, 68.0, 87.0, 81.0, 84.0, 85.0, 57.0, 59.0, 50.0, 48.0, 34.0, 26.0, 19.0, 12.0, 13.0, 17.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001800537109375, -0.0017509311437606812, -0.0017013251781463623, -0.0016517192125320435, -0.0016021132469177246, -0.0015525072813034058, -0.001502901315689087, -0.001453295350074768, -0.0014036893844604492, -0.0013540834188461304, -0.0013044774532318115, -0.0012548714876174927, -0.0012052655220031738, -0.001155659556388855, -0.0011060535907745361, -0.0010564476251602173, -0.0010068416595458984, -0.0009572356939315796, -0.0009076297283172607, -0.0008580237627029419, -0.000808417797088623, -0.0007588118314743042, -0.0007092058658599854, -0.0006595999002456665, -0.0006099939346313477, -0.0005603879690170288, -0.00051078200340271, -0.0004611760377883911, -0.00041157007217407227, -0.0003619641065597534, -0.00031235814094543457, -0.0002627521753311157, -0.00021314620971679688, -0.00016354024410247803, -0.00011393427848815918, -6.432831287384033e-05, -1.4722347259521484e-05, 3.488361835479736e-05, 8.448958396911621e-05, 0.00013409554958343506, 0.0001837015151977539, 0.00023330748081207275, 0.0002829134464263916, 0.00033251941204071045, 0.0003821253776550293, 0.00043173134326934814, 0.000481337308883667, 0.0005309432744979858, 0.0005805492401123047, 0.0006301552057266235, 0.0006797611713409424, 0.0007293671369552612, 0.0007789731025695801, 0.0008285790681838989, 0.0008781850337982178, 0.0009277909994125366, 0.0009773969650268555, 0.0010270029306411743, 0.0010766088962554932, 0.001126214861869812, 0.0011758208274841309, 0.0012254267930984497, 0.0012750327587127686, 0.0013246387243270874, 0.0013742446899414062]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 7.0, 8.0, 6.0, 11.0, 18.0, 23.0, 25.0, 37.0, 43.0, 73.0, 108.0, 156.0, 254.0, 618.0, 5978.0, 1036566.0, 3377.0, 548.0, 263.0, 143.0, 98.0, 55.0, 43.0, 28.0, 23.0, 11.0, 7.0, 3.0, 7.0, 3.0, 2.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294647216796875, -0.028391122817993164, -0.027317523956298828, -0.026243925094604492, -0.025170326232910156, -0.02409672737121582, -0.023023128509521484, -0.02194952964782715, -0.020875930786132812, -0.019802331924438477, -0.01872873306274414, -0.017655134201049805, -0.01658153533935547, -0.015507936477661133, -0.014434337615966797, -0.013360738754272461, -0.012287139892578125, -0.011213541030883789, -0.010139942169189453, -0.009066343307495117, -0.007992744445800781, -0.006919145584106445, -0.005845546722412109, -0.0047719478607177734, -0.0036983489990234375, -0.0026247501373291016, -0.0015511512756347656, -0.0004775524139404297, 0.0005960464477539062, 0.0016696453094482422, 0.002743244171142578, 0.003816843032836914, 0.00489044189453125, 0.005964040756225586, 0.007037639617919922, 0.008111238479614258, 0.009184837341308594, 0.01025843620300293, 0.011332035064697266, 0.012405633926391602, 0.013479232788085938, 0.014552831649780273, 0.01562643051147461, 0.016700029373168945, 0.01777362823486328, 0.018847227096557617, 0.019920825958251953, 0.02099442481994629, 0.022068023681640625, 0.02314162254333496, 0.024215221405029297, 0.025288820266723633, 0.02636241912841797, 0.027436017990112305, 0.02850961685180664, 0.029583215713500977, 0.030656814575195312, 0.03173041343688965, 0.032804012298583984, 0.03387761116027832, 0.034951210021972656, 0.03602480888366699, 0.03709840774536133, 0.038172006607055664, 0.03924560546875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 11.0, 56.0, 274.0, 409.0, 215.0, 44.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004250251222401857, -0.004160590935498476, -0.004070930648595095, -0.003981270361691713, -0.003891610074788332, -0.0038019500207155943, -0.003712289733812213, -0.0036226294469088316, -0.0035329691600054502, -0.003443308873102069, -0.0033536485861986876, -0.003263988299295306, -0.0031743282452225685, -0.003084667958319187, -0.002995007671415806, -0.0029053473845124245, -0.002815687097609043, -0.0027260268107056618, -0.0026363665238022804, -0.002546706236898899, -0.0024570459499955177, -0.00236738589592278, -0.0022777256090193987, -0.0021880653221160173, -0.002098405035212636, -0.0020087447483092546, -0.0019190844614058733, -0.0018294242909178138, -0.0017397640040144324, -0.001650103717111051, -0.0015604435466229916, -0.0014707832597196102, -0.0013811230892315507, -0.0012914628023281693, -0.0012018026318401098, -0.0011121423449367285, -0.0010224820580333471, -0.0009328217711299658, -0.0008431615424342453, -0.0007535013137385249, -0.0006638410268351436, -0.0005741807399317622, -0.0004845205112360418, -0.0003948602534364909, -0.00030519999563694, -0.0002155397378373891, -0.00012587948003783822, -3.6219251342117786e-05, 5.344103556126356e-05, 0.00014310129336081445, 0.00023276155116036534, 0.00032242180895991623, 0.0004120820667594671, 0.0005017423536628485, 0.0005914025823585689, 0.0006810628110542893, 0.0007707230979576707, 0.000860383384861052, 0.0009500436135567725, 0.001039703842252493, 0.0011293641291558743, 0.0012190244160592556, 0.001308684702962637, 0.0013983448734506965, 0.0014880051603540778]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 13.0, 12.0, 21.0, 11.0, 13.0, 22.0, 23.0, 30.0, 29.0, 31.0, 45.0, 39.0, 31.0, 38.0, 55.0, 37.0, 42.0, 42.0, 42.0, 45.0, 45.0, 38.0, 30.0, 40.0, 33.0, 29.0, 30.0, 22.0, 20.0, 15.0, 19.0, 12.0, 8.0, 12.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007501840591430664, -0.0007274607196450233, -0.0007047373801469803, -0.0006820140406489372, -0.0006592907011508942, -0.0006365673616528511, -0.000613844022154808, -0.000591120682656765, -0.0005683973431587219, -0.0005456740036606789, -0.0005229506641626358, -0.0005002273246645927, -0.0004775039851665497, -0.0004547806456685066, -0.00043205730617046356, -0.0004093339666724205, -0.00038661062717437744, -0.0003638872876763344, -0.0003411639481782913, -0.00031844060868024826, -0.0002957172691822052, -0.00027299392968416214, -0.0002502705901861191, -0.00022754725068807602, -0.00020482391119003296, -0.0001821005716919899, -0.00015937723219394684, -0.00013665389269590378, -0.00011393055319786072, -9.120721369981766e-05, -6.84838742017746e-05, -4.576053470373154e-05, -2.3037195205688477e-05, -3.1385570764541626e-07, 2.2409483790397644e-05, 4.5132823288440704e-05, 6.785616278648376e-05, 9.057950228452682e-05, 0.00011330284178256989, 0.00013602618128061295, 0.000158749520778656, 0.00018147286027669907, 0.00020419619977474213, 0.0002269195392727852, 0.00024964287877082825, 0.0002723662182688713, 0.00029508955776691437, 0.00031781289726495743, 0.0003405362367630005, 0.00036325957626104355, 0.0003859829157590866, 0.00040870625525712967, 0.00043142959475517273, 0.0004541529342532158, 0.00047687627375125885, 0.0004995996132493019, 0.000522322952747345, 0.000545046292245388, 0.0005677696317434311, 0.0005904929712414742, 0.0006132163107395172, 0.0006359396502375603, 0.0006586629897356033, 0.0006813863292336464, 0.0007041096687316895]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 11.0, 12.0, 8.0, 18.0, 13.0, 19.0, 28.0, 38.0, 27.0, 29.0, 36.0, 46.0, 36.0, 45.0, 51.0, 58.0, 40.0, 46.0, 51.0, 38.0, 41.0, 33.0, 34.0, 30.0, 31.0, 37.0, 18.0, 25.0, 18.0, 11.0, 14.0, 7.0, 8.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.4609375, -4.343902587890625, -4.22686767578125, -4.109832763671875, -3.9927978515625, -3.875762939453125, -3.75872802734375, -3.641693115234375, -3.524658203125, -3.407623291015625, -3.29058837890625, -3.173553466796875, -3.0565185546875, -2.939483642578125, -2.82244873046875, -2.705413818359375, -2.58837890625, -2.471343994140625, -2.35430908203125, -2.237274169921875, -2.1202392578125, -2.003204345703125, -1.88616943359375, -1.769134521484375, -1.652099609375, -1.535064697265625, -1.41802978515625, -1.300994873046875, -1.1839599609375, -1.066925048828125, -0.94989013671875, -0.832855224609375, -0.7158203125, -0.598785400390625, -0.48175048828125, -0.364715576171875, -0.2476806640625, -0.130645751953125, -0.01361083984375, 0.103424072265625, 0.220458984375, 0.337493896484375, 0.45452880859375, 0.571563720703125, 0.6885986328125, 0.805633544921875, 0.92266845703125, 1.039703369140625, 1.15673828125, 1.273773193359375, 1.39080810546875, 1.507843017578125, 1.6248779296875, 1.741912841796875, 1.85894775390625, 1.975982666015625, 2.093017578125, 2.210052490234375, 2.32708740234375, 2.444122314453125, 2.5611572265625, 2.678192138671875, 2.79522705078125, 2.912261962890625, 3.029296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 9.0, 10.0, 13.0, 14.0, 14.0, 32.0, 36.0, 37.0, 61.0, 83.0, 110.0, 162.0, 208.0, 307.0, 594.0, 1921.0, 8857.0, 43044.0, 317043.0, 573486.0, 81744.0, 15361.0, 3288.0, 840.0, 393.0, 233.0, 161.0, 125.0, 98.0, 65.0, 54.0, 34.0, 23.0, 16.0, 25.0, 16.0, 6.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-8.0390625, -7.8284912109375, -7.617919921875, -7.4073486328125, -7.19677734375, -6.9862060546875, -6.775634765625, -6.5650634765625, -6.3544921875, -6.1439208984375, -5.933349609375, -5.7227783203125, -5.51220703125, -5.3016357421875, -5.091064453125, -4.8804931640625, -4.669921875, -4.4593505859375, -4.248779296875, -4.0382080078125, -3.82763671875, -3.6170654296875, -3.406494140625, -3.1959228515625, -2.9853515625, -2.7747802734375, -2.564208984375, -2.3536376953125, -2.14306640625, -1.9324951171875, -1.721923828125, -1.5113525390625, -1.30078125, -1.0902099609375, -0.879638671875, -0.6690673828125, -0.45849609375, -0.2479248046875, -0.037353515625, 0.1732177734375, 0.3837890625, 0.5943603515625, 0.804931640625, 1.0155029296875, 1.22607421875, 1.4366455078125, 1.647216796875, 1.8577880859375, 2.068359375, 2.2789306640625, 2.489501953125, 2.7000732421875, 2.91064453125, 3.1212158203125, 3.331787109375, 3.5423583984375, 3.7529296875, 3.9635009765625, 4.174072265625, 4.3846435546875, 4.59521484375, 4.8057861328125, 5.016357421875, 5.2269287109375, 5.4375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 12.0, 12.0, 17.0, 17.0, 21.0, 16.0, 32.0, 30.0, 23.0, 23.0, 32.0, 38.0, 41.0, 56.0, 71.0, 182.0, 1515.0, 353.0, 104.0, 64.0, 37.0, 30.0, 41.0, 32.0, 33.0, 30.0, 29.0, 17.0, 21.0, 23.0, 9.0, 5.0, 8.0, 6.0, 10.0, 10.0, 3.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0234375, -9.6759033203125, -9.328369140625, -8.9808349609375, -8.63330078125, -8.2857666015625, -7.938232421875, -7.5906982421875, -7.2431640625, -6.8956298828125, -6.548095703125, -6.2005615234375, -5.85302734375, -5.5054931640625, -5.157958984375, -4.8104248046875, -4.462890625, -4.1153564453125, -3.767822265625, -3.4202880859375, -3.07275390625, -2.7252197265625, -2.377685546875, -2.0301513671875, -1.6826171875, -1.3350830078125, -0.987548828125, -0.6400146484375, -0.29248046875, 0.0550537109375, 0.402587890625, 0.7501220703125, 1.09765625, 1.4451904296875, 1.792724609375, 2.1402587890625, 2.48779296875, 2.8353271484375, 3.182861328125, 3.5303955078125, 3.8779296875, 4.2254638671875, 4.572998046875, 4.9205322265625, 5.26806640625, 5.6156005859375, 5.963134765625, 6.3106689453125, 6.658203125, 7.0057373046875, 7.353271484375, 7.7008056640625, 8.04833984375, 8.3958740234375, 8.743408203125, 9.0909423828125, 9.4384765625, 9.7860107421875, 10.133544921875, 10.4810791015625, 10.82861328125, 11.1761474609375, 11.523681640625, 11.8712158203125, 12.21875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 5.0, 14.0, 13.0, 10.0, 16.0, 15.0, 24.0, 20.0, 41.0, 48.0, 60.0, 73.0, 118.0, 172.0, 240.0, 476.0, 1417.0, 20831.0, 3072607.0, 46033.0, 1879.0, 592.0, 298.0, 165.0, 112.0, 84.0, 50.0, 56.0, 37.0, 36.0, 33.0, 16.0, 21.0, 15.0, 11.0, 14.0, 8.0, 5.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.6875, -24.8740234375, -24.060546875, -23.2470703125, -22.43359375, -21.6201171875, -20.806640625, -19.9931640625, -19.1796875, -18.3662109375, -17.552734375, -16.7392578125, -15.92578125, -15.1123046875, -14.298828125, -13.4853515625, -12.671875, -11.8583984375, -11.044921875, -10.2314453125, -9.41796875, -8.6044921875, -7.791015625, -6.9775390625, -6.1640625, -5.3505859375, -4.537109375, -3.7236328125, -2.91015625, -2.0966796875, -1.283203125, -0.4697265625, 0.34375, 1.1572265625, 1.970703125, 2.7841796875, 3.59765625, 4.4111328125, 5.224609375, 6.0380859375, 6.8515625, 7.6650390625, 8.478515625, 9.2919921875, 10.10546875, 10.9189453125, 11.732421875, 12.5458984375, 13.359375, 14.1728515625, 14.986328125, 15.7998046875, 16.61328125, 17.4267578125, 18.240234375, 19.0537109375, 19.8671875, 20.6806640625, 21.494140625, 22.3076171875, 23.12109375, 23.9345703125, 24.748046875, 25.5615234375, 26.375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 24.0, 83.0, 177.0, 253.0, 223.0, 157.0, 54.0, 19.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.79281234741211, -38.02808380126953, -37.26335525512695, -36.49863052368164, -35.73390197753906, -34.969173431396484, -34.204444885253906, -33.439720153808594, -32.674991607666016, -31.910263061523438, -31.145536422729492, -30.380807876586914, -29.61608123779297, -28.85135269165039, -28.086626052856445, -27.321897506713867, -26.557170867919922, -25.792442321777344, -25.0277156829834, -24.26298713684082, -23.498260498046875, -22.733531951904297, -21.96880531311035, -21.204076766967773, -20.439348220825195, -19.674619674682617, -18.909893035888672, -18.145164489746094, -17.38043785095215, -16.61570930480957, -15.850982666015625, -15.086254119873047, -14.321528434753418, -13.556800842285156, -12.792073249816895, -12.027345657348633, -11.262618064880371, -10.49789047241211, -9.733161926269531, -8.968435287475586, -8.203706741333008, -7.438979148864746, -6.674251556396484, -5.909523963928223, -5.144796371459961, -4.380068778991699, -3.6153407096862793, -2.8506131172180176, -2.085886001586914, -1.3211584091186523, -0.5564306974411011, 0.2082970142364502, 0.9730246067047119, 1.7377521991729736, 2.5024800300598145, 3.267207622528076, 4.031935214996338, 4.7966628074646, 5.561390399932861, 6.326118469238281, 7.090846061706543, 7.855573654174805, 8.620301246643066, 9.385028839111328, 10.14975643157959]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 9.0, 18.0, 18.0, 20.0, 19.0, 14.0, 22.0, 23.0, 22.0, 32.0, 38.0, 47.0, 26.0, 34.0, 44.0, 49.0, 31.0, 44.0, 45.0, 36.0, 37.0, 37.0, 31.0, 28.0, 31.0, 25.0, 23.0, 20.0, 21.0, 14.0, 24.0, 11.0, 7.0, 9.0, 11.0, 9.0, 10.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.435688018798828, -22.652280807495117, -21.868873596191406, -21.085464477539062, -20.30205726623535, -19.51865005493164, -18.73524284362793, -17.95183563232422, -17.168426513671875, -16.385019302368164, -15.601611137390137, -14.818203926086426, -14.034795761108398, -13.251388549804688, -12.467981338500977, -11.684574127197266, -10.901166915893555, -10.117759704589844, -9.334351539611816, -8.550944328308105, -7.767536640167236, -6.984128952026367, -6.200721740722656, -5.417314052581787, -4.633906364440918, -3.850498676300049, -3.067091226577759, -2.2836837768554688, -1.5002760887145996, -0.7168684005737305, 0.06653881072998047, 0.8499464988708496, 1.6333541870117188, 2.416761875152588, 3.200169324874878, 3.983576774597168, 4.766984462738037, 5.550392150878906, 6.333799362182617, 7.117207050323486, 7.9006147384643555, 8.684021949768066, 9.467430114746094, 10.250837326049805, 11.034244537353516, 11.817652702331543, 12.601059913635254, 13.384468078613281, 14.167875289916992, 14.951282501220703, 15.73469066619873, 16.518096923828125, 17.30150604248047, 18.08491325378418, 18.86832046508789, 19.6517276763916, 20.435134887695312, 21.218542098999023, 22.001949310302734, 22.785358428955078, 23.56876564025879, 24.3521728515625, 25.13558006286621, 25.918987274169922, 26.702396392822266]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 4.0, 13.0, 15.0, 16.0, 17.0, 18.0, 27.0, 39.0, 24.0, 32.0, 45.0, 49.0, 56.0, 52.0, 46.0, 62.0, 48.0, 49.0, 32.0, 43.0, 39.0, 44.0, 42.0, 38.0, 23.0, 26.0, 16.0, 18.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.9346923828125, -4.795166015625, -4.6556396484375, -4.51611328125, -4.3765869140625, -4.237060546875, -4.0975341796875, -3.9580078125, -3.8184814453125, -3.678955078125, -3.5394287109375, -3.39990234375, -3.2603759765625, -3.120849609375, -2.9813232421875, -2.841796875, -2.7022705078125, -2.562744140625, -2.4232177734375, -2.28369140625, -2.1441650390625, -2.004638671875, -1.8651123046875, -1.7255859375, -1.5860595703125, -1.446533203125, -1.3070068359375, -1.16748046875, -1.0279541015625, -0.888427734375, -0.7489013671875, -0.609375, -0.4698486328125, -0.330322265625, -0.1907958984375, -0.05126953125, 0.0882568359375, 0.227783203125, 0.3673095703125, 0.5068359375, 0.6463623046875, 0.785888671875, 0.9254150390625, 1.06494140625, 1.2044677734375, 1.343994140625, 1.4835205078125, 1.623046875, 1.7625732421875, 1.902099609375, 2.0416259765625, 2.18115234375, 2.3206787109375, 2.460205078125, 2.5997314453125, 2.7392578125, 2.8787841796875, 3.018310546875, 3.1578369140625, 3.29736328125, 3.4368896484375, 3.576416015625, 3.7159423828125, 3.85546875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 9.0, 12.0, 16.0, 10.0, 15.0, 34.0, 31.0, 40.0, 49.0, 65.0, 90.0, 147.0, 368.0, 1603.0, 27088.0, 887211.0, 2946450.0, 319641.0, 9772.0, 882.0, 250.0, 122.0, 87.0, 69.0, 45.0, 42.0, 27.0, 19.0, 21.0, 17.0, 13.0, 11.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.9921875, -10.689697265625, -10.38720703125, -10.084716796875, -9.7822265625, -9.479736328125, -9.17724609375, -8.874755859375, -8.572265625, -8.269775390625, -7.96728515625, -7.664794921875, -7.3623046875, -7.059814453125, -6.75732421875, -6.454833984375, -6.15234375, -5.849853515625, -5.54736328125, -5.244873046875, -4.9423828125, -4.639892578125, -4.33740234375, -4.034912109375, -3.732421875, -3.429931640625, -3.12744140625, -2.824951171875, -2.5224609375, -2.219970703125, -1.91748046875, -1.614990234375, -1.3125, -1.010009765625, -0.70751953125, -0.405029296875, -0.1025390625, 0.199951171875, 0.50244140625, 0.804931640625, 1.107421875, 1.409912109375, 1.71240234375, 2.014892578125, 2.3173828125, 2.619873046875, 2.92236328125, 3.224853515625, 3.52734375, 3.829833984375, 4.13232421875, 4.434814453125, 4.7373046875, 5.039794921875, 5.34228515625, 5.644775390625, 5.947265625, 6.249755859375, 6.55224609375, 6.854736328125, 7.1572265625, 7.459716796875, 7.76220703125, 8.064697265625, 8.3671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 12.0, 11.0, 16.0, 19.0, 27.0, 23.0, 49.0, 66.0, 83.0, 118.0, 139.0, 195.0, 272.0, 308.0, 387.0, 429.0, 418.0, 346.0, 302.0, 190.0, 171.0, 114.0, 93.0, 81.0, 40.0, 50.0, 30.0, 18.0, 9.0, 11.0, 9.0, 11.0, 5.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.3359375, -6.16796875, -6.0, -5.83203125, -5.6640625, -5.49609375, -5.328125, -5.16015625, -4.9921875, -4.82421875, -4.65625, -4.48828125, -4.3203125, -4.15234375, -3.984375, -3.81640625, -3.6484375, -3.48046875, -3.3125, -3.14453125, -2.9765625, -2.80859375, -2.640625, -2.47265625, -2.3046875, -2.13671875, -1.96875, -1.80078125, -1.6328125, -1.46484375, -1.296875, -1.12890625, -0.9609375, -0.79296875, -0.625, -0.45703125, -0.2890625, -0.12109375, 0.046875, 0.21484375, 0.3828125, 0.55078125, 0.71875, 0.88671875, 1.0546875, 1.22265625, 1.390625, 1.55859375, 1.7265625, 1.89453125, 2.0625, 2.23046875, 2.3984375, 2.56640625, 2.734375, 2.90234375, 3.0703125, 3.23828125, 3.40625, 3.57421875, 3.7421875, 3.91015625, 4.078125, 4.24609375, 4.4140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 12.0, 15.0, 16.0, 23.0, 30.0, 54.0, 71.0, 89.0, 144.0, 183.0, 273.0, 330.0, 597.0, 1472.0, 7947.0, 133455.0, 2928841.0, 1076976.0, 37774.0, 3305.0, 1003.0, 501.0, 331.0, 237.0, 158.0, 112.0, 87.0, 68.0, 46.0, 31.0, 28.0, 20.0, 11.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.3638916015625, -9.962158203125, -9.5604248046875, -9.15869140625, -8.7569580078125, -8.355224609375, -7.9534912109375, -7.5517578125, -7.1500244140625, -6.748291015625, -6.3465576171875, -5.94482421875, -5.5430908203125, -5.141357421875, -4.7396240234375, -4.337890625, -3.9361572265625, -3.534423828125, -3.1326904296875, -2.73095703125, -2.3292236328125, -1.927490234375, -1.5257568359375, -1.1240234375, -0.7222900390625, -0.320556640625, 0.0811767578125, 0.48291015625, 0.8846435546875, 1.286376953125, 1.6881103515625, 2.08984375, 2.4915771484375, 2.893310546875, 3.2950439453125, 3.69677734375, 4.0985107421875, 4.500244140625, 4.9019775390625, 5.3037109375, 5.7054443359375, 6.107177734375, 6.5089111328125, 6.91064453125, 7.3123779296875, 7.714111328125, 8.1158447265625, 8.517578125, 8.9193115234375, 9.321044921875, 9.7227783203125, 10.12451171875, 10.5262451171875, 10.927978515625, 11.3297119140625, 11.7314453125, 12.1331787109375, 12.534912109375, 12.9366455078125, 13.33837890625, 13.7401123046875, 14.141845703125, 14.5435791015625, 14.9453125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 12.0, 37.0, 118.0, 180.0, 223.0, 221.0, 133.0, 57.0, 25.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.236835479736328, -28.908466339111328, -27.580097198486328, -26.251728057861328, -24.923358917236328, -23.594989776611328, -22.266620635986328, -20.938251495361328, -19.609882354736328, -18.281513214111328, -16.953144073486328, -15.624774932861328, -14.296405792236328, -12.968036651611328, -11.639667510986328, -10.311298370361328, -8.982929229736328, -7.654560089111328, -6.326190948486328, -4.997821807861328, -3.669452667236328, -2.341083526611328, -1.0127143859863281, 0.3156547546386719, 1.6440238952636719, 2.972393035888672, 4.300762176513672, 5.629131317138672, 6.957500457763672, 8.285869598388672, 9.614238739013672, 10.942607879638672, 12.270973205566406, 13.599342346191406, 14.927711486816406, 16.256080627441406, 17.584449768066406, 18.912818908691406, 20.241188049316406, 21.569557189941406, 22.897926330566406, 24.226295471191406, 25.554664611816406, 26.883033752441406, 28.211402893066406, 29.539772033691406, 30.868141174316406, 32.196510314941406, 33.524879455566406, 34.853248596191406, 36.181617736816406, 37.509986877441406, 38.838356018066406, 40.166725158691406, 41.495094299316406, 42.823463439941406, 44.151832580566406, 45.480201721191406, 46.808570861816406, 48.136940002441406, 49.465309143066406, 50.793678283691406, 52.122047424316406, 53.450416564941406, 54.778785705566406]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 5.0, 14.0, 21.0, 12.0, 17.0, 25.0, 24.0, 27.0, 35.0, 33.0, 32.0, 38.0, 34.0, 49.0, 46.0, 50.0, 48.0, 46.0, 47.0, 42.0, 42.0, 32.0, 23.0, 38.0, 34.0, 40.0, 35.0, 16.0, 20.0, 13.0, 16.0, 10.0, 4.0, 4.0, 6.0, 8.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.979721069335938, -19.31089210510254, -18.64206314086914, -17.973234176635742, -17.304405212402344, -16.635576248168945, -15.966747283935547, -15.297918319702148, -14.62908935546875, -13.960260391235352, -13.291431427001953, -12.622602462768555, -11.953773498535156, -11.284944534301758, -10.61611557006836, -9.947286605834961, -9.278457641601562, -8.609628677368164, -7.940799713134766, -7.271970748901367, -6.603141784667969, -5.93431282043457, -5.265483856201172, -4.596654891967773, -3.927825927734375, -3.2589969635009766, -2.590167999267578, -1.9213390350341797, -1.2525100708007812, -0.5836811065673828, 0.08514785766601562, 0.7539768218994141, 1.4228057861328125, 2.091634750366211, 2.7604637145996094, 3.429292678833008, 4.098121643066406, 4.766950607299805, 5.435779571533203, 6.104608535766602, 6.7734375, 7.442266464233398, 8.111095428466797, 8.779924392700195, 9.448753356933594, 10.117582321166992, 10.78641128540039, 11.455240249633789, 12.124069213867188, 12.792898178100586, 13.461727142333984, 14.130556106567383, 14.799385070800781, 15.46821403503418, 16.137042999267578, 16.805871963500977, 17.474700927734375, 18.143529891967773, 18.812358856201172, 19.48118782043457, 20.15001678466797, 20.818845748901367, 21.487674713134766, 22.156503677368164, 22.825332641601562]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 1.0, 9.0, 14.0, 13.0, 13.0, 31.0, 14.0, 24.0, 23.0, 25.0, 41.0, 38.0, 28.0, 36.0, 48.0, 33.0, 42.0, 37.0, 49.0, 38.0, 46.0, 37.0, 36.0, 29.0, 45.0, 34.0, 30.0, 25.0, 22.0, 20.0, 22.0, 19.0, 12.0, 13.0, 12.0, 7.0, 4.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.958984375, -3.84307861328125, -3.7271728515625, -3.61126708984375, -3.495361328125, -3.37945556640625, -3.2635498046875, -3.14764404296875, -3.03173828125, -2.91583251953125, -2.7999267578125, -2.68402099609375, -2.568115234375, -2.45220947265625, -2.3363037109375, -2.22039794921875, -2.1044921875, -1.98858642578125, -1.8726806640625, -1.75677490234375, -1.640869140625, -1.52496337890625, -1.4090576171875, -1.29315185546875, -1.17724609375, -1.06134033203125, -0.9454345703125, -0.82952880859375, -0.713623046875, -0.59771728515625, -0.4818115234375, -0.36590576171875, -0.25, -0.13409423828125, -0.0181884765625, 0.09771728515625, 0.213623046875, 0.32952880859375, 0.4454345703125, 0.56134033203125, 0.67724609375, 0.79315185546875, 0.9090576171875, 1.02496337890625, 1.140869140625, 1.25677490234375, 1.3726806640625, 1.48858642578125, 1.6044921875, 1.72039794921875, 1.8363037109375, 1.95220947265625, 2.068115234375, 2.18402099609375, 2.2999267578125, 2.41583251953125, 2.53173828125, 2.64764404296875, 2.7635498046875, 2.87945556640625, 2.995361328125, 3.11126708984375, 3.2271728515625, 3.34307861328125, 3.458984375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 25.0, 19.0, 27.0, 70.0, 76.0, 108.0, 175.0, 256.0, 360.0, 506.0, 734.0, 1133.0, 1585.0, 2318.0, 3606.0, 5367.0, 7956.0, 12431.0, 19265.0, 30791.0, 50382.0, 86115.0, 151602.0, 224592.0, 181484.0, 105328.0, 60777.0, 36482.0, 22478.0, 14309.0, 9279.0, 6057.0, 4119.0, 2761.0, 1872.0, 1307.0, 865.0, 617.0, 431.0, 250.0, 185.0, 136.0, 94.0, 57.0, 51.0, 33.0, 18.0, 17.0, 13.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.370849609375, -0.3587608337402344, -0.34667205810546875, -0.3345832824707031, -0.3224945068359375, -0.3104057312011719, -0.29831695556640625, -0.2862281799316406, -0.274139404296875, -0.2620506286621094, -0.24996185302734375, -0.23787307739257812, -0.2257843017578125, -0.21369552612304688, -0.20160675048828125, -0.18951797485351562, -0.17742919921875, -0.16534042358398438, -0.15325164794921875, -0.14116287231445312, -0.1290740966796875, -0.11698532104492188, -0.10489654541015625, -0.09280776977539062, -0.080718994140625, -0.06863021850585938, -0.05654144287109375, -0.044452667236328125, -0.0323638916015625, -0.020275115966796875, -0.00818634033203125, 0.003902435302734375, 0.0159912109375, 0.028079986572265625, 0.04016876220703125, 0.052257537841796875, 0.0643463134765625, 0.07643508911132812, 0.08852386474609375, 0.10061264038085938, 0.112701416015625, 0.12479019165039062, 0.13687896728515625, 0.14896774291992188, 0.1610565185546875, 0.17314529418945312, 0.18523406982421875, 0.19732284545898438, 0.20941162109375, 0.22150039672851562, 0.23358917236328125, 0.24567794799804688, 0.2577667236328125, 0.2698554992675781, 0.28194427490234375, 0.2940330505371094, 0.306121826171875, 0.3182106018066406, 0.33029937744140625, 0.3423881530761719, 0.3544769287109375, 0.3665657043457031, 0.37865447998046875, 0.3907432556152344, 0.40283203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 10.0, 14.0, 19.0, 19.0, 14.0, 23.0, 17.0, 35.0, 28.0, 29.0, 23.0, 42.0, 27.0, 35.0, 39.0, 36.0, 37.0, 1072.0, 40.0, 45.0, 29.0, 32.0, 29.0, 30.0, 30.0, 31.0, 24.0, 35.0, 16.0, 21.0, 20.0, 17.0, 15.0, 9.0, 14.0, 15.0, 4.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.14453125, -2.07452392578125, -2.0045166015625, -1.93450927734375, -1.864501953125, -1.79449462890625, -1.7244873046875, -1.65447998046875, -1.58447265625, -1.51446533203125, -1.4444580078125, -1.37445068359375, -1.304443359375, -1.23443603515625, -1.1644287109375, -1.09442138671875, -1.0244140625, -0.95440673828125, -0.8843994140625, -0.81439208984375, -0.744384765625, -0.67437744140625, -0.6043701171875, -0.53436279296875, -0.46435546875, -0.39434814453125, -0.3243408203125, -0.25433349609375, -0.184326171875, -0.11431884765625, -0.0443115234375, 0.02569580078125, 0.095703125, 0.16571044921875, 0.2357177734375, 0.30572509765625, 0.375732421875, 0.44573974609375, 0.5157470703125, 0.58575439453125, 0.65576171875, 0.72576904296875, 0.7957763671875, 0.86578369140625, 0.935791015625, 1.00579833984375, 1.0758056640625, 1.14581298828125, 1.2158203125, 1.28582763671875, 1.3558349609375, 1.42584228515625, 1.495849609375, 1.56585693359375, 1.6358642578125, 1.70587158203125, 1.77587890625, 1.84588623046875, 1.9158935546875, 1.98590087890625, 2.055908203125, 2.12591552734375, 2.1959228515625, 2.26593017578125, 2.3359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 10.0, 19.0, 20.0, 46.0, 85.0, 89.0, 129.0, 195.0, 325.0, 459.0, 702.0, 1079.0, 1651.0, 2511.0, 3838.0, 6064.0, 9583.0, 15222.0, 25384.0, 43534.0, 76374.0, 139115.0, 1278204.0, 211194.0, 118201.0, 65738.0, 37937.0, 22306.0, 13555.0, 8365.0, 5220.0, 3367.0, 2162.0, 1477.0, 983.0, 626.0, 435.0, 303.0, 210.0, 130.0, 91.0, 53.0, 39.0, 31.0, 21.0, 26.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.376220703125, -0.3651123046875, -0.35400390625, -0.3428955078125, -0.331787109375, -0.3206787109375, -0.3095703125, -0.2984619140625, -0.287353515625, -0.2762451171875, -0.26513671875, -0.2540283203125, -0.242919921875, -0.2318115234375, -0.220703125, -0.2095947265625, -0.198486328125, -0.1873779296875, -0.17626953125, -0.1651611328125, -0.154052734375, -0.1429443359375, -0.1318359375, -0.1207275390625, -0.109619140625, -0.0985107421875, -0.08740234375, -0.0762939453125, -0.065185546875, -0.0540771484375, -0.04296875, -0.0318603515625, -0.020751953125, -0.0096435546875, 0.00146484375, 0.0125732421875, 0.023681640625, 0.0347900390625, 0.0458984375, 0.0570068359375, 0.068115234375, 0.0792236328125, 0.09033203125, 0.1014404296875, 0.112548828125, 0.1236572265625, 0.134765625, 0.1458740234375, 0.156982421875, 0.1680908203125, 0.17919921875, 0.1903076171875, 0.201416015625, 0.2125244140625, 0.2236328125, 0.2347412109375, 0.245849609375, 0.2569580078125, 0.26806640625, 0.2791748046875, 0.290283203125, 0.3013916015625, 0.3125, 0.3236083984375, 0.334716796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 10.0, 11.0, 13.0, 20.0, 18.0, 37.0, 38.0, 47.0, 60.0, 89.0, 84.0, 79.0, 86.0, 71.0, 66.0, 53.0, 43.0, 27.0, 26.0, 18.0, 12.0, 14.0, 14.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013608932495117188, -0.0013131499290466309, -0.001265406608581543, -0.001217663288116455, -0.0011699199676513672, -0.0011221766471862793, -0.0010744333267211914, -0.0010266900062561035, -0.0009789466857910156, -0.0009312033653259277, -0.0008834600448608398, -0.000835716724395752, -0.0007879734039306641, -0.0007402300834655762, -0.0006924867630004883, -0.0006447434425354004, -0.0005970001220703125, -0.0005492568016052246, -0.0005015134811401367, -0.00045377016067504883, -0.00040602684020996094, -0.00035828351974487305, -0.00031054019927978516, -0.00026279687881469727, -0.00021505355834960938, -0.00016731023788452148, -0.0001195669174194336, -7.18235969543457e-05, -2.4080276489257812e-05, 2.3663043975830078e-05, 7.140636444091797e-05, 0.00011914968490600586, 0.00016689300537109375, 0.00021463632583618164, 0.00026237964630126953, 0.0003101229667663574, 0.0003578662872314453, 0.0004056096076965332, 0.0004533529281616211, 0.000501096248626709, 0.0005488395690917969, 0.0005965828895568848, 0.0006443262100219727, 0.0006920695304870605, 0.0007398128509521484, 0.0007875561714172363, 0.0008352994918823242, 0.0008830428123474121, 0.0009307861328125, 0.0009785294532775879, 0.0010262727737426758, 0.0010740160942077637, 0.0011217594146728516, 0.0011695027351379395, 0.0012172460556030273, 0.0012649893760681152, 0.0013127326965332031, 0.001360476016998291, 0.001408219337463379, 0.0014559626579284668, 0.0015037059783935547, 0.0015514492988586426, 0.0015991926193237305, 0.0016469359397888184, 0.0016946792602539062]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 10.0, 11.0, 15.0, 31.0, 24.0, 51.0, 47.0, 91.0, 122.0, 202.0, 370.0, 821.0, 26696.0, 1016323.0, 2344.0, 538.0, 278.0, 164.0, 111.0, 75.0, 40.0, 28.0, 31.0, 26.0, 11.0, 11.0, 8.0, 11.0, 6.0, 6.0, 8.0, 1.0, 5.0, 4.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034088134765625, -0.03312230110168457, -0.03215646743774414, -0.03119063377380371, -0.03022480010986328, -0.02925896644592285, -0.028293132781982422, -0.027327299118041992, -0.026361465454101562, -0.025395631790161133, -0.024429798126220703, -0.023463964462280273, -0.022498130798339844, -0.021532297134399414, -0.020566463470458984, -0.019600629806518555, -0.018634796142578125, -0.017668962478637695, -0.016703128814697266, -0.015737295150756836, -0.014771461486816406, -0.013805627822875977, -0.012839794158935547, -0.011873960494995117, -0.010908126831054688, -0.009942293167114258, -0.008976459503173828, -0.008010625839233398, -0.007044792175292969, -0.006078958511352539, -0.005113124847412109, -0.00414729118347168, -0.00318145751953125, -0.0022156238555908203, -0.0012497901916503906, -0.00028395652770996094, 0.0006818771362304688, 0.0016477108001708984, 0.002613544464111328, 0.003579378128051758, 0.0045452117919921875, 0.005511045455932617, 0.006476879119873047, 0.0074427127838134766, 0.008408546447753906, 0.009374380111694336, 0.010340213775634766, 0.011306047439575195, 0.012271881103515625, 0.013237714767456055, 0.014203548431396484, 0.015169382095336914, 0.016135215759277344, 0.017101049423217773, 0.018066883087158203, 0.019032716751098633, 0.019998550415039062, 0.020964384078979492, 0.021930217742919922, 0.02289605140686035, 0.02386188507080078, 0.02482771873474121, 0.02579355239868164, 0.02675938606262207, 0.0277252197265625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 159.0, 706.0, 142.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.00998278521001339, -0.00981210544705391, -0.009641426615417004, -0.009470746852457523, -0.009300067089498043, -0.009129387326538563, -0.008958708494901657, -0.008788028731942177, -0.008617348968982697, -0.008446669206023216, -0.00827599037438631, -0.00810531061142683, -0.00793463084846735, -0.007763951551169157, -0.007593271788209677, -0.007422592490911484, -0.0072519127279520035, -0.0070812334306538105, -0.00691055366769433, -0.006739874370396137, -0.006569194607436657, -0.006398515310138464, -0.006227835547178984, -0.006057156249880791, -0.005886476952582598, -0.005715797655284405, -0.0055451178923249245, -0.0053744385950267315, -0.005203758832067251, -0.005033079534769058, -0.004862399771809578, -0.004691720474511385, -0.004521040245890617, -0.004350360948592424, -0.004179681185632944, -0.004009001888334751, -0.003838322125375271, -0.003667642595246434, -0.0034969630651175976, -0.0033262837678194046, -0.0031556044705212116, -0.002984924940392375, -0.0028142454102635384, -0.0026435658801347017, -0.002472886350005865, -0.0023022068198770285, -0.002131527289748192, -0.001960847992449999, -0.0017901682294905186, -0.001619488699361682, -0.0014488091692328453, -0.0012781296391040087, -0.001107450108975172, -0.0009367706370539963, -0.0007660911651328206, -0.000595411635003984, -0.00042473210487514734, -0.0002540525747463107, -8.337307372130454e-05, 8.730642730370164e-05, 0.00025798595743253827, 0.0004286654875613749, 0.0005993449594825506, 0.0007700244896113873, 0.0009407040197402239]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 4.0, 3.0, 8.0, 8.0, 9.0, 12.0, 11.0, 19.0, 20.0, 23.0, 24.0, 20.0, 23.0, 35.0, 24.0, 42.0, 37.0, 38.0, 38.0, 45.0, 33.0, 48.0, 37.0, 38.0, 49.0, 32.0, 40.0, 35.0, 26.0, 26.0, 29.0, 18.0, 20.0, 18.0, 16.0, 17.0, 15.0, 11.0, 10.0, 12.0, 5.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0006582736968994141, -0.0006378619000315666, -0.0006174501031637192, -0.0005970383062958717, -0.0005766265094280243, -0.0005562147125601768, -0.0005358029156923294, -0.000515391118824482, -0.0004949793219566345, -0.0004745675250887871, -0.00045415572822093964, -0.0004337439313530922, -0.00041333213448524475, -0.0003929203376173973, -0.00037250854074954987, -0.0003520967438817024, -0.000331684947013855, -0.00031127315014600754, -0.0002908613532781601, -0.00027044955641031265, -0.0002500377595424652, -0.00022962596267461777, -0.00020921416580677032, -0.00018880236893892288, -0.00016839057207107544, -0.000147978775203228, -0.00012756697833538055, -0.00010715518146753311, -8.674338459968567e-05, -6.633158773183823e-05, -4.5919790863990784e-05, -2.550799399614334e-05, -5.0961971282958984e-06, 1.5315599739551544e-05, 3.572739660739899e-05, 5.613919347524643e-05, 7.655099034309387e-05, 9.696278721094131e-05, 0.00011737458407878876, 0.0001377863809466362, 0.00015819817781448364, 0.00017860997468233109, 0.00019902177155017853, 0.00021943356841802597, 0.0002398453652858734, 0.00026025716215372086, 0.0002806689590215683, 0.00030108075588941574, 0.0003214925527572632, 0.0003419043496251106, 0.00036231614649295807, 0.0003827279433608055, 0.00040313974022865295, 0.0004235515370965004, 0.00044396333396434784, 0.0004643751308321953, 0.0004847869277000427, 0.0005051987245678902, 0.0005256105214357376, 0.000546022318303585, 0.0005664341151714325, 0.0005868459120392799, 0.0006072577089071274, 0.0006276695057749748, 0.0006480813026428223]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 1.0, 9.0, 14.0, 13.0, 13.0, 31.0, 14.0, 24.0, 23.0, 25.0, 41.0, 38.0, 28.0, 36.0, 48.0, 33.0, 42.0, 37.0, 49.0, 38.0, 45.0, 38.0, 36.0, 29.0, 45.0, 34.0, 30.0, 25.0, 22.0, 20.0, 22.0, 19.0, 12.0, 13.0, 12.0, 7.0, 4.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.958984375, -3.84307861328125, -3.7271728515625, -3.61126708984375, -3.495361328125, -3.37945556640625, -3.2635498046875, -3.14764404296875, -3.03173828125, -2.91583251953125, -2.7999267578125, -2.68402099609375, -2.568115234375, -2.45220947265625, -2.3363037109375, -2.22039794921875, -2.1044921875, -1.98858642578125, -1.8726806640625, -1.75677490234375, -1.640869140625, -1.52496337890625, -1.4090576171875, -1.29315185546875, -1.17724609375, -1.06134033203125, -0.9454345703125, -0.82952880859375, -0.713623046875, -0.59771728515625, -0.4818115234375, -0.36590576171875, -0.25, -0.13409423828125, -0.0181884765625, 0.09771728515625, 0.213623046875, 0.32952880859375, 0.4454345703125, 0.56134033203125, 0.67724609375, 0.79315185546875, 0.9090576171875, 1.02496337890625, 1.140869140625, 1.25677490234375, 1.3726806640625, 1.48858642578125, 1.6044921875, 1.72039794921875, 1.8363037109375, 1.95220947265625, 2.068115234375, 2.18402099609375, 2.2999267578125, 2.41583251953125, 2.53173828125, 2.64764404296875, 2.7635498046875, 2.87945556640625, 2.995361328125, 3.11126708984375, 3.2271728515625, 3.34307861328125, 3.458984375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 6.0, 10.0, 11.0, 12.0, 18.0, 29.0, 39.0, 65.0, 66.0, 101.0, 118.0, 176.0, 249.0, 344.0, 434.0, 675.0, 1351.0, 4172.0, 20602.0, 155244.0, 764980.0, 80845.0, 12870.0, 2876.0, 1091.0, 584.0, 441.0, 292.0, 233.0, 134.0, 110.0, 93.0, 65.0, 51.0, 46.0, 28.0, 22.0, 18.0, 11.0, 4.0, 11.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.0, -9.708984375, -9.41796875, -9.126953125, -8.8359375, -8.544921875, -8.25390625, -7.962890625, -7.671875, -7.380859375, -7.08984375, -6.798828125, -6.5078125, -6.216796875, -5.92578125, -5.634765625, -5.34375, -5.052734375, -4.76171875, -4.470703125, -4.1796875, -3.888671875, -3.59765625, -3.306640625, -3.015625, -2.724609375, -2.43359375, -2.142578125, -1.8515625, -1.560546875, -1.26953125, -0.978515625, -0.6875, -0.396484375, -0.10546875, 0.185546875, 0.4765625, 0.767578125, 1.05859375, 1.349609375, 1.640625, 1.931640625, 2.22265625, 2.513671875, 2.8046875, 3.095703125, 3.38671875, 3.677734375, 3.96875, 4.259765625, 4.55078125, 4.841796875, 5.1328125, 5.423828125, 5.71484375, 6.005859375, 6.296875, 6.587890625, 6.87890625, 7.169921875, 7.4609375, 7.751953125, 8.04296875, 8.333984375, 8.625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 3.0, 14.0, 16.0, 15.0, 18.0, 22.0, 16.0, 29.0, 32.0, 32.0, 42.0, 44.0, 50.0, 46.0, 64.0, 129.0, 367.0, 1508.0, 151.0, 79.0, 56.0, 49.0, 47.0, 37.0, 27.0, 31.0, 22.0, 16.0, 18.0, 11.0, 12.0, 10.0, 9.0, 10.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.4364013671875, -12.036865234375, -11.6373291015625, -11.23779296875, -10.8382568359375, -10.438720703125, -10.0391845703125, -9.6396484375, -9.2401123046875, -8.840576171875, -8.4410400390625, -8.04150390625, -7.6419677734375, -7.242431640625, -6.8428955078125, -6.443359375, -6.0438232421875, -5.644287109375, -5.2447509765625, -4.84521484375, -4.4456787109375, -4.046142578125, -3.6466064453125, -3.2470703125, -2.8475341796875, -2.447998046875, -2.0484619140625, -1.64892578125, -1.2493896484375, -0.849853515625, -0.4503173828125, -0.05078125, 0.3487548828125, 0.748291015625, 1.1478271484375, 1.54736328125, 1.9468994140625, 2.346435546875, 2.7459716796875, 3.1455078125, 3.5450439453125, 3.944580078125, 4.3441162109375, 4.74365234375, 5.1431884765625, 5.542724609375, 5.9422607421875, 6.341796875, 6.7413330078125, 7.140869140625, 7.5404052734375, 7.93994140625, 8.3394775390625, 8.739013671875, 9.1385498046875, 9.5380859375, 9.9376220703125, 10.337158203125, 10.7366943359375, 11.13623046875, 11.5357666015625, 11.935302734375, 12.3348388671875, 12.734375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 6.0, 13.0, 11.0, 17.0, 17.0, 17.0, 23.0, 29.0, 43.0, 50.0, 75.0, 106.0, 173.0, 287.0, 588.0, 2416.0, 90797.0, 3039312.0, 9318.0, 1192.0, 406.0, 211.0, 146.0, 100.0, 72.0, 43.0, 42.0, 36.0, 31.0, 20.0, 15.0, 15.0, 20.0, 18.0, 10.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.09912109375, -32.0732421875, -31.04736328125, -30.021484375, -28.99560546875, -27.9697265625, -26.94384765625, -25.91796875, -24.89208984375, -23.8662109375, -22.84033203125, -21.814453125, -20.78857421875, -19.7626953125, -18.73681640625, -17.7109375, -16.68505859375, -15.6591796875, -14.63330078125, -13.607421875, -12.58154296875, -11.5556640625, -10.52978515625, -9.50390625, -8.47802734375, -7.4521484375, -6.42626953125, -5.400390625, -4.37451171875, -3.3486328125, -2.32275390625, -1.296875, -0.27099609375, 0.7548828125, 1.78076171875, 2.806640625, 3.83251953125, 4.8583984375, 5.88427734375, 6.91015625, 7.93603515625, 8.9619140625, 9.98779296875, 11.013671875, 12.03955078125, 13.0654296875, 14.09130859375, 15.1171875, 16.14306640625, 17.1689453125, 18.19482421875, 19.220703125, 20.24658203125, 21.2724609375, 22.29833984375, 23.32421875, 24.35009765625, 25.3759765625, 26.40185546875, 27.427734375, 28.45361328125, 29.4794921875, 30.50537109375, 31.53125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 61.0, 278.0, 421.0, 200.0, 41.0, 7.0], "bins": [-79.4412612915039, -78.12487030029297, -76.80847930908203, -75.4920883178711, -74.17569732666016, -72.85929870605469, -71.54290771484375, -70.22651672363281, -68.91012573242188, -67.59373474121094, -66.27734375, -64.96095275878906, -63.64455795288086, -62.32816696166992, -61.011775970458984, -59.69538497924805, -58.37899398803711, -57.06260299682617, -55.746212005615234, -54.42981719970703, -53.113426208496094, -51.797035217285156, -50.48064422607422, -49.16425323486328, -47.847862243652344, -46.531471252441406, -45.21508026123047, -43.898685455322266, -42.58229446411133, -41.26590347290039, -39.94951248168945, -38.633121490478516, -37.31672668457031, -36.000335693359375, -34.68394470214844, -33.367549896240234, -32.0511589050293, -30.73476791381836, -29.418376922607422, -28.101985931396484, -26.785593032836914, -25.469202041625977, -24.152809143066406, -22.83641815185547, -21.52002716064453, -20.20363426208496, -18.887243270874023, -17.570850372314453, -16.254459381103516, -14.938067436218262, -13.621675491333008, -12.30528450012207, -10.988892555236816, -9.672500610351562, -8.356109619140625, -7.039717674255371, -5.723326206207275, -4.40693473815918, -3.090542793273926, -1.774151086807251, -0.45775938034057617, 0.8586325645446777, 2.1750240325927734, 3.491415500640869, 4.807807445526123]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 8.0, 4.0, 6.0, 9.0, 7.0, 11.0, 11.0, 12.0, 19.0, 18.0, 19.0, 24.0, 29.0, 31.0, 38.0, 40.0, 35.0, 40.0, 40.0, 42.0, 39.0, 39.0, 45.0, 42.0, 35.0, 44.0, 44.0, 30.0, 30.0, 42.0, 28.0, 18.0, 17.0, 19.0, 15.0, 20.0, 14.0, 10.0, 8.0, 11.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.759864807128906, -26.878202438354492, -25.996538162231445, -25.11487579345703, -24.233213424682617, -23.351551055908203, -22.469886779785156, -21.588224411010742, -20.706562042236328, -19.824899673461914, -18.943235397338867, -18.061573028564453, -17.17991065979004, -16.298248291015625, -15.416584014892578, -14.534921646118164, -13.653257369995117, -12.771594047546387, -11.889931678771973, -11.008268356323242, -10.126605987548828, -9.244942665100098, -8.363279342651367, -7.481616497039795, -6.599953651428223, -5.71829080581665, -4.836627960205078, -3.9549646377563477, -3.0733017921447754, -2.191638946533203, -1.3099756240844727, -0.4283127784729004, 0.4533500671386719, 1.3350130319595337, 2.2166759967803955, 3.098339080810547, 3.980001926422119, 4.861664772033691, 5.743328094482422, 6.624990940093994, 7.506653785705566, 8.388317108154297, 9.269979476928711, 10.151642799377441, 11.033306121826172, 11.914968490600586, 12.796631813049316, 13.678295135498047, 14.559957504272461, 15.441620826721191, 16.323284149169922, 17.204946517944336, 18.08660888671875, 18.968273162841797, 19.84993553161621, 20.731597900390625, 21.613262176513672, 22.494924545288086, 23.376588821411133, 24.258251190185547, 25.13991355895996, 26.021575927734375, 26.903240203857422, 27.784902572631836, 28.66656494140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 8.0, 14.0, 12.0, 8.0, 23.0, 28.0, 22.0, 26.0, 30.0, 32.0, 41.0, 39.0, 37.0, 40.0, 35.0, 49.0, 41.0, 43.0, 42.0, 36.0, 49.0, 33.0, 41.0, 31.0, 27.0, 31.0, 28.0, 15.0, 19.0, 19.0, 16.0, 9.0, 10.0, 17.0, 11.0, 6.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.876953125, -3.75433349609375, -3.6317138671875, -3.50909423828125, -3.386474609375, -3.26385498046875, -3.1412353515625, -3.01861572265625, -2.89599609375, -2.77337646484375, -2.6507568359375, -2.52813720703125, -2.405517578125, -2.28289794921875, -2.1602783203125, -2.03765869140625, -1.9150390625, -1.79241943359375, -1.6697998046875, -1.54718017578125, -1.424560546875, -1.30194091796875, -1.1793212890625, -1.05670166015625, -0.93408203125, -0.81146240234375, -0.6888427734375, -0.56622314453125, -0.443603515625, -0.32098388671875, -0.1983642578125, -0.07574462890625, 0.046875, 0.16949462890625, 0.2921142578125, 0.41473388671875, 0.537353515625, 0.65997314453125, 0.7825927734375, 0.90521240234375, 1.02783203125, 1.15045166015625, 1.2730712890625, 1.39569091796875, 1.518310546875, 1.64093017578125, 1.7635498046875, 1.88616943359375, 2.0087890625, 2.13140869140625, 2.2540283203125, 2.37664794921875, 2.499267578125, 2.62188720703125, 2.7445068359375, 2.86712646484375, 2.98974609375, 3.11236572265625, 3.2349853515625, 3.35760498046875, 3.480224609375, 3.60284423828125, 3.7254638671875, 3.84808349609375, 3.970703125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 10.0, 6.0, 10.0, 12.0, 19.0, 25.0, 27.0, 35.0, 44.0, 54.0, 75.0, 81.0, 120.0, 186.0, 252.0, 459.0, 1038.0, 5100.0, 53703.0, 606519.0, 2326709.0, 1072038.0, 114698.0, 9853.0, 1568.0, 570.0, 288.0, 182.0, 152.0, 92.0, 64.0, 64.0, 59.0, 42.0, 25.0, 27.0, 20.0, 11.0, 16.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.77801513671875, -6.5638427734375, -6.34967041015625, -6.135498046875, -5.92132568359375, -5.7071533203125, -5.49298095703125, -5.27880859375, -5.06463623046875, -4.8504638671875, -4.63629150390625, -4.422119140625, -4.20794677734375, -3.9937744140625, -3.77960205078125, -3.5654296875, -3.35125732421875, -3.1370849609375, -2.92291259765625, -2.708740234375, -2.49456787109375, -2.2803955078125, -2.06622314453125, -1.85205078125, -1.63787841796875, -1.4237060546875, -1.20953369140625, -0.995361328125, -0.78118896484375, -0.5670166015625, -0.35284423828125, -0.138671875, 0.07550048828125, 0.2896728515625, 0.50384521484375, 0.718017578125, 0.93218994140625, 1.1463623046875, 1.36053466796875, 1.57470703125, 1.78887939453125, 2.0030517578125, 2.21722412109375, 2.431396484375, 2.64556884765625, 2.8597412109375, 3.07391357421875, 3.2880859375, 3.50225830078125, 3.7164306640625, 3.93060302734375, 4.144775390625, 4.35894775390625, 4.5731201171875, 4.78729248046875, 5.00146484375, 5.21563720703125, 5.4298095703125, 5.64398193359375, 5.858154296875, 6.07232666015625, 6.2864990234375, 6.50067138671875, 6.71484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 14.0, 11.0, 23.0, 22.0, 31.0, 44.0, 69.0, 94.0, 108.0, 175.0, 244.0, 319.0, 372.0, 408.0, 427.0, 385.0, 344.0, 247.0, 211.0, 136.0, 108.0, 78.0, 60.0, 24.0, 23.0, 24.0, 16.0, 13.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.6953125, -6.5205078125, -6.345703125, -6.1708984375, -5.99609375, -5.8212890625, -5.646484375, -5.4716796875, -5.296875, -5.1220703125, -4.947265625, -4.7724609375, -4.59765625, -4.4228515625, -4.248046875, -4.0732421875, -3.8984375, -3.7236328125, -3.548828125, -3.3740234375, -3.19921875, -3.0244140625, -2.849609375, -2.6748046875, -2.5, -2.3251953125, -2.150390625, -1.9755859375, -1.80078125, -1.6259765625, -1.451171875, -1.2763671875, -1.1015625, -0.9267578125, -0.751953125, -0.5771484375, -0.40234375, -0.2275390625, -0.052734375, 0.1220703125, 0.296875, 0.4716796875, 0.646484375, 0.8212890625, 0.99609375, 1.1708984375, 1.345703125, 1.5205078125, 1.6953125, 1.8701171875, 2.044921875, 2.2197265625, 2.39453125, 2.5693359375, 2.744140625, 2.9189453125, 3.09375, 3.2685546875, 3.443359375, 3.6181640625, 3.79296875, 3.9677734375, 4.142578125, 4.3173828125, 4.4921875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 9.0, 17.0, 13.0, 27.0, 35.0, 53.0, 65.0, 119.0, 185.0, 289.0, 499.0, 1047.0, 3012.0, 29619.0, 1121585.0, 2940172.0, 89081.0, 5464.0, 1334.0, 617.0, 373.0, 200.0, 141.0, 106.0, 52.0, 44.0, 40.0, 25.0, 14.0, 12.0, 3.0, 7.0, 6.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4609375, -12.0023193359375, -11.543701171875, -11.0850830078125, -10.62646484375, -10.1678466796875, -9.709228515625, -9.2506103515625, -8.7919921875, -8.3333740234375, -7.874755859375, -7.4161376953125, -6.95751953125, -6.4989013671875, -6.040283203125, -5.5816650390625, -5.123046875, -4.6644287109375, -4.205810546875, -3.7471923828125, -3.28857421875, -2.8299560546875, -2.371337890625, -1.9127197265625, -1.4541015625, -0.9954833984375, -0.536865234375, -0.0782470703125, 0.38037109375, 0.8389892578125, 1.297607421875, 1.7562255859375, 2.21484375, 2.6734619140625, 3.132080078125, 3.5906982421875, 4.04931640625, 4.5079345703125, 4.966552734375, 5.4251708984375, 5.8837890625, 6.3424072265625, 6.801025390625, 7.2596435546875, 7.71826171875, 8.1768798828125, 8.635498046875, 9.0941162109375, 9.552734375, 10.0113525390625, 10.469970703125, 10.9285888671875, 11.38720703125, 11.8458251953125, 12.304443359375, 12.7630615234375, 13.2216796875, 13.6802978515625, 14.138916015625, 14.5975341796875, 15.05615234375, 15.5147705078125, 15.973388671875, 16.4320068359375, 16.890625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 70.0, 939.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.3030090332031, -416.13153076171875, -406.9600524902344, -397.78857421875, -388.6170959472656, -379.44561767578125, -370.2741394042969, -361.1026611328125, -351.9311828613281, -342.75970458984375, -333.5882263183594, -324.416748046875, -315.2452697753906, -306.07379150390625, -296.9023132324219, -287.7308349609375, -278.5593566894531, -269.38787841796875, -260.2164001464844, -251.044921875, -241.87344360351562, -232.70196533203125, -223.53048706054688, -214.3590087890625, -205.18753051757812, -196.01605224609375, -186.84457397460938, -177.673095703125, -168.50161743164062, -159.33013916015625, -150.15866088867188, -140.9871826171875, -131.815673828125, -122.64419555664062, -113.47271728515625, -104.30123901367188, -95.1297607421875, -85.95828247070312, -76.78680419921875, -67.61532592773438, -58.44384765625, -49.272369384765625, -40.10089111328125, -30.929412841796875, -21.7579345703125, -12.586456298828125, -3.41497802734375, 5.756500244140625, 14.927978515625, 24.099456787109375, 33.27093505859375, 42.442413330078125, 51.6138916015625, 60.785369873046875, 69.95684814453125, 79.12832641601562, 88.2998046875, 97.47128295898438, 106.64276123046875, 115.81423950195312, 124.9857177734375, 134.15719604492188, 143.32867431640625, 152.50015258789062, 161.671630859375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 11.0, 20.0, 8.0, 20.0, 22.0, 18.0, 32.0, 32.0, 38.0, 38.0, 26.0, 43.0, 41.0, 49.0, 57.0, 49.0, 50.0, 50.0, 58.0, 44.0, 34.0, 35.0, 39.0, 34.0, 25.0, 30.0, 13.0, 21.0, 17.0, 12.0, 7.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.179353713989258, -20.442554473876953, -19.70575523376465, -18.968955993652344, -18.23215675354004, -17.495357513427734, -16.75855827331543, -16.021759033203125, -15.28495979309082, -14.548160552978516, -13.811361312866211, -13.074562072753906, -12.337762832641602, -11.600963592529297, -10.864164352416992, -10.127365112304688, -9.390565872192383, -8.653766632080078, -7.916967391967773, -7.180168151855469, -6.443368911743164, -5.706569671630859, -4.969770431518555, -4.23297119140625, -3.4961719512939453, -2.7593727111816406, -2.022573471069336, -1.2857742309570312, -0.5489749908447266, 0.18782424926757812, 0.9246234893798828, 1.6614227294921875, 2.398223876953125, 3.1350231170654297, 3.8718223571777344, 4.608621597290039, 5.345420837402344, 6.082220077514648, 6.819019317626953, 7.555818557739258, 8.292617797851562, 9.029417037963867, 9.766216278076172, 10.503015518188477, 11.239814758300781, 11.976613998413086, 12.71341323852539, 13.450212478637695, 14.18701171875, 14.923810958862305, 15.66061019897461, 16.397409439086914, 17.13420867919922, 17.871007919311523, 18.607807159423828, 19.344606399536133, 20.081405639648438, 20.818204879760742, 21.555004119873047, 22.29180335998535, 23.028602600097656, 23.76540184020996, 24.502201080322266, 25.23900032043457, 25.975799560546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 13.0, 16.0, 9.0, 21.0, 20.0, 22.0, 26.0, 38.0, 33.0, 35.0, 31.0, 29.0, 43.0, 32.0, 56.0, 42.0, 45.0, 42.0, 49.0, 38.0, 31.0, 41.0, 27.0, 24.0, 21.0, 33.0, 27.0, 25.0, 28.0, 19.0, 13.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.634765625, -3.513580322265625, -3.39239501953125, -3.271209716796875, -3.1500244140625, -3.028839111328125, -2.90765380859375, -2.786468505859375, -2.665283203125, -2.544097900390625, -2.42291259765625, -2.301727294921875, -2.1805419921875, -2.059356689453125, -1.93817138671875, -1.816986083984375, -1.69580078125, -1.574615478515625, -1.45343017578125, -1.332244873046875, -1.2110595703125, -1.089874267578125, -0.96868896484375, -0.847503662109375, -0.726318359375, -0.605133056640625, -0.48394775390625, -0.362762451171875, -0.2415771484375, -0.120391845703125, 0.00079345703125, 0.121978759765625, 0.2431640625, 0.364349365234375, 0.48553466796875, 0.606719970703125, 0.7279052734375, 0.849090576171875, 0.97027587890625, 1.091461181640625, 1.212646484375, 1.333831787109375, 1.45501708984375, 1.576202392578125, 1.6973876953125, 1.818572998046875, 1.93975830078125, 2.060943603515625, 2.18212890625, 2.303314208984375, 2.42449951171875, 2.545684814453125, 2.6668701171875, 2.788055419921875, 2.90924072265625, 3.030426025390625, 3.151611328125, 3.272796630859375, 3.39398193359375, 3.515167236328125, 3.6363525390625, 3.757537841796875, 3.87872314453125, 3.999908447265625, 4.12109375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 9.0, 22.0, 23.0, 56.0, 79.0, 81.0, 170.0, 268.0, 384.0, 680.0, 1040.0, 1692.0, 2773.0, 4503.0, 7607.0, 12930.0, 22494.0, 39809.0, 73337.0, 142832.0, 261754.0, 222556.0, 114686.0, 59715.0, 32911.0, 18773.0, 10863.0, 6522.0, 3784.0, 2360.0, 1431.0, 880.0, 569.0, 356.0, 216.0, 130.0, 93.0, 56.0, 42.0, 25.0, 20.0, 9.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4775390625, -0.4625396728515625, -0.447540283203125, -0.4325408935546875, -0.41754150390625, -0.4025421142578125, -0.387542724609375, -0.3725433349609375, -0.3575439453125, -0.3425445556640625, -0.327545166015625, -0.3125457763671875, -0.29754638671875, -0.2825469970703125, -0.267547607421875, -0.2525482177734375, -0.237548828125, -0.2225494384765625, -0.207550048828125, -0.1925506591796875, -0.17755126953125, -0.1625518798828125, -0.147552490234375, -0.1325531005859375, -0.1175537109375, -0.1025543212890625, -0.087554931640625, -0.0725555419921875, -0.05755615234375, -0.0425567626953125, -0.027557373046875, -0.0125579833984375, 0.00244140625, 0.0174407958984375, 0.032440185546875, 0.0474395751953125, 0.06243896484375, 0.0774383544921875, 0.092437744140625, 0.1074371337890625, 0.1224365234375, 0.1374359130859375, 0.152435302734375, 0.1674346923828125, 0.18243408203125, 0.1974334716796875, 0.212432861328125, 0.2274322509765625, 0.242431640625, 0.2574310302734375, 0.272430419921875, 0.2874298095703125, 0.30242919921875, 0.3174285888671875, 0.332427978515625, 0.3474273681640625, 0.3624267578125, 0.3774261474609375, 0.392425537109375, 0.4074249267578125, 0.42242431640625, 0.4374237060546875, 0.452423095703125, 0.4674224853515625, 0.482421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 4.0, 11.0, 7.0, 16.0, 16.0, 18.0, 24.0, 26.0, 17.0, 24.0, 28.0, 42.0, 34.0, 38.0, 41.0, 40.0, 39.0, 44.0, 1071.0, 27.0, 47.0, 37.0, 43.0, 48.0, 36.0, 40.0, 28.0, 24.0, 32.0, 13.0, 18.0, 16.0, 12.0, 9.0, 6.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.576171875, -2.498870849609375, -2.42156982421875, -2.344268798828125, -2.2669677734375, -2.189666748046875, -2.11236572265625, -2.035064697265625, -1.957763671875, -1.880462646484375, -1.80316162109375, -1.725860595703125, -1.6485595703125, -1.571258544921875, -1.49395751953125, -1.416656494140625, -1.33935546875, -1.262054443359375, -1.18475341796875, -1.107452392578125, -1.0301513671875, -0.952850341796875, -0.87554931640625, -0.798248291015625, -0.720947265625, -0.643646240234375, -0.56634521484375, -0.489044189453125, -0.4117431640625, -0.334442138671875, -0.25714111328125, -0.179840087890625, -0.1025390625, -0.025238037109375, 0.05206298828125, 0.129364013671875, 0.2066650390625, 0.283966064453125, 0.36126708984375, 0.438568115234375, 0.515869140625, 0.593170166015625, 0.67047119140625, 0.747772216796875, 0.8250732421875, 0.902374267578125, 0.97967529296875, 1.056976318359375, 1.13427734375, 1.211578369140625, 1.28887939453125, 1.366180419921875, 1.4434814453125, 1.520782470703125, 1.59808349609375, 1.675384521484375, 1.752685546875, 1.829986572265625, 1.90728759765625, 1.984588623046875, 2.0618896484375, 2.139190673828125, 2.21649169921875, 2.293792724609375, 2.37109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 10.0, 10.0, 14.0, 11.0, 30.0, 49.0, 75.0, 90.0, 134.0, 178.0, 285.0, 445.0, 546.0, 841.0, 1210.0, 1668.0, 2529.0, 3754.0, 5523.0, 8190.0, 12372.0, 19052.0, 29228.0, 45948.0, 74117.0, 121006.0, 237182.0, 1189389.0, 126964.0, 77771.0, 48236.0, 30836.0, 20049.0, 12876.0, 8679.0, 5654.0, 3780.0, 2586.0, 1894.0, 1190.0, 857.0, 573.0, 382.0, 265.0, 185.0, 173.0, 112.0, 68.0, 32.0, 36.0, 16.0, 13.0, 13.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.28173828125, -0.27236175537109375, -0.2629852294921875, -0.25360870361328125, -0.244232177734375, -0.23485565185546875, -0.2254791259765625, -0.21610260009765625, -0.20672607421875, -0.19734954833984375, -0.1879730224609375, -0.17859649658203125, -0.169219970703125, -0.15984344482421875, -0.1504669189453125, -0.14109039306640625, -0.1317138671875, -0.12233734130859375, -0.1129608154296875, -0.10358428955078125, -0.094207763671875, -0.08483123779296875, -0.0754547119140625, -0.06607818603515625, -0.05670166015625, -0.04732513427734375, -0.0379486083984375, -0.02857208251953125, -0.019195556640625, -0.00981903076171875, -0.0004425048828125, 0.00893402099609375, 0.018310546875, 0.02768707275390625, 0.0370635986328125, 0.04644012451171875, 0.055816650390625, 0.06519317626953125, 0.0745697021484375, 0.08394622802734375, 0.09332275390625, 0.10269927978515625, 0.1120758056640625, 0.12145233154296875, 0.130828857421875, 0.14020538330078125, 0.1495819091796875, 0.15895843505859375, 0.1683349609375, 0.17771148681640625, 0.1870880126953125, 0.19646453857421875, 0.205841064453125, 0.21521759033203125, 0.2245941162109375, 0.23397064208984375, 0.24334716796875, 0.25272369384765625, 0.2621002197265625, 0.27147674560546875, 0.280853271484375, 0.29022979736328125, 0.2996063232421875, 0.30898284912109375, 0.318359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 4.0, 7.0, 9.0, 12.0, 24.0, 30.0, 26.0, 39.0, 54.0, 86.0, 92.0, 84.0, 87.0, 87.0, 68.0, 48.0, 48.0, 39.0, 31.0, 22.0, 16.0, 14.0, 15.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0019969940185546875, -0.0019449293613433838, -0.00189286470413208, -0.0018408000469207764, -0.0017887353897094727, -0.001736670732498169, -0.0016846060752868652, -0.0016325414180755615, -0.0015804767608642578, -0.001528412103652954, -0.0014763474464416504, -0.0014242827892303467, -0.001372218132019043, -0.0013201534748077393, -0.0012680888175964355, -0.0012160241603851318, -0.0011639595031738281, -0.0011118948459625244, -0.0010598301887512207, -0.001007765531539917, -0.0009557008743286133, -0.0009036362171173096, -0.0008515715599060059, -0.0007995069026947021, -0.0007474422454833984, -0.0006953775882720947, -0.000643312931060791, -0.0005912482738494873, -0.0005391836166381836, -0.0004871189594268799, -0.00043505430221557617, -0.00038298964500427246, -0.00033092498779296875, -0.00027886033058166504, -0.00022679567337036133, -0.00017473101615905762, -0.0001226663589477539, -7.06017017364502e-05, -1.8537044525146484e-05, 3.3527612686157227e-05, 8.559226989746094e-05, 0.00013765692710876465, 0.00018972158432006836, 0.00024178624153137207, 0.0002938508987426758, 0.0003459155559539795, 0.0003979802131652832, 0.0004500448703765869, 0.0005021095275878906, 0.0005541741847991943, 0.000606238842010498, 0.0006583034992218018, 0.0007103681564331055, 0.0007624328136444092, 0.0008144974708557129, 0.0008665621280670166, 0.0009186267852783203, 0.000970691442489624, 0.0010227560997009277, 0.0010748207569122314, 0.0011268854141235352, 0.0011789500713348389, 0.0012310147285461426, 0.0012830793857574463, 0.00133514404296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 11.0, 7.0, 9.0, 14.0, 16.0, 20.0, 35.0, 29.0, 53.0, 62.0, 106.0, 143.0, 246.0, 464.0, 1309.0, 636225.0, 407332.0, 1233.0, 478.0, 253.0, 150.0, 89.0, 69.0, 50.0, 39.0, 18.0, 18.0, 16.0, 9.0, 8.0, 6.0, 6.0, 2.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.025115966796875, -0.024148941040039062, -0.023181915283203125, -0.022214889526367188, -0.02124786376953125, -0.020280838012695312, -0.019313812255859375, -0.018346786499023438, -0.0173797607421875, -0.016412734985351562, -0.015445709228515625, -0.014478683471679688, -0.01351165771484375, -0.012544631958007812, -0.011577606201171875, -0.010610580444335938, -0.0096435546875, -0.008676528930664062, -0.007709503173828125, -0.0067424774169921875, -0.00577545166015625, -0.0048084259033203125, -0.003841400146484375, -0.0028743743896484375, -0.0019073486328125, -0.0009403228759765625, 2.6702880859375e-05, 0.0009937286376953125, 0.00196075439453125, 0.0029277801513671875, 0.003894805908203125, 0.0048618316650390625, 0.005828857421875, 0.0067958831787109375, 0.007762908935546875, 0.008729934692382812, 0.00969696044921875, 0.010663986206054688, 0.011631011962890625, 0.012598037719726562, 0.0135650634765625, 0.014532089233398438, 0.015499114990234375, 0.016466140747070312, 0.01743316650390625, 0.018400192260742188, 0.019367218017578125, 0.020334243774414062, 0.02130126953125, 0.022268295288085938, 0.023235321044921875, 0.024202346801757812, 0.02516937255859375, 0.026136398315429688, 0.027103424072265625, 0.028070449829101562, 0.0290374755859375, 0.030004501342773438, 0.030971527099609375, 0.03193855285644531, 0.03290557861328125, 0.03387260437011719, 0.034839630126953125, 0.03580665588378906, 0.036773681640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 502.0, 514.0, 1.0, 0.0, 1.0], "bins": [-0.024783875793218613, -0.024370895698666573, -0.023957915604114532, -0.02354493737220764, -0.0231319572776556, -0.02271897718310356, -0.02230599708855152, -0.02189301699399948, -0.02148003876209259, -0.02106705866754055, -0.02065407857298851, -0.02024110034108162, -0.01982812024652958, -0.01941514015197754, -0.0190021600574255, -0.01858917996287346, -0.018176201730966568, -0.017763221636414528, -0.017350241541862488, -0.016937263309955597, -0.016524283215403557, -0.016111303120851517, -0.015698323026299477, -0.015285343863070011, -0.014872362837195396, -0.014459382742643356, -0.01404640357941389, -0.01363342348486185, -0.013220444321632385, -0.012807464227080345, -0.012394484132528305, -0.01198150496929884, -0.011568525806069374, -0.011155545711517334, -0.010742566548287868, -0.010329586453735828, -0.009916607290506363, -0.009503627195954323, -0.009090647101402283, -0.008677667938172817, -0.008264688774943352, -0.007851708680391312, -0.007438729517161846, -0.007025749422609806, -0.006612770259380341, -0.0061997901648283005, -0.005786810535937548, -0.005373830907046795, -0.004960850812494755, -0.004547871183604002, -0.004134891554713249, -0.0037219116929918528, -0.0033089320641011, -0.002895952435210347, -0.0024829725734889507, -0.002069992944598198, -0.0016570135485380888, -0.001244033919647336, -0.0008310541743412614, -0.00041807442903518677, -5.094800144433975e-06, 0.0004078848287463188, 0.0008208646904677153, 0.001233844319358468, 0.0016468239482492208]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 17.0, 21.0, 27.0, 24.0, 40.0, 36.0, 39.0, 55.0, 60.0, 52.0, 58.0, 58.0, 55.0, 65.0, 50.0, 54.0, 43.0, 44.0, 38.0, 38.0, 16.0, 19.0, 14.0, 14.0, 12.0, 9.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007422566413879395, -0.0007111327722668648, -0.0006800089031457901, -0.0006488850340247154, -0.0006177611649036407, -0.0005866372957825661, -0.0005555134266614914, -0.0005243895575404167, -0.000493265688419342, -0.00046214181929826736, -0.0004310179501771927, -0.000399894081056118, -0.00036877021193504333, -0.00033764634281396866, -0.000306522473692894, -0.0002753986045718193, -0.00024427473545074463, -0.00021315086632966995, -0.00018202699720859528, -0.0001509031280875206, -0.00011977925896644592, -8.865538984537125e-05, -5.753152072429657e-05, -2.6407651603221893e-05, 4.716217517852783e-06, 3.584008663892746e-05, 6.696395576000214e-05, 9.808782488107681e-05, 0.0001292116940021515, 0.00016033556312322617, 0.00019145943224430084, 0.00022258330136537552, 0.0002537071704864502, 0.00028483103960752487, 0.00031595490872859955, 0.0003470787778496742, 0.0003782026469707489, 0.0004093265160918236, 0.00044045038521289825, 0.00047157425433397293, 0.0005026981234550476, 0.0005338219925761223, 0.000564945861697197, 0.0005960697308182716, 0.0006271935999393463, 0.000658317469060421, 0.0006894413381814957, 0.0007205652073025703, 0.000751689076423645, 0.0007828129455447197, 0.0008139368146657944, 0.000845060683786869, 0.0008761845529079437, 0.0009073084220290184, 0.0009384322911500931, 0.0009695561602711678, 0.0010006800293922424, 0.001031803898513317, 0.0010629277676343918, 0.0010940516367554665, 0.0011251755058765411, 0.0011562993749976158, 0.0011874232441186905, 0.0012185471132397652, 0.0012496709823608398]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 13.0, 16.0, 9.0, 21.0, 20.0, 23.0, 25.0, 38.0, 33.0, 35.0, 31.0, 29.0, 43.0, 32.0, 56.0, 42.0, 45.0, 42.0, 49.0, 38.0, 31.0, 41.0, 27.0, 24.0, 21.0, 33.0, 27.0, 25.0, 28.0, 19.0, 13.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.634765625, -3.513580322265625, -3.39239501953125, -3.271209716796875, -3.1500244140625, -3.028839111328125, -2.90765380859375, -2.786468505859375, -2.665283203125, -2.544097900390625, -2.42291259765625, -2.301727294921875, -2.1805419921875, -2.059356689453125, -1.93817138671875, -1.816986083984375, -1.69580078125, -1.574615478515625, -1.45343017578125, -1.332244873046875, -1.2110595703125, -1.089874267578125, -0.96868896484375, -0.847503662109375, -0.726318359375, -0.605133056640625, -0.48394775390625, -0.362762451171875, -0.2415771484375, -0.120391845703125, 0.00079345703125, 0.121978759765625, 0.2431640625, 0.364349365234375, 0.48553466796875, 0.606719970703125, 0.7279052734375, 0.849090576171875, 0.97027587890625, 1.091461181640625, 1.212646484375, 1.333831787109375, 1.45501708984375, 1.576202392578125, 1.6973876953125, 1.818572998046875, 1.93975830078125, 2.060943603515625, 2.18212890625, 2.303314208984375, 2.42449951171875, 2.545684814453125, 2.6668701171875, 2.788055419921875, 2.90924072265625, 3.030426025390625, 3.151611328125, 3.272796630859375, 3.39398193359375, 3.515167236328125, 3.6363525390625, 3.757537841796875, 3.87872314453125, 3.999908447265625, 4.12109375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 5.0, 19.0, 18.0, 16.0, 32.0, 40.0, 43.0, 53.0, 79.0, 125.0, 155.0, 250.0, 370.0, 654.0, 1318.0, 2651.0, 6146.0, 16214.0, 44478.0, 124309.0, 357191.0, 321648.0, 108313.0, 39231.0, 14285.0, 5495.0, 2393.0, 1169.0, 625.0, 349.0, 250.0, 193.0, 107.0, 87.0, 65.0, 44.0, 27.0, 26.0, 19.0, 11.0, 14.0, 3.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.3836669921875, -4.232177734375, -4.0806884765625, -3.92919921875, -3.7777099609375, -3.626220703125, -3.4747314453125, -3.3232421875, -3.1717529296875, -3.020263671875, -2.8687744140625, -2.71728515625, -2.5657958984375, -2.414306640625, -2.2628173828125, -2.111328125, -1.9598388671875, -1.808349609375, -1.6568603515625, -1.50537109375, -1.3538818359375, -1.202392578125, -1.0509033203125, -0.8994140625, -0.7479248046875, -0.596435546875, -0.4449462890625, -0.29345703125, -0.1419677734375, 0.009521484375, 0.1610107421875, 0.3125, 0.4639892578125, 0.615478515625, 0.7669677734375, 0.91845703125, 1.0699462890625, 1.221435546875, 1.3729248046875, 1.5244140625, 1.6759033203125, 1.827392578125, 1.9788818359375, 2.13037109375, 2.2818603515625, 2.433349609375, 2.5848388671875, 2.736328125, 2.8878173828125, 3.039306640625, 3.1907958984375, 3.34228515625, 3.4937744140625, 3.645263671875, 3.7967529296875, 3.9482421875, 4.0997314453125, 4.251220703125, 4.4027099609375, 4.55419921875, 4.7056884765625, 4.857177734375, 5.0086669921875, 5.16015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 11.0, 3.0, 4.0, 14.0, 12.0, 23.0, 25.0, 14.0, 30.0, 26.0, 29.0, 34.0, 35.0, 38.0, 57.0, 60.0, 79.0, 139.0, 325.0, 1380.0, 160.0, 98.0, 84.0, 42.0, 41.0, 32.0, 35.0, 28.0, 30.0, 25.0, 15.0, 13.0, 17.0, 14.0, 14.0, 9.0, 6.0, 6.0, 5.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.953125, -10.6112060546875, -10.269287109375, -9.9273681640625, -9.58544921875, -9.2435302734375, -8.901611328125, -8.5596923828125, -8.2177734375, -7.8758544921875, -7.533935546875, -7.1920166015625, -6.85009765625, -6.5081787109375, -6.166259765625, -5.8243408203125, -5.482421875, -5.1405029296875, -4.798583984375, -4.4566650390625, -4.11474609375, -3.7728271484375, -3.430908203125, -3.0889892578125, -2.7470703125, -2.4051513671875, -2.063232421875, -1.7213134765625, -1.37939453125, -1.0374755859375, -0.695556640625, -0.3536376953125, -0.01171875, 0.3302001953125, 0.672119140625, 1.0140380859375, 1.35595703125, 1.6978759765625, 2.039794921875, 2.3817138671875, 2.7236328125, 3.0655517578125, 3.407470703125, 3.7493896484375, 4.09130859375, 4.4332275390625, 4.775146484375, 5.1170654296875, 5.458984375, 5.8009033203125, 6.142822265625, 6.4847412109375, 6.82666015625, 7.1685791015625, 7.510498046875, 7.8524169921875, 8.1943359375, 8.5362548828125, 8.878173828125, 9.2200927734375, 9.56201171875, 9.9039306640625, 10.245849609375, 10.5877685546875, 10.9296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 16.0, 10.0, 14.0, 14.0, 20.0, 32.0, 46.0, 69.0, 100.0, 156.0, 242.0, 343.0, 617.0, 1314.0, 12657.0, 2546385.0, 575466.0, 5600.0, 1070.0, 532.0, 335.0, 204.0, 125.0, 81.0, 67.0, 44.0, 28.0, 20.0, 19.0, 16.0, 9.0, 7.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.734375, -24.00439453125, -23.2744140625, -22.54443359375, -21.814453125, -21.08447265625, -20.3544921875, -19.62451171875, -18.89453125, -18.16455078125, -17.4345703125, -16.70458984375, -15.974609375, -15.24462890625, -14.5146484375, -13.78466796875, -13.0546875, -12.32470703125, -11.5947265625, -10.86474609375, -10.134765625, -9.40478515625, -8.6748046875, -7.94482421875, -7.21484375, -6.48486328125, -5.7548828125, -5.02490234375, -4.294921875, -3.56494140625, -2.8349609375, -2.10498046875, -1.375, -0.64501953125, 0.0849609375, 0.81494140625, 1.544921875, 2.27490234375, 3.0048828125, 3.73486328125, 4.46484375, 5.19482421875, 5.9248046875, 6.65478515625, 7.384765625, 8.11474609375, 8.8447265625, 9.57470703125, 10.3046875, 11.03466796875, 11.7646484375, 12.49462890625, 13.224609375, 13.95458984375, 14.6845703125, 15.41455078125, 16.14453125, 16.87451171875, 17.6044921875, 18.33447265625, 19.064453125, 19.79443359375, 20.5244140625, 21.25439453125, 21.984375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 866.0, 147.0, 0.0, 1.0], "bins": [-409.0158996582031, -402.2823486328125, -395.548828125, -388.8152770996094, -382.08172607421875, -375.34820556640625, -368.6146545410156, -361.881103515625, -355.1475830078125, -348.4140319824219, -341.6805114746094, -334.94696044921875, -328.2134094238281, -321.4798889160156, -314.746337890625, -308.0127868652344, -301.27923583984375, -294.5456848144531, -287.8121643066406, -281.07861328125, -274.3450622558594, -267.6115417480469, -260.87799072265625, -254.14443969726562, -247.41091918945312, -240.67738342285156, -233.94383239746094, -227.21029663085938, -220.4767608642578, -213.7432098388672, -207.00967407226562, -200.276123046875, -193.5426025390625, -186.80906677246094, -180.0755157470703, -173.34197998046875, -166.6084442138672, -159.87489318847656, -153.141357421875, -146.40780639648438, -139.6742706298828, -132.94073486328125, -126.20719146728516, -119.47364807128906, -112.74010467529297, -106.00656127929688, -99.27302551269531, -92.53948211669922, -85.80593872070312, -79.07239532470703, -72.33885955810547, -65.60531616210938, -58.87177276611328, -52.13823318481445, -45.404693603515625, -38.67115020751953, -31.937610626220703, -25.204069137573242, -18.47052764892578, -11.736988067626953, -5.003446578979492, 1.7300949096679688, 8.463634490966797, 15.19717788696289, 21.93071746826172]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 8.0, 9.0, 17.0, 21.0, 22.0, 16.0, 18.0, 29.0, 34.0, 27.0, 45.0, 52.0, 42.0, 40.0, 36.0, 47.0, 33.0, 35.0, 34.0, 47.0, 49.0, 37.0, 37.0, 31.0, 34.0, 31.0, 24.0, 19.0, 23.0, 9.0, 15.0, 9.0, 13.0, 9.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.19073486328125, -21.389434814453125, -20.588134765625, -19.786834716796875, -18.98553466796875, -18.184234619140625, -17.3829345703125, -16.581634521484375, -15.78033447265625, -14.979034423828125, -14.177734375, -13.376434326171875, -12.57513427734375, -11.773834228515625, -10.9725341796875, -10.171234130859375, -9.369935035705566, -8.568634986877441, -7.767334938049316, -6.966034889221191, -6.164734840393066, -5.3634352684021, -4.562135219573975, -3.7608351707458496, -2.9595351219177246, -2.1582350730895996, -1.3569351434707642, -0.5556352138519287, 0.2456648349761963, 1.0469646453857422, 1.8482646942138672, 2.649564743041992, 3.450864791870117, 4.252164840698242, 5.053464889526367, 5.854764938354492, 6.656064987182617, 7.457364559173584, 8.258665084838867, 9.059965133666992, 9.861265182495117, 10.662565231323242, 11.463865280151367, 12.265165328979492, 13.066465377807617, 13.867765426635742, 14.669065475463867, 15.470365524291992, 16.271663665771484, 17.07296371459961, 17.874263763427734, 18.67556381225586, 19.476863861083984, 20.27816390991211, 21.079463958740234, 21.88076400756836, 22.682064056396484, 23.48336410522461, 24.284664154052734, 25.08596420288086, 25.887264251708984, 26.68856430053711, 27.489864349365234, 28.29116439819336, 29.092464447021484]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 7.0, 9.0, 7.0, 8.0, 17.0, 8.0, 17.0, 22.0, 24.0, 29.0, 32.0, 26.0, 32.0, 31.0, 25.0, 24.0, 32.0, 36.0, 39.0, 38.0, 52.0, 46.0, 39.0, 46.0, 34.0, 37.0, 34.0, 32.0, 25.0, 26.0, 30.0, 20.0, 11.0, 17.0, 12.0, 12.0, 20.0, 8.0, 4.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.6953125, -3.58001708984375, -3.4647216796875, -3.34942626953125, -3.234130859375, -3.11883544921875, -3.0035400390625, -2.88824462890625, -2.77294921875, -2.65765380859375, -2.5423583984375, -2.42706298828125, -2.311767578125, -2.19647216796875, -2.0811767578125, -1.96588134765625, -1.8505859375, -1.73529052734375, -1.6199951171875, -1.50469970703125, -1.389404296875, -1.27410888671875, -1.1588134765625, -1.04351806640625, -0.92822265625, -0.81292724609375, -0.6976318359375, -0.58233642578125, -0.467041015625, -0.35174560546875, -0.2364501953125, -0.12115478515625, -0.005859375, 0.10943603515625, 0.2247314453125, 0.34002685546875, 0.455322265625, 0.57061767578125, 0.6859130859375, 0.80120849609375, 0.91650390625, 1.03179931640625, 1.1470947265625, 1.26239013671875, 1.377685546875, 1.49298095703125, 1.6082763671875, 1.72357177734375, 1.8388671875, 1.95416259765625, 2.0694580078125, 2.18475341796875, 2.300048828125, 2.41534423828125, 2.5306396484375, 2.64593505859375, 2.76123046875, 2.87652587890625, 2.9918212890625, 3.10711669921875, 3.222412109375, 3.33770751953125, 3.4530029296875, 3.56829833984375, 3.68359375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 15.0, 17.0, 7.0, 14.0, 19.0, 24.0, 17.0, 46.0, 70.0, 85.0, 111.0, 178.0, 300.0, 540.0, 1125.0, 3056.0, 9378.0, 34499.0, 137553.0, 499112.0, 1257892.0, 1379562.0, 624721.0, 181679.0, 45762.0, 11850.0, 3692.0, 1393.0, 616.0, 313.0, 177.0, 115.0, 86.0, 59.0, 46.0, 37.0, 20.0, 15.0, 12.0, 17.0, 8.0, 11.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.29632568359375, -3.1746826171875, -3.05303955078125, -2.931396484375, -2.80975341796875, -2.6881103515625, -2.56646728515625, -2.44482421875, -2.32318115234375, -2.2015380859375, -2.07989501953125, -1.958251953125, -1.83660888671875, -1.7149658203125, -1.59332275390625, -1.4716796875, -1.35003662109375, -1.2283935546875, -1.10675048828125, -0.985107421875, -0.86346435546875, -0.7418212890625, -0.62017822265625, -0.49853515625, -0.37689208984375, -0.2552490234375, -0.13360595703125, -0.011962890625, 0.10968017578125, 0.2313232421875, 0.35296630859375, 0.474609375, 0.59625244140625, 0.7178955078125, 0.83953857421875, 0.961181640625, 1.08282470703125, 1.2044677734375, 1.32611083984375, 1.44775390625, 1.56939697265625, 1.6910400390625, 1.81268310546875, 1.934326171875, 2.05596923828125, 2.1776123046875, 2.29925537109375, 2.4208984375, 2.54254150390625, 2.6641845703125, 2.78582763671875, 2.907470703125, 3.02911376953125, 3.1507568359375, 3.27239990234375, 3.39404296875, 3.51568603515625, 3.6373291015625, 3.75897216796875, 3.880615234375, 4.00225830078125, 4.1239013671875, 4.24554443359375, 4.3671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 11.0, 6.0, 13.0, 23.0, 34.0, 32.0, 48.0, 70.0, 97.0, 154.0, 204.0, 340.0, 399.0, 488.0, 491.0, 445.0, 354.0, 265.0, 157.0, 127.0, 73.0, 69.0, 46.0, 27.0, 23.0, 18.0, 13.0, 8.0, 15.0, 4.0, 2.0, 2.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.27239990234375, -5.0916748046875, -4.91094970703125, -4.730224609375, -4.54949951171875, -4.3687744140625, -4.18804931640625, -4.00732421875, -3.82659912109375, -3.6458740234375, -3.46514892578125, -3.284423828125, -3.10369873046875, -2.9229736328125, -2.74224853515625, -2.5615234375, -2.38079833984375, -2.2000732421875, -2.01934814453125, -1.838623046875, -1.65789794921875, -1.4771728515625, -1.29644775390625, -1.11572265625, -0.93499755859375, -0.7542724609375, -0.57354736328125, -0.392822265625, -0.21209716796875, -0.0313720703125, 0.14935302734375, 0.330078125, 0.51080322265625, 0.6915283203125, 0.87225341796875, 1.052978515625, 1.23370361328125, 1.4144287109375, 1.59515380859375, 1.77587890625, 1.95660400390625, 2.1373291015625, 2.31805419921875, 2.498779296875, 2.67950439453125, 2.8602294921875, 3.04095458984375, 3.2216796875, 3.40240478515625, 3.5831298828125, 3.76385498046875, 3.944580078125, 4.12530517578125, 4.3060302734375, 4.48675537109375, 4.66748046875, 4.84820556640625, 5.0289306640625, 5.20965576171875, 5.390380859375, 5.57110595703125, 5.7518310546875, 5.93255615234375, 6.11328125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 11.0, 16.0, 11.0, 16.0, 20.0, 32.0, 34.0, 44.0, 75.0, 120.0, 146.0, 243.0, 510.0, 1101.0, 3298.0, 13664.0, 75624.0, 629399.0, 2748834.0, 625096.0, 76205.0, 13946.0, 3560.0, 1030.0, 487.0, 264.0, 144.0, 103.0, 71.0, 55.0, 35.0, 21.0, 14.0, 15.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.10546875, -6.85614013671875, -6.6068115234375, -6.35748291015625, -6.108154296875, -5.85882568359375, -5.6094970703125, -5.36016845703125, -5.11083984375, -4.86151123046875, -4.6121826171875, -4.36285400390625, -4.113525390625, -3.86419677734375, -3.6148681640625, -3.36553955078125, -3.1162109375, -2.86688232421875, -2.6175537109375, -2.36822509765625, -2.118896484375, -1.86956787109375, -1.6202392578125, -1.37091064453125, -1.12158203125, -0.87225341796875, -0.6229248046875, -0.37359619140625, -0.124267578125, 0.12506103515625, 0.3743896484375, 0.62371826171875, 0.873046875, 1.12237548828125, 1.3717041015625, 1.62103271484375, 1.870361328125, 2.11968994140625, 2.3690185546875, 2.61834716796875, 2.86767578125, 3.11700439453125, 3.3663330078125, 3.61566162109375, 3.864990234375, 4.11431884765625, 4.3636474609375, 4.61297607421875, 4.8623046875, 5.11163330078125, 5.3609619140625, 5.61029052734375, 5.859619140625, 6.10894775390625, 6.3582763671875, 6.60760498046875, 6.85693359375, 7.10626220703125, 7.3555908203125, 7.60491943359375, 7.854248046875, 8.10357666015625, 8.3529052734375, 8.60223388671875, 8.8515625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 17.0, 62.0, 174.0, 331.0, 286.0, 109.0, 25.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.522146224975586, -18.76357650756836, -17.0050048828125, -15.246435165405273, -13.487865447998047, -11.729294776916504, -9.970724105834961, -8.212154388427734, -6.453583717346191, -4.695013523101807, -2.9364430904388428, -1.177872657775879, 0.5806975364685059, 2.3392677307128906, 4.097838401794434, 5.85640811920166, 7.614978790283203, 9.373549461364746, 11.132119178771973, 12.890689849853516, 14.649259567260742, 16.40782928466797, 18.166400909423828, 19.924970626831055, 21.68354034423828, 23.442110061645508, 25.200681686401367, 26.959251403808594, 28.71782112121582, 30.476390838623047, 32.234962463378906, 33.9935302734375, 35.75210189819336, 37.51067352294922, 39.26924133300781, 41.02781295776367, 42.78638458251953, 44.544952392578125, 46.303524017333984, 48.062095642089844, 49.82066345214844, 51.5792350769043, 53.33780288696289, 55.09637451171875, 56.85494613647461, 58.6135139465332, 60.37208557128906, 62.130653381347656, 63.88922882080078, 65.64779663085938, 67.4063720703125, 69.1649398803711, 70.92350769042969, 72.68208312988281, 74.4406509399414, 76.19921875, 77.9577865600586, 79.71635437011719, 81.47492980957031, 83.2334976196289, 84.9920654296875, 86.75064086914062, 88.50920867919922, 90.26777648925781, 92.02635192871094]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 4.0, 4.0, 6.0, 6.0, 5.0, 8.0, 12.0, 11.0, 14.0, 13.0, 16.0, 11.0, 25.0, 25.0, 35.0, 30.0, 36.0, 30.0, 35.0, 33.0, 40.0, 32.0, 39.0, 38.0, 43.0, 36.0, 35.0, 41.0, 40.0, 28.0, 26.0, 25.0, 24.0, 20.0, 26.0, 22.0, 18.0, 15.0, 13.0, 10.0, 5.0, 13.0, 13.0, 7.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-16.554866790771484, -16.042278289794922, -15.529691696166992, -15.01710319519043, -14.504515647888184, -13.991928100585938, -13.479340553283691, -12.966753005981445, -12.454164505004883, -11.941576957702637, -11.42898941040039, -10.916400909423828, -10.403813362121582, -9.891225814819336, -9.37863826751709, -8.866050720214844, -8.353463172912598, -7.840875625610352, -7.328287601470947, -6.815700054168701, -6.303112030029297, -5.790524482727051, -5.277936935424805, -4.765349388122559, -4.252761363983154, -3.740173578262329, -3.227585792541504, -2.714998245239258, -2.2024104595184326, -1.6898226737976074, -1.1772351264953613, -0.6646473407745361, -0.15205955505371094, 0.3605281710624695, 0.8731158971786499, 1.3857035636901855, 1.8982913494110107, 2.410879135131836, 2.923466682434082, 3.4360544681549072, 3.9486422538757324, 4.4612298011779785, 4.973817825317383, 5.486405372619629, 5.998992919921875, 6.511580944061279, 7.024168491363525, 7.53675651550293, 8.049344062805176, 8.561931610107422, 9.074519157409668, 9.587106704711914, 10.099695205688477, 10.612282752990723, 11.124870300292969, 11.637457847595215, 12.150045394897461, 12.662632942199707, 13.175220489501953, 13.687808990478516, 14.200396537780762, 14.712984085083008, 15.225571632385254, 15.7381591796875, 16.250747680664062]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 2.0, 9.0, 11.0, 10.0, 19.0, 11.0, 19.0, 22.0, 16.0, 18.0, 30.0, 26.0, 32.0, 28.0, 27.0, 49.0, 28.0, 36.0, 48.0, 46.0, 44.0, 41.0, 39.0, 34.0, 46.0, 29.0, 32.0, 26.0, 26.0, 22.0, 24.0, 27.0, 21.0, 25.0, 12.0, 13.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0], "bins": [-3.931640625, -3.819183349609375, -3.70672607421875, -3.594268798828125, -3.4818115234375, -3.369354248046875, -3.25689697265625, -3.144439697265625, -3.031982421875, -2.919525146484375, -2.80706787109375, -2.694610595703125, -2.5821533203125, -2.469696044921875, -2.35723876953125, -2.244781494140625, -2.13232421875, -2.019866943359375, -1.90740966796875, -1.794952392578125, -1.6824951171875, -1.570037841796875, -1.45758056640625, -1.345123291015625, -1.232666015625, -1.120208740234375, -1.00775146484375, -0.895294189453125, -0.7828369140625, -0.670379638671875, -0.55792236328125, -0.445465087890625, -0.3330078125, -0.220550537109375, -0.10809326171875, 0.004364013671875, 0.1168212890625, 0.229278564453125, 0.34173583984375, 0.454193115234375, 0.566650390625, 0.679107666015625, 0.79156494140625, 0.904022216796875, 1.0164794921875, 1.128936767578125, 1.24139404296875, 1.353851318359375, 1.46630859375, 1.578765869140625, 1.69122314453125, 1.803680419921875, 1.9161376953125, 2.028594970703125, 2.14105224609375, 2.253509521484375, 2.365966796875, 2.478424072265625, 2.59088134765625, 2.703338623046875, 2.8157958984375, 2.928253173828125, 3.04071044921875, 3.153167724609375, 3.265625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 9.0, 21.0, 33.0, 33.0, 52.0, 62.0, 85.0, 138.0, 201.0, 282.0, 462.0, 685.0, 996.0, 1428.0, 2222.0, 3274.0, 4930.0, 7561.0, 11269.0, 17392.0, 26774.0, 41979.0, 66920.0, 109831.0, 175003.0, 203299.0, 139047.0, 85698.0, 52881.0, 33208.0, 21415.0, 14000.0, 9116.0, 5970.0, 4026.0, 2638.0, 1816.0, 1206.0, 839.0, 598.0, 330.0, 297.0, 180.0, 110.0, 77.0, 53.0, 30.0, 28.0, 18.0, 17.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.3671875, -0.3558006286621094, -0.34441375732421875, -0.3330268859863281, -0.3216400146484375, -0.3102531433105469, -0.29886627197265625, -0.2874794006347656, -0.276092529296875, -0.2647056579589844, -0.25331878662109375, -0.24193191528320312, -0.2305450439453125, -0.21915817260742188, -0.20777130126953125, -0.19638442993164062, -0.18499755859375, -0.17361068725585938, -0.16222381591796875, -0.15083694458007812, -0.1394500732421875, -0.12806320190429688, -0.11667633056640625, -0.10528945922851562, -0.093902587890625, -0.08251571655273438, -0.07112884521484375, -0.059741973876953125, -0.0483551025390625, -0.036968231201171875, -0.02558135986328125, -0.014194488525390625, -0.0028076171875, 0.008579254150390625, 0.01996612548828125, 0.031352996826171875, 0.0427398681640625, 0.054126739501953125, 0.06551361083984375, 0.07690048217773438, 0.088287353515625, 0.09967422485351562, 0.11106109619140625, 0.12244796752929688, 0.1338348388671875, 0.14522171020507812, 0.15660858154296875, 0.16799545288085938, 0.17938232421875, 0.19076919555664062, 0.20215606689453125, 0.21354293823242188, 0.2249298095703125, 0.23631668090820312, 0.24770355224609375, 0.2590904235839844, 0.270477294921875, 0.2818641662597656, 0.29325103759765625, 0.3046379089355469, 0.3160247802734375, 0.3274116516113281, 0.33879852294921875, 0.3501853942871094, 0.361572265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 2.0, 6.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 13.0, 25.0, 22.0, 16.0, 32.0, 22.0, 18.0, 32.0, 32.0, 24.0, 42.0, 31.0, 43.0, 48.0, 37.0, 1053.0, 41.0, 35.0, 36.0, 32.0, 43.0, 42.0, 28.0, 30.0, 14.0, 23.0, 22.0, 23.0, 14.0, 17.0, 21.0, 14.0, 9.0, 6.0, 11.0, 10.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.171875, -2.103302001953125, -2.03472900390625, -1.966156005859375, -1.8975830078125, -1.829010009765625, -1.76043701171875, -1.691864013671875, -1.623291015625, -1.554718017578125, -1.48614501953125, -1.417572021484375, -1.3489990234375, -1.280426025390625, -1.21185302734375, -1.143280029296875, -1.07470703125, -1.006134033203125, -0.93756103515625, -0.868988037109375, -0.8004150390625, -0.731842041015625, -0.66326904296875, -0.594696044921875, -0.526123046875, -0.457550048828125, -0.38897705078125, -0.320404052734375, -0.2518310546875, -0.183258056640625, -0.11468505859375, -0.046112060546875, 0.0224609375, 0.091033935546875, 0.15960693359375, 0.228179931640625, 0.2967529296875, 0.365325927734375, 0.43389892578125, 0.502471923828125, 0.571044921875, 0.639617919921875, 0.70819091796875, 0.776763916015625, 0.8453369140625, 0.913909912109375, 0.98248291015625, 1.051055908203125, 1.11962890625, 1.188201904296875, 1.25677490234375, 1.325347900390625, 1.3939208984375, 1.462493896484375, 1.53106689453125, 1.599639892578125, 1.668212890625, 1.736785888671875, 1.80535888671875, 1.873931884765625, 1.9425048828125, 2.011077880859375, 2.07965087890625, 2.148223876953125, 2.216796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 4.0, 16.0, 19.0, 30.0, 36.0, 61.0, 82.0, 152.0, 199.0, 270.0, 404.0, 574.0, 894.0, 1239.0, 1896.0, 2771.0, 3919.0, 5859.0, 8866.0, 13365.0, 20080.0, 30572.0, 47548.0, 76707.0, 127398.0, 1220707.0, 213047.0, 118933.0, 71664.0, 44847.0, 28792.0, 18385.0, 12168.0, 8187.0, 5470.0, 3714.0, 2541.0, 1694.0, 1217.0, 872.0, 590.0, 418.0, 323.0, 189.0, 116.0, 99.0, 64.0, 47.0, 29.0, 19.0, 11.0, 9.0, 9.0, 2.0, 3.0, 1.0, 6.0], "bins": [-0.31591796875, -0.3063240051269531, -0.29673004150390625, -0.2871360778808594, -0.2775421142578125, -0.2679481506347656, -0.25835418701171875, -0.24876022338867188, -0.239166259765625, -0.22957229614257812, -0.21997833251953125, -0.21038436889648438, -0.2007904052734375, -0.19119644165039062, -0.18160247802734375, -0.17200851440429688, -0.16241455078125, -0.15282058715820312, -0.14322662353515625, -0.13363265991210938, -0.1240386962890625, -0.11444473266601562, -0.10485076904296875, -0.09525680541992188, -0.085662841796875, -0.07606887817382812, -0.06647491455078125, -0.056880950927734375, -0.0472869873046875, -0.037693023681640625, -0.02809906005859375, -0.018505096435546875, -0.0089111328125, 0.000682830810546875, 0.01027679443359375, 0.019870758056640625, 0.0294647216796875, 0.039058685302734375, 0.04865264892578125, 0.058246612548828125, 0.067840576171875, 0.07743453979492188, 0.08702850341796875, 0.09662246704101562, 0.1062164306640625, 0.11581039428710938, 0.12540435791015625, 0.13499832153320312, 0.14459228515625, 0.15418624877929688, 0.16378021240234375, 0.17337417602539062, 0.1829681396484375, 0.19256210327148438, 0.20215606689453125, 0.21175003051757812, 0.221343994140625, 0.23093795776367188, 0.24053192138671875, 0.2501258850097656, 0.2597198486328125, 0.2693138122558594, 0.27890777587890625, 0.2885017395019531, 0.298095703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 14.0, 15.0, 28.0, 20.0, 24.0, 53.0, 51.0, 66.0, 88.0, 99.0, 87.0, 80.0, 86.0, 53.0, 51.0, 29.0, 30.0, 24.0, 17.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018062591552734375, -0.0017526894807815552, -0.0016991198062896729, -0.0016455501317977905, -0.0015919804573059082, -0.0015384107828140259, -0.0014848411083221436, -0.0014312714338302612, -0.001377701759338379, -0.0013241320848464966, -0.0012705624103546143, -0.001216992735862732, -0.0011634230613708496, -0.0011098533868789673, -0.001056283712387085, -0.0010027140378952026, -0.0009491443634033203, -0.000895574688911438, -0.0008420050144195557, -0.0007884353399276733, -0.000734865665435791, -0.0006812959909439087, -0.0006277263164520264, -0.000574156641960144, -0.0005205869674682617, -0.0004670172929763794, -0.00041344761848449707, -0.00035987794399261475, -0.0003063082695007324, -0.0002527385950088501, -0.00019916892051696777, -0.00014559924602508545, -9.202957153320312e-05, -3.84598970413208e-05, 1.5109777450561523e-05, 6.867945194244385e-05, 0.00012224912643432617, 0.0001758188009262085, 0.00022938847541809082, 0.00028295814990997314, 0.00033652782440185547, 0.0003900974988937378, 0.0004436671733856201, 0.0004972368478775024, 0.0005508065223693848, 0.0006043761968612671, 0.0006579458713531494, 0.0007115155458450317, 0.0007650852203369141, 0.0008186548948287964, 0.0008722245693206787, 0.000925794243812561, 0.0009793639183044434, 0.0010329335927963257, 0.001086503267288208, 0.0011400729417800903, 0.0011936426162719727, 0.001247212290763855, 0.0013007819652557373, 0.0013543516397476196, 0.001407921314239502, 0.0014614909887313843, 0.0015150606632232666, 0.001568630337715149, 0.0016222000122070312]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 6.0, 3.0, 9.0, 10.0, 4.0, 12.0, 21.0, 31.0, 46.0, 78.0, 87.0, 123.0, 188.0, 325.0, 622.0, 3442.0, 1014472.0, 27127.0, 862.0, 350.0, 221.0, 139.0, 86.0, 62.0, 48.0, 36.0, 27.0, 29.0, 12.0, 4.0, 9.0, 3.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281524658203125, -0.027170896530151367, -0.026189327239990234, -0.0252077579498291, -0.02422618865966797, -0.023244619369506836, -0.022263050079345703, -0.02128148078918457, -0.020299911499023438, -0.019318342208862305, -0.018336772918701172, -0.01735520362854004, -0.016373634338378906, -0.015392065048217773, -0.01441049575805664, -0.013428926467895508, -0.012447357177734375, -0.011465787887573242, -0.01048421859741211, -0.009502649307250977, -0.008521080017089844, -0.007539510726928711, -0.006557941436767578, -0.005576372146606445, -0.0045948028564453125, -0.0036132335662841797, -0.002631664276123047, -0.001650094985961914, -0.0006685256958007812, 0.00031304359436035156, 0.0012946128845214844, 0.002276182174682617, 0.00325775146484375, 0.004239320755004883, 0.005220890045166016, 0.0062024593353271484, 0.007184028625488281, 0.008165597915649414, 0.009147167205810547, 0.01012873649597168, 0.011110305786132812, 0.012091875076293945, 0.013073444366455078, 0.014055013656616211, 0.015036582946777344, 0.016018152236938477, 0.01699972152709961, 0.017981290817260742, 0.018962860107421875, 0.019944429397583008, 0.02092599868774414, 0.021907567977905273, 0.022889137268066406, 0.02387070655822754, 0.024852275848388672, 0.025833845138549805, 0.026815414428710938, 0.02779698371887207, 0.028778553009033203, 0.029760122299194336, 0.03074169158935547, 0.0317232608795166, 0.032704830169677734, 0.03368639945983887, 0.03466796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 34.0, 964.0, 20.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.022569013759493828, -0.022176243364810944, -0.02178347110748291, -0.021390700712800026, -0.02099793031811714, -0.02060515806078911, -0.020212387666106224, -0.01981961727142334, -0.019426845014095306, -0.019034074619412422, -0.01864130236208439, -0.018248531967401505, -0.01785576157271862, -0.017462989315390587, -0.017070218920707703, -0.01667744852602482, -0.016284678131341934, -0.01589190773665905, -0.015499136410653591, -0.015106365084648132, -0.014713593758642673, -0.01432082336395979, -0.01392805203795433, -0.013535281643271446, -0.013142509385943413, -0.012749738059937954, -0.01235696766525507, -0.011964196339249611, -0.011571425013244152, -0.011178654618561268, -0.010785883292555809, -0.010393112897872925, -0.010000341571867466, -0.009607570245862007, -0.009214799851179123, -0.008822028525173664, -0.008429257199168205, -0.008036486804485321, -0.007643715478479862, -0.007250944618135691, -0.006858173292130232, -0.00646540243178606, -0.0060726311057806015, -0.00567986024543643, -0.0052870893850922585, -0.0048943180590868, -0.004501547198742628, -0.004108776338398457, -0.0037160052452236414, -0.0033232341520488262, -0.0029304632917046547, -0.0025376921985298395, -0.0021449211053550243, -0.0017521502450108528, -0.0013593791518360376, -0.0009666082914918661, -0.0005738371983170509, -0.00018106619245372713, 0.00021170481340959668, 0.000604475848376751, 0.0009972468251362443, 0.0013900178018957376, 0.0017827888950705528, 0.0021755597554147243, 0.0025683308485895395]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 9.0, 14.0, 15.0, 18.0, 24.0, 24.0, 27.0, 27.0, 37.0, 47.0, 47.0, 49.0, 61.0, 55.0, 54.0, 55.0, 45.0, 50.0, 46.0, 51.0, 42.0, 36.0, 35.0, 16.0, 19.0, 18.0, 15.0, 13.0, 8.0, 12.0, 2.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007165670394897461, -0.0006863139569759369, -0.0006560608744621277, -0.0006258077919483185, -0.0005955547094345093, -0.0005653016269207001, -0.0005350485444068909, -0.0005047954618930817, -0.00047454237937927246, -0.00044428929686546326, -0.00041403621435165405, -0.00038378313183784485, -0.00035353004932403564, -0.00032327696681022644, -0.00029302388429641724, -0.00026277080178260803, -0.00023251771926879883, -0.00020226463675498962, -0.00017201155424118042, -0.00014175847172737122, -0.00011150538921356201, -8.125230669975281e-05, -5.0999224185943604e-05, -2.07461416721344e-05, 9.506940841674805e-06, 3.976002335548401e-05, 7.001310586929321e-05, 0.00010026618838310242, 0.00013051927089691162, 0.00016077235341072083, 0.00019102543592453003, 0.00022127851843833923, 0.00025153160095214844, 0.00028178468346595764, 0.00031203776597976685, 0.00034229084849357605, 0.00037254393100738525, 0.00040279701352119446, 0.00043305009603500366, 0.00046330317854881287, 0.0004935562610626221, 0.0005238093435764313, 0.0005540624260902405, 0.0005843155086040497, 0.0006145685911178589, 0.0006448216736316681, 0.0006750747561454773, 0.0007053278386592865, 0.0007355809211730957, 0.0007658340036869049, 0.0007960870862007141, 0.0008263401687145233, 0.0008565932512283325, 0.0008868463337421417, 0.0009170994162559509, 0.0009473524987697601, 0.0009776055812835693, 0.0010078586637973785, 0.0010381117463111877, 0.001068364828824997, 0.0010986179113388062, 0.0011288709938526154, 0.0011591240763664246, 0.0011893771588802338, 0.001219630241394043]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 2.0, 9.0, 11.0, 10.0, 19.0, 11.0, 19.0, 22.0, 16.0, 18.0, 30.0, 26.0, 32.0, 28.0, 27.0, 49.0, 28.0, 36.0, 48.0, 46.0, 44.0, 41.0, 39.0, 34.0, 46.0, 29.0, 32.0, 26.0, 26.0, 22.0, 24.0, 27.0, 21.0, 25.0, 12.0, 13.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0], "bins": [-3.931640625, -3.819183349609375, -3.70672607421875, -3.594268798828125, -3.4818115234375, -3.369354248046875, -3.25689697265625, -3.144439697265625, -3.031982421875, -2.919525146484375, -2.80706787109375, -2.694610595703125, -2.5821533203125, -2.469696044921875, -2.35723876953125, -2.244781494140625, -2.13232421875, -2.019866943359375, -1.90740966796875, -1.794952392578125, -1.6824951171875, -1.570037841796875, -1.45758056640625, -1.345123291015625, -1.232666015625, -1.120208740234375, -1.00775146484375, -0.895294189453125, -0.7828369140625, -0.670379638671875, -0.55792236328125, -0.445465087890625, -0.3330078125, -0.220550537109375, -0.10809326171875, 0.004364013671875, 0.1168212890625, 0.229278564453125, 0.34173583984375, 0.454193115234375, 0.566650390625, 0.679107666015625, 0.79156494140625, 0.904022216796875, 1.0164794921875, 1.128936767578125, 1.24139404296875, 1.353851318359375, 1.46630859375, 1.578765869140625, 1.69122314453125, 1.803680419921875, 1.9161376953125, 2.028594970703125, 2.14105224609375, 2.253509521484375, 2.365966796875, 2.478424072265625, 2.59088134765625, 2.703338623046875, 2.8157958984375, 2.928253173828125, 3.04071044921875, 3.153167724609375, 3.265625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 10.0, 4.0, 5.0, 6.0, 8.0, 19.0, 22.0, 30.0, 38.0, 52.0, 91.0, 109.0, 112.0, 198.0, 226.0, 370.0, 602.0, 881.0, 1691.0, 3680.0, 9505.0, 28119.0, 88644.0, 253098.0, 374371.0, 190155.0, 62864.0, 19993.0, 6944.0, 2870.0, 1372.0, 808.0, 480.0, 293.0, 237.0, 169.0, 120.0, 91.0, 68.0, 58.0, 33.0, 27.0, 26.0, 16.0, 16.0, 10.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.22821044921875, -4.0736083984375, -3.91900634765625, -3.764404296875, -3.60980224609375, -3.4552001953125, -3.30059814453125, -3.14599609375, -2.99139404296875, -2.8367919921875, -2.68218994140625, -2.527587890625, -2.37298583984375, -2.2183837890625, -2.06378173828125, -1.9091796875, -1.75457763671875, -1.5999755859375, -1.44537353515625, -1.290771484375, -1.13616943359375, -0.9815673828125, -0.82696533203125, -0.67236328125, -0.51776123046875, -0.3631591796875, -0.20855712890625, -0.053955078125, 0.10064697265625, 0.2552490234375, 0.40985107421875, 0.564453125, 0.71905517578125, 0.8736572265625, 1.02825927734375, 1.182861328125, 1.33746337890625, 1.4920654296875, 1.64666748046875, 1.80126953125, 1.95587158203125, 2.1104736328125, 2.26507568359375, 2.419677734375, 2.57427978515625, 2.7288818359375, 2.88348388671875, 3.0380859375, 3.19268798828125, 3.3472900390625, 3.50189208984375, 3.656494140625, 3.81109619140625, 3.9656982421875, 4.12030029296875, 4.27490234375, 4.42950439453125, 4.5841064453125, 4.73870849609375, 4.893310546875, 5.04791259765625, 5.2025146484375, 5.35711669921875, 5.51171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 17.0, 10.0, 18.0, 11.0, 16.0, 25.0, 27.0, 30.0, 40.0, 50.0, 46.0, 70.0, 91.0, 131.0, 267.0, 1384.0, 223.0, 122.0, 86.0, 55.0, 45.0, 42.0, 35.0, 31.0, 36.0, 18.0, 24.0, 14.0, 15.0, 8.0, 11.0, 8.0, 16.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.1875, -9.85107421875, -9.5146484375, -9.17822265625, -8.841796875, -8.50537109375, -8.1689453125, -7.83251953125, -7.49609375, -7.15966796875, -6.8232421875, -6.48681640625, -6.150390625, -5.81396484375, -5.4775390625, -5.14111328125, -4.8046875, -4.46826171875, -4.1318359375, -3.79541015625, -3.458984375, -3.12255859375, -2.7861328125, -2.44970703125, -2.11328125, -1.77685546875, -1.4404296875, -1.10400390625, -0.767578125, -0.43115234375, -0.0947265625, 0.24169921875, 0.578125, 0.91455078125, 1.2509765625, 1.58740234375, 1.923828125, 2.26025390625, 2.5966796875, 2.93310546875, 3.26953125, 3.60595703125, 3.9423828125, 4.27880859375, 4.615234375, 4.95166015625, 5.2880859375, 5.62451171875, 5.9609375, 6.29736328125, 6.6337890625, 6.97021484375, 7.306640625, 7.64306640625, 7.9794921875, 8.31591796875, 8.65234375, 8.98876953125, 9.3251953125, 9.66162109375, 9.998046875, 10.33447265625, 10.6708984375, 11.00732421875, 11.34375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 13.0, 16.0, 16.0, 22.0, 39.0, 43.0, 52.0, 87.0, 93.0, 131.0, 208.0, 307.0, 455.0, 816.0, 1640.0, 14688.0, 2214064.0, 900653.0, 8863.0, 1447.0, 649.0, 395.0, 272.0, 185.0, 129.0, 90.0, 81.0, 57.0, 48.0, 27.0, 29.0, 17.0, 14.0, 9.0, 1.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.6875, -21.083740234375, -20.47998046875, -19.876220703125, -19.2724609375, -18.668701171875, -18.06494140625, -17.461181640625, -16.857421875, -16.253662109375, -15.64990234375, -15.046142578125, -14.4423828125, -13.838623046875, -13.23486328125, -12.631103515625, -12.02734375, -11.423583984375, -10.81982421875, -10.216064453125, -9.6123046875, -9.008544921875, -8.40478515625, -7.801025390625, -7.197265625, -6.593505859375, -5.98974609375, -5.385986328125, -4.7822265625, -4.178466796875, -3.57470703125, -2.970947265625, -2.3671875, -1.763427734375, -1.15966796875, -0.555908203125, 0.0478515625, 0.651611328125, 1.25537109375, 1.859130859375, 2.462890625, 3.066650390625, 3.67041015625, 4.274169921875, 4.8779296875, 5.481689453125, 6.08544921875, 6.689208984375, 7.29296875, 7.896728515625, 8.50048828125, 9.104248046875, 9.7080078125, 10.311767578125, 10.91552734375, 11.519287109375, 12.123046875, 12.726806640625, 13.33056640625, 13.934326171875, 14.5380859375, 15.141845703125, 15.74560546875, 16.349365234375, 16.953125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [5.0, 24.0, 87.0, 299.0, 373.0, 176.0, 42.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.076804161071777, -4.662458896636963, -3.2481138706207275, -1.8337688446044922, -0.41942358016967773, 0.9949216842651367, 2.409266471862793, 3.8236122131347656, 5.237957000732422, 6.652302265167236, 8.06664752960205, 9.480992317199707, 10.89533805847168, 12.309682846069336, 13.724027633666992, 15.138373374938965, 16.552719116210938, 17.967063903808594, 19.38140869140625, 20.795753479003906, 22.210100173950195, 23.62444496154785, 25.038789749145508, 26.453136444091797, 27.86747932434082, 29.281824111938477, 30.696168899536133, 32.11051559448242, 33.52486038208008, 34.939205169677734, 36.35354995727539, 37.76789474487305, 39.1822395324707, 40.59658432006836, 42.010929107666016, 43.42527389526367, 44.83961868286133, 46.25396728515625, 47.668312072753906, 49.08265686035156, 50.49700164794922, 51.911346435546875, 53.32569122314453, 54.74003601074219, 56.154380798339844, 57.5687255859375, 58.983070373535156, 60.39741897583008, 61.81175994873047, 63.226104736328125, 64.64044952392578, 66.05479431152344, 67.4691390991211, 68.88348388671875, 70.2978286743164, 71.71217346191406, 73.12652587890625, 74.5408706665039, 75.95521545410156, 77.36956024169922, 78.78390502929688, 80.19824981689453, 81.61259460449219, 83.02693939208984, 84.4412841796875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 12.0, 15.0, 11.0, 10.0, 14.0, 24.0, 21.0, 24.0, 26.0, 34.0, 33.0, 32.0, 39.0, 41.0, 48.0, 45.0, 41.0, 51.0, 40.0, 39.0, 39.0, 45.0, 29.0, 30.0, 29.0, 26.0, 32.0, 34.0, 18.0, 21.0, 16.0, 13.0, 13.0, 13.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.459896087646484, -18.735986709594727, -18.01207733154297, -17.288166046142578, -16.56425666809082, -15.840347290039062, -15.116437911987305, -14.392528533935547, -13.668618202209473, -12.944708824157715, -12.22079849243164, -11.496889114379883, -10.772979736328125, -10.04906940460205, -9.325160026550293, -8.601249694824219, -7.877340316772461, -7.153430461883545, -6.429520606994629, -5.705611228942871, -4.981701374053955, -4.257791519165039, -3.5338821411132812, -2.8099722862243652, -2.086062431335449, -1.3621526956558228, -0.6382429599761963, 0.08566665649414062, 0.8095765113830566, 1.5334863662719727, 2.2573957443237305, 2.9813055992126465, 3.7052154541015625, 4.4291253089904785, 5.1530351638793945, 5.876944541931152, 6.600854396820068, 7.324764251708984, 8.048673629760742, 8.7725830078125, 9.496493339538574, 10.220402717590332, 10.944313049316406, 11.668222427368164, 12.392131805419922, 13.116042137145996, 13.839951515197754, 14.563861846923828, 15.287771224975586, 16.011680603027344, 16.7355899810791, 17.45949935913086, 18.18341064453125, 18.907320022583008, 19.631229400634766, 20.355138778686523, 21.07904815673828, 21.80295753479004, 22.526866912841797, 23.250778198242188, 23.974687576293945, 24.698596954345703, 25.42250633239746, 26.14641571044922, 26.87032699584961]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 8.0, 9.0, 6.0, 9.0, 12.0, 14.0, 18.0, 24.0, 30.0, 21.0, 22.0, 27.0, 27.0, 26.0, 39.0, 35.0, 47.0, 45.0, 46.0, 40.0, 36.0, 33.0, 41.0, 36.0, 40.0, 30.0, 35.0, 33.0, 34.0, 31.0, 20.0, 18.0, 20.0, 12.0, 7.0, 13.0, 11.0, 8.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.7734375, -3.66082763671875, -3.5482177734375, -3.43560791015625, -3.322998046875, -3.21038818359375, -3.0977783203125, -2.98516845703125, -2.87255859375, -2.75994873046875, -2.6473388671875, -2.53472900390625, -2.422119140625, -2.30950927734375, -2.1968994140625, -2.08428955078125, -1.9716796875, -1.85906982421875, -1.7464599609375, -1.63385009765625, -1.521240234375, -1.40863037109375, -1.2960205078125, -1.18341064453125, -1.07080078125, -0.95819091796875, -0.8455810546875, -0.73297119140625, -0.620361328125, -0.50775146484375, -0.3951416015625, -0.28253173828125, -0.169921875, -0.05731201171875, 0.0552978515625, 0.16790771484375, 0.280517578125, 0.39312744140625, 0.5057373046875, 0.61834716796875, 0.73095703125, 0.84356689453125, 0.9561767578125, 1.06878662109375, 1.181396484375, 1.29400634765625, 1.4066162109375, 1.51922607421875, 1.6318359375, 1.74444580078125, 1.8570556640625, 1.96966552734375, 2.082275390625, 2.19488525390625, 2.3074951171875, 2.42010498046875, 2.53271484375, 2.64532470703125, 2.7579345703125, 2.87054443359375, 2.983154296875, 3.09576416015625, 3.2083740234375, 3.32098388671875, 3.43359375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 14.0, 7.0, 5.0, 10.0, 19.0, 19.0, 23.0, 34.0, 37.0, 34.0, 51.0, 82.0, 110.0, 139.0, 177.0, 257.0, 305.0, 398.0, 2056.0, 3478874.0, 709041.0, 977.0, 353.0, 306.0, 236.0, 141.0, 139.0, 104.0, 65.0, 37.0, 42.0, 48.0, 33.0, 18.0, 17.0, 11.0, 8.0, 8.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.155517578125, -27.10791015625, -26.060302734375, -25.0126953125, -23.965087890625, -22.91748046875, -21.869873046875, -20.822265625, -19.774658203125, -18.72705078125, -17.679443359375, -16.6318359375, -15.584228515625, -14.53662109375, -13.489013671875, -12.44140625, -11.393798828125, -10.34619140625, -9.298583984375, -8.2509765625, -7.203369140625, -6.15576171875, -5.108154296875, -4.060546875, -3.012939453125, -1.96533203125, -0.917724609375, 0.1298828125, 1.177490234375, 2.22509765625, 3.272705078125, 4.3203125, 5.367919921875, 6.41552734375, 7.463134765625, 8.5107421875, 9.558349609375, 10.60595703125, 11.653564453125, 12.701171875, 13.748779296875, 14.79638671875, 15.843994140625, 16.8916015625, 17.939208984375, 18.98681640625, 20.034423828125, 21.08203125, 22.129638671875, 23.17724609375, 24.224853515625, 25.2724609375, 26.320068359375, 27.36767578125, 28.415283203125, 29.462890625, 30.510498046875, 31.55810546875, 32.605712890625, 33.6533203125, 34.700927734375, 35.74853515625, 36.796142578125, 37.84375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 7.0, 19.0, 19.0, 31.0, 26.0, 52.0, 64.0, 81.0, 120.0, 183.0, 270.0, 324.0, 451.0, 536.0, 516.0, 343.0, 272.0, 178.0, 152.0, 101.0, 77.0, 61.0, 44.0, 31.0, 13.0, 17.0, 18.0, 13.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.4337158203125, -4.254150390625, -4.0745849609375, -3.89501953125, -3.7154541015625, -3.535888671875, -3.3563232421875, -3.1767578125, -2.9971923828125, -2.817626953125, -2.6380615234375, -2.45849609375, -2.2789306640625, -2.099365234375, -1.9197998046875, -1.740234375, -1.5606689453125, -1.381103515625, -1.2015380859375, -1.02197265625, -0.8424072265625, -0.662841796875, -0.4832763671875, -0.3037109375, -0.1241455078125, 0.055419921875, 0.2349853515625, 0.41455078125, 0.5941162109375, 0.773681640625, 0.9532470703125, 1.1328125, 1.3123779296875, 1.491943359375, 1.6715087890625, 1.85107421875, 2.0306396484375, 2.210205078125, 2.3897705078125, 2.5693359375, 2.7489013671875, 2.928466796875, 3.1080322265625, 3.28759765625, 3.4671630859375, 3.646728515625, 3.8262939453125, 4.005859375, 4.1854248046875, 4.364990234375, 4.5445556640625, 4.72412109375, 4.9036865234375, 5.083251953125, 5.2628173828125, 5.4423828125, 5.6219482421875, 5.801513671875, 5.9810791015625, 6.16064453125, 6.3402099609375, 6.519775390625, 6.6993408203125, 6.87890625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 6.0, 9.0, 15.0, 20.0, 27.0, 33.0, 49.0, 71.0, 113.0, 224.0, 537.0, 3630.0, 321413.0, 3832417.0, 33664.0, 1268.0, 335.0, 150.0, 68.0, 55.0, 30.0, 37.0, 23.0, 14.0, 20.0, 9.0, 10.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.71875, -24.968505859375, -24.21826171875, -23.468017578125, -22.7177734375, -21.967529296875, -21.21728515625, -20.467041015625, -19.716796875, -18.966552734375, -18.21630859375, -17.466064453125, -16.7158203125, -15.965576171875, -15.21533203125, -14.465087890625, -13.71484375, -12.964599609375, -12.21435546875, -11.464111328125, -10.7138671875, -9.963623046875, -9.21337890625, -8.463134765625, -7.712890625, -6.962646484375, -6.21240234375, -5.462158203125, -4.7119140625, -3.961669921875, -3.21142578125, -2.461181640625, -1.7109375, -0.960693359375, -0.21044921875, 0.539794921875, 1.2900390625, 2.040283203125, 2.79052734375, 3.540771484375, 4.291015625, 5.041259765625, 5.79150390625, 6.541748046875, 7.2919921875, 8.042236328125, 8.79248046875, 9.542724609375, 10.29296875, 11.043212890625, 11.79345703125, 12.543701171875, 13.2939453125, 14.044189453125, 14.79443359375, 15.544677734375, 16.294921875, 17.045166015625, 17.79541015625, 18.545654296875, 19.2958984375, 20.046142578125, 20.79638671875, 21.546630859375, 22.296875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 77.0, 442.0, 407.0, 75.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.29013061523438, -128.30751037597656, -125.32489013671875, -122.34226989746094, -119.35964965820312, -116.37702941894531, -113.3944091796875, -110.41178894042969, -107.42916870117188, -104.44654846191406, -101.46392822265625, -98.48130798339844, -95.49868774414062, -92.51606750488281, -89.533447265625, -86.55082702636719, -83.5682144165039, -80.5855941772461, -77.60297393798828, -74.62035369873047, -71.63773345947266, -68.65511322021484, -65.67250061035156, -62.689876556396484, -59.70725631713867, -56.72463607788086, -53.74201583862305, -50.7593994140625, -47.77677917480469, -44.794158935546875, -41.81153869628906, -38.82891845703125, -35.84629821777344, -32.863677978515625, -29.881057739257812, -26.898439407348633, -23.91581916809082, -20.933198928833008, -17.950580596923828, -14.967960357666016, -11.985340118408203, -9.00271987915039, -6.0201005935668945, -3.0374813079833984, -0.05486106872558594, 2.9277591705322266, 5.910377502441406, 8.892997741699219, 11.875617980957031, 14.858238220214844, 17.840858459472656, 20.823476791381836, 23.80609703063965, 26.78871726989746, 29.77133560180664, 32.75395584106445, 35.736576080322266, 38.71919631958008, 41.70181655883789, 44.68443298339844, 47.66705322265625, 50.64967346191406, 53.632293701171875, 56.61491394042969, 59.5975341796875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 12.0, 10.0, 8.0, 12.0, 7.0, 15.0, 16.0, 22.0, 22.0, 25.0, 29.0, 37.0, 38.0, 43.0, 41.0, 49.0, 48.0, 57.0, 37.0, 44.0, 42.0, 43.0, 51.0, 37.0, 40.0, 31.0, 34.0, 17.0, 18.0, 22.0, 20.0, 20.0, 9.0, 5.0, 10.0, 9.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.43429183959961, -19.788476943969727, -19.142662048339844, -18.49684715270996, -17.851032257080078, -17.205215454101562, -16.55940055847168, -15.913585662841797, -15.267770767211914, -14.621955871582031, -13.976140975952148, -13.33032512664795, -12.684510231018066, -12.038695335388184, -11.392879486083984, -10.747064590454102, -10.101249694824219, -9.455434799194336, -8.809619903564453, -8.163804054260254, -7.517989158630371, -6.872174263000488, -6.226358890533447, -5.580543518066406, -4.934728622436523, -4.288913726806641, -3.6430983543395996, -2.9972832202911377, -2.351468086242676, -1.7056529521942139, -1.059837818145752, -0.41402244567871094, 0.2317943572998047, 0.8776094913482666, 1.5234246253967285, 2.1692397594451904, 2.8150548934936523, 3.4608700275421143, 4.106685161590576, 4.752500534057617, 5.3983154296875, 6.044130325317383, 6.689945697784424, 7.335761070251465, 7.981575965881348, 8.62739086151123, 9.27320671081543, 9.919021606445312, 10.564836502075195, 11.210651397705078, 11.856466293334961, 12.50228214263916, 13.148097038269043, 13.793911933898926, 14.439727783203125, 15.085542678833008, 15.73135757446289, 16.377172470092773, 17.022987365722656, 17.66880226135254, 18.314617156982422, 18.960433959960938, 19.60624885559082, 20.252063751220703, 20.897878646850586]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 12.0, 16.0, 25.0, 21.0, 26.0, 28.0, 33.0, 29.0, 34.0, 25.0, 41.0, 40.0, 41.0, 46.0, 44.0, 43.0, 59.0, 40.0, 38.0, 32.0, 42.0, 25.0, 37.0, 39.0, 31.0, 15.0, 7.0, 21.0, 10.0, 15.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.80859375, -3.695465087890625, -3.58233642578125, -3.469207763671875, -3.3560791015625, -3.242950439453125, -3.12982177734375, -3.016693115234375, -2.903564453125, -2.790435791015625, -2.67730712890625, -2.564178466796875, -2.4510498046875, -2.337921142578125, -2.22479248046875, -2.111663818359375, -1.99853515625, -1.885406494140625, -1.77227783203125, -1.659149169921875, -1.5460205078125, -1.432891845703125, -1.31976318359375, -1.206634521484375, -1.093505859375, -0.980377197265625, -0.86724853515625, -0.754119873046875, -0.6409912109375, -0.527862548828125, -0.41473388671875, -0.301605224609375, -0.1884765625, -0.075347900390625, 0.03778076171875, 0.150909423828125, 0.2640380859375, 0.377166748046875, 0.49029541015625, 0.603424072265625, 0.716552734375, 0.829681396484375, 0.94281005859375, 1.055938720703125, 1.1690673828125, 1.282196044921875, 1.39532470703125, 1.508453369140625, 1.62158203125, 1.734710693359375, 1.84783935546875, 1.960968017578125, 2.0740966796875, 2.187225341796875, 2.30035400390625, 2.413482666015625, 2.526611328125, 2.639739990234375, 2.75286865234375, 2.865997314453125, 2.9791259765625, 3.092254638671875, 3.20538330078125, 3.318511962890625, 3.431640625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 8.0, 10.0, 8.0, 9.0, 30.0, 39.0, 67.0, 88.0, 124.0, 188.0, 295.0, 385.0, 620.0, 817.0, 1237.0, 1815.0, 2569.0, 3780.0, 5494.0, 8141.0, 12232.0, 18936.0, 29631.0, 48111.0, 81166.0, 140437.0, 220015.0, 187181.0, 110483.0, 64327.0, 38628.0, 24286.0, 15310.0, 10251.0, 6876.0, 4626.0, 3180.0, 2167.0, 1513.0, 1044.0, 745.0, 549.0, 336.0, 254.0, 159.0, 140.0, 87.0, 49.0, 40.0, 19.0, 26.0, 16.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34716796875, -0.33551025390625, -0.3238525390625, -0.31219482421875, -0.300537109375, -0.28887939453125, -0.2772216796875, -0.26556396484375, -0.25390625, -0.24224853515625, -0.2305908203125, -0.21893310546875, -0.207275390625, -0.19561767578125, -0.1839599609375, -0.17230224609375, -0.16064453125, -0.14898681640625, -0.1373291015625, -0.12567138671875, -0.114013671875, -0.10235595703125, -0.0906982421875, -0.07904052734375, -0.0673828125, -0.05572509765625, -0.0440673828125, -0.03240966796875, -0.020751953125, -0.00909423828125, 0.0025634765625, 0.01422119140625, 0.02587890625, 0.03753662109375, 0.0491943359375, 0.06085205078125, 0.072509765625, 0.08416748046875, 0.0958251953125, 0.10748291015625, 0.119140625, 0.13079833984375, 0.1424560546875, 0.15411376953125, 0.165771484375, 0.17742919921875, 0.1890869140625, 0.20074462890625, 0.21240234375, 0.22406005859375, 0.2357177734375, 0.24737548828125, 0.259033203125, 0.27069091796875, 0.2823486328125, 0.29400634765625, 0.3056640625, 0.31732177734375, 0.3289794921875, 0.34063720703125, 0.352294921875, 0.36395263671875, 0.3756103515625, 0.38726806640625, 0.39892578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 2.0, 4.0, 3.0, 8.0, 10.0, 11.0, 9.0, 18.0, 15.0, 18.0, 30.0, 21.0, 24.0, 36.0, 29.0, 32.0, 34.0, 28.0, 41.0, 60.0, 49.0, 1056.0, 49.0, 37.0, 41.0, 43.0, 21.0, 28.0, 39.0, 33.0, 32.0, 28.0, 7.0, 25.0, 16.0, 15.0, 12.0, 8.0, 17.0, 9.0, 7.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.19921875, -2.12896728515625, -2.0587158203125, -1.98846435546875, -1.918212890625, -1.84796142578125, -1.7777099609375, -1.70745849609375, -1.63720703125, -1.56695556640625, -1.4967041015625, -1.42645263671875, -1.356201171875, -1.28594970703125, -1.2156982421875, -1.14544677734375, -1.0751953125, -1.00494384765625, -0.9346923828125, -0.86444091796875, -0.794189453125, -0.72393798828125, -0.6536865234375, -0.58343505859375, -0.51318359375, -0.44293212890625, -0.3726806640625, -0.30242919921875, -0.232177734375, -0.16192626953125, -0.0916748046875, -0.02142333984375, 0.048828125, 0.11907958984375, 0.1893310546875, 0.25958251953125, 0.329833984375, 0.40008544921875, 0.4703369140625, 0.54058837890625, 0.61083984375, 0.68109130859375, 0.7513427734375, 0.82159423828125, 0.891845703125, 0.96209716796875, 1.0323486328125, 1.10260009765625, 1.1728515625, 1.24310302734375, 1.3133544921875, 1.38360595703125, 1.453857421875, 1.52410888671875, 1.5943603515625, 1.66461181640625, 1.73486328125, 1.80511474609375, 1.8753662109375, 1.94561767578125, 2.015869140625, 2.08612060546875, 2.1563720703125, 2.22662353515625, 2.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 9.0, 6.0, 12.0, 25.0, 24.0, 45.0, 62.0, 83.0, 125.0, 163.0, 253.0, 339.0, 507.0, 770.0, 1094.0, 1448.0, 2148.0, 3190.0, 4640.0, 6966.0, 10436.0, 15590.0, 24344.0, 38033.0, 61305.0, 99602.0, 160775.0, 1253228.0, 153178.0, 94840.0, 58552.0, 36414.0, 22974.0, 15127.0, 9871.0, 6435.0, 4345.0, 3134.0, 2087.0, 1443.0, 1007.0, 727.0, 537.0, 367.0, 264.0, 181.0, 141.0, 90.0, 76.0, 45.0, 23.0, 16.0, 19.0, 11.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.2939453125, -0.28459930419921875, -0.2752532958984375, -0.26590728759765625, -0.256561279296875, -0.24721527099609375, -0.2378692626953125, -0.22852325439453125, -0.21917724609375, -0.20983123779296875, -0.2004852294921875, -0.19113922119140625, -0.181793212890625, -0.17244720458984375, -0.1631011962890625, -0.15375518798828125, -0.1444091796875, -0.13506317138671875, -0.1257171630859375, -0.11637115478515625, -0.107025146484375, -0.09767913818359375, -0.0883331298828125, -0.07898712158203125, -0.06964111328125, -0.06029510498046875, -0.0509490966796875, -0.04160308837890625, -0.032257080078125, -0.02291107177734375, -0.0135650634765625, -0.00421905517578125, 0.005126953125, 0.01447296142578125, 0.0238189697265625, 0.03316497802734375, 0.042510986328125, 0.05185699462890625, 0.0612030029296875, 0.07054901123046875, 0.07989501953125, 0.08924102783203125, 0.0985870361328125, 0.10793304443359375, 0.117279052734375, 0.12662506103515625, 0.1359710693359375, 0.14531707763671875, 0.1546630859375, 0.16400909423828125, 0.1733551025390625, 0.18270111083984375, 0.192047119140625, 0.20139312744140625, 0.2107391357421875, 0.22008514404296875, 0.22943115234375, 0.23877716064453125, 0.2481231689453125, 0.25746917724609375, 0.266815185546875, 0.27616119384765625, 0.2855072021484375, 0.29485321044921875, 0.30419921875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 6.0, 13.0, 9.0, 9.0, 21.0, 9.0, 30.0, 32.0, 51.0, 57.0, 53.0, 86.0, 110.0, 85.0, 79.0, 96.0, 43.0, 41.0, 30.0, 31.0, 19.0, 16.0, 6.0, 18.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020904541015625, -0.0020271241664886475, -0.001963794231414795, -0.0019004642963409424, -0.0018371343612670898, -0.0017738044261932373, -0.0017104744911193848, -0.0016471445560455322, -0.0015838146209716797, -0.0015204846858978271, -0.0014571547508239746, -0.001393824815750122, -0.0013304948806762695, -0.001267164945602417, -0.0012038350105285645, -0.001140505075454712, -0.0010771751403808594, -0.0010138452053070068, -0.0009505152702331543, -0.0008871853351593018, -0.0008238554000854492, -0.0007605254650115967, -0.0006971955299377441, -0.0006338655948638916, -0.0005705356597900391, -0.0005072057247161865, -0.000443875789642334, -0.00038054585456848145, -0.0003172159194946289, -0.00025388598442077637, -0.00019055604934692383, -0.0001272261142730713, -6.389617919921875e-05, -5.662441253662109e-07, 6.276369094848633e-05, 0.00012609362602233887, 0.0001894235610961914, 0.00025275349617004395, 0.0003160834312438965, 0.000379413366317749, 0.00044274330139160156, 0.0005060732364654541, 0.0005694031715393066, 0.0006327331066131592, 0.0006960630416870117, 0.0007593929767608643, 0.0008227229118347168, 0.0008860528469085693, 0.0009493827819824219, 0.0010127127170562744, 0.001076042652130127, 0.0011393725872039795, 0.001202702522277832, 0.0012660324573516846, 0.0013293623924255371, 0.0013926923274993896, 0.0014560222625732422, 0.0015193521976470947, 0.0015826821327209473, 0.0016460120677947998, 0.0017093420028686523, 0.0017726719379425049, 0.0018360018730163574, 0.00189933180809021, 0.0019626617431640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 12.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 19.0, 29.0, 31.0, 31.0, 63.0, 74.0, 107.0, 164.0, 270.0, 583.0, 1673.0, 970045.0, 73236.0, 1006.0, 393.0, 258.0, 162.0, 89.0, 71.0, 36.0, 40.0, 30.0, 25.0, 16.0, 9.0, 17.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.036285400390625, -0.03510856628417969, -0.033931732177734375, -0.03275489807128906, -0.03157806396484375, -0.030401229858398438, -0.029224395751953125, -0.028047561645507812, -0.0268707275390625, -0.025693893432617188, -0.024517059326171875, -0.023340225219726562, -0.02216339111328125, -0.020986557006835938, -0.019809722900390625, -0.018632888793945312, -0.0174560546875, -0.016279220581054688, -0.015102386474609375, -0.013925552368164062, -0.01274871826171875, -0.011571884155273438, -0.010395050048828125, -0.009218215942382812, -0.0080413818359375, -0.0068645477294921875, -0.005687713623046875, -0.0045108795166015625, -0.00333404541015625, -0.0021572113037109375, -0.000980377197265625, 0.0001964569091796875, 0.001373291015625, 0.0025501251220703125, 0.003726959228515625, 0.0049037933349609375, 0.00608062744140625, 0.0072574615478515625, 0.008434295654296875, 0.009611129760742188, 0.0107879638671875, 0.011964797973632812, 0.013141632080078125, 0.014318466186523438, 0.01549530029296875, 0.016672134399414062, 0.017848968505859375, 0.019025802612304688, 0.02020263671875, 0.021379470825195312, 0.022556304931640625, 0.023733139038085938, 0.02490997314453125, 0.026086807250976562, 0.027263641357421875, 0.028440475463867188, 0.0296173095703125, 0.030794143676757812, 0.031970977783203125, 0.03314781188964844, 0.03432464599609375, 0.03550148010253906, 0.036678314208984375, 0.03785514831542969, 0.039031982421875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 15.0, 70.0, 248.0, 370.0, 215.0, 75.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031177103519439697, -0.0030344061087816954, -0.002951101865619421, -0.0028677978552877903, -0.002784493612125516, -0.0027011893689632416, -0.002617885125800967, -0.002534580882638693, -0.002451276872307062, -0.002367972629144788, -0.0022846683859825134, -0.0022013643756508827, -0.0021180601324886084, -0.002034755889326334, -0.0019514516461640596, -0.0018681474030017853, -0.001784843159839511, -0.0017015389166772366, -0.001618234789930284, -0.0015349305467680097, -0.0014516264200210571, -0.0013683221768587828, -0.0012850179336965084, -0.001201713690534234, -0.0011184095637872815, -0.0010351053206250072, -0.0009518011938780546, -0.0008684969507157803, -0.0007851927657611668, -0.0007018885808065534, -0.000618584337644279, -0.0005352801526896656, -0.0004519759677350521, -0.00036867178278043866, -0.00028536756872199476, -0.00020206335466355085, -0.0001187591697089374, -3.545498475432396e-05, 4.78492584079504e-05, 0.00013115344336256385, 0.0002144576283171773, 0.00029776181327179074, 0.00038106602733023465, 0.00046437024138867855, 0.000547674426343292, 0.0006309786112979054, 0.0007142828544601798, 0.0007975870394147933, 0.0008808912243694067, 0.0009641954093240201, 0.0010474995942786336, 0.001130803837440908, 0.0012141079641878605, 0.0012974122073501348, 0.0013807164505124092, 0.0014640206936746836, 0.001547324820421636, 0.0016306290635839105, 0.001713933190330863, 0.0017972374334931374, 0.0018805416766554117, 0.001963845919817686, 0.002047149930149317, 0.002130454173311591, 0.0022137584164738655]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 5.0, 11.0, 11.0, 7.0, 9.0, 14.0, 16.0, 20.0, 26.0, 25.0, 34.0, 28.0, 40.0, 39.0, 43.0, 44.0, 43.0, 44.0, 41.0, 45.0, 43.0, 45.0, 36.0, 34.0, 42.0, 45.0, 35.0, 31.0, 17.0, 22.0, 19.0, 19.0, 14.0, 12.0, 6.0, 5.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008981227874755859, -0.0008695870637893677, -0.0008410513401031494, -0.0008125156164169312, -0.0007839798927307129, -0.0007554441690444946, -0.0007269084453582764, -0.0006983727216720581, -0.0006698369979858398, -0.0006413012742996216, -0.0006127655506134033, -0.0005842298269271851, -0.0005556941032409668, -0.0005271583795547485, -0.0004986226558685303, -0.000470086932182312, -0.00044155120849609375, -0.0004130154848098755, -0.0003844797611236572, -0.00035594403743743896, -0.0003274083137512207, -0.00029887259006500244, -0.0002703368663787842, -0.00024180114269256592, -0.00021326541900634766, -0.0001847296953201294, -0.00015619397163391113, -0.00012765824794769287, -9.912252426147461e-05, -7.058680057525635e-05, -4.2051076889038086e-05, -1.3515353202819824e-05, 1.5020370483398438e-05, 4.35560941696167e-05, 7.209181785583496e-05, 0.00010062754154205322, 0.00012916326522827148, 0.00015769898891448975, 0.000186234712600708, 0.00021477043628692627, 0.00024330615997314453, 0.0002718418836593628, 0.00030037760734558105, 0.0003289133310317993, 0.0003574490547180176, 0.00038598477840423584, 0.0004145205020904541, 0.00044305622577667236, 0.0004715919494628906, 0.0005001276731491089, 0.0005286633968353271, 0.0005571991205215454, 0.0005857348442077637, 0.0006142705678939819, 0.0006428062915802002, 0.0006713420152664185, 0.0006998777389526367, 0.000728413462638855, 0.0007569491863250732, 0.0007854849100112915, 0.0008140206336975098, 0.000842556357383728, 0.0008710920810699463, 0.0008996278047561646, 0.0009281635284423828]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 12.0, 16.0, 25.0, 21.0, 26.0, 28.0, 33.0, 29.0, 34.0, 25.0, 41.0, 40.0, 41.0, 46.0, 44.0, 43.0, 59.0, 40.0, 38.0, 32.0, 42.0, 25.0, 37.0, 39.0, 31.0, 15.0, 7.0, 21.0, 10.0, 15.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.80859375, -3.695465087890625, -3.58233642578125, -3.469207763671875, -3.3560791015625, -3.242950439453125, -3.12982177734375, -3.016693115234375, -2.903564453125, -2.790435791015625, -2.67730712890625, -2.564178466796875, -2.4510498046875, -2.337921142578125, -2.22479248046875, -2.111663818359375, -1.99853515625, -1.885406494140625, -1.77227783203125, -1.659149169921875, -1.5460205078125, -1.432891845703125, -1.31976318359375, -1.206634521484375, -1.093505859375, -0.980377197265625, -0.86724853515625, -0.754119873046875, -0.6409912109375, -0.527862548828125, -0.41473388671875, -0.301605224609375, -0.1884765625, -0.075347900390625, 0.03778076171875, 0.150909423828125, 0.2640380859375, 0.377166748046875, 0.49029541015625, 0.603424072265625, 0.716552734375, 0.829681396484375, 0.94281005859375, 1.055938720703125, 1.1690673828125, 1.282196044921875, 1.39532470703125, 1.508453369140625, 1.62158203125, 1.734710693359375, 1.84783935546875, 1.960968017578125, 2.0740966796875, 2.187225341796875, 2.30035400390625, 2.413482666015625, 2.526611328125, 2.639739990234375, 2.75286865234375, 2.865997314453125, 2.9791259765625, 3.092254638671875, 3.20538330078125, 3.318511962890625, 3.431640625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 29.0, 29.0, 47.0, 44.0, 69.0, 73.0, 102.0, 160.0, 202.0, 270.0, 323.0, 469.0, 643.0, 897.0, 1199.0, 1959.0, 5248.0, 28376.0, 163862.0, 534123.0, 250260.0, 44924.0, 7830.0, 2365.0, 1364.0, 909.0, 658.0, 516.0, 385.0, 298.0, 228.0, 169.0, 124.0, 91.0, 68.0, 55.0, 31.0, 23.0, 25.0, 19.0, 15.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0], "bins": [-7.01953125, -6.797607421875, -6.57568359375, -6.353759765625, -6.1318359375, -5.909912109375, -5.68798828125, -5.466064453125, -5.244140625, -5.022216796875, -4.80029296875, -4.578369140625, -4.3564453125, -4.134521484375, -3.91259765625, -3.690673828125, -3.46875, -3.246826171875, -3.02490234375, -2.802978515625, -2.5810546875, -2.359130859375, -2.13720703125, -1.915283203125, -1.693359375, -1.471435546875, -1.24951171875, -1.027587890625, -0.8056640625, -0.583740234375, -0.36181640625, -0.139892578125, 0.08203125, 0.303955078125, 0.52587890625, 0.747802734375, 0.9697265625, 1.191650390625, 1.41357421875, 1.635498046875, 1.857421875, 2.079345703125, 2.30126953125, 2.523193359375, 2.7451171875, 2.967041015625, 3.18896484375, 3.410888671875, 3.6328125, 3.854736328125, 4.07666015625, 4.298583984375, 4.5205078125, 4.742431640625, 4.96435546875, 5.186279296875, 5.408203125, 5.630126953125, 5.85205078125, 6.073974609375, 6.2958984375, 6.517822265625, 6.73974609375, 6.961669921875, 7.18359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 7.0, 10.0, 12.0, 17.0, 21.0, 32.0, 40.0, 35.0, 27.0, 47.0, 65.0, 53.0, 110.0, 186.0, 1353.0, 318.0, 172.0, 93.0, 82.0, 51.0, 37.0, 33.0, 24.0, 35.0, 35.0, 19.0, 26.0, 17.0, 17.0, 15.0, 6.0, 6.0, 13.0, 3.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.71875, -8.4461669921875, -8.173583984375, -7.9010009765625, -7.62841796875, -7.3558349609375, -7.083251953125, -6.8106689453125, -6.5380859375, -6.2655029296875, -5.992919921875, -5.7203369140625, -5.44775390625, -5.1751708984375, -4.902587890625, -4.6300048828125, -4.357421875, -4.0848388671875, -3.812255859375, -3.5396728515625, -3.26708984375, -2.9945068359375, -2.721923828125, -2.4493408203125, -2.1767578125, -1.9041748046875, -1.631591796875, -1.3590087890625, -1.08642578125, -0.8138427734375, -0.541259765625, -0.2686767578125, 0.00390625, 0.2764892578125, 0.549072265625, 0.8216552734375, 1.09423828125, 1.3668212890625, 1.639404296875, 1.9119873046875, 2.1845703125, 2.4571533203125, 2.729736328125, 3.0023193359375, 3.27490234375, 3.5474853515625, 3.820068359375, 4.0926513671875, 4.365234375, 4.6378173828125, 4.910400390625, 5.1829833984375, 5.45556640625, 5.7281494140625, 6.000732421875, 6.2733154296875, 6.5458984375, 6.8184814453125, 7.091064453125, 7.3636474609375, 7.63623046875, 7.9088134765625, 8.181396484375, 8.4539794921875, 8.7265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 2.0, 14.0, 10.0, 16.0, 19.0, 25.0, 28.0, 47.0, 57.0, 87.0, 107.0, 160.0, 242.0, 366.0, 645.0, 1253.0, 5115.0, 3129565.0, 4941.0, 1232.0, 619.0, 345.0, 229.0, 164.0, 114.0, 68.0, 62.0, 36.0, 30.0, 24.0, 14.0, 12.0, 12.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.4951171875, -33.240234375, -31.9853515625, -30.73046875, -29.4755859375, -28.220703125, -26.9658203125, -25.7109375, -24.4560546875, -23.201171875, -21.9462890625, -20.69140625, -19.4365234375, -18.181640625, -16.9267578125, -15.671875, -14.4169921875, -13.162109375, -11.9072265625, -10.65234375, -9.3974609375, -8.142578125, -6.8876953125, -5.6328125, -4.3779296875, -3.123046875, -1.8681640625, -0.61328125, 0.6416015625, 1.896484375, 3.1513671875, 4.40625, 5.6611328125, 6.916015625, 8.1708984375, 9.42578125, 10.6806640625, 11.935546875, 13.1904296875, 14.4453125, 15.7001953125, 16.955078125, 18.2099609375, 19.46484375, 20.7197265625, 21.974609375, 23.2294921875, 24.484375, 25.7392578125, 26.994140625, 28.2490234375, 29.50390625, 30.7587890625, 32.013671875, 33.2685546875, 34.5234375, 35.7783203125, 37.033203125, 38.2880859375, 39.54296875, 40.7978515625, 42.052734375, 43.3076171875, 44.5625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 120.0, 611.0, 261.0, 20.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-119.82560729980469, -117.14168548583984, -114.45775604248047, -111.77383422851562, -109.08990478515625, -106.4059829711914, -103.72206115722656, -101.03813171386719, -98.35420989990234, -95.6702880859375, -92.98635864257812, -90.30243682861328, -87.61851501464844, -84.93458557128906, -82.25066375732422, -79.56674194335938, -76.8828125, -74.19889068603516, -71.51496124267578, -68.83103942871094, -66.14710998535156, -63.46318817138672, -60.779266357421875, -58.095340728759766, -55.411415100097656, -52.72748947143555, -50.04356384277344, -47.359642028808594, -44.675716400146484, -41.991790771484375, -39.30786895751953, -36.62394332885742, -33.94001007080078, -31.256084442138672, -28.572160720825195, -25.88823699951172, -23.20431137084961, -20.5203857421875, -17.836462020874023, -15.152538299560547, -12.468612670898438, -9.784687995910645, -7.100763320922852, -4.416838645935059, -1.7329139709472656, 0.9510107040405273, 3.6349353790283203, 6.318859100341797, 9.002784729003906, 11.6867094039917, 14.370634078979492, 17.05455780029297, 19.738483428955078, 22.422409057617188, 25.106332778930664, 27.79025650024414, 30.47418212890625, 33.15810775756836, 35.84203338623047, 38.52595520019531, 41.20988082885742, 43.89380645751953, 46.577728271484375, 49.261653900146484, 51.945579528808594]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 12.0, 7.0, 10.0, 12.0, 13.0, 16.0, 16.0, 19.0, 21.0, 23.0, 25.0, 24.0, 31.0, 29.0, 27.0, 35.0, 32.0, 28.0, 42.0, 39.0, 41.0, 49.0, 46.0, 34.0, 40.0, 33.0, 41.0, 32.0, 25.0, 24.0, 21.0, 21.0, 18.0, 15.0, 19.0, 14.0, 21.0, 5.0, 5.0, 8.0, 10.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-21.61600112915039, -20.964628219604492, -20.313257217407227, -19.661884307861328, -19.01051139831543, -18.35913848876953, -17.707767486572266, -17.056394577026367, -16.40502166748047, -15.753649711608887, -15.102276802062988, -14.450904846191406, -13.799531936645508, -13.148159980773926, -12.496788024902344, -11.845415115356445, -11.19404411315918, -10.542672157287598, -9.8912992477417, -9.239927291870117, -8.588554382324219, -7.937182426452637, -7.285810470581055, -6.6344380378723145, -5.983065605163574, -5.331693172454834, -4.680320739746094, -4.028948783874512, -3.3775763511657715, -2.7262039184570312, -2.07483172416687, -1.423459529876709, -0.7720870971679688, -0.12071478366851807, 0.5306575298309326, 1.1820298433303833, 1.833402156829834, 2.484774589538574, 3.1361467838287354, 3.7875189781188965, 4.438891410827637, 5.090263843536377, 5.741636276245117, 6.393008232116699, 7.0443806648254395, 7.69575309753418, 8.347125053405762, 8.998497009277344, 9.649869918823242, 10.301241874694824, 10.952614784240723, 11.603986740112305, 12.255359649658203, 12.906731605529785, 13.558103561401367, 14.209476470947266, 14.860848426818848, 15.51222038269043, 16.163593292236328, 16.814966201782227, 17.466337203979492, 18.11771011352539, 18.76908302307129, 19.420454025268555, 20.071826934814453]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 11.0, 11.0, 14.0, 14.0, 16.0, 25.0, 25.0, 20.0, 28.0, 36.0, 29.0, 41.0, 36.0, 41.0, 34.0, 53.0, 45.0, 42.0, 39.0, 33.0, 52.0, 61.0, 30.0, 33.0, 34.0, 18.0, 21.0, 23.0, 22.0, 16.0, 14.0, 10.0, 12.0, 9.0, 3.0, 9.0, 5.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41015625, -3.29620361328125, -3.1822509765625, -3.06829833984375, -2.954345703125, -2.84039306640625, -2.7264404296875, -2.61248779296875, -2.49853515625, -2.38458251953125, -2.2706298828125, -2.15667724609375, -2.042724609375, -1.92877197265625, -1.8148193359375, -1.70086669921875, -1.5869140625, -1.47296142578125, -1.3590087890625, -1.24505615234375, -1.131103515625, -1.01715087890625, -0.9031982421875, -0.78924560546875, -0.67529296875, -0.56134033203125, -0.4473876953125, -0.33343505859375, -0.219482421875, -0.10552978515625, 0.0084228515625, 0.12237548828125, 0.236328125, 0.35028076171875, 0.4642333984375, 0.57818603515625, 0.692138671875, 0.80609130859375, 0.9200439453125, 1.03399658203125, 1.14794921875, 1.26190185546875, 1.3758544921875, 1.48980712890625, 1.603759765625, 1.71771240234375, 1.8316650390625, 1.94561767578125, 2.0595703125, 2.17352294921875, 2.2874755859375, 2.40142822265625, 2.515380859375, 2.62933349609375, 2.7432861328125, 2.85723876953125, 2.97119140625, 3.08514404296875, 3.1990966796875, 3.31304931640625, 3.427001953125, 3.54095458984375, 3.6549072265625, 3.76885986328125, 3.8828125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 5.0, 14.0, 21.0, 18.0, 31.0, 32.0, 58.0, 95.0, 131.0, 190.0, 338.0, 556.0, 1000.0, 1859.0, 3999.0, 9374.0, 26073.0, 85366.0, 294996.0, 873904.0, 1582842.0, 885385.0, 298695.0, 85412.0, 25974.0, 9562.0, 3951.0, 1934.0, 977.0, 503.0, 317.0, 211.0, 127.0, 72.0, 68.0, 55.0, 27.0, 22.0, 24.0, 15.0, 5.0, 8.0, 12.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.506378173828125, -3.37408447265625, -3.241790771484375, -3.1094970703125, -2.977203369140625, -2.84490966796875, -2.712615966796875, -2.580322265625, -2.448028564453125, -2.31573486328125, -2.183441162109375, -2.0511474609375, -1.918853759765625, -1.78656005859375, -1.654266357421875, -1.52197265625, -1.389678955078125, -1.25738525390625, -1.125091552734375, -0.9927978515625, -0.860504150390625, -0.72821044921875, -0.595916748046875, -0.463623046875, -0.331329345703125, -0.19903564453125, -0.066741943359375, 0.0655517578125, 0.197845458984375, 0.33013916015625, 0.462432861328125, 0.5947265625, 0.727020263671875, 0.85931396484375, 0.991607666015625, 1.1239013671875, 1.256195068359375, 1.38848876953125, 1.520782470703125, 1.653076171875, 1.785369873046875, 1.91766357421875, 2.049957275390625, 2.1822509765625, 2.314544677734375, 2.44683837890625, 2.579132080078125, 2.71142578125, 2.843719482421875, 2.97601318359375, 3.108306884765625, 3.2406005859375, 3.372894287109375, 3.50518798828125, 3.637481689453125, 3.769775390625, 3.902069091796875, 4.03436279296875, 4.166656494140625, 4.2989501953125, 4.431243896484375, 4.56353759765625, 4.695831298828125, 4.828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 8.0, 14.0, 16.0, 31.0, 29.0, 36.0, 52.0, 71.0, 101.0, 123.0, 183.0, 238.0, 363.0, 463.0, 546.0, 448.0, 342.0, 237.0, 182.0, 139.0, 100.0, 100.0, 51.0, 51.0, 33.0, 31.0, 20.0, 20.0, 7.0, 7.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.23046875, -7.02032470703125, -6.8101806640625, -6.60003662109375, -6.389892578125, -6.17974853515625, -5.9696044921875, -5.75946044921875, -5.54931640625, -5.33917236328125, -5.1290283203125, -4.91888427734375, -4.708740234375, -4.49859619140625, -4.2884521484375, -4.07830810546875, -3.8681640625, -3.65802001953125, -3.4478759765625, -3.23773193359375, -3.027587890625, -2.81744384765625, -2.6072998046875, -2.39715576171875, -2.18701171875, -1.97686767578125, -1.7667236328125, -1.55657958984375, -1.346435546875, -1.13629150390625, -0.9261474609375, -0.71600341796875, -0.505859375, -0.29571533203125, -0.0855712890625, 0.12457275390625, 0.334716796875, 0.54486083984375, 0.7550048828125, 0.96514892578125, 1.17529296875, 1.38543701171875, 1.5955810546875, 1.80572509765625, 2.015869140625, 2.22601318359375, 2.4361572265625, 2.64630126953125, 2.8564453125, 3.06658935546875, 3.2767333984375, 3.48687744140625, 3.697021484375, 3.90716552734375, 4.1173095703125, 4.32745361328125, 4.53759765625, 4.74774169921875, 4.9578857421875, 5.16802978515625, 5.378173828125, 5.58831787109375, 5.7984619140625, 6.00860595703125, 6.21875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 14.0, 29.0, 26.0, 55.0, 117.0, 182.0, 326.0, 595.0, 1473.0, 4966.0, 86031.0, 3227877.0, 847236.0, 20827.0, 2621.0, 919.0, 447.0, 223.0, 128.0, 67.0, 51.0, 22.0, 13.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-20.71875, -20.234619140625, -19.75048828125, -19.266357421875, -18.7822265625, -18.298095703125, -17.81396484375, -17.329833984375, -16.845703125, -16.361572265625, -15.87744140625, -15.393310546875, -14.9091796875, -14.425048828125, -13.94091796875, -13.456787109375, -12.97265625, -12.488525390625, -12.00439453125, -11.520263671875, -11.0361328125, -10.552001953125, -10.06787109375, -9.583740234375, -9.099609375, -8.615478515625, -8.13134765625, -7.647216796875, -7.1630859375, -6.678955078125, -6.19482421875, -5.710693359375, -5.2265625, -4.742431640625, -4.25830078125, -3.774169921875, -3.2900390625, -2.805908203125, -2.32177734375, -1.837646484375, -1.353515625, -0.869384765625, -0.38525390625, 0.098876953125, 0.5830078125, 1.067138671875, 1.55126953125, 2.035400390625, 2.51953125, 3.003662109375, 3.48779296875, 3.971923828125, 4.4560546875, 4.940185546875, 5.42431640625, 5.908447265625, 6.392578125, 6.876708984375, 7.36083984375, 7.844970703125, 8.3291015625, 8.813232421875, 9.29736328125, 9.781494140625, 10.265625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 122.0, 636.0, 241.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.91302490234375, -168.05313110351562, -163.19322204589844, -158.3333282470703, -153.4734344482422, -148.613525390625, -143.75363159179688, -138.89373779296875, -134.03382873535156, -129.17393493652344, -124.31403350830078, -119.45413208007812, -114.59423065185547, -109.73432922363281, -104.87443542480469, -100.01453399658203, -95.1546401977539, -90.29473876953125, -85.43484497070312, -80.57494354248047, -75.71504211425781, -70.85514831542969, -65.99524688720703, -61.135345458984375, -56.275447845458984, -51.415550231933594, -46.55564880371094, -41.69575119018555, -36.835853576660156, -31.9759521484375, -27.11605453491211, -22.256153106689453, -17.396255493164062, -12.536355972290039, -7.676457405090332, -2.816558837890625, 2.0433406829833984, 6.903240203857422, 11.763137817382812, 16.62303924560547, 21.48293685913086, 26.342836380004883, 31.202735900878906, 36.0626335144043, 40.92253112792969, 45.782432556152344, 50.642330169677734, 55.50223159790039, 60.36212921142578, 65.22203063964844, 70.08192443847656, 74.94182586669922, 79.80172729492188, 84.66162109375, 89.52152252197266, 94.38142395019531, 99.24131774902344, 104.1012191772461, 108.96111297607422, 113.82101440429688, 118.68091583251953, 123.54081726074219, 128.4007110595703, 133.2606201171875, 138.12051391601562]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 8.0, 12.0, 19.0, 25.0, 22.0, 19.0, 20.0, 24.0, 28.0, 36.0, 31.0, 33.0, 42.0, 41.0, 32.0, 36.0, 40.0, 35.0, 38.0, 25.0, 33.0, 44.0, 37.0, 23.0, 29.0, 36.0, 31.0, 25.0, 14.0, 20.0, 19.0, 23.0, 14.0, 9.0, 11.0, 14.0, 4.0, 5.0, 0.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.626014709472656, -24.84342384338379, -24.06083106994629, -23.278240203857422, -22.495647430419922, -21.713056564331055, -20.930465698242188, -20.147872924804688, -19.36528205871582, -18.582691192626953, -17.800098419189453, -17.017507553100586, -16.23491668701172, -15.452323913574219, -14.669733047485352, -13.887141227722168, -13.104549407958984, -12.3219575881958, -11.539365768432617, -10.75677490234375, -9.974183082580566, -9.191591262817383, -8.409000396728516, -7.626408576965332, -6.843816757202148, -6.061224937438965, -5.2786335945129395, -4.496042251586914, -3.7134504318237305, -2.930858850479126, -2.1482672691345215, -1.365675926208496, -0.5830821990966797, 0.1995093822479248, 0.9821009635925293, 1.7646925449371338, 2.5472841262817383, 3.3298757076263428, 4.112467288970947, 4.895058631896973, 5.677650451660156, 6.46024227142334, 7.242833614349365, 8.02542495727539, 8.808016777038574, 9.590608596801758, 10.373199462890625, 11.155791282653809, 11.938383102416992, 12.720974922180176, 13.50356674194336, 14.286157608032227, 15.06874942779541, 15.851341247558594, 16.63393211364746, 17.416522979736328, 18.199115753173828, 18.981706619262695, 19.764299392700195, 20.546890258789062, 21.329483032226562, 22.11207389831543, 22.894664764404297, 23.677257537841797, 24.459848403930664]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 12.0, 6.0, 9.0, 8.0, 10.0, 26.0, 19.0, 23.0, 18.0, 22.0, 36.0, 35.0, 25.0, 28.0, 49.0, 42.0, 47.0, 41.0, 48.0, 34.0, 42.0, 40.0, 43.0, 37.0, 33.0, 32.0, 25.0, 28.0, 30.0, 31.0, 23.0, 15.0, 8.0, 19.0, 13.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.070343017578125, -2.97467041015625, -2.878997802734375, -2.7833251953125, -2.687652587890625, -2.59197998046875, -2.496307373046875, -2.400634765625, -2.304962158203125, -2.20928955078125, -2.113616943359375, -2.0179443359375, -1.922271728515625, -1.82659912109375, -1.730926513671875, -1.63525390625, -1.539581298828125, -1.44390869140625, -1.348236083984375, -1.2525634765625, -1.156890869140625, -1.06121826171875, -0.965545654296875, -0.869873046875, -0.774200439453125, -0.67852783203125, -0.582855224609375, -0.4871826171875, -0.391510009765625, -0.29583740234375, -0.200164794921875, -0.1044921875, -0.008819580078125, 0.08685302734375, 0.182525634765625, 0.2781982421875, 0.373870849609375, 0.46954345703125, 0.565216064453125, 0.660888671875, 0.756561279296875, 0.85223388671875, 0.947906494140625, 1.0435791015625, 1.139251708984375, 1.23492431640625, 1.330596923828125, 1.42626953125, 1.521942138671875, 1.61761474609375, 1.713287353515625, 1.8089599609375, 1.904632568359375, 2.00030517578125, 2.095977783203125, 2.191650390625, 2.287322998046875, 2.38299560546875, 2.478668212890625, 2.5743408203125, 2.670013427734375, 2.76568603515625, 2.861358642578125, 2.95703125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 11.0, 12.0, 21.0, 34.0, 35.0, 58.0, 80.0, 124.0, 166.0, 250.0, 387.0, 581.0, 799.0, 1160.0, 1800.0, 2686.0, 4038.0, 5910.0, 9126.0, 14069.0, 21845.0, 34605.0, 57239.0, 99709.0, 177797.0, 233800.0, 156189.0, 87383.0, 50617.0, 31098.0, 19574.0, 12577.0, 8210.0, 5437.0, 3617.0, 2409.0, 1642.0, 1105.0, 741.0, 479.0, 352.0, 251.0, 156.0, 125.0, 86.0, 55.0, 39.0, 31.0, 14.0, 8.0, 9.0, 6.0, 2.0, 2.0, 3.0], "bins": [-0.341796875, -0.33185577392578125, -0.3219146728515625, -0.31197357177734375, -0.302032470703125, -0.29209136962890625, -0.2821502685546875, -0.27220916748046875, -0.26226806640625, -0.25232696533203125, -0.2423858642578125, -0.23244476318359375, -0.222503662109375, -0.21256256103515625, -0.2026214599609375, -0.19268035888671875, -0.1827392578125, -0.17279815673828125, -0.1628570556640625, -0.15291595458984375, -0.142974853515625, -0.13303375244140625, -0.1230926513671875, -0.11315155029296875, -0.10321044921875, -0.09326934814453125, -0.0833282470703125, -0.07338714599609375, -0.063446044921875, -0.05350494384765625, -0.0435638427734375, -0.03362274169921875, -0.023681640625, -0.01374053955078125, -0.0037994384765625, 0.00614166259765625, 0.016082763671875, 0.02602386474609375, 0.0359649658203125, 0.04590606689453125, 0.05584716796875, 0.06578826904296875, 0.0757293701171875, 0.08567047119140625, 0.095611572265625, 0.10555267333984375, 0.1154937744140625, 0.12543487548828125, 0.1353759765625, 0.14531707763671875, 0.1552581787109375, 0.16519927978515625, 0.175140380859375, 0.18508148193359375, 0.1950225830078125, 0.20496368408203125, 0.21490478515625, 0.22484588623046875, 0.2347869873046875, 0.24472808837890625, 0.254669189453125, 0.26461029052734375, 0.2745513916015625, 0.28449249267578125, 0.29443359375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 3.0, 4.0, 10.0, 11.0, 10.0, 11.0, 23.0, 18.0, 23.0, 29.0, 24.0, 33.0, 26.0, 23.0, 31.0, 30.0, 43.0, 35.0, 47.0, 41.0, 1059.0, 43.0, 39.0, 41.0, 26.0, 25.0, 44.0, 26.0, 28.0, 30.0, 26.0, 24.0, 23.0, 13.0, 18.0, 11.0, 9.0, 9.0, 16.0, 6.0, 3.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.8505859375, -1.7937774658203125, -1.736968994140625, -1.6801605224609375, -1.62335205078125, -1.5665435791015625, -1.509735107421875, -1.4529266357421875, -1.3961181640625, -1.3393096923828125, -1.282501220703125, -1.2256927490234375, -1.16888427734375, -1.1120758056640625, -1.055267333984375, -0.9984588623046875, -0.941650390625, -0.8848419189453125, -0.828033447265625, -0.7712249755859375, -0.71441650390625, -0.6576080322265625, -0.600799560546875, -0.5439910888671875, -0.4871826171875, -0.4303741455078125, -0.373565673828125, -0.3167572021484375, -0.25994873046875, -0.2031402587890625, -0.146331787109375, -0.0895233154296875, -0.03271484375, 0.0240936279296875, 0.080902099609375, 0.1377105712890625, 0.19451904296875, 0.2513275146484375, 0.308135986328125, 0.3649444580078125, 0.4217529296875, 0.4785614013671875, 0.535369873046875, 0.5921783447265625, 0.64898681640625, 0.7057952880859375, 0.762603759765625, 0.8194122314453125, 0.876220703125, 0.9330291748046875, 0.989837646484375, 1.0466461181640625, 1.10345458984375, 1.1602630615234375, 1.217071533203125, 1.2738800048828125, 1.3306884765625, 1.3874969482421875, 1.444305419921875, 1.5011138916015625, 1.55792236328125, 1.6147308349609375, 1.671539306640625, 1.7283477783203125, 1.78515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 9.0, 7.0, 23.0, 24.0, 33.0, 52.0, 84.0, 108.0, 147.0, 250.0, 336.0, 421.0, 633.0, 881.0, 1342.0, 1884.0, 2734.0, 4132.0, 5933.0, 8821.0, 13258.0, 19920.0, 31303.0, 49177.0, 80120.0, 133621.0, 1254202.0, 184911.0, 113242.0, 68101.0, 41934.0, 26252.0, 17156.0, 11336.0, 7606.0, 5270.0, 3701.0, 2471.0, 1674.0, 1216.0, 854.0, 655.0, 379.0, 278.0, 178.0, 144.0, 122.0, 62.0, 46.0, 31.0, 26.0, 9.0, 8.0, 8.0, 4.0, 6.0, 1.0], "bins": [-0.26806640625, -0.2601432800292969, -0.25222015380859375, -0.24429702758789062, -0.2363739013671875, -0.22845077514648438, -0.22052764892578125, -0.21260452270507812, -0.204681396484375, -0.19675827026367188, -0.18883514404296875, -0.18091201782226562, -0.1729888916015625, -0.16506576538085938, -0.15714263916015625, -0.14921951293945312, -0.14129638671875, -0.13337326049804688, -0.12545013427734375, -0.11752700805664062, -0.1096038818359375, -0.10168075561523438, -0.09375762939453125, -0.08583450317382812, -0.077911376953125, -0.06998825073242188, -0.06206512451171875, -0.054141998291015625, -0.0462188720703125, -0.038295745849609375, -0.03037261962890625, -0.022449493408203125, -0.0145263671875, -0.006603240966796875, 0.00131988525390625, 0.009243011474609375, 0.0171661376953125, 0.025089263916015625, 0.03301239013671875, 0.040935516357421875, 0.048858642578125, 0.056781768798828125, 0.06470489501953125, 0.07262802124023438, 0.0805511474609375, 0.08847427368164062, 0.09639739990234375, 0.10432052612304688, 0.11224365234375, 0.12016677856445312, 0.12808990478515625, 0.13601303100585938, 0.1439361572265625, 0.15185928344726562, 0.15978240966796875, 0.16770553588867188, 0.175628662109375, 0.18355178833007812, 0.19147491455078125, 0.19939804077148438, 0.2073211669921875, 0.21524429321289062, 0.22316741943359375, 0.23109054565429688, 0.239013671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 10.0, 12.0, 7.0, 25.0, 22.0, 21.0, 10.0, 22.0, 39.0, 32.0, 41.0, 37.0, 48.0, 55.0, 61.0, 58.0, 58.0, 45.0, 44.0, 52.0, 37.0, 40.0, 43.0, 28.0, 28.0, 17.0, 19.0, 17.0, 8.0, 10.0, 12.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006933212280273438, -0.0006702244281768799, -0.000647127628326416, -0.0006240308284759521, -0.0006009340286254883, -0.0005778372287750244, -0.0005547404289245605, -0.0005316436290740967, -0.0005085468292236328, -0.00048545002937316895, -0.0004623532295227051, -0.0004392564296722412, -0.00041615962982177734, -0.0003930628299713135, -0.0003699660301208496, -0.00034686923027038574, -0.0003237724304199219, -0.000300675630569458, -0.00027757883071899414, -0.0002544820308685303, -0.0002313852310180664, -0.00020828843116760254, -0.00018519163131713867, -0.0001620948314666748, -0.00013899803161621094, -0.00011590123176574707, -9.28044319152832e-05, -6.970763206481934e-05, -4.661083221435547e-05, -2.35140323638916e-05, -4.172325134277344e-07, 2.2679567337036133e-05, 4.57763671875e-05, 6.887316703796387e-05, 9.196996688842773e-05, 0.0001150667667388916, 0.00013816356658935547, 0.00016126036643981934, 0.0001843571662902832, 0.00020745396614074707, 0.00023055076599121094, 0.0002536475658416748, 0.00027674436569213867, 0.00029984116554260254, 0.0003229379653930664, 0.0003460347652435303, 0.00036913156509399414, 0.000392228364944458, 0.0004153251647949219, 0.00043842196464538574, 0.0004615187644958496, 0.0004846155643463135, 0.0005077123641967773, 0.0005308091640472412, 0.0005539059638977051, 0.0005770027637481689, 0.0006000995635986328, 0.0006231963634490967, 0.0006462931632995605, 0.0006693899631500244, 0.0006924867630004883, 0.0007155835628509521, 0.000738680362701416, 0.0007617771625518799, 0.0007848739624023438]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 3.0, 9.0, 13.0, 14.0, 20.0, 23.0, 34.0, 40.0, 41.0, 62.0, 90.0, 122.0, 171.0, 248.0, 333.0, 628.0, 1511.0, 63391.0, 964120.0, 14856.0, 1074.0, 547.0, 325.0, 221.0, 130.0, 101.0, 84.0, 39.0, 46.0, 48.0, 44.0, 39.0, 21.0, 15.0, 17.0, 14.0, 10.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0139617919921875, -0.013543248176574707, -0.013124704360961914, -0.012706160545349121, -0.012287616729736328, -0.011869072914123535, -0.011450529098510742, -0.01103198528289795, -0.010613441467285156, -0.010194897651672363, -0.00977635383605957, -0.009357810020446777, -0.008939266204833984, -0.008520722389221191, -0.008102178573608398, -0.0076836347579956055, -0.0072650909423828125, -0.0068465471267700195, -0.0064280033111572266, -0.006009459495544434, -0.005590915679931641, -0.005172371864318848, -0.004753828048706055, -0.004335284233093262, -0.003916740417480469, -0.0034981966018676758, -0.003079652786254883, -0.00266110897064209, -0.002242565155029297, -0.001824021339416504, -0.001405477523803711, -0.000986933708190918, -0.000568389892578125, -0.00014984607696533203, 0.00026869773864746094, 0.0006872415542602539, 0.0011057853698730469, 0.0015243291854858398, 0.0019428730010986328, 0.0023614168167114258, 0.0027799606323242188, 0.0031985044479370117, 0.0036170482635498047, 0.004035592079162598, 0.004454135894775391, 0.004872679710388184, 0.0052912235260009766, 0.0057097673416137695, 0.0061283111572265625, 0.0065468549728393555, 0.0069653987884521484, 0.007383942604064941, 0.007802486419677734, 0.008221030235290527, 0.00863957405090332, 0.009058117866516113, 0.009476661682128906, 0.0098952054977417, 0.010313749313354492, 0.010732293128967285, 0.011150836944580078, 0.011569380760192871, 0.011987924575805664, 0.012406468391418457, 0.01282501220703125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 67.0, 414.0, 439.0, 85.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00449946615844965, -0.004403896629810333, -0.004308327566832304, -0.0042127580381929874, -0.004117188975214958, -0.004021619446575642, -0.003926050383597612, -0.0038304810877889395, -0.0037349117919802666, -0.0036393424961715937, -0.0035437732003629208, -0.003448203904554248, -0.003352634608745575, -0.003257065312936902, -0.003161496017128229, -0.0030659267213195562, -0.0029703574255108833, -0.0028747881297022104, -0.0027792188338935375, -0.0026836495380848646, -0.0025880802422761917, -0.002492510946467519, -0.002396941650658846, -0.002301372354850173, -0.0022058028262108564, -0.0021102335304021835, -0.0020146642345935106, -0.0019190949387848377, -0.0018235256429761648, -0.001727956347167492, -0.001632387051358819, -0.001536817755550146, -0.001441248576156795, -0.0013456792803481221, -0.0012501099845394492, -0.0011545406887307763, -0.0010589713929221034, -0.0009634020971134305, -0.0008678327430970967, -0.0007722634472884238, -0.0006766941514797509, -0.000581124855671078, -0.00048555555986240506, -0.0003899862349499017, -0.0002944169391412288, -0.0001988476433325559, -0.00010327831842005253, -7.709022611379623e-06, 8.786027319729328e-05, 0.0001834295690059662, 0.0002789988648146391, 0.00037456818972714245, 0.00047013748553581536, 0.0005657067522406578, 0.0006612761062569916, 0.0007568454020656645, 0.0008524146978743374, 0.0009479839936830103, 0.0010435533476993442, 0.001139122643508017, 0.00123469193931669, 0.0013302612351253629, 0.0014258305309340358, 0.0015213998267427087, 0.0016169691225513816]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 9.0, 20.0, 18.0, 22.0, 27.0, 22.0, 21.0, 30.0, 27.0, 27.0, 27.0, 38.0, 43.0, 37.0, 39.0, 25.0, 22.0, 57.0, 42.0, 35.0, 46.0, 45.0, 38.0, 40.0, 25.0, 27.0, 26.0, 19.0, 18.0, 18.0, 15.0, 13.0, 7.0, 15.0, 11.0, 3.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00043201446533203125, -0.00041953567415475845, -0.00040705688297748566, -0.00039457809180021286, -0.00038209930062294006, -0.00036962050944566727, -0.00035714171826839447, -0.0003446629270911217, -0.0003321841359138489, -0.0003197053447365761, -0.0003072265535593033, -0.0002947477623820305, -0.0002822689712047577, -0.0002697901800274849, -0.0002573113888502121, -0.0002448325976729393, -0.0002323538064956665, -0.0002198750153183937, -0.0002073962241411209, -0.00019491743296384811, -0.00018243864178657532, -0.00016995985060930252, -0.00015748105943202972, -0.00014500226825475693, -0.00013252347707748413, -0.00012004468590021133, -0.00010756589472293854, -9.508710354566574e-05, -8.260831236839294e-05, -7.012952119112015e-05, -5.765073001384735e-05, -4.5171938836574554e-05, -3.269314765930176e-05, -2.021435648202896e-05, -7.735565304756165e-06, 4.743225872516632e-06, 1.722201704978943e-05, 2.9700808227062225e-05, 4.217959940433502e-05, 5.465839058160782e-05, 6.713718175888062e-05, 7.961597293615341e-05, 9.209476411342621e-05, 0.000104573555290699, 0.0001170523464679718, 0.0001295311376452446, 0.0001420099288225174, 0.0001544887199997902, 0.000166967511177063, 0.00017944630235433578, 0.00019192509353160858, 0.00020440388470888138, 0.00021688267588615417, 0.00022936146706342697, 0.00024184025824069977, 0.00025431904941797256, 0.00026679784059524536, 0.00027927663177251816, 0.00029175542294979095, 0.00030423421412706375, 0.00031671300530433655, 0.00032919179648160934, 0.00034167058765888214, 0.00035414937883615494, 0.00036662817001342773]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 12.0, 6.0, 9.0, 8.0, 10.0, 26.0, 19.0, 23.0, 18.0, 22.0, 36.0, 35.0, 25.0, 28.0, 49.0, 42.0, 47.0, 41.0, 48.0, 34.0, 42.0, 39.0, 44.0, 37.0, 33.0, 32.0, 25.0, 28.0, 30.0, 31.0, 23.0, 15.0, 8.0, 19.0, 13.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.070343017578125, -2.97467041015625, -2.878997802734375, -2.7833251953125, -2.687652587890625, -2.59197998046875, -2.496307373046875, -2.400634765625, -2.304962158203125, -2.20928955078125, -2.113616943359375, -2.0179443359375, -1.922271728515625, -1.82659912109375, -1.730926513671875, -1.63525390625, -1.539581298828125, -1.44390869140625, -1.348236083984375, -1.2525634765625, -1.156890869140625, -1.06121826171875, -0.965545654296875, -0.869873046875, -0.774200439453125, -0.67852783203125, -0.582855224609375, -0.4871826171875, -0.391510009765625, -0.29583740234375, -0.200164794921875, -0.1044921875, -0.008819580078125, 0.08685302734375, 0.182525634765625, 0.2781982421875, 0.373870849609375, 0.46954345703125, 0.565216064453125, 0.660888671875, 0.756561279296875, 0.85223388671875, 0.947906494140625, 1.0435791015625, 1.139251708984375, 1.23492431640625, 1.330596923828125, 1.42626953125, 1.521942138671875, 1.61761474609375, 1.713287353515625, 1.8089599609375, 1.904632568359375, 2.00030517578125, 2.095977783203125, 2.191650390625, 2.287322998046875, 2.38299560546875, 2.478668212890625, 2.5743408203125, 2.670013427734375, 2.76568603515625, 2.861358642578125, 2.95703125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 9.0, 8.0, 15.0, 14.0, 29.0, 43.0, 66.0, 63.0, 92.0, 130.0, 174.0, 212.0, 250.0, 340.0, 483.0, 681.0, 842.0, 1201.0, 1647.0, 2296.0, 3694.0, 8837.0, 45532.0, 387773.0, 508717.0, 61809.0, 10439.0, 4098.0, 2433.0, 1710.0, 1246.0, 933.0, 670.0, 500.0, 400.0, 291.0, 245.0, 165.0, 130.0, 90.0, 80.0, 44.0, 35.0, 26.0, 19.0, 16.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.77850341796875, -6.5531005859375, -6.32769775390625, -6.102294921875, -5.87689208984375, -5.6514892578125, -5.42608642578125, -5.20068359375, -4.97528076171875, -4.7498779296875, -4.52447509765625, -4.299072265625, -4.07366943359375, -3.8482666015625, -3.62286376953125, -3.3974609375, -3.17205810546875, -2.9466552734375, -2.72125244140625, -2.495849609375, -2.27044677734375, -2.0450439453125, -1.81964111328125, -1.59423828125, -1.36883544921875, -1.1434326171875, -0.91802978515625, -0.692626953125, -0.46722412109375, -0.2418212890625, -0.01641845703125, 0.208984375, 0.43438720703125, 0.6597900390625, 0.88519287109375, 1.110595703125, 1.33599853515625, 1.5614013671875, 1.78680419921875, 2.01220703125, 2.23760986328125, 2.4630126953125, 2.68841552734375, 2.913818359375, 3.13922119140625, 3.3646240234375, 3.59002685546875, 3.8154296875, 4.04083251953125, 4.2662353515625, 4.49163818359375, 4.717041015625, 4.94244384765625, 5.1678466796875, 5.39324951171875, 5.61865234375, 5.84405517578125, 6.0694580078125, 6.29486083984375, 6.520263671875, 6.74566650390625, 6.9710693359375, 7.19647216796875, 7.421875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 5.0, 4.0, 6.0, 6.0, 11.0, 15.0, 11.0, 14.0, 20.0, 24.0, 38.0, 41.0, 50.0, 51.0, 68.0, 99.0, 238.0, 1587.0, 284.0, 107.0, 52.0, 54.0, 49.0, 40.0, 34.0, 22.0, 19.0, 17.0, 21.0, 14.0, 12.0, 7.0, 9.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.087158203125, -8.79931640625, -8.511474609375, -8.2236328125, -7.935791015625, -7.64794921875, -7.360107421875, -7.072265625, -6.784423828125, -6.49658203125, -6.208740234375, -5.9208984375, -5.633056640625, -5.34521484375, -5.057373046875, -4.76953125, -4.481689453125, -4.19384765625, -3.906005859375, -3.6181640625, -3.330322265625, -3.04248046875, -2.754638671875, -2.466796875, -2.178955078125, -1.89111328125, -1.603271484375, -1.3154296875, -1.027587890625, -0.73974609375, -0.451904296875, -0.1640625, 0.123779296875, 0.41162109375, 0.699462890625, 0.9873046875, 1.275146484375, 1.56298828125, 1.850830078125, 2.138671875, 2.426513671875, 2.71435546875, 3.002197265625, 3.2900390625, 3.577880859375, 3.86572265625, 4.153564453125, 4.44140625, 4.729248046875, 5.01708984375, 5.304931640625, 5.5927734375, 5.880615234375, 6.16845703125, 6.456298828125, 6.744140625, 7.031982421875, 7.31982421875, 7.607666015625, 7.8955078125, 8.183349609375, 8.47119140625, 8.759033203125, 9.046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 10.0, 21.0, 15.0, 25.0, 29.0, 31.0, 56.0, 83.0, 138.0, 216.0, 394.0, 754.0, 2031.0, 820805.0, 2317077.0, 2150.0, 781.0, 354.0, 258.0, 139.0, 97.0, 55.0, 48.0, 34.0, 20.0, 22.0, 13.0, 6.0, 3.0, 7.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.5, -35.2841796875, -34.068359375, -32.8525390625, -31.63671875, -30.4208984375, -29.205078125, -27.9892578125, -26.7734375, -25.5576171875, -24.341796875, -23.1259765625, -21.91015625, -20.6943359375, -19.478515625, -18.2626953125, -17.046875, -15.8310546875, -14.615234375, -13.3994140625, -12.18359375, -10.9677734375, -9.751953125, -8.5361328125, -7.3203125, -6.1044921875, -4.888671875, -3.6728515625, -2.45703125, -1.2412109375, -0.025390625, 1.1904296875, 2.40625, 3.6220703125, 4.837890625, 6.0537109375, 7.26953125, 8.4853515625, 9.701171875, 10.9169921875, 12.1328125, 13.3486328125, 14.564453125, 15.7802734375, 16.99609375, 18.2119140625, 19.427734375, 20.6435546875, 21.859375, 23.0751953125, 24.291015625, 25.5068359375, 26.72265625, 27.9384765625, 29.154296875, 30.3701171875, 31.5859375, 32.8017578125, 34.017578125, 35.2333984375, 36.44921875, 37.6650390625, 38.880859375, 40.0966796875, 41.3125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 72.0, 305.0, 431.0, 166.0, 27.0, 6.0, 0.0, 0.0, 1.0], "bins": [-120.43241119384766, -118.32765197753906, -116.22289276123047, -114.11813354492188, -112.01338195800781, -109.90862274169922, -107.80386352539062, -105.69910430908203, -103.59434509277344, -101.48958587646484, -99.38482666015625, -97.28006744384766, -95.17530822753906, -93.070556640625, -90.9657974243164, -88.86103820800781, -86.75627899169922, -84.65151977539062, -82.54676055908203, -80.44200134277344, -78.33724975585938, -76.23249053955078, -74.12773132324219, -72.0229721069336, -69.918212890625, -67.8134536743164, -65.70869445800781, -63.603939056396484, -61.49917984008789, -59.3944206237793, -57.28966522216797, -55.184906005859375, -53.08014678955078, -50.97538757324219, -48.870628356933594, -46.765872955322266, -44.66111373901367, -42.55635452270508, -40.45159912109375, -38.346839904785156, -36.24208068847656, -34.13732147216797, -32.032562255859375, -29.927806854248047, -27.823047637939453, -25.71828842163086, -23.6135311126709, -21.508773803710938, -19.404014587402344, -17.29925537109375, -15.194498062133789, -13.089739799499512, -10.984981536865234, -8.880223274230957, -6.77546501159668, -4.670706748962402, -2.565948486328125, -0.46119022369384766, 1.6435680389404297, 3.748326301574707, 5.853084564208984, 7.957842826843262, 10.062601089477539, 12.167359352111816, 14.272117614746094]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 12.0, 6.0, 9.0, 15.0, 14.0, 22.0, 15.0, 29.0, 33.0, 37.0, 34.0, 33.0, 31.0, 35.0, 46.0, 38.0, 41.0, 40.0, 51.0, 55.0, 44.0, 41.0, 37.0, 39.0, 37.0, 35.0, 29.0, 25.0, 19.0, 14.0, 13.0, 11.0, 10.0, 7.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-32.10478591918945, -31.19209861755371, -30.27941131591797, -29.366724014282227, -28.454036712646484, -27.541349411010742, -26.628662109375, -25.715974807739258, -24.803287506103516, -23.890600204467773, -22.97791290283203, -22.06522560119629, -21.152538299560547, -20.239850997924805, -19.327163696289062, -18.41447639465332, -17.501789093017578, -16.589101791381836, -15.676414489746094, -14.763727188110352, -13.85103988647461, -12.938352584838867, -12.025665283203125, -11.112977981567383, -10.20029067993164, -9.287603378295898, -8.374916076660156, -7.462228775024414, -6.549541473388672, -5.63685417175293, -4.7241668701171875, -3.8114795684814453, -2.8987903594970703, -1.9861030578613281, -1.073415756225586, -0.16072845458984375, 0.7519588470458984, 1.6646461486816406, 2.577333450317383, 3.490020751953125, 4.402708053588867, 5.315395355224609, 6.228082656860352, 7.140769958496094, 8.053457260131836, 8.966144561767578, 9.87883186340332, 10.791519165039062, 11.704206466674805, 12.616893768310547, 13.529581069946289, 14.442268371582031, 15.354955673217773, 16.267642974853516, 17.180330276489258, 18.093017578125, 19.005704879760742, 19.918392181396484, 20.831079483032227, 21.74376678466797, 22.65645408630371, 23.569141387939453, 24.481828689575195, 25.394515991210938, 26.30720329284668]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 3.0, 6.0, 13.0, 10.0, 11.0, 11.0, 12.0, 20.0, 23.0, 26.0, 36.0, 29.0, 37.0, 38.0, 30.0, 28.0, 43.0, 41.0, 43.0, 44.0, 40.0, 39.0, 56.0, 38.0, 45.0, 29.0, 33.0, 33.0, 14.0, 22.0, 26.0, 14.0, 23.0, 16.0, 18.0, 10.0, 7.0, 5.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.25390625, -3.153961181640625, -3.05401611328125, -2.954071044921875, -2.8541259765625, -2.754180908203125, -2.65423583984375, -2.554290771484375, -2.454345703125, -2.354400634765625, -2.25445556640625, -2.154510498046875, -2.0545654296875, -1.954620361328125, -1.85467529296875, -1.754730224609375, -1.65478515625, -1.554840087890625, -1.45489501953125, -1.354949951171875, -1.2550048828125, -1.155059814453125, -1.05511474609375, -0.955169677734375, -0.855224609375, -0.755279541015625, -0.65533447265625, -0.555389404296875, -0.4554443359375, -0.355499267578125, -0.25555419921875, -0.155609130859375, -0.0556640625, 0.044281005859375, 0.14422607421875, 0.244171142578125, 0.3441162109375, 0.444061279296875, 0.54400634765625, 0.643951416015625, 0.743896484375, 0.843841552734375, 0.94378662109375, 1.043731689453125, 1.1436767578125, 1.243621826171875, 1.34356689453125, 1.443511962890625, 1.54345703125, 1.643402099609375, 1.74334716796875, 1.843292236328125, 1.9432373046875, 2.043182373046875, 2.14312744140625, 2.243072509765625, 2.343017578125, 2.442962646484375, 2.54290771484375, 2.642852783203125, 2.7427978515625, 2.842742919921875, 2.94268798828125, 3.042633056640625, 3.142578125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 12.0, 7.0, 13.0, 15.0, 19.0, 22.0, 31.0, 38.0, 43.0, 61.0, 112.0, 199.0, 438.0, 1078.0, 2922.0, 10808.0, 61792.0, 696221.0, 2644549.0, 698375.0, 61755.0, 10729.0, 2979.0, 1087.0, 389.0, 208.0, 92.0, 69.0, 50.0, 39.0, 28.0, 19.0, 18.0, 16.0, 9.0, 9.0, 6.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.00054931640625, -5.7823486328125, -5.56414794921875, -5.345947265625, -5.12774658203125, -4.9095458984375, -4.69134521484375, -4.47314453125, -4.25494384765625, -4.0367431640625, -3.81854248046875, -3.600341796875, -3.38214111328125, -3.1639404296875, -2.94573974609375, -2.7275390625, -2.50933837890625, -2.2911376953125, -2.07293701171875, -1.854736328125, -1.63653564453125, -1.4183349609375, -1.20013427734375, -0.98193359375, -0.76373291015625, -0.5455322265625, -0.32733154296875, -0.109130859375, 0.10906982421875, 0.3272705078125, 0.54547119140625, 0.763671875, 0.98187255859375, 1.2000732421875, 1.41827392578125, 1.636474609375, 1.85467529296875, 2.0728759765625, 2.29107666015625, 2.50927734375, 2.72747802734375, 2.9456787109375, 3.16387939453125, 3.382080078125, 3.60028076171875, 3.8184814453125, 4.03668212890625, 4.2548828125, 4.47308349609375, 4.6912841796875, 4.90948486328125, 5.127685546875, 5.34588623046875, 5.5640869140625, 5.78228759765625, 6.00048828125, 6.21868896484375, 6.4368896484375, 6.65509033203125, 6.873291015625, 7.09149169921875, 7.3096923828125, 7.52789306640625, 7.74609375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 12.0, 40.0, 152.0, 729.0, 2027.0, 885.0, 185.0, 41.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.22412109375, -28.3544921875, -27.48486328125, -26.615234375, -25.74560546875, -24.8759765625, -24.00634765625, -23.13671875, -22.26708984375, -21.3974609375, -20.52783203125, -19.658203125, -18.78857421875, -17.9189453125, -17.04931640625, -16.1796875, -15.31005859375, -14.4404296875, -13.57080078125, -12.701171875, -11.83154296875, -10.9619140625, -10.09228515625, -9.22265625, -8.35302734375, -7.4833984375, -6.61376953125, -5.744140625, -4.87451171875, -4.0048828125, -3.13525390625, -2.265625, -1.39599609375, -0.5263671875, 0.34326171875, 1.212890625, 2.08251953125, 2.9521484375, 3.82177734375, 4.69140625, 5.56103515625, 6.4306640625, 7.30029296875, 8.169921875, 9.03955078125, 9.9091796875, 10.77880859375, 11.6484375, 12.51806640625, 13.3876953125, 14.25732421875, 15.126953125, 15.99658203125, 16.8662109375, 17.73583984375, 18.60546875, 19.47509765625, 20.3447265625, 21.21435546875, 22.083984375, 22.95361328125, 23.8232421875, 24.69287109375, 25.5625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 16.0, 75.0, 363.0, 3181.0, 4182570.0, 7304.0, 585.0, 127.0, 33.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90625, -53.05126953125, -51.1962890625, -49.34130859375, -47.486328125, -45.63134765625, -43.7763671875, -41.92138671875, -40.06640625, -38.21142578125, -36.3564453125, -34.50146484375, -32.646484375, -30.79150390625, -28.9365234375, -27.08154296875, -25.2265625, -23.37158203125, -21.5166015625, -19.66162109375, -17.806640625, -15.95166015625, -14.0966796875, -12.24169921875, -10.38671875, -8.53173828125, -6.6767578125, -4.82177734375, -2.966796875, -1.11181640625, 0.7431640625, 2.59814453125, 4.453125, 6.30810546875, 8.1630859375, 10.01806640625, 11.873046875, 13.72802734375, 15.5830078125, 17.43798828125, 19.29296875, 21.14794921875, 23.0029296875, 24.85791015625, 26.712890625, 28.56787109375, 30.4228515625, 32.27783203125, 34.1328125, 35.98779296875, 37.8427734375, 39.69775390625, 41.552734375, 43.40771484375, 45.2626953125, 47.11767578125, 48.97265625, 50.82763671875, 52.6826171875, 54.53759765625, 56.392578125, 58.24755859375, 60.1025390625, 61.95751953125, 63.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 136.0, 744.0, 124.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.8914794921875, -150.60498046875, -145.3184814453125, -140.031982421875, -134.7454833984375, -129.45899963378906, -124.17250061035156, -118.88600158691406, -113.59950256347656, -108.31300354003906, -103.02650451660156, -97.7400131225586, -92.4535140991211, -87.1670150756836, -81.88052368164062, -76.59402465820312, -71.30752563476562, -66.02102661132812, -60.73453140258789, -55.448036193847656, -50.161537170410156, -44.875038146972656, -39.58854293823242, -34.30204772949219, -29.015548706054688, -23.72905158996582, -18.442554473876953, -13.156057357788086, -7.869560241699219, -2.5830631256103516, 2.7034339904785156, 7.98992919921875, 13.27642822265625, 18.562925338745117, 23.849422454833984, 29.13591957092285, 34.42241668701172, 39.70891571044922, 44.99541091918945, 50.28190612792969, 55.56840515136719, 60.85490417480469, 66.14140319824219, 71.42789459228516, 76.71439361572266, 82.00089263916016, 87.28738403320312, 92.57388305664062, 97.86038208007812, 103.14688110351562, 108.43338012695312, 113.7198715209961, 119.0063705444336, 124.2928695678711, 129.57936096191406, 134.86585998535156, 140.15235900878906, 145.43885803222656, 150.72535705566406, 156.01185607910156, 161.29833984375, 166.5848388671875, 171.871337890625, 177.1578369140625, 182.4443359375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 4.0, 9.0, 4.0, 14.0, 12.0, 12.0, 15.0, 10.0, 24.0, 26.0, 29.0, 28.0, 33.0, 31.0, 36.0, 37.0, 41.0, 32.0, 35.0, 26.0, 37.0, 44.0, 33.0, 37.0, 31.0, 35.0, 29.0, 36.0, 33.0, 33.0, 29.0, 21.0, 22.0, 19.0, 15.0, 13.0, 14.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.217395782470703, -25.44339942932129, -24.669403076171875, -23.89540672302246, -23.121410369873047, -22.347414016723633, -21.57341766357422, -20.799423217773438, -20.02542495727539, -19.251428604125977, -18.477432250976562, -17.70343589782715, -16.929439544677734, -16.15544319152832, -15.381447792053223, -14.607451438903809, -13.833456039428711, -13.059459686279297, -12.285463333129883, -11.511466979980469, -10.737470626831055, -9.96347427368164, -9.189478874206543, -8.415482521057129, -7.641486167907715, -6.867489814758301, -6.093493461608887, -5.319497585296631, -4.545501232147217, -3.7715048789978027, -2.997509002685547, -2.223512649536133, -1.4495162963867188, -0.6755200624465942, 0.09847617149353027, 0.8724722862243652, 1.6464686393737793, 2.4204649925231934, 3.194460868835449, 3.9684572219848633, 4.742453575134277, 5.516449928283691, 6.2904462814331055, 7.064442157745361, 7.838438510894775, 8.612434387207031, 9.386430740356445, 10.16042709350586, 10.934423446655273, 11.708419799804688, 12.482416152954102, 13.256412506103516, 14.03040885925293, 14.804405212402344, 15.578400611877441, 16.352397918701172, 17.126392364501953, 17.900388717651367, 18.67438507080078, 19.448381423950195, 20.22237777709961, 20.996374130249023, 21.770370483398438, 22.54436492919922, 23.318363189697266]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 12.0, 12.0, 17.0, 13.0, 12.0, 20.0, 23.0, 28.0, 29.0, 31.0, 29.0, 37.0, 24.0, 33.0, 35.0, 36.0, 38.0, 33.0, 41.0, 46.0, 34.0, 37.0, 39.0, 31.0, 23.0, 21.0, 24.0, 37.0, 34.0, 26.0, 7.0, 18.0, 13.0, 10.0, 12.0, 14.0, 7.0, 12.0, 8.0, 2.0, 2.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-2.34765625, -2.276611328125, -2.20556640625, -2.134521484375, -2.0634765625, -1.992431640625, -1.92138671875, -1.850341796875, -1.779296875, -1.708251953125, -1.63720703125, -1.566162109375, -1.4951171875, -1.424072265625, -1.35302734375, -1.281982421875, -1.2109375, -1.139892578125, -1.06884765625, -0.997802734375, -0.9267578125, -0.855712890625, -0.78466796875, -0.713623046875, -0.642578125, -0.571533203125, -0.50048828125, -0.429443359375, -0.3583984375, -0.287353515625, -0.21630859375, -0.145263671875, -0.07421875, -0.003173828125, 0.06787109375, 0.138916015625, 0.2099609375, 0.281005859375, 0.35205078125, 0.423095703125, 0.494140625, 0.565185546875, 0.63623046875, 0.707275390625, 0.7783203125, 0.849365234375, 0.92041015625, 0.991455078125, 1.0625, 1.133544921875, 1.20458984375, 1.275634765625, 1.3466796875, 1.417724609375, 1.48876953125, 1.559814453125, 1.630859375, 1.701904296875, 1.77294921875, 1.843994140625, 1.9150390625, 1.986083984375, 2.05712890625, 2.128173828125, 2.19921875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 15.0, 15.0, 23.0, 22.0, 48.0, 72.0, 108.0, 156.0, 213.0, 278.0, 443.0, 671.0, 1058.0, 1590.0, 2470.0, 3678.0, 6026.0, 9630.0, 15368.0, 25115.0, 42682.0, 73262.0, 134325.0, 233265.0, 214310.0, 119066.0, 65467.0, 38050.0, 22920.0, 14013.0, 8654.0, 5551.0, 3384.0, 2251.0, 1455.0, 933.0, 638.0, 405.0, 276.0, 184.0, 143.0, 103.0, 60.0, 45.0, 32.0, 19.0, 14.0, 15.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.275390625, -0.2667579650878906, -0.25812530517578125, -0.24949264526367188, -0.2408599853515625, -0.23222732543945312, -0.22359466552734375, -0.21496200561523438, -0.206329345703125, -0.19769668579101562, -0.18906402587890625, -0.18043136596679688, -0.1717987060546875, -0.16316604614257812, -0.15453338623046875, -0.14590072631835938, -0.13726806640625, -0.12863540649414062, -0.12000274658203125, -0.11137008666992188, -0.1027374267578125, -0.09410476684570312, -0.08547210693359375, -0.07683944702148438, -0.068206787109375, -0.059574127197265625, -0.05094146728515625, -0.042308807373046875, -0.0336761474609375, -0.025043487548828125, -0.01641082763671875, -0.007778167724609375, 0.0008544921875, 0.009487152099609375, 0.01811981201171875, 0.026752471923828125, 0.0353851318359375, 0.044017791748046875, 0.05265045166015625, 0.061283111572265625, 0.069915771484375, 0.07854843139648438, 0.08718109130859375, 0.09581375122070312, 0.1044464111328125, 0.11307907104492188, 0.12171173095703125, 0.13034439086914062, 0.13897705078125, 0.14760971069335938, 0.15624237060546875, 0.16487503051757812, 0.1735076904296875, 0.18214035034179688, 0.19077301025390625, 0.19940567016601562, 0.208038330078125, 0.21667098999023438, 0.22530364990234375, 0.23393630981445312, 0.2425689697265625, 0.2512016296386719, 0.25983428955078125, 0.2684669494628906, 0.277099609375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 7.0, 12.0, 10.0, 15.0, 15.0, 17.0, 20.0, 27.0, 40.0, 31.0, 35.0, 36.0, 49.0, 34.0, 39.0, 47.0, 42.0, 1071.0, 36.0, 55.0, 38.0, 31.0, 29.0, 28.0, 26.0, 32.0, 35.0, 23.0, 22.0, 22.0, 16.0, 11.0, 13.0, 11.0, 12.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.5439453125, -1.4933319091796875, -1.442718505859375, -1.3921051025390625, -1.34149169921875, -1.2908782958984375, -1.240264892578125, -1.1896514892578125, -1.1390380859375, -1.0884246826171875, -1.037811279296875, -0.9871978759765625, -0.93658447265625, -0.8859710693359375, -0.835357666015625, -0.7847442626953125, -0.734130859375, -0.6835174560546875, -0.632904052734375, -0.5822906494140625, -0.53167724609375, -0.4810638427734375, -0.430450439453125, -0.3798370361328125, -0.3292236328125, -0.2786102294921875, -0.227996826171875, -0.1773834228515625, -0.12677001953125, -0.0761566162109375, -0.025543212890625, 0.0250701904296875, 0.07568359375, 0.1262969970703125, 0.176910400390625, 0.2275238037109375, 0.27813720703125, 0.3287506103515625, 0.379364013671875, 0.4299774169921875, 0.4805908203125, 0.5312042236328125, 0.581817626953125, 0.6324310302734375, 0.68304443359375, 0.7336578369140625, 0.784271240234375, 0.8348846435546875, 0.885498046875, 0.9361114501953125, 0.986724853515625, 1.0373382568359375, 1.08795166015625, 1.1385650634765625, 1.189178466796875, 1.2397918701171875, 1.2904052734375, 1.3410186767578125, 1.391632080078125, 1.4422454833984375, 1.49285888671875, 1.5434722900390625, 1.594085693359375, 1.6446990966796875, 1.6953125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 13.0, 19.0, 22.0, 37.0, 52.0, 65.0, 83.0, 111.0, 178.0, 231.0, 336.0, 445.0, 617.0, 889.0, 1342.0, 1799.0, 2677.0, 3773.0, 5631.0, 8404.0, 12809.0, 19608.0, 30621.0, 49383.0, 84766.0, 150579.0, 1274441.0, 181292.0, 102946.0, 59463.0, 35974.0, 22865.0, 14825.0, 9784.0, 6523.0, 4431.0, 3082.0, 2096.0, 1432.0, 1010.0, 729.0, 511.0, 345.0, 261.0, 170.0, 136.0, 90.0, 76.0, 59.0, 30.0, 23.0, 17.0, 8.0, 10.0, 9.0, 3.0, 1.0, 1.0], "bins": [-0.2216796875, -0.21489524841308594, -0.20811080932617188, -0.2013263702392578, -0.19454193115234375, -0.1877574920654297, -0.18097305297851562, -0.17418861389160156, -0.1674041748046875, -0.16061973571777344, -0.15383529663085938, -0.1470508575439453, -0.14026641845703125, -0.1334819793701172, -0.12669754028320312, -0.11991310119628906, -0.113128662109375, -0.10634422302246094, -0.09955978393554688, -0.09277534484863281, -0.08599090576171875, -0.07920646667480469, -0.07242202758789062, -0.06563758850097656, -0.0588531494140625, -0.05206871032714844, -0.045284271240234375, -0.03849983215332031, -0.03171539306640625, -0.024930953979492188, -0.018146514892578125, -0.011362075805664062, -0.00457763671875, 0.0022068023681640625, 0.008991241455078125, 0.015775680541992188, 0.02256011962890625, 0.029344558715820312, 0.036128997802734375, 0.04291343688964844, 0.0496978759765625, 0.05648231506347656, 0.06326675415039062, 0.07005119323730469, 0.07683563232421875, 0.08362007141113281, 0.09040451049804688, 0.09718894958496094, 0.103973388671875, 0.11075782775878906, 0.11754226684570312, 0.12432670593261719, 0.13111114501953125, 0.1378955841064453, 0.14468002319335938, 0.15146446228027344, 0.1582489013671875, 0.16503334045410156, 0.17181777954101562, 0.1786022186279297, 0.18538665771484375, 0.1921710968017578, 0.19895553588867188, 0.20573997497558594, 0.2125244140625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 7.0, 7.0, 5.0, 16.0, 13.0, 22.0, 21.0, 37.0, 33.0, 54.0, 46.0, 68.0, 54.0, 84.0, 77.0, 63.0, 67.0, 58.0, 49.0, 37.0, 33.0, 27.0, 15.0, 14.0, 9.0, 8.0, 16.0, 5.0, 4.0, 5.0, 9.0, 5.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.001110076904296875, -0.0010782405734062195, -0.001046404242515564, -0.0010145679116249084, -0.000982731580734253, -0.0009508952498435974, -0.0009190589189529419, -0.0008872225880622864, -0.0008553862571716309, -0.0008235499262809753, -0.0007917135953903198, -0.0007598772644996643, -0.0007280409336090088, -0.0006962046027183533, -0.0006643682718276978, -0.0006325319409370422, -0.0006006956100463867, -0.0005688592791557312, -0.0005370229482650757, -0.0005051866173744202, -0.00047335028648376465, -0.00044151395559310913, -0.0004096776247024536, -0.0003778412938117981, -0.0003460049629211426, -0.00031416863203048706, -0.00028233230113983154, -0.000250495970249176, -0.0002186596393585205, -0.000186823308467865, -0.00015498697757720947, -0.00012315064668655396, -9.131431579589844e-05, -5.947798490524292e-05, -2.7641654014587402e-05, 4.194676876068115e-06, 3.603100776672363e-05, 6.786733865737915e-05, 9.970366954803467e-05, 0.00013154000043869019, 0.0001633763313293457, 0.00019521266222000122, 0.00022704899311065674, 0.00025888532400131226, 0.0002907216548919678, 0.0003225579857826233, 0.0003543943166732788, 0.0003862306475639343, 0.00041806697845458984, 0.00044990330934524536, 0.0004817396402359009, 0.0005135759711265564, 0.0005454123020172119, 0.0005772486329078674, 0.000609084963798523, 0.0006409212946891785, 0.000672757625579834, 0.0007045939564704895, 0.000736430287361145, 0.0007682666182518005, 0.0008001029491424561, 0.0008319392800331116, 0.0008637756109237671, 0.0008956119418144226, 0.0009274482727050781]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 5.0, 6.0, 9.0, 14.0, 19.0, 12.0, 21.0, 18.0, 34.0, 34.0, 52.0, 66.0, 95.0, 157.0, 224.0, 379.0, 622.0, 1378.0, 189381.0, 852457.0, 1673.0, 694.0, 395.0, 231.0, 155.0, 110.0, 69.0, 51.0, 44.0, 29.0, 24.0, 15.0, 14.0, 13.0, 12.0, 7.0, 6.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0165863037109375, -0.016016244888305664, -0.015446186065673828, -0.014876127243041992, -0.014306068420410156, -0.01373600959777832, -0.013165950775146484, -0.012595891952514648, -0.012025833129882812, -0.011455774307250977, -0.01088571548461914, -0.010315656661987305, -0.009745597839355469, -0.009175539016723633, -0.008605480194091797, -0.008035421371459961, -0.007465362548828125, -0.006895303726196289, -0.006325244903564453, -0.005755186080932617, -0.005185127258300781, -0.004615068435668945, -0.004045009613037109, -0.0034749507904052734, -0.0029048919677734375, -0.0023348331451416016, -0.0017647743225097656, -0.0011947154998779297, -0.0006246566772460938, -5.459785461425781e-05, 0.0005154609680175781, 0.001085519790649414, 0.00165557861328125, 0.002225637435913086, 0.002795696258544922, 0.003365755081176758, 0.003935813903808594, 0.00450587272644043, 0.005075931549072266, 0.0056459903717041016, 0.0062160491943359375, 0.0067861080169677734, 0.007356166839599609, 0.007926225662231445, 0.008496284484863281, 0.009066343307495117, 0.009636402130126953, 0.010206460952758789, 0.010776519775390625, 0.011346578598022461, 0.011916637420654297, 0.012486696243286133, 0.013056755065917969, 0.013626813888549805, 0.01419687271118164, 0.014766931533813477, 0.015336990356445312, 0.01590704917907715, 0.016477108001708984, 0.01704716682434082, 0.017617225646972656, 0.018187284469604492, 0.018757343292236328, 0.019327402114868164, 0.0198974609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 11.0, 566.0, 432.0, 3.0, 1.0], "bins": [-0.00776103138923645, -0.007633655332028866, -0.007506279740482569, -0.007378903683274984, -0.007251528091728687, -0.007124152034521103, -0.006996776442974806, -0.0068694003857672215, -0.006742024794220924, -0.00661464873701334, -0.006487273145467043, -0.0063598970882594585, -0.0062325214967131615, -0.006105145439505577, -0.00597776984795928, -0.005850393790751696, -0.005723017733544111, -0.005595641676336527, -0.00546826608479023, -0.005340890027582645, -0.005213514436036348, -0.005086138378828764, -0.004958762787282467, -0.0048313867300748825, -0.004704010672867298, -0.004576634615659714, -0.004449259024113417, -0.004321882966905832, -0.004194507375359535, -0.004067131318151951, -0.003939755726605654, -0.0038123796693980694, -0.0036850038450211287, -0.003557628020644188, -0.003430252196267247, -0.0033028763718903065, -0.003175500314682722, -0.003048124723136425, -0.0029207486659288406, -0.0027933728415519, -0.002665997017174959, -0.0025386211927980185, -0.0024112453684210777, -0.002283869544044137, -0.0021564937196671963, -0.002029117662459612, -0.0019017418380826712, -0.0017743660137057304, -0.0016469901893287897, -0.001519614364951849, -0.0013922385405749083, -0.0012648625997826457, -0.001137486775405705, -0.0010101109510287642, -0.0008827350684441626, -0.000755359185859561, -0.0006279833614826202, -0.0005006075371056795, -0.00037323165452107787, -0.0002458558010403067, -0.0001184799475595355, 8.895876817405224e-06, 0.00013627175940200686, 0.0002636476419866085, 0.00039102346636354923]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 15.0, 11.0, 11.0, 17.0, 21.0, 20.0, 20.0, 29.0, 36.0, 41.0, 38.0, 44.0, 61.0, 48.0, 44.0, 53.0, 54.0, 51.0, 38.0, 49.0, 34.0, 43.0, 34.0, 29.0, 36.0, 23.0, 12.0, 21.0, 15.0, 13.0, 9.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005265474319458008, -0.0005075614899396896, -0.0004885755479335785, -0.00046958960592746735, -0.0004506036639213562, -0.00043161772191524506, -0.0004126317799091339, -0.00039364583790302277, -0.0003746598958969116, -0.0003556739538908005, -0.00033668801188468933, -0.0003177020698785782, -0.00029871612787246704, -0.0002797301858663559, -0.00026074424386024475, -0.0002417583018541336, -0.00022277235984802246, -0.00020378641784191132, -0.00018480047583580017, -0.00016581453382968903, -0.00014682859182357788, -0.00012784264981746674, -0.00010885670781135559, -8.987076580524445e-05, -7.08848237991333e-05, -5.1898881793022156e-05, -3.291293978691101e-05, -1.3926997780799866e-05, 5.058944225311279e-06, 2.4044886231422424e-05, 4.303082823753357e-05, 6.201677024364471e-05, 8.100271224975586e-05, 9.9988654255867e-05, 0.00011897459626197815, 0.0001379605382680893, 0.00015694648027420044, 0.00017593242228031158, 0.00019491836428642273, 0.00021390430629253387, 0.00023289024829864502, 0.00025187619030475616, 0.0002708621323108673, 0.00028984807431697845, 0.0003088340163230896, 0.00032781995832920074, 0.0003468059003353119, 0.00036579184234142303, 0.0003847777843475342, 0.0004037637263536453, 0.00042274966835975647, 0.0004417356103658676, 0.00046072155237197876, 0.0004797074943780899, 0.000498693436384201, 0.0005176793783903122, 0.0005366653203964233, 0.0005556512624025345, 0.0005746372044086456, 0.0005936231464147568, 0.0006126090884208679, 0.0006315950304269791, 0.0006505809724330902, 0.0006695669144392014, 0.0006885528564453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 12.0, 12.0, 17.0, 13.0, 12.0, 20.0, 23.0, 28.0, 29.0, 31.0, 29.0, 37.0, 24.0, 33.0, 35.0, 36.0, 38.0, 33.0, 41.0, 46.0, 34.0, 37.0, 39.0, 31.0, 23.0, 21.0, 24.0, 37.0, 34.0, 26.0, 7.0, 18.0, 13.0, 10.0, 12.0, 14.0, 7.0, 12.0, 8.0, 2.0, 2.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-2.34765625, -2.276611328125, -2.20556640625, -2.134521484375, -2.0634765625, -1.992431640625, -1.92138671875, -1.850341796875, -1.779296875, -1.708251953125, -1.63720703125, -1.566162109375, -1.4951171875, -1.424072265625, -1.35302734375, -1.281982421875, -1.2109375, -1.139892578125, -1.06884765625, -0.997802734375, -0.9267578125, -0.855712890625, -0.78466796875, -0.713623046875, -0.642578125, -0.571533203125, -0.50048828125, -0.429443359375, -0.3583984375, -0.287353515625, -0.21630859375, -0.145263671875, -0.07421875, -0.003173828125, 0.06787109375, 0.138916015625, 0.2099609375, 0.281005859375, 0.35205078125, 0.423095703125, 0.494140625, 0.565185546875, 0.63623046875, 0.707275390625, 0.7783203125, 0.849365234375, 0.92041015625, 0.991455078125, 1.0625, 1.133544921875, 1.20458984375, 1.275634765625, 1.3466796875, 1.417724609375, 1.48876953125, 1.559814453125, 1.630859375, 1.701904296875, 1.77294921875, 1.843994140625, 1.9150390625, 1.986083984375, 2.05712890625, 2.128173828125, 2.19921875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 12.0, 8.0, 14.0, 25.0, 16.0, 30.0, 39.0, 35.0, 65.0, 71.0, 81.0, 109.0, 174.0, 225.0, 271.0, 351.0, 533.0, 788.0, 1217.0, 2162.0, 4254.0, 9867.0, 32235.0, 176459.0, 598119.0, 170229.0, 31165.0, 9658.0, 4152.0, 2126.0, 1174.0, 812.0, 527.0, 382.0, 312.0, 186.0, 154.0, 114.0, 84.0, 71.0, 59.0, 40.0, 38.0, 24.0, 20.0, 22.0, 13.0, 10.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-4.2734375, -4.14190673828125, -4.0103759765625, -3.87884521484375, -3.747314453125, -3.61578369140625, -3.4842529296875, -3.35272216796875, -3.22119140625, -3.08966064453125, -2.9581298828125, -2.82659912109375, -2.695068359375, -2.56353759765625, -2.4320068359375, -2.30047607421875, -2.1689453125, -2.03741455078125, -1.9058837890625, -1.77435302734375, -1.642822265625, -1.51129150390625, -1.3797607421875, -1.24822998046875, -1.11669921875, -0.98516845703125, -0.8536376953125, -0.72210693359375, -0.590576171875, -0.45904541015625, -0.3275146484375, -0.19598388671875, -0.064453125, 0.06707763671875, 0.1986083984375, 0.33013916015625, 0.461669921875, 0.59320068359375, 0.7247314453125, 0.85626220703125, 0.98779296875, 1.11932373046875, 1.2508544921875, 1.38238525390625, 1.513916015625, 1.64544677734375, 1.7769775390625, 1.90850830078125, 2.0400390625, 2.17156982421875, 2.3031005859375, 2.43463134765625, 2.566162109375, 2.69769287109375, 2.8292236328125, 2.96075439453125, 3.09228515625, 3.22381591796875, 3.3553466796875, 3.48687744140625, 3.618408203125, 3.74993896484375, 3.8814697265625, 4.01300048828125, 4.14453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 3.0, 11.0, 10.0, 10.0, 11.0, 14.0, 20.0, 20.0, 31.0, 33.0, 34.0, 39.0, 54.0, 62.0, 88.0, 192.0, 1546.0, 320.0, 140.0, 77.0, 60.0, 45.0, 43.0, 31.0, 28.0, 25.0, 15.0, 10.0, 16.0, 11.0, 6.0, 8.0, 6.0, 1.0, 5.0, 3.0, 1.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-9.3828125, -9.113037109375, -8.84326171875, -8.573486328125, -8.3037109375, -8.033935546875, -7.76416015625, -7.494384765625, -7.224609375, -6.954833984375, -6.68505859375, -6.415283203125, -6.1455078125, -5.875732421875, -5.60595703125, -5.336181640625, -5.06640625, -4.796630859375, -4.52685546875, -4.257080078125, -3.9873046875, -3.717529296875, -3.44775390625, -3.177978515625, -2.908203125, -2.638427734375, -2.36865234375, -2.098876953125, -1.8291015625, -1.559326171875, -1.28955078125, -1.019775390625, -0.75, -0.480224609375, -0.21044921875, 0.059326171875, 0.3291015625, 0.598876953125, 0.86865234375, 1.138427734375, 1.408203125, 1.677978515625, 1.94775390625, 2.217529296875, 2.4873046875, 2.757080078125, 3.02685546875, 3.296630859375, 3.56640625, 3.836181640625, 4.10595703125, 4.375732421875, 4.6455078125, 4.915283203125, 5.18505859375, 5.454833984375, 5.724609375, 5.994384765625, 6.26416015625, 6.533935546875, 6.8037109375, 7.073486328125, 7.34326171875, 7.613037109375, 7.8828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 5.0, 9.0, 16.0, 23.0, 42.0, 33.0, 57.0, 73.0, 104.0, 138.0, 194.0, 412.0, 857.0, 3977.0, 3031594.0, 104586.0, 1904.0, 640.0, 340.0, 168.0, 141.0, 94.0, 66.0, 59.0, 32.0, 35.0, 23.0, 20.0, 13.0, 9.0, 2.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.199951171875, -16.60302734375, -16.006103515625, -15.4091796875, -14.812255859375, -14.21533203125, -13.618408203125, -13.021484375, -12.424560546875, -11.82763671875, -11.230712890625, -10.6337890625, -10.036865234375, -9.43994140625, -8.843017578125, -8.24609375, -7.649169921875, -7.05224609375, -6.455322265625, -5.8583984375, -5.261474609375, -4.66455078125, -4.067626953125, -3.470703125, -2.873779296875, -2.27685546875, -1.679931640625, -1.0830078125, -0.486083984375, 0.11083984375, 0.707763671875, 1.3046875, 1.901611328125, 2.49853515625, 3.095458984375, 3.6923828125, 4.289306640625, 4.88623046875, 5.483154296875, 6.080078125, 6.677001953125, 7.27392578125, 7.870849609375, 8.4677734375, 9.064697265625, 9.66162109375, 10.258544921875, 10.85546875, 11.452392578125, 12.04931640625, 12.646240234375, 13.2431640625, 13.840087890625, 14.43701171875, 15.033935546875, 15.630859375, 16.227783203125, 16.82470703125, 17.421630859375, 18.0185546875, 18.615478515625, 19.21240234375, 19.809326171875, 20.40625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 52.0, 945.0, 15.0, 0.0, 0.0, 0.0, 1.0], "bins": [-262.3836364746094, -257.8918762207031, -253.4001007080078, -248.9083251953125, -244.41656494140625, -239.92478942871094, -235.4330291748047, -230.94125366210938, -226.44949340820312, -221.9577178955078, -217.46595764160156, -212.97418212890625, -208.482421875, -203.9906463623047, -199.49888610839844, -195.00711059570312, -190.5153350830078, -186.0235595703125, -181.53179931640625, -177.04002380371094, -172.5482635498047, -168.05648803710938, -163.56472778320312, -159.0729522705078, -154.5811767578125, -150.0894012451172, -145.59764099121094, -141.10586547851562, -136.61410522460938, -132.12232971191406, -127.63056182861328, -123.1387939453125, -118.64701843261719, -114.1552505493164, -109.66348266601562, -105.17171478271484, -100.67994689941406, -96.18817138671875, -91.69640350341797, -87.20463562011719, -82.7128677368164, -78.22109985351562, -73.72933197021484, -69.23756408691406, -64.74578857421875, -60.254024505615234, -55.76225280761719, -51.270484924316406, -46.778717041015625, -42.286949157714844, -37.79518127441406, -33.303409576416016, -28.811641693115234, -24.319873809814453, -19.82810401916504, -15.336334228515625, -10.844568252563477, -6.352799415588379, -1.8610305786132812, 2.6307382583618164, 7.122507095336914, 11.614274978637695, 16.10604476928711, 20.597814559936523, 25.089582443237305]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 2.0, 9.0, 9.0, 9.0, 10.0, 16.0, 9.0, 13.0, 11.0, 16.0, 25.0, 15.0, 21.0, 21.0, 21.0, 40.0, 24.0, 38.0, 42.0, 27.0, 35.0, 26.0, 20.0, 32.0, 43.0, 35.0, 38.0, 35.0, 28.0, 31.0, 18.0, 35.0, 28.0, 22.0, 15.0, 21.0, 17.0, 13.0, 13.0, 13.0, 11.0, 16.0, 8.0, 9.0, 12.0, 13.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0], "bins": [-15.109373092651367, -14.654638290405273, -14.199904441833496, -13.745169639587402, -13.290435791015625, -12.835700988769531, -12.380966186523438, -11.92623233795166, -11.471498489379883, -11.016763687133789, -10.562029838562012, -10.107295036315918, -9.65256118774414, -9.197826385498047, -8.743091583251953, -8.288357734680176, -7.833622932434082, -7.3788886070251465, -6.924154281616211, -6.469419479370117, -6.01468563079834, -5.559950828552246, -5.1052165031433105, -4.650482177734375, -4.1957478523254395, -3.741013526916504, -3.2862792015075684, -2.8315446376800537, -2.376810312271118, -1.9220759868621826, -1.467341423034668, -1.0126070976257324, -0.5578718185424805, -0.10313743352890015, 0.3515969514846802, 0.8063313961029053, 1.2610657215118408, 1.7158000469207764, 2.170534610748291, 2.6252689361572266, 3.080003261566162, 3.5347375869750977, 3.989471912384033, 4.444206237792969, 4.8989410400390625, 5.35367488861084, 5.808409690856934, 6.263144016265869, 6.717878341674805, 7.17261266708374, 7.627346992492676, 8.08208179473877, 8.536815643310547, 8.99155044555664, 9.446285247802734, 9.901019096374512, 10.355752944946289, 10.810487747192383, 11.26522159576416, 11.719956398010254, 12.174690246582031, 12.629425048828125, 13.084159851074219, 13.538893699645996, 13.99362850189209]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 4.0, 2.0, 7.0, 2.0, 12.0, 4.0, 8.0, 8.0, 9.0, 11.0, 14.0, 22.0, 20.0, 27.0, 27.0, 22.0, 36.0, 31.0, 25.0, 20.0, 29.0, 26.0, 34.0, 58.0, 48.0, 43.0, 37.0, 31.0, 40.0, 30.0, 47.0, 22.0, 23.0, 24.0, 32.0, 18.0, 22.0, 17.0, 25.0, 14.0, 10.0, 19.0, 11.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.892578125, -2.80718994140625, -2.7218017578125, -2.63641357421875, -2.551025390625, -2.46563720703125, -2.3802490234375, -2.29486083984375, -2.20947265625, -2.12408447265625, -2.0386962890625, -1.95330810546875, -1.867919921875, -1.78253173828125, -1.6971435546875, -1.61175537109375, -1.5263671875, -1.44097900390625, -1.3555908203125, -1.27020263671875, -1.184814453125, -1.09942626953125, -1.0140380859375, -0.92864990234375, -0.84326171875, -0.75787353515625, -0.6724853515625, -0.58709716796875, -0.501708984375, -0.41632080078125, -0.3309326171875, -0.24554443359375, -0.16015625, -0.07476806640625, 0.0106201171875, 0.09600830078125, 0.181396484375, 0.26678466796875, 0.3521728515625, 0.43756103515625, 0.52294921875, 0.60833740234375, 0.6937255859375, 0.77911376953125, 0.864501953125, 0.94989013671875, 1.0352783203125, 1.12066650390625, 1.2060546875, 1.29144287109375, 1.3768310546875, 1.46221923828125, 1.547607421875, 1.63299560546875, 1.7183837890625, 1.80377197265625, 1.88916015625, 1.97454833984375, 2.0599365234375, 2.14532470703125, 2.230712890625, 2.31610107421875, 2.4014892578125, 2.48687744140625, 2.572265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 7.0, 11.0, 10.0, 6.0, 17.0, 24.0, 18.0, 35.0, 43.0, 57.0, 81.0, 111.0, 142.0, 211.0, 300.0, 406.0, 609.0, 927.0, 1789.0, 6940.0, 261439.0, 3675216.0, 234177.0, 6849.0, 1880.0, 891.0, 586.0, 381.0, 295.0, 227.0, 149.0, 104.0, 73.0, 52.0, 47.0, 30.0, 19.0, 28.0, 18.0, 16.0, 10.0, 8.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-15.125, -14.67333984375, -14.2216796875, -13.77001953125, -13.318359375, -12.86669921875, -12.4150390625, -11.96337890625, -11.51171875, -11.06005859375, -10.6083984375, -10.15673828125, -9.705078125, -9.25341796875, -8.8017578125, -8.35009765625, -7.8984375, -7.44677734375, -6.9951171875, -6.54345703125, -6.091796875, -5.64013671875, -5.1884765625, -4.73681640625, -4.28515625, -3.83349609375, -3.3818359375, -2.93017578125, -2.478515625, -2.02685546875, -1.5751953125, -1.12353515625, -0.671875, -0.22021484375, 0.2314453125, 0.68310546875, 1.134765625, 1.58642578125, 2.0380859375, 2.48974609375, 2.94140625, 3.39306640625, 3.8447265625, 4.29638671875, 4.748046875, 5.19970703125, 5.6513671875, 6.10302734375, 6.5546875, 7.00634765625, 7.4580078125, 7.90966796875, 8.361328125, 8.81298828125, 9.2646484375, 9.71630859375, 10.16796875, 10.61962890625, 11.0712890625, 11.52294921875, 11.974609375, 12.42626953125, 12.8779296875, 13.32958984375, 13.78125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 3.0, 7.0, 14.0, 26.0, 33.0, 62.0, 109.0, 231.0, 384.0, 599.0, 789.0, 658.0, 487.0, 304.0, 156.0, 104.0, 44.0, 23.0, 19.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.05078125, -6.78778076171875, -6.5247802734375, -6.26177978515625, -5.998779296875, -5.73577880859375, -5.4727783203125, -5.20977783203125, -4.94677734375, -4.68377685546875, -4.4207763671875, -4.15777587890625, -3.894775390625, -3.63177490234375, -3.3687744140625, -3.10577392578125, -2.8427734375, -2.57977294921875, -2.3167724609375, -2.05377197265625, -1.790771484375, -1.52777099609375, -1.2647705078125, -1.00177001953125, -0.73876953125, -0.47576904296875, -0.2127685546875, 0.05023193359375, 0.313232421875, 0.57623291015625, 0.8392333984375, 1.10223388671875, 1.365234375, 1.62823486328125, 1.8912353515625, 2.15423583984375, 2.417236328125, 2.68023681640625, 2.9432373046875, 3.20623779296875, 3.46923828125, 3.73223876953125, 3.9952392578125, 4.25823974609375, 4.521240234375, 4.78424072265625, 5.0472412109375, 5.31024169921875, 5.5732421875, 5.83624267578125, 6.0992431640625, 6.36224365234375, 6.625244140625, 6.88824462890625, 7.1512451171875, 7.41424560546875, 7.67724609375, 7.94024658203125, 8.2032470703125, 8.46624755859375, 8.729248046875, 8.99224853515625, 9.2552490234375, 9.51824951171875, 9.78125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 6.0, 18.0, 14.0, 32.0, 52.0, 89.0, 181.0, 363.0, 865.0, 2415.0, 8035.0, 53679.0, 768310.0, 2951649.0, 369696.0, 30122.0, 5603.0, 1768.0, 718.0, 302.0, 147.0, 79.0, 44.0, 30.0, 22.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.22552490234375, -6.0135498046875, -5.80157470703125, -5.589599609375, -5.37762451171875, -5.1656494140625, -4.95367431640625, -4.74169921875, -4.52972412109375, -4.3177490234375, -4.10577392578125, -3.893798828125, -3.68182373046875, -3.4698486328125, -3.25787353515625, -3.0458984375, -2.83392333984375, -2.6219482421875, -2.40997314453125, -2.197998046875, -1.98602294921875, -1.7740478515625, -1.56207275390625, -1.35009765625, -1.13812255859375, -0.9261474609375, -0.71417236328125, -0.502197265625, -0.29022216796875, -0.0782470703125, 0.13372802734375, 0.345703125, 0.55767822265625, 0.7696533203125, 0.98162841796875, 1.193603515625, 1.40557861328125, 1.6175537109375, 1.82952880859375, 2.04150390625, 2.25347900390625, 2.4654541015625, 2.67742919921875, 2.889404296875, 3.10137939453125, 3.3133544921875, 3.52532958984375, 3.7373046875, 3.94927978515625, 4.1612548828125, 4.37322998046875, 4.585205078125, 4.79718017578125, 5.0091552734375, 5.22113037109375, 5.43310546875, 5.64508056640625, 5.8570556640625, 6.06903076171875, 6.281005859375, 6.49298095703125, 6.7049560546875, 6.91693115234375, 7.12890625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 7.0, 22.0, 22.0, 37.0, 64.0, 74.0, 107.0, 116.0, 136.0, 113.0, 100.0, 68.0, 50.0, 38.0, 17.0, 8.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.768287658691406, -31.316558837890625, -29.864830017089844, -28.41309928894043, -26.96137046813965, -25.509641647338867, -24.057910919189453, -22.606182098388672, -21.15445327758789, -19.70272445678711, -18.250995635986328, -16.799264907836914, -15.347536087036133, -13.895807266235352, -12.444077491760254, -10.992347717285156, -9.540618896484375, -8.088890075683594, -6.637160301208496, -5.185431003570557, -3.733701705932617, -2.2819724082946777, -0.8302431106567383, 0.6214866638183594, 2.0732154846191406, 3.52494478225708, 4.9766740798950195, 6.428403377532959, 7.880132675170898, 9.33186149597168, 10.783591270446777, 12.235321044921875, 13.687049865722656, 15.138778686523438, 16.59050750732422, 18.042238235473633, 19.493967056274414, 20.945695877075195, 22.39742660522461, 23.84915542602539, 25.300884246826172, 26.752613067626953, 28.204341888427734, 29.65607261657715, 31.10780143737793, 32.559532165527344, 34.011260986328125, 35.462989807128906, 36.91471862792969, 38.36644744873047, 39.81817626953125, 41.26990509033203, 42.72163391113281, 44.17336654663086, 45.62509536743164, 47.07682418823242, 48.5285530090332, 49.980281829833984, 51.432010650634766, 52.88373947143555, 54.335472106933594, 55.787200927734375, 57.238929748535156, 58.69065856933594, 60.14238739013672]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 9.0, 6.0, 13.0, 12.0, 13.0, 13.0, 21.0, 18.0, 23.0, 25.0, 29.0, 27.0, 33.0, 47.0, 29.0, 38.0, 38.0, 53.0, 31.0, 32.0, 41.0, 31.0, 47.0, 39.0, 32.0, 23.0, 32.0, 26.0, 33.0, 23.0, 18.0, 19.0, 14.0, 15.0, 11.0, 14.0, 12.0, 12.0, 6.0, 7.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0], "bins": [-20.572280883789062, -19.982149124145508, -19.392017364501953, -18.801883697509766, -18.21175193786621, -17.621620178222656, -17.0314884185791, -16.441356658935547, -15.851223945617676, -15.261092185974121, -14.67095947265625, -14.080827713012695, -13.49069595336914, -12.90056324005127, -12.310431480407715, -11.720298767089844, -11.130167007446289, -10.540035247802734, -9.949902534484863, -9.359770774841309, -8.769638061523438, -8.179506301879883, -7.589374542236328, -6.999242305755615, -6.409110069274902, -5.8189778327941895, -5.228845596313477, -4.638713836669922, -4.048581600189209, -3.458449363708496, -2.8683173656463623, -2.2781853675842285, -1.6880550384521484, -1.097922921180725, -0.5077908039093018, 0.08234131336212158, 0.6724734306335449, 1.2626056671142578, 1.8527376651763916, 2.4428696632385254, 3.0330018997192383, 3.623134136199951, 4.213266372680664, 4.803398132324219, 5.393530368804932, 5.9836626052856445, 6.573794364929199, 7.163926601409912, 7.754058837890625, 8.34419059753418, 8.93432331085205, 9.524455070495605, 10.114587783813477, 10.704719543457031, 11.294851303100586, 11.88498306274414, 12.475115776062012, 13.065247535705566, 13.655380249023438, 14.245512008666992, 14.835643768310547, 15.425776481628418, 16.01590919494629, 16.606040954589844, 17.1961727142334]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 2.0, 4.0, 10.0, 13.0, 9.0, 14.0, 10.0, 19.0, 17.0, 18.0, 16.0, 32.0, 22.0, 33.0, 38.0, 48.0, 33.0, 40.0, 44.0, 41.0, 42.0, 42.0, 42.0, 43.0, 41.0, 37.0, 35.0, 43.0, 29.0, 22.0, 31.0, 15.0, 17.0, 15.0, 14.0, 16.0, 11.0, 15.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.46875, -35.35302734375, -34.2373046875, -33.12158203125, -32.005859375, -30.89013671875, -29.7744140625, -28.65869140625, -27.54296875, -26.42724609375, -25.3115234375, -24.19580078125, -23.080078125, -21.96435546875, -20.8486328125, -19.73291015625, -18.6171875, -17.50146484375, -16.3857421875, -15.27001953125, -14.154296875, -13.03857421875, -11.9228515625, -10.80712890625, -9.69140625, -8.57568359375, -7.4599609375, -6.34423828125, -5.228515625, -4.11279296875, -2.9970703125, -1.88134765625, -0.765625, 0.35009765625, 1.4658203125, 2.58154296875, 3.697265625, 4.81298828125, 5.9287109375, 7.04443359375, 8.16015625, 9.27587890625, 10.3916015625, 11.50732421875, 12.623046875, 13.73876953125, 14.8544921875, 15.97021484375, 17.0859375, 18.20166015625, 19.3173828125, 20.43310546875, 21.548828125, 22.66455078125, 23.7802734375, 24.89599609375, 26.01171875, 27.12744140625, 28.2431640625, 29.35888671875, 30.474609375, 31.59033203125, 32.7060546875, 33.82177734375, 34.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 16.0, 12.0, 30.0, 45.0, 57.0, 91.0, 158.0, 217.0, 367.0, 556.0, 937.0, 1362.0, 2149.0, 3153.0, 4893.0, 7293.0, 11446.0, 18448.0, 30260.0, 50801.0, 87507.0, 148344.0, 220598.0, 184052.0, 110430.0, 64497.0, 37686.0, 23145.0, 14203.0, 9099.0, 5822.0, 3663.0, 2590.0, 1654.0, 1029.0, 649.0, 445.0, 286.0, 202.0, 133.0, 81.0, 46.0, 26.0, 28.0, 12.0, 14.0, 10.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.22265625, -3.121063232421875, -3.01947021484375, -2.917877197265625, -2.8162841796875, -2.714691162109375, -2.61309814453125, -2.511505126953125, -2.409912109375, -2.308319091796875, -2.20672607421875, -2.105133056640625, -2.0035400390625, -1.901947021484375, -1.80035400390625, -1.698760986328125, -1.59716796875, -1.495574951171875, -1.39398193359375, -1.292388916015625, -1.1907958984375, -1.089202880859375, -0.98760986328125, -0.886016845703125, -0.784423828125, -0.682830810546875, -0.58123779296875, -0.479644775390625, -0.3780517578125, -0.276458740234375, -0.17486572265625, -0.073272705078125, 0.0283203125, 0.129913330078125, 0.23150634765625, 0.333099365234375, 0.4346923828125, 0.536285400390625, 0.63787841796875, 0.739471435546875, 0.841064453125, 0.942657470703125, 1.04425048828125, 1.145843505859375, 1.2474365234375, 1.349029541015625, 1.45062255859375, 1.552215576171875, 1.65380859375, 1.755401611328125, 1.85699462890625, 1.958587646484375, 2.0601806640625, 2.161773681640625, 2.26336669921875, 2.364959716796875, 2.466552734375, 2.568145751953125, 2.66973876953125, 2.771331787109375, 2.8729248046875, 2.974517822265625, 3.07611083984375, 3.177703857421875, 3.279296875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 6.0, 9.0, 10.0, 9.0, 4.0, 11.0, 16.0, 17.0, 24.0, 27.0, 22.0, 26.0, 26.0, 27.0, 34.0, 28.0, 40.0, 51.0, 30.0, 42.0, 1080.0, 49.0, 43.0, 28.0, 30.0, 33.0, 31.0, 41.0, 21.0, 26.0, 21.0, 19.0, 25.0, 24.0, 12.0, 16.0, 11.0, 12.0, 9.0, 7.0, 8.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.21875, -20.543701171875, -19.86865234375, -19.193603515625, -18.5185546875, -17.843505859375, -17.16845703125, -16.493408203125, -15.818359375, -15.143310546875, -14.46826171875, -13.793212890625, -13.1181640625, -12.443115234375, -11.76806640625, -11.093017578125, -10.41796875, -9.742919921875, -9.06787109375, -8.392822265625, -7.7177734375, -7.042724609375, -6.36767578125, -5.692626953125, -5.017578125, -4.342529296875, -3.66748046875, -2.992431640625, -2.3173828125, -1.642333984375, -0.96728515625, -0.292236328125, 0.3828125, 1.057861328125, 1.73291015625, 2.407958984375, 3.0830078125, 3.758056640625, 4.43310546875, 5.108154296875, 5.783203125, 6.458251953125, 7.13330078125, 7.808349609375, 8.4833984375, 9.158447265625, 9.83349609375, 10.508544921875, 11.18359375, 11.858642578125, 12.53369140625, 13.208740234375, 13.8837890625, 14.558837890625, 15.23388671875, 15.908935546875, 16.583984375, 17.259033203125, 17.93408203125, 18.609130859375, 19.2841796875, 19.959228515625, 20.63427734375, 21.309326171875, 21.984375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 7.0, 4.0, 13.0, 13.0, 21.0, 27.0, 54.0, 67.0, 80.0, 139.0, 173.0, 264.0, 431.0, 594.0, 949.0, 1425.0, 2070.0, 3095.0, 4980.0, 7709.0, 12210.0, 19813.0, 32195.0, 54355.0, 93589.0, 165394.0, 1286641.0, 170034.0, 96693.0, 55668.0, 33284.0, 20065.0, 12397.0, 7887.0, 5043.0, 3350.0, 2082.0, 1391.0, 938.0, 635.0, 428.0, 316.0, 184.0, 129.0, 95.0, 63.0, 48.0, 34.0, 16.0, 18.0, 11.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.609375, -3.501708984375, -3.39404296875, -3.286376953125, -3.1787109375, -3.071044921875, -2.96337890625, -2.855712890625, -2.748046875, -2.640380859375, -2.53271484375, -2.425048828125, -2.3173828125, -2.209716796875, -2.10205078125, -1.994384765625, -1.88671875, -1.779052734375, -1.67138671875, -1.563720703125, -1.4560546875, -1.348388671875, -1.24072265625, -1.133056640625, -1.025390625, -0.917724609375, -0.81005859375, -0.702392578125, -0.5947265625, -0.487060546875, -0.37939453125, -0.271728515625, -0.1640625, -0.056396484375, 0.05126953125, 0.158935546875, 0.2666015625, 0.374267578125, 0.48193359375, 0.589599609375, 0.697265625, 0.804931640625, 0.91259765625, 1.020263671875, 1.1279296875, 1.235595703125, 1.34326171875, 1.450927734375, 1.55859375, 1.666259765625, 1.77392578125, 1.881591796875, 1.9892578125, 2.096923828125, 2.20458984375, 2.312255859375, 2.419921875, 2.527587890625, 2.63525390625, 2.742919921875, 2.8505859375, 2.958251953125, 3.06591796875, 3.173583984375, 3.28125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 7.0, 2.0, 7.0, 2.0, 6.0, 8.0, 8.0, 17.0, 19.0, 27.0, 35.0, 54.0, 63.0, 75.0, 85.0, 96.0, 104.0, 75.0, 68.0, 59.0, 45.0, 31.0, 26.0, 24.0, 15.0, 16.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0297088623046875, -0.02890181541442871, -0.028094768524169922, -0.027287721633911133, -0.026480674743652344, -0.025673627853393555, -0.024866580963134766, -0.024059534072875977, -0.023252487182617188, -0.0224454402923584, -0.02163839340209961, -0.02083134651184082, -0.02002429962158203, -0.019217252731323242, -0.018410205841064453, -0.017603158950805664, -0.016796112060546875, -0.015989065170288086, -0.015182018280029297, -0.014374971389770508, -0.013567924499511719, -0.01276087760925293, -0.01195383071899414, -0.011146783828735352, -0.010339736938476562, -0.009532690048217773, -0.008725643157958984, -0.007918596267700195, -0.007111549377441406, -0.006304502487182617, -0.005497455596923828, -0.004690408706665039, -0.00388336181640625, -0.003076314926147461, -0.002269268035888672, -0.0014622211456298828, -0.0006551742553710938, 0.0001518726348876953, 0.0009589195251464844, 0.0017659664154052734, 0.0025730133056640625, 0.0033800601959228516, 0.004187107086181641, 0.00499415397644043, 0.005801200866699219, 0.006608247756958008, 0.007415294647216797, 0.008222341537475586, 0.009029388427734375, 0.009836435317993164, 0.010643482208251953, 0.011450529098510742, 0.012257575988769531, 0.01306462287902832, 0.01387166976928711, 0.014678716659545898, 0.015485763549804688, 0.016292810440063477, 0.017099857330322266, 0.017906904220581055, 0.018713951110839844, 0.019520998001098633, 0.020328044891357422, 0.02113509178161621, 0.021942138671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 16.0, 11.0, 13.0, 13.0, 17.0, 25.0, 36.0, 41.0, 87.0, 118.0, 161.0, 345.0, 535.0, 1211.0, 2645.0, 7297.0, 26403.0, 135597.0, 571884.0, 242475.0, 42432.0, 10501.0, 3558.0, 1442.0, 666.0, 355.0, 218.0, 128.0, 84.0, 61.0, 44.0, 28.0, 21.0, 13.0, 18.0, 12.0, 13.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1151123046875, -0.11109542846679688, -0.10707855224609375, -0.10306167602539062, -0.0990447998046875, -0.09502792358398438, -0.09101104736328125, -0.08699417114257812, -0.082977294921875, -0.07896041870117188, -0.07494354248046875, -0.07092666625976562, -0.0669097900390625, -0.06289291381835938, -0.05887603759765625, -0.054859161376953125, -0.05084228515625, -0.046825408935546875, -0.04280853271484375, -0.038791656494140625, -0.0347747802734375, -0.030757904052734375, -0.02674102783203125, -0.022724151611328125, -0.018707275390625, -0.014690399169921875, -0.01067352294921875, -0.006656646728515625, -0.0026397705078125, 0.001377105712890625, 0.00539398193359375, 0.009410858154296875, 0.013427734375, 0.017444610595703125, 0.02146148681640625, 0.025478363037109375, 0.0294952392578125, 0.033512115478515625, 0.03752899169921875, 0.041545867919921875, 0.045562744140625, 0.049579620361328125, 0.05359649658203125, 0.057613372802734375, 0.0616302490234375, 0.06564712524414062, 0.06966400146484375, 0.07368087768554688, 0.07769775390625, 0.08171463012695312, 0.08573150634765625, 0.08974838256835938, 0.0937652587890625, 0.09778213500976562, 0.10179901123046875, 0.10581588745117188, 0.109832763671875, 0.11384963989257812, 0.11786651611328125, 0.12188339233398438, 0.1259002685546875, 0.12991714477539062, 0.13393402099609375, 0.13795089721679688, 0.1419677734375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 18.0, 37.0, 49.0, 85.0, 118.0, 128.0, 145.0, 126.0, 103.0, 68.0, 36.0, 24.0, 15.0, 12.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017672255635261536, -0.016899771988391876, -0.016127288341522217, -0.015354804694652557, -0.014582321047782898, -0.013809837400913239, -0.013037352822721004, -0.012264869175851345, -0.011492385528981686, -0.010719901882112026, -0.009947418235242367, -0.009174933657050133, -0.008402450010180473, -0.007629966828972101, -0.0068574827164411545, -0.006084999069571495, -0.005312515422701836, -0.004540031775832176, -0.003767547896131873, -0.00299506401643157, -0.0022225803695619106, -0.0014500967226922512, -0.0006776126101613045, 9.487103670835495e-05, 0.0008673546835780144, 0.0016398384468629956, 0.002412322210147977, 0.00318480608984828, 0.003957289736717939, 0.004729773383587599, 0.0055022574961185455, 0.006274741142988205, 0.007047224789857864, 0.007819708436727524, 0.008592192083597183, 0.009364675730466843, 0.010137159377336502, 0.010909643024206161, 0.011682127602398396, 0.012454611249268055, 0.013227094896137714, 0.013999578543007374, 0.014772062189877033, 0.015544546768069267, 0.016317030414938927, 0.017089514061808586, 0.017861997708678246, 0.018634481355547905, 0.019406965002417564, 0.020179448649287224, 0.020951932296156883, 0.021724415943026543, 0.022496899589896202, 0.02326938323676586, 0.02404186874628067, 0.02481435239315033, 0.02558683604001999, 0.02635931968688965, 0.027131803333759308, 0.027904286980628967, 0.028676770627498627, 0.029449254274368286, 0.030221737921237946, 0.030994221568107605, 0.031766705214977264]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 4.0, 5.0, 8.0, 7.0, 19.0, 13.0, 14.0, 17.0, 29.0, 16.0, 30.0, 39.0, 37.0, 30.0, 32.0, 41.0, 48.0, 39.0, 44.0, 48.0, 38.0, 40.0, 36.0, 34.0, 26.0, 30.0, 33.0, 40.0, 20.0, 24.0, 24.0, 20.0, 13.0, 18.0, 13.0, 10.0, 12.0, 11.0, 5.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.012194693088531494, -0.011804303154349327, -0.01141391322016716, -0.011023523285984993, -0.010633133351802826, -0.010242743417620659, -0.009852353483438492, -0.009461963549256325, -0.009071573615074158, -0.00868118368089199, -0.008290793746709824, -0.007900403812527657, -0.0075100138783454895, -0.0071196239441633224, -0.006729234009981155, -0.006338844075798988, -0.005948454141616821, -0.005558064207434654, -0.005167674273252487, -0.00477728433907032, -0.004386894404888153, -0.003996504470705986, -0.003606114536523819, -0.003215724602341652, -0.002825334668159485, -0.002434944733977318, -0.0020445547997951508, -0.0016541648656129837, -0.0012637749314308167, -0.0008733849972486496, -0.00048299506306648254, -9.260512888431549e-05, 0.00029778480529785156, 0.0006881747394800186, 0.0010785646736621857, 0.0014689546078443527, 0.0018593445420265198, 0.002249734476208687, 0.002640124410390854, 0.003030514344573021, 0.003420904278755188, 0.003811294212937355, 0.004201684147119522, 0.004592074081301689, 0.004982464015483856, 0.005372853949666023, 0.00576324388384819, 0.006153633818030357, 0.006544023752212524, 0.0069344136863946915, 0.0073248036205768585, 0.007715193554759026, 0.008105583488941193, 0.00849597342312336, 0.008886363357305527, 0.009276753291487694, 0.00966714322566986, 0.010057533159852028, 0.010447923094034195, 0.010838313028216362, 0.011228702962398529, 0.011619092896580696, 0.012009482830762863, 0.01239987276494503, 0.012790262699127197]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 2.0, 4.0, 10.0, 12.0, 10.0, 14.0, 10.0, 19.0, 16.0, 17.0, 18.0, 30.0, 24.0, 32.0, 40.0, 47.0, 34.0, 39.0, 44.0, 41.0, 42.0, 40.0, 44.0, 43.0, 40.0, 35.0, 38.0, 41.0, 30.0, 22.0, 30.0, 17.0, 16.0, 16.0, 14.0, 16.0, 11.0, 15.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.46875, -35.353515625, -34.23828125, -33.123046875, -32.0078125, -30.892578125, -29.77734375, -28.662109375, -27.546875, -26.431640625, -25.31640625, -24.201171875, -23.0859375, -21.970703125, -20.85546875, -19.740234375, -18.625, -17.509765625, -16.39453125, -15.279296875, -14.1640625, -13.048828125, -11.93359375, -10.818359375, -9.703125, -8.587890625, -7.47265625, -6.357421875, -5.2421875, -4.126953125, -3.01171875, -1.896484375, -0.78125, 0.333984375, 1.44921875, 2.564453125, 3.6796875, 4.794921875, 5.91015625, 7.025390625, 8.140625, 9.255859375, 10.37109375, 11.486328125, 12.6015625, 13.716796875, 14.83203125, 15.947265625, 17.0625, 18.177734375, 19.29296875, 20.408203125, 21.5234375, 22.638671875, 23.75390625, 24.869140625, 25.984375, 27.099609375, 28.21484375, 29.330078125, 30.4453125, 31.560546875, 32.67578125, 33.791015625, 34.90625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 13.0, 24.0, 22.0, 28.0, 45.0, 59.0, 69.0, 130.0, 205.0, 280.0, 415.0, 702.0, 1302.0, 2632.0, 6144.0, 19401.0, 87160.0, 428469.0, 394164.0, 77727.0, 17916.0, 5933.0, 2465.0, 1251.0, 682.0, 428.0, 267.0, 182.0, 107.0, 100.0, 66.0, 35.0, 30.0, 26.0, 9.0, 14.0, 10.0, 9.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.04522705078125, -6.8248291015625, -6.60443115234375, -6.384033203125, -6.16363525390625, -5.9432373046875, -5.72283935546875, -5.50244140625, -5.28204345703125, -5.0616455078125, -4.84124755859375, -4.620849609375, -4.40045166015625, -4.1800537109375, -3.95965576171875, -3.7392578125, -3.51885986328125, -3.2984619140625, -3.07806396484375, -2.857666015625, -2.63726806640625, -2.4168701171875, -2.19647216796875, -1.97607421875, -1.75567626953125, -1.5352783203125, -1.31488037109375, -1.094482421875, -0.87408447265625, -0.6536865234375, -0.43328857421875, -0.212890625, 0.00750732421875, 0.2279052734375, 0.44830322265625, 0.668701171875, 0.88909912109375, 1.1094970703125, 1.32989501953125, 1.55029296875, 1.77069091796875, 1.9910888671875, 2.21148681640625, 2.431884765625, 2.65228271484375, 2.8726806640625, 3.09307861328125, 3.3134765625, 3.53387451171875, 3.7542724609375, 3.97467041015625, 4.195068359375, 4.41546630859375, 4.6358642578125, 4.85626220703125, 5.07666015625, 5.29705810546875, 5.5174560546875, 5.73785400390625, 5.958251953125, 6.17864990234375, 6.3990478515625, 6.61944580078125, 6.83984375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 18.0, 17.0, 20.0, 36.0, 44.0, 65.0, 98.0, 105.0, 2046.0, 186.0, 89.0, 92.0, 51.0, 35.0, 44.0, 25.0, 22.0, 16.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.625, -108.330078125, -105.03515625, -101.740234375, -98.4453125, -95.150390625, -91.85546875, -88.560546875, -85.265625, -81.970703125, -78.67578125, -75.380859375, -72.0859375, -68.791015625, -65.49609375, -62.201171875, -58.90625, -55.611328125, -52.31640625, -49.021484375, -45.7265625, -42.431640625, -39.13671875, -35.841796875, -32.546875, -29.251953125, -25.95703125, -22.662109375, -19.3671875, -16.072265625, -12.77734375, -9.482421875, -6.1875, -2.892578125, 0.40234375, 3.697265625, 6.9921875, 10.287109375, 13.58203125, 16.876953125, 20.171875, 23.466796875, 26.76171875, 30.056640625, 33.3515625, 36.646484375, 39.94140625, 43.236328125, 46.53125, 49.826171875, 53.12109375, 56.416015625, 59.7109375, 63.005859375, 66.30078125, 69.595703125, 72.890625, 76.185546875, 79.48046875, 82.775390625, 86.0703125, 89.365234375, 92.66015625, 95.955078125, 99.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 5.0, 6.0, 5.0, 7.0, 18.0, 17.0, 25.0, 36.0, 54.0, 69.0, 117.0, 199.0, 305.0, 522.0, 1015.0, 2781.0, 18763.0, 2613267.0, 488678.0, 14929.0, 2587.0, 971.0, 509.0, 272.0, 181.0, 106.0, 80.0, 58.0, 32.0, 24.0, 24.0, 14.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.5859375, -14.11474609375, -13.6435546875, -13.17236328125, -12.701171875, -12.22998046875, -11.7587890625, -11.28759765625, -10.81640625, -10.34521484375, -9.8740234375, -9.40283203125, -8.931640625, -8.46044921875, -7.9892578125, -7.51806640625, -7.046875, -6.57568359375, -6.1044921875, -5.63330078125, -5.162109375, -4.69091796875, -4.2197265625, -3.74853515625, -3.27734375, -2.80615234375, -2.3349609375, -1.86376953125, -1.392578125, -0.92138671875, -0.4501953125, 0.02099609375, 0.4921875, 0.96337890625, 1.4345703125, 1.90576171875, 2.376953125, 2.84814453125, 3.3193359375, 3.79052734375, 4.26171875, 4.73291015625, 5.2041015625, 5.67529296875, 6.146484375, 6.61767578125, 7.0888671875, 7.56005859375, 8.03125, 8.50244140625, 8.9736328125, 9.44482421875, 9.916015625, 10.38720703125, 10.8583984375, 11.32958984375, 11.80078125, 12.27197265625, 12.7431640625, 13.21435546875, 13.685546875, 14.15673828125, 14.6279296875, 15.09912109375, 15.5703125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 9.0, 23.0, 91.0, 279.0, 340.0, 168.0, 51.0, 13.0, 16.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.14376831054688, -133.12490844726562, -127.10604858398438, -121.08718872070312, -115.06832885742188, -109.04946899414062, -103.03060150146484, -97.0117416381836, -90.99288177490234, -84.9740219116211, -78.95516204833984, -72.93629455566406, -66.91743469238281, -60.89857864379883, -54.87971496582031, -48.86085510253906, -42.84199523925781, -36.82313537597656, -30.80427360534668, -24.785411834716797, -18.766551971435547, -12.747692108154297, -6.728828430175781, -0.7099685668945312, 5.308891296386719, 11.327752113342285, 17.34661293029785, 23.365474700927734, 29.384334564208984, 35.403194427490234, 41.42205810546875, 47.44091796875, 53.45977783203125, 59.4786376953125, 65.49749755859375, 71.516357421875, 77.53521728515625, 83.5540771484375, 89.57294464111328, 95.59180450439453, 101.61066436767578, 107.62952423095703, 113.64838409423828, 119.66725158691406, 125.68611145019531, 131.70497131347656, 137.7238311767578, 143.74269104003906, 149.7615509033203, 155.78041076660156, 161.7992706298828, 167.81813049316406, 173.8369903564453, 179.85585021972656, 185.87472534179688, 191.89358520507812, 197.91244506835938, 203.93130493164062, 209.95016479492188, 215.96902465820312, 221.98788452148438, 228.00674438476562, 234.02560424804688, 240.04446411132812, 246.06332397460938]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 11.0, 16.0, 10.0, 19.0, 33.0, 27.0, 30.0, 21.0, 33.0, 44.0, 49.0, 36.0, 33.0, 38.0, 35.0, 68.0, 51.0, 38.0, 54.0, 37.0, 47.0, 44.0, 30.0, 17.0, 26.0, 28.0, 20.0, 14.0, 10.0, 13.0, 7.0, 9.0, 8.0, 1.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-70.78162384033203, -68.49209594726562, -66.20257568359375, -63.913047790527344, -61.62351989746094, -59.3339958190918, -57.044471740722656, -54.75494384765625, -52.46541976928711, -50.17589569091797, -47.88636779785156, -45.59684371948242, -43.30731964111328, -41.017791748046875, -38.728267669677734, -36.438743591308594, -34.14921569824219, -31.859689712524414, -29.57016372680664, -27.2806396484375, -24.991113662719727, -22.701587677001953, -20.412063598632812, -18.12253761291504, -15.833011627197266, -13.543485641479492, -11.253960609436035, -8.964435577392578, -6.674909591674805, -4.385383605957031, -2.095858573913574, 0.1936664581298828, 2.4832000732421875, 4.772725582122803, 7.062251091003418, 9.351776123046875, 11.641302108764648, 13.930828094482422, 16.220352172851562, 18.509878158569336, 20.79940414428711, 23.088930130004883, 25.378456115722656, 27.667980194091797, 29.95750617980957, 32.247032165527344, 34.536556243896484, 36.826080322265625, 39.11560821533203, 41.40513229370117, 43.69466018676758, 45.98418426513672, 48.273712158203125, 50.563236236572266, 52.852760314941406, 55.14228820800781, 57.43181228637695, 59.721336364746094, 62.0108642578125, 64.3003921508789, 66.58991241455078, 68.87944030761719, 71.1689682006836, 73.45848846435547, 75.74801635742188]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 12.0, 12.0, 20.0, 29.0, 44.0, 60.0, 74.0, 100.0, 159.0, 217.0, 351.0, 520.0, 784.0, 1361.0, 2091.0, 3277.0, 5001.0, 7131.0, 1008935.0, 6348.0, 4238.0, 2786.0, 1785.0, 1105.0, 684.0, 445.0, 301.0, 171.0, 153.0, 90.0, 53.0, 65.0, 36.0, 21.0, 22.0, 15.0, 13.0, 10.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.990504264831543, -12.56213092803955, -12.133756637573242, -11.70538330078125, -11.277009963989258, -10.84863567352295, -10.420262336730957, -9.991888046264648, -9.563514709472656, -9.135141372680664, -8.706767082214355, -8.278393745422363, -7.850019931793213, -7.4216461181640625, -6.99327278137207, -6.56489896774292, -6.1365251541137695, -5.708151340484619, -5.279777526855469, -4.851404190063477, -4.423030376434326, -3.994656562805176, -3.5662829875946045, -3.137909412384033, -2.709535598754883, -2.2811617851257324, -1.8527882099151611, -1.4244145154953003, -0.9960408210754395, -0.5676670074462891, -0.13929343223571777, 0.2890801429748535, 0.7174530029296875, 1.1458266973495483, 1.5742003917694092, 2.0025739669799805, 2.430947780609131, 2.8593215942382812, 3.2876951694488525, 3.716068744659424, 4.144442558288574, 4.572816371917725, 5.001190185546875, 5.429563522338867, 5.857937335968018, 6.286311149597168, 6.71468448638916, 7.1430583000183105, 7.571432113647461, 7.999805927276611, 8.428179740905762, 8.856553077697754, 9.284927368164062, 9.713300704956055, 10.141674041748047, 10.570047378540039, 10.998421669006348, 11.42679500579834, 11.855169296264648, 12.28354263305664, 12.711915969848633, 13.140290260314941, 13.568663597106934, 13.997037887573242, 14.425411224365234]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 12.0, 8.0, 15.0, 24.0, 54.0, 63.0, 105.0, 229.0, 51460032.0, 2305.0, 123.0, 61.0, 49.0, 29.0, 19.0, 17.0, 10.0, 13.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1726.7813720703125, -1664.7305908203125, -1602.679931640625, -1540.629150390625, -1478.578369140625, -1416.527587890625, -1354.4769287109375, -1292.4261474609375, -1230.37548828125, -1168.32470703125, -1106.2740478515625, -1044.2232666015625, -982.1724853515625, -920.1217651367188, -858.071044921875, -796.020263671875, -733.969482421875, -671.9187622070312, -609.8679809570312, -547.8172607421875, -485.7665100097656, -423.71575927734375, -361.6650390625, -299.6142883300781, -237.56353759765625, -175.51278686523438, -113.46205139160156, -51.41131591796875, 10.639434814453125, 72.690185546875, 134.74090576171875, 196.79165649414062, 258.842529296875, 320.8932800292969, 382.94403076171875, 444.9947509765625, 507.0455017089844, 569.0962524414062, 631.14697265625, 693.19775390625, 755.2484741210938, 817.2991943359375, 879.3499755859375, 941.4006958007812, 1003.451416015625, 1065.502197265625, 1127.552978515625, 1189.6036376953125, 1251.6544189453125, 1313.7052001953125, 1375.755859375, 1437.806640625, 1499.857421875, 1561.908203125, 1623.9588623046875, 1686.0096435546875, 1748.060302734375, 1810.111083984375, 1872.1617431640625, 1934.2125244140625, 1996.2633056640625, 2058.31396484375, 2120.36474609375, 2182.41552734375, 2244.46630859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 7.0, 13.0, 54.0, 58.0, 88.0, 133.0, 234.0, 353.0, 468.0, 732.0, 1058.0, 1563.0, 2307.0, 3186.0, 4498.0, 6742.0, 10039.0, 14401.0, 20988.0, 30929.0, 46046.0, 69706.0, 106224.0, 161133.0, 248740.0, 394054.0, 3052013.0, 1093062.0, 355477.0, 227539.0, 147541.0, 96341.0, 63142.0, 42700.0, 28219.0, 19250.0, 13356.0, 9092.0, 6197.0, 4341.0, 3002.0, 2110.0, 1378.0, 947.0, 691.0, 472.0, 311.0, 181.0, 142.0, 62.0, 64.0, 23.0, 12.0, 9.0, 5.0, 5.0, 5.0], "bins": [-1.091796875, -1.0595855712890625, -1.027374267578125, -0.9951629638671875, -0.96295166015625, -0.9307403564453125, -0.898529052734375, -0.8663177490234375, -0.8341064453125, -0.8018951416015625, -0.769683837890625, -0.7374725341796875, -0.70526123046875, -0.6730499267578125, -0.640838623046875, -0.6086273193359375, -0.576416015625, -0.5442047119140625, -0.511993408203125, -0.4797821044921875, -0.44757080078125, -0.4153594970703125, -0.383148193359375, -0.3509368896484375, -0.3187255859375, -0.2865142822265625, -0.254302978515625, -0.2220916748046875, -0.18988037109375, -0.1576690673828125, -0.125457763671875, -0.0932464599609375, -0.06103515625, -0.0288238525390625, 0.003387451171875, 0.0355987548828125, 0.06781005859375, 0.1000213623046875, 0.132232666015625, 0.1644439697265625, 0.1966552734375, 0.2288665771484375, 0.261077880859375, 0.2932891845703125, 0.32550048828125, 0.3577117919921875, 0.389923095703125, 0.4221343994140625, 0.454345703125, 0.4865570068359375, 0.518768310546875, 0.5509796142578125, 0.58319091796875, 0.6154022216796875, 0.647613525390625, 0.6798248291015625, 0.7120361328125, 0.7442474365234375, 0.776458740234375, 0.8086700439453125, 0.84088134765625, 0.8730926513671875, 0.905303955078125, 0.9375152587890625, 0.9697265625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 14.0, 2.0, 8.0, 14.0, 8.0, 14.0, 14.0, 18.0, 22.0, 23.0, 26.0, 30.0, 32.0, 36.0, 41.0, 37.0, 42.0, 46.0, 51.0, 731.0, 343.0, 54.0, 34.0, 45.0, 30.0, 42.0, 40.0, 34.0, 29.0, 22.0, 16.0, 30.0, 16.0, 15.0, 17.0, 10.0, 10.0, 8.0, 8.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.8984375, -7.65032958984375, -7.4022216796875, -7.15411376953125, -6.906005859375, -6.65789794921875, -6.4097900390625, -6.16168212890625, -5.91357421875, -5.66546630859375, -5.4173583984375, -5.16925048828125, -4.921142578125, -4.67303466796875, -4.4249267578125, -4.17681884765625, -3.9287109375, -3.68060302734375, -3.4324951171875, -3.18438720703125, -2.936279296875, -2.68817138671875, -2.4400634765625, -2.19195556640625, -1.94384765625, -1.69573974609375, -1.4476318359375, -1.19952392578125, -0.951416015625, -0.70330810546875, -0.4552001953125, -0.20709228515625, 0.041015625, 0.28912353515625, 0.5372314453125, 0.78533935546875, 1.033447265625, 1.28155517578125, 1.5296630859375, 1.77777099609375, 2.02587890625, 2.27398681640625, 2.5220947265625, 2.77020263671875, 3.018310546875, 3.26641845703125, 3.5145263671875, 3.76263427734375, 4.0107421875, 4.25885009765625, 4.5069580078125, 4.75506591796875, 5.003173828125, 5.25128173828125, 5.4993896484375, 5.74749755859375, 5.99560546875, 6.24371337890625, 6.4918212890625, 6.73992919921875, 6.988037109375, 7.23614501953125, 7.4842529296875, 7.73236083984375, 7.98046875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [7.0, 3.0, 6.0, 7.0, 8.0, 7.0, 10.0, 23.0, 18.0, 36.0, 38.0, 69.0, 102.0, 134.0, 207.0, 290.0, 372.0, 636.0, 887.0, 1349.0, 1977.0, 2887.0, 4530.0, 6635.0, 10320.0, 16065.0, 25570.0, 41831.0, 69907.0, 115802.0, 197367.0, 345831.0, 840729.0, 3528588.0, 458972.0, 248938.0, 146538.0, 85394.0, 51896.0, 32097.0, 19691.0, 12227.0, 7957.0, 5188.0, 3378.0, 2169.0, 1488.0, 1017.0, 755.0, 506.0, 316.0, 230.0, 127.0, 97.0, 68.0, 49.0, 37.0, 28.0, 10.0, 12.0, 8.0, 7.0, 5.0, 3.0], "bins": [-1.51953125, -1.473785400390625, -1.42803955078125, -1.382293701171875, -1.3365478515625, -1.290802001953125, -1.24505615234375, -1.199310302734375, -1.153564453125, -1.107818603515625, -1.06207275390625, -1.016326904296875, -0.9705810546875, -0.924835205078125, -0.87908935546875, -0.833343505859375, -0.78759765625, -0.741851806640625, -0.69610595703125, -0.650360107421875, -0.6046142578125, -0.558868408203125, -0.51312255859375, -0.467376708984375, -0.421630859375, -0.375885009765625, -0.33013916015625, -0.284393310546875, -0.2386474609375, -0.192901611328125, -0.14715576171875, -0.101409912109375, -0.0556640625, -0.009918212890625, 0.03582763671875, 0.081573486328125, 0.1273193359375, 0.173065185546875, 0.21881103515625, 0.264556884765625, 0.310302734375, 0.356048583984375, 0.40179443359375, 0.447540283203125, 0.4932861328125, 0.539031982421875, 0.58477783203125, 0.630523681640625, 0.67626953125, 0.722015380859375, 0.76776123046875, 0.813507080078125, 0.8592529296875, 0.904998779296875, 0.95074462890625, 0.996490478515625, 1.042236328125, 1.087982177734375, 1.13372802734375, 1.179473876953125, 1.2252197265625, 1.270965576171875, 1.31671142578125, 1.362457275390625, 1.408203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 18.0, 15.0, 13.0, 17.0, 17.0, 19.0, 29.0, 21.0, 26.0, 30.0, 36.0, 29.0, 42.0, 53.0, 47.0, 99.0, 831.0, 219.0, 57.0, 45.0, 35.0, 43.0, 30.0, 29.0, 36.0, 23.0, 26.0, 30.0, 19.0, 13.0, 8.0, 12.0, 7.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.19085693359375, -6.0067138671875, -5.82257080078125, -5.638427734375, -5.45428466796875, -5.2701416015625, -5.08599853515625, -4.90185546875, -4.71771240234375, -4.5335693359375, -4.34942626953125, -4.165283203125, -3.98114013671875, -3.7969970703125, -3.61285400390625, -3.4287109375, -3.24456787109375, -3.0604248046875, -2.87628173828125, -2.692138671875, -2.50799560546875, -2.3238525390625, -2.13970947265625, -1.95556640625, -1.77142333984375, -1.5872802734375, -1.40313720703125, -1.218994140625, -1.03485107421875, -0.8507080078125, -0.66656494140625, -0.482421875, -0.29827880859375, -0.1141357421875, 0.07000732421875, 0.254150390625, 0.43829345703125, 0.6224365234375, 0.80657958984375, 0.99072265625, 1.17486572265625, 1.3590087890625, 1.54315185546875, 1.727294921875, 1.91143798828125, 2.0955810546875, 2.27972412109375, 2.4638671875, 2.64801025390625, 2.8321533203125, 3.01629638671875, 3.200439453125, 3.38458251953125, 3.5687255859375, 3.75286865234375, 3.93701171875, 4.12115478515625, 4.3052978515625, 4.48944091796875, 4.673583984375, 4.85772705078125, 5.0418701171875, 5.22601318359375, 5.41015625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 21.0, 18.0, 13.0, 24.0, 35.0, 63.0, 95.0, 160.0, 196.0, 262.0, 431.0, 704.0, 1039.0, 1594.0, 2842.0, 5476.0, 12968.0, 40532.0, 222391.0, 5886123.0, 77631.0, 21433.0, 7877.0, 3926.0, 1940.0, 1204.0, 810.0, 516.0, 307.0, 230.0, 171.0, 135.0, 88.0, 55.0, 30.0, 21.0, 10.0, 19.0, 5.0, 9.0, 6.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.16796875, -6.9384765625, -6.708984375, -6.4794921875, -6.25, -6.0205078125, -5.791015625, -5.5615234375, -5.33203125, -5.1025390625, -4.873046875, -4.6435546875, -4.4140625, -4.1845703125, -3.955078125, -3.7255859375, -3.49609375, -3.2666015625, -3.037109375, -2.8076171875, -2.578125, -2.3486328125, -2.119140625, -1.8896484375, -1.66015625, -1.4306640625, -1.201171875, -0.9716796875, -0.7421875, -0.5126953125, -0.283203125, -0.0537109375, 0.17578125, 0.4052734375, 0.634765625, 0.8642578125, 1.09375, 1.3232421875, 1.552734375, 1.7822265625, 2.01171875, 2.2412109375, 2.470703125, 2.7001953125, 2.9296875, 3.1591796875, 3.388671875, 3.6181640625, 3.84765625, 4.0771484375, 4.306640625, 4.5361328125, 4.765625, 4.9951171875, 5.224609375, 5.4541015625, 5.68359375, 5.9130859375, 6.142578125, 6.3720703125, 6.6015625, 6.8310546875, 7.060546875, 7.2900390625, 7.51953125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 2.0, 9.0, 14.0, 12.0, 27.0, 19.0, 17.0, 27.0, 28.0, 18.0, 25.0, 29.0, 37.0, 31.0, 54.0, 64.0, 162.0, 712.0, 219.0, 72.0, 50.0, 38.0, 44.0, 35.0, 32.0, 30.0, 32.0, 30.0, 22.0, 17.0, 17.0, 20.0, 17.0, 3.0, 5.0, 8.0, 14.0, 1.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.2421875, -4.10760498046875, -3.9730224609375, -3.83843994140625, -3.703857421875, -3.56927490234375, -3.4346923828125, -3.30010986328125, -3.16552734375, -3.03094482421875, -2.8963623046875, -2.76177978515625, -2.627197265625, -2.49261474609375, -2.3580322265625, -2.22344970703125, -2.0888671875, -1.95428466796875, -1.8197021484375, -1.68511962890625, -1.550537109375, -1.41595458984375, -1.2813720703125, -1.14678955078125, -1.01220703125, -0.87762451171875, -0.7430419921875, -0.60845947265625, -0.473876953125, -0.33929443359375, -0.2047119140625, -0.07012939453125, 0.064453125, 0.19903564453125, 0.3336181640625, 0.46820068359375, 0.602783203125, 0.73736572265625, 0.8719482421875, 1.00653076171875, 1.14111328125, 1.27569580078125, 1.4102783203125, 1.54486083984375, 1.679443359375, 1.81402587890625, 1.9486083984375, 2.08319091796875, 2.2177734375, 2.35235595703125, 2.4869384765625, 2.62152099609375, 2.756103515625, 2.89068603515625, 3.0252685546875, 3.15985107421875, 3.29443359375, 3.42901611328125, 3.5635986328125, 3.69818115234375, 3.832763671875, 3.96734619140625, 4.1019287109375, 4.23651123046875, 4.37109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 12.0, 27.0, 44.0, 76.0, 159.0, 219.0, 207.0, 124.0, 62.0, 33.0, 15.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.960474491119385, -7.5760579109191895, -7.191641330718994, -6.807224750518799, -6.4228081703186035, -6.038391590118408, -5.653975009918213, -5.269558429718018, -4.885141849517822, -4.500725269317627, -4.116308689117432, -3.7318921089172363, -3.347475528717041, -2.9630589485168457, -2.5786423683166504, -2.194225788116455, -1.8098092079162598, -1.4253926277160645, -1.0409760475158691, -0.6565594673156738, -0.2721428871154785, 0.1122736930847168, 0.4966902732849121, 0.8811068534851074, 1.2655234336853027, 1.649940013885498, 2.0343565940856934, 2.4187731742858887, 2.803189754486084, 3.1876063346862793, 3.5720229148864746, 3.95643949508667, 4.340856552124023, 4.725273132324219, 5.109689712524414, 5.494106292724609, 5.878522872924805, 6.262939453125, 6.647356033325195, 7.031772613525391, 7.416189193725586, 7.800605773925781, 8.185022354125977, 8.569438934326172, 8.953855514526367, 9.338272094726562, 9.722688674926758, 10.107105255126953, 10.491521835327148, 10.875938415527344, 11.260354995727539, 11.644771575927734, 12.02918815612793, 12.413604736328125, 12.79802131652832, 13.182437896728516, 13.566854476928711, 13.951271057128906, 14.335687637329102, 14.720104217529297, 15.104520797729492, 15.488937377929688, 15.873353958129883, 16.257770538330078, 16.642187118530273]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 6.0, 6.0, 18.0, 21.0, 25.0, 34.0, 37.0, 49.0, 57.0, 53.0, 63.0, 62.0, 54.0, 65.0, 71.0, 52.0, 58.0, 43.0, 44.0, 36.0, 30.0, 35.0, 21.0, 10.0, 11.0, 7.0, 8.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.039026260375977, -11.74767017364502, -11.456315040588379, -11.164958953857422, -10.873603820800781, -10.582247734069824, -10.290892601013184, -9.999536514282227, -9.708181381225586, -9.416825294494629, -9.125470161437988, -8.834114074707031, -8.54275894165039, -8.251402854919434, -7.960047245025635, -7.668691635131836, -7.377335548400879, -7.08597993850708, -6.794624328613281, -6.503268718719482, -6.211913108825684, -5.920557022094727, -5.629201412200928, -5.337845802307129, -5.04649019241333, -4.755134582519531, -4.463778972625732, -4.172423362731934, -3.8810675144195557, -3.589711904525757, -3.298356056213379, -3.00700044631958, -2.7156457901000977, -2.424290180206299, -2.1329345703125, -1.841578722000122, -1.5502231121063232, -1.2588675022125244, -0.967511773109436, -0.6761560440063477, -0.38480043411254883, -0.09344476461410522, 0.19791090488433838, 0.489266574382782, 0.7806222438812256, 1.0719778537750244, 1.3633335828781128, 1.6546893119812012, 1.946044921875, 2.237400531768799, 2.5287561416625977, 2.8201119899749756, 3.1114675998687744, 3.4028232097625732, 3.694179058074951, 3.98553466796875, 4.276890277862549, 4.568245887756348, 4.8596014976501465, 5.150957107543945, 5.442313194274902, 5.733668327331543, 6.0250244140625, 6.316380023956299, 6.607735633850098]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 8.0, 8.0, 9.0, 6.0, 18.0, 16.0, 26.0, 37.0, 23.0, 24.0, 42.0, 57.0, 67.0, 88.0, 125.0, 183.0, 204.0, 279.0, 371.0, 489.0, 657.0, 1003.0, 1518.0, 2441.0, 4003.0, 7497.0, 16496.0, 51137.0, 3815016.0, 244569.0, 26848.0, 9883.0, 4490.0, 2467.0, 1482.0, 910.0, 544.0, 369.0, 267.0, 160.0, 119.0, 93.0, 73.0, 55.0, 31.0, 17.0, 15.0, 13.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.21533203125, -0.209320068359375, -0.20330810546875, -0.197296142578125, -0.1912841796875, -0.185272216796875, -0.17926025390625, -0.173248291015625, -0.167236328125, -0.161224365234375, -0.15521240234375, -0.149200439453125, -0.1431884765625, -0.137176513671875, -0.13116455078125, -0.125152587890625, -0.119140625, -0.113128662109375, -0.10711669921875, -0.101104736328125, -0.0950927734375, -0.089080810546875, -0.08306884765625, -0.077056884765625, -0.071044921875, -0.065032958984375, -0.05902099609375, -0.053009033203125, -0.0469970703125, -0.040985107421875, -0.03497314453125, -0.028961181640625, -0.02294921875, -0.016937255859375, -0.01092529296875, -0.004913330078125, 0.0010986328125, 0.007110595703125, 0.01312255859375, 0.019134521484375, 0.025146484375, 0.031158447265625, 0.03717041015625, 0.043182373046875, 0.0491943359375, 0.055206298828125, 0.06121826171875, 0.067230224609375, 0.0732421875, 0.079254150390625, 0.08526611328125, 0.091278076171875, 0.0972900390625, 0.103302001953125, 0.10931396484375, 0.115325927734375, 0.121337890625, 0.127349853515625, 0.13336181640625, 0.139373779296875, 0.1453857421875, 0.151397705078125, 0.15740966796875, 0.163421630859375, 0.16943359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 11.0, 19.0, 25.0, 11.0, 192.0, 578.0, 40.0, 24.0, 11.0, 8.0, 4.0, 4.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047027587890625, -0.04572153091430664, -0.04441547393798828, -0.04310941696166992, -0.04180335998535156, -0.0404973030090332, -0.039191246032714844, -0.037885189056396484, -0.036579132080078125, -0.035273075103759766, -0.033967018127441406, -0.03266096115112305, -0.03135490417480469, -0.030048847198486328, -0.02874279022216797, -0.02743673324584961, -0.02613067626953125, -0.02482461929321289, -0.02351856231689453, -0.022212505340576172, -0.020906448364257812, -0.019600391387939453, -0.018294334411621094, -0.016988277435302734, -0.015682220458984375, -0.014376163482666016, -0.013070106506347656, -0.011764049530029297, -0.010457992553710938, -0.009151935577392578, -0.007845878601074219, -0.006539821624755859, -0.0052337646484375, -0.003927707672119141, -0.0026216506958007812, -0.0013155937194824219, -9.5367431640625e-06, 0.0012965202331542969, 0.0026025772094726562, 0.003908634185791016, 0.005214691162109375, 0.006520748138427734, 0.007826805114746094, 0.009132862091064453, 0.010438919067382812, 0.011744976043701172, 0.013051033020019531, 0.01435708999633789, 0.01566314697265625, 0.01696920394897461, 0.01827526092529297, 0.019581317901611328, 0.020887374877929688, 0.022193431854248047, 0.023499488830566406, 0.024805545806884766, 0.026111602783203125, 0.027417659759521484, 0.028723716735839844, 0.030029773712158203, 0.03133583068847656, 0.03264188766479492, 0.03394794464111328, 0.03525400161743164, 0.03656005859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 12.0, 19.0, 19.0, 28.0, 58.0, 58.0, 131.0, 217.0, 382.0, 735.0, 1591.0, 4370.0, 17279.0, 125155.0, 3731760.0, 271327.0, 29421.0, 7006.0, 2375.0, 1021.0, 531.0, 312.0, 180.0, 103.0, 65.0, 43.0, 24.0, 13.0, 6.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.2707023620605469, -0.26186370849609375, -0.2530250549316406, -0.2441864013671875, -0.23534774780273438, -0.22650909423828125, -0.21767044067382812, -0.208831787109375, -0.19999313354492188, -0.19115447998046875, -0.18231582641601562, -0.1734771728515625, -0.16463851928710938, -0.15579986572265625, -0.14696121215820312, -0.13812255859375, -0.12928390502929688, -0.12044525146484375, -0.11160659790039062, -0.1027679443359375, -0.09392929077148438, -0.08509063720703125, -0.07625198364257812, -0.067413330078125, -0.058574676513671875, -0.04973602294921875, -0.040897369384765625, -0.0320587158203125, -0.023220062255859375, -0.01438140869140625, -0.005542755126953125, 0.0032958984375, 0.012134552001953125, 0.02097320556640625, 0.029811859130859375, 0.0386505126953125, 0.047489166259765625, 0.05632781982421875, 0.06516647338867188, 0.074005126953125, 0.08284378051757812, 0.09168243408203125, 0.10052108764648438, 0.1093597412109375, 0.11819839477539062, 0.12703704833984375, 0.13587570190429688, 0.14471435546875, 0.15355300903320312, 0.16239166259765625, 0.17123031616210938, 0.1800689697265625, 0.18890762329101562, 0.19774627685546875, 0.20658493041992188, 0.215423583984375, 0.22426223754882812, 0.23310089111328125, 0.24193954467773438, 0.2507781982421875, 0.2596168518066406, 0.26845550537109375, 0.2772941589355469, 0.2861328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 13.0, 25.0, 24.0, 52.0, 85.0, 152.0, 241.0, 760.0, 1722.0, 411.0, 211.0, 112.0, 92.0, 47.0, 35.0, 28.0, 14.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078125, -0.07525920867919922, -0.07239341735839844, -0.06952762603759766, -0.06666183471679688, -0.0637960433959961, -0.06093025207519531, -0.05806446075439453, -0.05519866943359375, -0.05233287811279297, -0.04946708679199219, -0.046601295471191406, -0.043735504150390625, -0.040869712829589844, -0.03800392150878906, -0.03513813018798828, -0.0322723388671875, -0.02940654754638672, -0.026540756225585938, -0.023674964904785156, -0.020809173583984375, -0.017943382263183594, -0.015077590942382812, -0.012211799621582031, -0.00934600830078125, -0.006480216979980469, -0.0036144256591796875, -0.0007486343383789062, 0.002117156982421875, 0.004982948303222656, 0.007848739624023438, 0.010714530944824219, 0.013580322265625, 0.01644611358642578, 0.019311904907226562, 0.022177696228027344, 0.025043487548828125, 0.027909278869628906, 0.030775070190429688, 0.03364086151123047, 0.03650665283203125, 0.03937244415283203, 0.04223823547363281, 0.045104026794433594, 0.047969818115234375, 0.050835609436035156, 0.05370140075683594, 0.05656719207763672, 0.0594329833984375, 0.06229877471923828, 0.06516456604003906, 0.06803035736083984, 0.07089614868164062, 0.0737619400024414, 0.07662773132324219, 0.07949352264404297, 0.08235931396484375, 0.08522510528564453, 0.08809089660644531, 0.0909566879272461, 0.09382247924804688, 0.09668827056884766, 0.09955406188964844, 0.10241985321044922, 0.10528564453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 17.0, 17.0, 35.0, 130.0, 306.0, 268.0, 110.0, 54.0, 27.0, 20.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27859652042388916, -0.2547541856765747, -0.23091186583042145, -0.2070695459842682, -0.18322721123695374, -0.15938489139080048, -0.13554257154464722, -0.11170023679733276, -0.0878579169511795, -0.06401558965444565, -0.04017326608300209, -0.016330942511558533, 0.0075113847851753235, 0.03135371208190918, 0.05519603192806244, 0.07903836667537689, 0.10288068652153015, 0.1267230063676834, 0.15056534111499786, 0.17440766096115112, 0.19824999570846558, 0.22209231555461884, 0.2459346354007721, 0.26977697014808655, 0.2936192750930786, 0.31746160984039307, 0.34130391478538513, 0.3651462495326996, 0.38898858428001404, 0.4128308892250061, 0.43667322397232056, 0.460515558719635, 0.48435789346694946, 0.5082002282142639, 0.5320425629615784, 0.555884838104248, 0.5797271728515625, 0.603569507598877, 0.6274118423461914, 0.6512541770935059, 0.6750965118408203, 0.6989388465881348, 0.7227811813354492, 0.7466235160827637, 0.7704657912254333, 0.7943081259727478, 0.8181504607200623, 0.8419927954673767, 0.8658350706100464, 0.8896774053573608, 0.9135197401046753, 0.9373620748519897, 0.9612043499946594, 0.9850466847419739, 1.0088889598846436, 1.032731294631958, 1.056573748588562, 1.0804160833358765, 1.104258418083191, 1.1281007528305054, 1.1519430875778198, 1.1757854223251343, 1.1996276378631592, 1.2234699726104736, 1.247312307357788]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 11.0, 15.0, 25.0, 33.0, 47.0, 45.0, 83.0, 105.0, 92.0, 93.0, 85.0, 95.0, 68.0, 59.0, 48.0, 33.0, 27.0, 9.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5118328332901001, -0.4925919473171234, -0.47335106134414673, -0.45411017537117004, -0.43486928939819336, -0.41562843322753906, -0.3963875472545624, -0.3771466612815857, -0.357905775308609, -0.3386648893356323, -0.31942400336265564, -0.30018311738967896, -0.28094226121902466, -0.2617013454437256, -0.2424604892730713, -0.2232196033000946, -0.20397871732711792, -0.18473783135414124, -0.16549694538116455, -0.14625607430934906, -0.12701518833637238, -0.10777430236339569, -0.0885334238409996, -0.06929254531860352, -0.05005165934562683, -0.030810777097940445, -0.011569894850254059, 0.007670987397432327, 0.026911869645118713, 0.0461527556180954, 0.06539363414049149, 0.08463451266288757, 0.10387545824050903, 0.12311634421348572, 0.1423572301864624, 0.1615981012582779, 0.18083898723125458, 0.20007987320423126, 0.21932074427604675, 0.23856163024902344, 0.2578025162220001, 0.2770434021949768, 0.2962842881679535, 0.3155251741409302, 0.3347660303115845, 0.35400694608688354, 0.37324780225753784, 0.3924886882305145, 0.4117295742034912, 0.4309704601764679, 0.4502113461494446, 0.46945223212242126, 0.48869311809539795, 0.5079339742660522, 0.5271748900413513, 0.5464157462120056, 0.5656566619873047, 0.584897518157959, 0.6041384339332581, 0.6233792901039124, 0.6426202058792114, 0.6618610620498657, 0.6811019778251648, 0.7003428339958191, 0.7195836901664734]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 6.0, 8.0, 14.0, 25.0, 28.0, 44.0, 74.0, 60.0, 101.0, 173.0, 262.0, 400.0, 623.0, 1040.0, 1758.0, 3310.0, 6119.0, 14257.0, 56274.0, 857552.0, 75473.0, 15926.0, 6779.0, 3426.0, 1874.0, 1063.0, 639.0, 408.0, 285.0, 164.0, 106.0, 82.0, 62.0, 37.0, 28.0, 17.0, 13.0, 14.0, 7.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.217010498046875, -0.20941162109375, -0.201812744140625, -0.1942138671875, -0.186614990234375, -0.17901611328125, -0.171417236328125, -0.163818359375, -0.156219482421875, -0.14862060546875, -0.141021728515625, -0.1334228515625, -0.125823974609375, -0.11822509765625, -0.110626220703125, -0.10302734375, -0.095428466796875, -0.08782958984375, -0.080230712890625, -0.0726318359375, -0.065032958984375, -0.05743408203125, -0.049835205078125, -0.042236328125, -0.034637451171875, -0.02703857421875, -0.019439697265625, -0.0118408203125, -0.004241943359375, 0.00335693359375, 0.010955810546875, 0.0185546875, 0.026153564453125, 0.03375244140625, 0.041351318359375, 0.0489501953125, 0.056549072265625, 0.06414794921875, 0.071746826171875, 0.079345703125, 0.086944580078125, 0.09454345703125, 0.102142333984375, 0.1097412109375, 0.117340087890625, 0.12493896484375, 0.132537841796875, 0.14013671875, 0.147735595703125, 0.15533447265625, 0.162933349609375, 0.1705322265625, 0.178131103515625, 0.18572998046875, 0.193328857421875, 0.200927734375, 0.208526611328125, 0.21612548828125, 0.223724365234375, 0.2313232421875, 0.238922119140625, 0.24652099609375, 0.254119873046875, 0.26171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 15.0, 12.0, 21.0, 50.0, 158.0, 332.0, 229.0, 75.0, 30.0, 11.0, 10.0, 5.0, 4.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05517578125, -0.05362272262573242, -0.052069664001464844, -0.050516605377197266, -0.04896354675292969, -0.04741048812866211, -0.04585742950439453, -0.04430437088012695, -0.042751312255859375, -0.0411982536315918, -0.03964519500732422, -0.03809213638305664, -0.03653907775878906, -0.034986019134521484, -0.033432960510253906, -0.03187990188598633, -0.03032684326171875, -0.028773784637451172, -0.027220726013183594, -0.025667667388916016, -0.024114608764648438, -0.02256155014038086, -0.02100849151611328, -0.019455432891845703, -0.017902374267578125, -0.016349315643310547, -0.014796257019042969, -0.01324319839477539, -0.011690139770507812, -0.010137081146240234, -0.008584022521972656, -0.007030963897705078, -0.0054779052734375, -0.003924846649169922, -0.0023717880249023438, -0.0008187294006347656, 0.0007343292236328125, 0.0022873878479003906, 0.0038404464721679688, 0.005393505096435547, 0.006946563720703125, 0.008499622344970703, 0.010052680969238281, 0.01160573959350586, 0.013158798217773438, 0.014711856842041016, 0.016264915466308594, 0.017817974090576172, 0.01937103271484375, 0.020924091339111328, 0.022477149963378906, 0.024030208587646484, 0.025583267211914062, 0.02713632583618164, 0.02868938446044922, 0.030242443084716797, 0.031795501708984375, 0.03334856033325195, 0.03490161895751953, 0.03645467758178711, 0.03800773620605469, 0.039560794830322266, 0.041113853454589844, 0.04266691207885742, 0.044219970703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 7.0, 11.0, 9.0, 12.0, 26.0, 41.0, 59.0, 106.0, 218.0, 540.0, 1660.0, 7799.0, 67616.0, 844158.0, 112145.0, 10761.0, 2151.0, 680.0, 251.0, 117.0, 63.0, 36.0, 26.0, 16.0, 8.0, 4.0, 10.0, 13.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4628486633300781, -0.44864654541015625, -0.4344444274902344, -0.4202423095703125, -0.4060401916503906, -0.39183807373046875, -0.3776359558105469, -0.363433837890625, -0.3492317199707031, -0.33502960205078125, -0.3208274841308594, -0.3066253662109375, -0.2924232482910156, -0.27822113037109375, -0.2640190124511719, -0.24981689453125, -0.23561477661132812, -0.22141265869140625, -0.20721054077148438, -0.1930084228515625, -0.17880630493164062, -0.16460418701171875, -0.15040206909179688, -0.136199951171875, -0.12199783325195312, -0.10779571533203125, -0.09359359741210938, -0.0793914794921875, -0.06518936157226562, -0.05098724365234375, -0.036785125732421875, -0.0225830078125, -0.008380889892578125, 0.00582122802734375, 0.020023345947265625, 0.0342254638671875, 0.048427581787109375, 0.06262969970703125, 0.07683181762695312, 0.091033935546875, 0.10523605346679688, 0.11943817138671875, 0.13364028930664062, 0.1478424072265625, 0.16204452514648438, 0.17624664306640625, 0.19044876098632812, 0.20465087890625, 0.21885299682617188, 0.23305511474609375, 0.24725723266601562, 0.2614593505859375, 0.2756614685058594, 0.28986358642578125, 0.3040657043457031, 0.318267822265625, 0.3324699401855469, 0.34667205810546875, 0.3608741760253906, 0.3750762939453125, 0.3892784118652344, 0.40348052978515625, 0.4176826477050781, 0.431884765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 9.0, 10.0, 11.0, 9.0, 20.0, 20.0, 18.0, 27.0, 18.0, 36.0, 27.0, 23.0, 41.0, 35.0, 37.0, 34.0, 45.0, 42.0, 31.0, 33.0, 46.0, 43.0, 44.0, 46.0, 32.0, 33.0, 28.0, 22.0, 34.0, 16.0, 23.0, 23.0, 10.0, 20.0, 13.0, 4.0, 11.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.15178489685058594, -0.14646530151367188, -0.1411457061767578, -0.13582611083984375, -0.1305065155029297, -0.12518692016601562, -0.11986732482910156, -0.1145477294921875, -0.10922813415527344, -0.10390853881835938, -0.09858894348144531, -0.09326934814453125, -0.08794975280761719, -0.08263015747070312, -0.07731056213378906, -0.071990966796875, -0.06667137145996094, -0.061351776123046875, -0.05603218078613281, -0.05071258544921875, -0.04539299011230469, -0.040073394775390625, -0.03475379943847656, -0.0294342041015625, -0.024114608764648438, -0.018795013427734375, -0.013475418090820312, -0.00815582275390625, -0.0028362274169921875, 0.002483367919921875, 0.0078029632568359375, 0.01312255859375, 0.018442153930664062, 0.023761749267578125, 0.029081344604492188, 0.03440093994140625, 0.03972053527832031, 0.045040130615234375, 0.05035972595214844, 0.0556793212890625, 0.06099891662597656, 0.06631851196289062, 0.07163810729980469, 0.07695770263671875, 0.08227729797363281, 0.08759689331054688, 0.09291648864746094, 0.098236083984375, 0.10355567932128906, 0.10887527465820312, 0.11419486999511719, 0.11951446533203125, 0.12483406066894531, 0.13015365600585938, 0.13547325134277344, 0.1407928466796875, 0.14611244201660156, 0.15143203735351562, 0.1567516326904297, 0.16207122802734375, 0.1673908233642578, 0.17271041870117188, 0.17803001403808594, 0.183349609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 6.0, 5.0, 13.0, 16.0, 24.0, 32.0, 46.0, 59.0, 72.0, 128.0, 200.0, 366.0, 613.0, 1093.0, 2227.0, 6290.0, 38004.0, 927846.0, 58286.0, 7846.0, 2529.0, 1154.0, 600.0, 369.0, 225.0, 138.0, 109.0, 70.0, 50.0, 28.0, 25.0, 14.0, 8.0, 9.0, 7.0, 7.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.37060546875, -0.3601875305175781, -0.34976959228515625, -0.3393516540527344, -0.3289337158203125, -0.3185157775878906, -0.30809783935546875, -0.2976799011230469, -0.287261962890625, -0.2768440246582031, -0.26642608642578125, -0.2560081481933594, -0.2455902099609375, -0.23517227172851562, -0.22475433349609375, -0.21433639526367188, -0.20391845703125, -0.19350051879882812, -0.18308258056640625, -0.17266464233398438, -0.1622467041015625, -0.15182876586914062, -0.14141082763671875, -0.13099288940429688, -0.120574951171875, -0.11015701293945312, -0.09973907470703125, -0.08932113647460938, -0.0789031982421875, -0.06848526000976562, -0.05806732177734375, -0.047649383544921875, -0.0372314453125, -0.026813507080078125, -0.01639556884765625, -0.005977630615234375, 0.0044403076171875, 0.014858245849609375, 0.02527618408203125, 0.035694122314453125, 0.046112060546875, 0.056529998779296875, 0.06694793701171875, 0.07736587524414062, 0.0877838134765625, 0.09820175170898438, 0.10861968994140625, 0.11903762817382812, 0.12945556640625, 0.13987350463867188, 0.15029144287109375, 0.16070938110351562, 0.1711273193359375, 0.18154525756835938, 0.19196319580078125, 0.20238113403320312, 0.212799072265625, 0.22321701049804688, 0.23363494873046875, 0.24405288696289062, 0.2544708251953125, 0.2648887634277344, 0.27530670166015625, 0.2857246398925781, 0.296142578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 10.0, 7.0, 22.0, 23.0, 46.0, 72.0, 166.0, 354.0, 95.0, 55.0, 33.0, 32.0, 17.0, 11.0, 6.0, 6.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027408599853515625, -0.0026322901248931885, -0.0025237202644348145, -0.0024151504039764404, -0.0023065805435180664, -0.0021980106830596924, -0.0020894408226013184, -0.0019808709621429443, -0.0018723011016845703, -0.0017637312412261963, -0.0016551613807678223, -0.0015465915203094482, -0.0014380216598510742, -0.0013294517993927002, -0.0012208819389343262, -0.0011123120784759521, -0.0010037422180175781, -0.0008951723575592041, -0.0007866024971008301, -0.0006780326366424561, -0.000569462776184082, -0.000460892915725708, -0.000352323055267334, -0.00024375319480895996, -0.00013518333435058594, -2.6613473892211914e-05, 8.195638656616211e-05, 0.00019052624702453613, 0.00029909610748291016, 0.0004076659679412842, 0.0005162358283996582, 0.0006248056888580322, 0.0007333755493164062, 0.0008419454097747803, 0.0009505152702331543, 0.0010590851306915283, 0.0011676549911499023, 0.0012762248516082764, 0.0013847947120666504, 0.0014933645725250244, 0.0016019344329833984, 0.0017105042934417725, 0.0018190741539001465, 0.0019276440143585205, 0.0020362138748168945, 0.0021447837352752686, 0.0022533535957336426, 0.0023619234561920166, 0.0024704933166503906, 0.0025790631771087646, 0.0026876330375671387, 0.0027962028980255127, 0.0029047727584838867, 0.0030133426189422607, 0.0031219124794006348, 0.003230482339859009, 0.003339052200317383, 0.003447622060775757, 0.003556191921234131, 0.003664761781692505, 0.003773331642150879, 0.003881901502609253, 0.003990471363067627, 0.004099041223526001, 0.004207611083984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 8.0, 4.0, 14.0, 19.0, 14.0, 24.0, 37.0, 46.0, 65.0, 91.0, 126.0, 209.0, 283.0, 458.0, 713.0, 1216.0, 2078.0, 3726.0, 7742.0, 17547.0, 52170.0, 308153.0, 536997.0, 75093.0, 22438.0, 8983.0, 4202.0, 2293.0, 1324.0, 784.0, 511.0, 342.0, 214.0, 183.0, 118.0, 100.0, 60.0, 32.0, 30.0, 26.0, 15.0, 24.0, 13.0, 4.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.136474609375, -0.132354736328125, -0.12823486328125, -0.124114990234375, -0.1199951171875, -0.115875244140625, -0.11175537109375, -0.107635498046875, -0.103515625, -0.099395751953125, -0.09527587890625, -0.091156005859375, -0.0870361328125, -0.082916259765625, -0.07879638671875, -0.074676513671875, -0.070556640625, -0.066436767578125, -0.06231689453125, -0.058197021484375, -0.0540771484375, -0.049957275390625, -0.04583740234375, -0.041717529296875, -0.03759765625, -0.033477783203125, -0.02935791015625, -0.025238037109375, -0.0211181640625, -0.016998291015625, -0.01287841796875, -0.008758544921875, -0.004638671875, -0.000518798828125, 0.00360107421875, 0.007720947265625, 0.0118408203125, 0.015960693359375, 0.02008056640625, 0.024200439453125, 0.0283203125, 0.032440185546875, 0.03656005859375, 0.040679931640625, 0.0447998046875, 0.048919677734375, 0.05303955078125, 0.057159423828125, 0.061279296875, 0.065399169921875, 0.06951904296875, 0.073638916015625, 0.0777587890625, 0.081878662109375, 0.08599853515625, 0.090118408203125, 0.09423828125, 0.098358154296875, 0.10247802734375, 0.106597900390625, 0.1107177734375, 0.114837646484375, 0.11895751953125, 0.123077392578125, 0.127197265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 8.0, 6.0, 6.0, 7.0, 8.0, 10.0, 11.0, 13.0, 17.0, 33.0, 17.0, 33.0, 44.0, 57.0, 94.0, 93.0, 77.0, 88.0, 61.0, 62.0, 46.0, 37.0, 32.0, 32.0, 21.0, 20.0, 18.0, 11.0, 7.0, 4.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1591930389404297, -0.15468978881835938, -0.15018653869628906, -0.14568328857421875, -0.14118003845214844, -0.13667678833007812, -0.1321735382080078, -0.1276702880859375, -0.12316703796386719, -0.11866378784179688, -0.11416053771972656, -0.10965728759765625, -0.10515403747558594, -0.10065078735351562, -0.09614753723144531, -0.091644287109375, -0.08714103698730469, -0.08263778686523438, -0.07813453674316406, -0.07363128662109375, -0.06912803649902344, -0.06462478637695312, -0.06012153625488281, -0.0556182861328125, -0.05111503601074219, -0.046611785888671875, -0.04210853576660156, -0.03760528564453125, -0.03310203552246094, -0.028598785400390625, -0.024095535278320312, -0.01959228515625, -0.015089035034179688, -0.010585784912109375, -0.0060825347900390625, -0.00157928466796875, 0.0029239654541015625, 0.007427215576171875, 0.011930465698242188, 0.0164337158203125, 0.020936965942382812, 0.025440216064453125, 0.029943466186523438, 0.03444671630859375, 0.03894996643066406, 0.043453216552734375, 0.04795646667480469, 0.052459716796875, 0.05696296691894531, 0.061466217041015625, 0.06596946716308594, 0.07047271728515625, 0.07497596740722656, 0.07947921752929688, 0.08398246765136719, 0.0884857177734375, 0.09298896789550781, 0.09749221801757812, 0.10199546813964844, 0.10649871826171875, 0.11100196838378906, 0.11550521850585938, 0.12000846862792969, 0.12451171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 35.0, 288.0, 468.0, 122.0, 38.0, 16.0, 14.0, 7.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625552654266357, -5.473827362060547, -5.322101593017578, -5.170376300811768, -5.018650531768799, -4.866925239562988, -4.7151994705200195, -4.563474178314209, -4.411748886108398, -4.260023593902588, -4.108297824859619, -3.9565722942352295, -3.80484676361084, -3.6531214714050293, -3.5013959407806396, -3.34967041015625, -3.1979446411132812, -3.0462191104888916, -2.894493579864502, -2.7427680492401123, -2.5910425186157227, -2.439317226409912, -2.2875916957855225, -2.135866165161133, -1.9841406345367432, -1.8324151039123535, -1.6806895732879639, -1.5289641618728638, -1.3772386312484741, -1.2255131006240845, -1.0737876892089844, -0.9220621585845947, -0.7703366279602051, -0.6186110973358154, -0.46688562631607056, -0.3151601254940033, -0.16343462467193604, -0.011709094047546387, 0.1400163769721985, 0.29174184799194336, 0.443467378616333, 0.5951929092407227, 0.7469183802604675, 0.8986438512802124, 1.050369381904602, 1.2020949125289917, 1.3538203239440918, 1.5055458545684814, 1.657271385192871, 1.8089969158172607, 1.9607224464416504, 2.11244797706604, 2.2641735076904297, 2.4158987998962402, 2.56762433052063, 2.7193498611450195, 2.871075391769409, 3.022800922393799, 3.1745264530181885, 3.326251983642578, 3.4779772758483887, 3.6297030448913574, 3.781428337097168, 3.9331538677215576, 4.084879398345947]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 2.0, 6.0, 3.0, 7.0, 13.0, 26.0, 40.0, 63.0, 84.0, 123.0, 141.0, 140.0, 97.0, 90.0, 57.0, 28.0, 22.0, 13.0, 6.0, 2.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.130622625350952, -3.0262396335601807, -2.9218568801879883, -2.817473888397217, -2.7130911350250244, -2.608708143234253, -2.5043253898620605, -2.399942398071289, -2.2955594062805176, -2.191176414489746, -2.0867936611175537, -1.9824106693267822, -1.8780279159545898, -1.7736449241638184, -1.6692620515823364, -1.5648791790008545, -1.460496425628662, -1.3561135530471802, -1.2517306804656982, -1.1473476886749268, -1.0429649353027344, -0.9385820031166077, -0.834199070930481, -0.729816198348999, -0.6254333257675171, -0.5210504531860352, -0.41666755080223083, -0.3122846484184265, -0.20790177583694458, -0.10351890325546265, 0.0008640289306640625, 0.105246901512146, 0.20962977409362793, 0.31401264667510986, 0.4183955490589142, 0.5227784514427185, 0.6271613240242004, 0.7315441966056824, 0.8359271287918091, 0.940310001373291, 1.044692873954773, 1.1490757465362549, 1.2534586191177368, 1.3578414916992188, 1.4622244834899902, 1.5666072368621826, 1.670990228652954, 1.775373101234436, 1.879755973815918, 1.9841388463974, 2.088521718978882, 2.1929047107696533, 2.2972874641418457, 2.401670455932617, 2.5060534477233887, 2.610436201095581, 2.7148189544677734, 2.819201946258545, 2.9235846996307373, 3.027967691421509, 3.132350444793701, 3.2367334365844727, 3.341116428375244, 3.4454991817474365, 3.549882173538208]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 11.0, 10.0, 19.0, 28.0, 69.0, 133.0, 399.0, 1411.0, 8174.0, 3873327.0, 304272.0, 4911.0, 941.0, 321.0, 135.0, 55.0, 30.0, 11.0, 4.0, 12.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.134765625, -2.088287353515625, -2.04180908203125, -1.995330810546875, -1.9488525390625, -1.902374267578125, -1.85589599609375, -1.809417724609375, -1.762939453125, -1.716461181640625, -1.66998291015625, -1.623504638671875, -1.5770263671875, -1.530548095703125, -1.48406982421875, -1.437591552734375, -1.39111328125, -1.344635009765625, -1.29815673828125, -1.251678466796875, -1.2052001953125, -1.158721923828125, -1.11224365234375, -1.065765380859375, -1.019287109375, -0.972808837890625, -0.92633056640625, -0.879852294921875, -0.8333740234375, -0.786895751953125, -0.74041748046875, -0.693939208984375, -0.6474609375, -0.600982666015625, -0.55450439453125, -0.508026123046875, -0.4615478515625, -0.415069580078125, -0.36859130859375, -0.322113037109375, -0.275634765625, -0.229156494140625, -0.18267822265625, -0.136199951171875, -0.0897216796875, -0.043243408203125, 0.00323486328125, 0.049713134765625, 0.09619140625, 0.142669677734375, 0.18914794921875, 0.235626220703125, 0.2821044921875, 0.328582763671875, 0.37506103515625, 0.421539306640625, 0.468017578125, 0.514495849609375, 0.56097412109375, 0.607452392578125, 0.6539306640625, 0.700408935546875, 0.74688720703125, 0.793365478515625, 0.83984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 5.0, 7.0, 13.0, 16.0, 16.0, 22.0, 38.0, 72.0, 113.0, 160.0, 170.0, 127.0, 73.0, 55.0, 32.0, 20.0, 10.0, 7.0, 8.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034576416015625, -0.033463478088378906, -0.03235054016113281, -0.03123760223388672, -0.030124664306640625, -0.02901172637939453, -0.027898788452148438, -0.026785850524902344, -0.02567291259765625, -0.024559974670410156, -0.023447036743164062, -0.02233409881591797, -0.021221160888671875, -0.02010822296142578, -0.018995285034179688, -0.017882347106933594, -0.0167694091796875, -0.015656471252441406, -0.014543533325195312, -0.013430595397949219, -0.012317657470703125, -0.011204719543457031, -0.010091781616210938, -0.008978843688964844, -0.00786590576171875, -0.006752967834472656, -0.0056400299072265625, -0.004527091979980469, -0.003414154052734375, -0.0023012161254882812, -0.0011882781982421875, -7.534027099609375e-05, 0.00103759765625, 0.0021505355834960938, 0.0032634735107421875, 0.004376411437988281, 0.005489349365234375, 0.006602287292480469, 0.0077152252197265625, 0.008828163146972656, 0.00994110107421875, 0.011054039001464844, 0.012166976928710938, 0.013279914855957031, 0.014392852783203125, 0.015505790710449219, 0.016618728637695312, 0.017731666564941406, 0.0188446044921875, 0.019957542419433594, 0.021070480346679688, 0.02218341827392578, 0.023296356201171875, 0.02440929412841797, 0.025522232055664062, 0.026635169982910156, 0.02774810791015625, 0.028861045837402344, 0.029973983764648438, 0.03108692169189453, 0.032199859619140625, 0.03331279754638672, 0.03442573547363281, 0.035538673400878906, 0.036651611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 9.0, 13.0, 17.0, 41.0, 80.0, 142.0, 350.0, 697.0, 1549.0, 4021.0, 11684.0, 53695.0, 3676558.0, 400740.0, 30979.0, 8265.0, 2945.0, 1264.0, 627.0, 313.0, 133.0, 79.0, 39.0, 24.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.2350616455078125, -0.221099853515625, -0.2071380615234375, -0.19317626953125, -0.1792144775390625, -0.165252685546875, -0.1512908935546875, -0.1373291015625, -0.1233673095703125, -0.109405517578125, -0.0954437255859375, -0.08148193359375, -0.0675201416015625, -0.053558349609375, -0.0395965576171875, -0.025634765625, -0.0116729736328125, 0.002288818359375, 0.0162506103515625, 0.03021240234375, 0.0441741943359375, 0.058135986328125, 0.0720977783203125, 0.0860595703125, 0.1000213623046875, 0.113983154296875, 0.1279449462890625, 0.14190673828125, 0.1558685302734375, 0.169830322265625, 0.1837921142578125, 0.19775390625, 0.2117156982421875, 0.225677490234375, 0.2396392822265625, 0.25360107421875, 0.2675628662109375, 0.281524658203125, 0.2954864501953125, 0.3094482421875, 0.3234100341796875, 0.337371826171875, 0.3513336181640625, 0.36529541015625, 0.3792572021484375, 0.393218994140625, 0.4071807861328125, 0.421142578125, 0.4351043701171875, 0.449066162109375, 0.4630279541015625, 0.47698974609375, 0.4909515380859375, 0.504913330078125, 0.5188751220703125, 0.5328369140625, 0.5467987060546875, 0.560760498046875, 0.5747222900390625, 0.58868408203125, 0.6026458740234375, 0.616607666015625, 0.6305694580078125, 0.64453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 1.0, 9.0, 9.0, 13.0, 18.0, 34.0, 49.0, 72.0, 126.0, 337.0, 1952.0, 1033.0, 157.0, 79.0, 36.0, 33.0, 18.0, 17.0, 15.0, 14.0, 10.0, 10.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053497314453125, -0.05150556564331055, -0.049513816833496094, -0.04752206802368164, -0.04553031921386719, -0.043538570404052734, -0.04154682159423828, -0.03955507278442383, -0.037563323974609375, -0.03557157516479492, -0.03357982635498047, -0.031588077545166016, -0.029596328735351562, -0.02760457992553711, -0.025612831115722656, -0.023621082305908203, -0.02162933349609375, -0.019637584686279297, -0.017645835876464844, -0.01565408706665039, -0.013662338256835938, -0.011670589447021484, -0.009678840637207031, -0.007687091827392578, -0.005695343017578125, -0.003703594207763672, -0.0017118453979492188, 0.0002799034118652344, 0.0022716522216796875, 0.004263401031494141, 0.006255149841308594, 0.008246898651123047, 0.0102386474609375, 0.012230396270751953, 0.014222145080566406, 0.01621389389038086, 0.018205642700195312, 0.020197391510009766, 0.02218914031982422, 0.024180889129638672, 0.026172637939453125, 0.028164386749267578, 0.03015613555908203, 0.032147884368896484, 0.03413963317871094, 0.03613138198852539, 0.038123130798339844, 0.0401148796081543, 0.04210662841796875, 0.0440983772277832, 0.046090126037597656, 0.04808187484741211, 0.05007362365722656, 0.052065372467041016, 0.05405712127685547, 0.05604887008666992, 0.058040618896484375, 0.06003236770629883, 0.06202411651611328, 0.06401586532592773, 0.06600761413574219, 0.06799936294555664, 0.0699911117553711, 0.07198286056518555, 0.073974609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 10.0, 25.0, 54.0, 649.0, 237.0, 25.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.913608968257904, -0.8558057546615601, -0.7980024814605713, -0.7401992678642273, -0.6823960542678833, -0.6245927810668945, -0.5667895674705505, -0.5089863538742065, -0.45118311047554016, -0.3933798670768738, -0.3355766534805298, -0.2777734100818634, -0.21997018158435822, -0.16216695308685303, -0.10436370968818665, -0.04656049609184265, 0.01124274730682373, 0.06904597580432892, 0.1268492043018341, 0.1846524477005005, 0.24245567619800568, 0.30025890469551086, 0.35806214809417725, 0.41586536169052124, 0.4736686050891876, 0.531471848487854, 0.589275062084198, 0.647078275680542, 0.7048815488815308, 0.7626847624778748, 0.8204879760742188, 0.8782912492752075, 0.9360944032669067, 0.9938976168632507, 1.0517008304595947, 1.1095041036605835, 1.1673073768615723, 1.2251105308532715, 1.2829138040542603, 1.340717077255249, 1.3985202312469482, 1.456323504447937, 1.5141266584396362, 1.571929931640625, 1.6297332048416138, 1.687536358833313, 1.7453396320343018, 1.803142786026001, 1.8609461784362793, 1.918749451637268, 1.9765526056289673, 2.034355878829956, 2.0921590328216553, 2.1499624252319336, 2.207765579223633, 2.265568733215332, 2.3233718872070312, 2.3811750411987305, 2.438978433609009, 2.496781587600708, 2.5545847415924072, 2.6123881340026855, 2.6701912879943848, 2.727994441986084, 2.7857978343963623]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 8.0, 10.0, 18.0, 10.0, 30.0, 38.0, 38.0, 72.0, 71.0, 67.0, 94.0, 98.0, 92.0, 67.0, 77.0, 65.0, 33.0, 28.0, 15.0, 16.0, 14.0, 4.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36985695362091064, -0.3587307333946228, -0.34760454297065735, -0.3364783227443695, -0.32535210251808167, -0.3142258822917938, -0.30309969186782837, -0.2919734716415405, -0.2808472514152527, -0.26972103118896484, -0.2585948407649994, -0.24746862053871155, -0.2363424003124237, -0.22521619498729706, -0.2140899896621704, -0.20296376943588257, -0.19183756411075592, -0.18071135878562927, -0.16958513855934143, -0.15845893323421478, -0.14733271300792694, -0.1362065076828003, -0.12508028745651245, -0.1139540821313858, -0.10282786935567856, -0.09170165657997131, -0.08057544380426407, -0.06944923102855682, -0.05832302197813988, -0.04719680920243263, -0.036070600152015686, -0.02494438737630844, -0.013818174600601196, -0.002691962756216526, 0.008434249088168144, 0.01956046000123024, 0.030686672776937485, 0.04181288555264473, 0.052939094603061676, 0.06406530737876892, 0.07519152015447617, 0.08631773293018341, 0.09744394570589066, 0.1085701584815979, 0.11969636380672455, 0.1308225840330124, 0.14194878935813904, 0.15307500958442688, 0.16420121490955353, 0.17532742023468018, 0.18645364046096802, 0.19757984578609467, 0.2087060660123825, 0.21983227133750916, 0.230958491563797, 0.24208469688892365, 0.2532109022140503, 0.26433712244033813, 0.2754633128643036, 0.28658953309059143, 0.2977157533168793, 0.3088419735431671, 0.31996816396713257, 0.3310943841934204, 0.34222060441970825]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 9.0, 22.0, 20.0, 32.0, 29.0, 57.0, 87.0, 123.0, 172.0, 275.0, 363.0, 665.0, 980.0, 1647.0, 2619.0, 4718.0, 9049.0, 19721.0, 55210.0, 250457.0, 544867.0, 99547.0, 30051.0, 12597.0, 6331.0, 3467.0, 1931.0, 1251.0, 737.0, 474.0, 326.0, 232.0, 159.0, 94.0, 65.0, 48.0, 32.0, 23.0, 17.0, 15.0, 11.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13027191162109375, -0.1256561279296875, -0.12104034423828125, -0.116424560546875, -0.11180877685546875, -0.1071929931640625, -0.10257720947265625, -0.09796142578125, -0.09334564208984375, -0.0887298583984375, -0.08411407470703125, -0.079498291015625, -0.07488250732421875, -0.0702667236328125, -0.06565093994140625, -0.06103515625, -0.05641937255859375, -0.0518035888671875, -0.04718780517578125, -0.042572021484375, -0.03795623779296875, -0.0333404541015625, -0.02872467041015625, -0.02410888671875, -0.01949310302734375, -0.0148773193359375, -0.01026153564453125, -0.005645751953125, -0.00102996826171875, 0.0035858154296875, 0.00820159912109375, 0.0128173828125, 0.01743316650390625, 0.0220489501953125, 0.02666473388671875, 0.031280517578125, 0.03589630126953125, 0.0405120849609375, 0.04512786865234375, 0.04974365234375, 0.05435943603515625, 0.0589752197265625, 0.06359100341796875, 0.068206787109375, 0.07282257080078125, 0.0774383544921875, 0.08205413818359375, 0.086669921875, 0.09128570556640625, 0.0959014892578125, 0.10051727294921875, 0.105133056640625, 0.10974884033203125, 0.1143646240234375, 0.11898040771484375, 0.12359619140625, 0.12821197509765625, 0.1328277587890625, 0.13744354248046875, 0.142059326171875, 0.14667510986328125, 0.1512908935546875, 0.15590667724609375, 0.1605224609375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 5.0, 1.0, 11.0, 7.0, 19.0, 9.0, 16.0, 18.0, 48.0, 50.0, 79.0, 93.0, 118.0, 118.0, 93.0, 82.0, 62.0, 44.0, 30.0, 19.0, 12.0, 20.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0279998779296875, -0.027262449264526367, -0.026525020599365234, -0.0257875919342041, -0.02505016326904297, -0.024312734603881836, -0.023575305938720703, -0.02283787727355957, -0.022100448608398438, -0.021363019943237305, -0.020625591278076172, -0.01988816261291504, -0.019150733947753906, -0.018413305282592773, -0.01767587661743164, -0.016938447952270508, -0.016201019287109375, -0.015463590621948242, -0.01472616195678711, -0.013988733291625977, -0.013251304626464844, -0.012513875961303711, -0.011776447296142578, -0.011039018630981445, -0.010301589965820312, -0.00956416130065918, -0.008826732635498047, -0.008089303970336914, -0.007351875305175781, -0.0066144466400146484, -0.005877017974853516, -0.005139589309692383, -0.00440216064453125, -0.003664731979370117, -0.0029273033142089844, -0.0021898746490478516, -0.0014524459838867188, -0.0007150173187255859, 2.2411346435546875e-05, 0.0007598400115966797, 0.0014972686767578125, 0.0022346973419189453, 0.002972126007080078, 0.003709554672241211, 0.004446983337402344, 0.0051844120025634766, 0.005921840667724609, 0.006659269332885742, 0.007396697998046875, 0.008134126663208008, 0.00887155532836914, 0.009608983993530273, 0.010346412658691406, 0.011083841323852539, 0.011821269989013672, 0.012558698654174805, 0.013296127319335938, 0.01403355598449707, 0.014770984649658203, 0.015508413314819336, 0.01624584197998047, 0.0169832706451416, 0.017720699310302734, 0.018458127975463867, 0.019195556640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 21.0, 46.0, 313.0, 2559.0, 34654.0, 831124.0, 170656.0, 8174.0, 763.0, 115.0, 22.0, 12.0, 6.0, 3.0, 7.0, 4.0, 5.0, 2.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.4303550720214844, -0.41588592529296875, -0.4014167785644531, -0.3869476318359375, -0.3724784851074219, -0.35800933837890625, -0.3435401916503906, -0.329071044921875, -0.3146018981933594, -0.30013275146484375, -0.2856636047363281, -0.2711944580078125, -0.2567253112792969, -0.24225616455078125, -0.22778701782226562, -0.21331787109375, -0.19884872436523438, -0.18437957763671875, -0.16991043090820312, -0.1554412841796875, -0.14097213745117188, -0.12650299072265625, -0.11203384399414062, -0.097564697265625, -0.08309555053710938, -0.06862640380859375, -0.054157257080078125, -0.0396881103515625, -0.025218963623046875, -0.01074981689453125, 0.003719329833984375, 0.0181884765625, 0.032657623291015625, 0.04712677001953125, 0.061595916748046875, 0.0760650634765625, 0.09053421020507812, 0.10500335693359375, 0.11947250366210938, 0.133941650390625, 0.14841079711914062, 0.16287994384765625, 0.17734909057617188, 0.1918182373046875, 0.20628738403320312, 0.22075653076171875, 0.23522567749023438, 0.24969482421875, 0.2641639709472656, 0.27863311767578125, 0.2931022644042969, 0.3075714111328125, 0.3220405578613281, 0.33650970458984375, 0.3509788513183594, 0.365447998046875, 0.3799171447753906, 0.39438629150390625, 0.4088554382324219, 0.4233245849609375, 0.4377937316894531, 0.45226287841796875, 0.4667320251464844, 0.481201171875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 11.0, 5.0, 10.0, 15.0, 21.0, 23.0, 22.0, 32.0, 26.0, 28.0, 30.0, 40.0, 39.0, 41.0, 42.0, 50.0, 39.0, 38.0, 48.0, 47.0, 41.0, 41.0, 30.0, 31.0, 33.0, 32.0, 30.0, 18.0, 25.0, 19.0, 13.0, 13.0, 7.0, 8.0, 6.0, 4.0, 9.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09954833984375, -0.0966033935546875, -0.093658447265625, -0.0907135009765625, -0.0877685546875, -0.0848236083984375, -0.081878662109375, -0.0789337158203125, -0.07598876953125, -0.0730438232421875, -0.070098876953125, -0.0671539306640625, -0.064208984375, -0.0612640380859375, -0.058319091796875, -0.0553741455078125, -0.05242919921875, -0.0494842529296875, -0.046539306640625, -0.0435943603515625, -0.0406494140625, -0.0377044677734375, -0.034759521484375, -0.0318145751953125, -0.02886962890625, -0.0259246826171875, -0.022979736328125, -0.0200347900390625, -0.01708984375, -0.0141448974609375, -0.011199951171875, -0.0082550048828125, -0.00531005859375, -0.0023651123046875, 0.000579833984375, 0.0035247802734375, 0.0064697265625, 0.0094146728515625, 0.012359619140625, 0.0153045654296875, 0.01824951171875, 0.0211944580078125, 0.024139404296875, 0.0270843505859375, 0.030029296875, 0.0329742431640625, 0.035919189453125, 0.0388641357421875, 0.04180908203125, 0.0447540283203125, 0.047698974609375, 0.0506439208984375, 0.0535888671875, 0.0565338134765625, 0.059478759765625, 0.0624237060546875, 0.06536865234375, 0.0683135986328125, 0.071258544921875, 0.0742034912109375, 0.0771484375, 0.0800933837890625, 0.083038330078125, 0.0859832763671875, 0.08892822265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 18.0, 26.0, 37.0, 285.0, 10549.0, 1036675.0, 778.0, 95.0, 25.0, 11.0, 11.0, 7.0, 5.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.697265625, -3.592254638671875, -3.48724365234375, -3.382232666015625, -3.2772216796875, -3.172210693359375, -3.06719970703125, -2.962188720703125, -2.857177734375, -2.752166748046875, -2.64715576171875, -2.542144775390625, -2.4371337890625, -2.332122802734375, -2.22711181640625, -2.122100830078125, -2.01708984375, -1.912078857421875, -1.80706787109375, -1.702056884765625, -1.5970458984375, -1.492034912109375, -1.38702392578125, -1.282012939453125, -1.177001953125, -1.071990966796875, -0.96697998046875, -0.861968994140625, -0.7569580078125, -0.651947021484375, -0.54693603515625, -0.441925048828125, -0.3369140625, -0.231903076171875, -0.12689208984375, -0.021881103515625, 0.0831298828125, 0.188140869140625, 0.29315185546875, 0.398162841796875, 0.503173828125, 0.608184814453125, 0.71319580078125, 0.818206787109375, 0.9232177734375, 1.028228759765625, 1.13323974609375, 1.238250732421875, 1.34326171875, 1.448272705078125, 1.55328369140625, 1.658294677734375, 1.7633056640625, 1.868316650390625, 1.97332763671875, 2.078338623046875, 2.183349609375, 2.288360595703125, 2.39337158203125, 2.498382568359375, 2.6033935546875, 2.708404541015625, 2.81341552734375, 2.918426513671875, 3.0234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 4.0, 7.0, 15.0, 12.0, 21.0, 22.0, 23.0, 51.0, 101.0, 223.0, 194.0, 135.0, 70.0, 32.0, 20.0, 11.0, 8.0, 9.0, 7.0, 6.0, 6.0, 7.0, 4.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007166862487792969, -0.0006956830620765686, -0.0006746798753738403, -0.0006536766886711121, -0.0006326735019683838, -0.0006116703152656555, -0.0005906671285629272, -0.000569663941860199, -0.0005486607551574707, -0.0005276575684547424, -0.0005066543817520142, -0.0004856511950492859, -0.0004646480083465576, -0.00044364482164382935, -0.0004226416349411011, -0.0004016384482383728, -0.00038063526153564453, -0.00035963207483291626, -0.000338628888130188, -0.0003176257014274597, -0.00029662251472473145, -0.0002756193280220032, -0.0002546161413192749, -0.00023361295461654663, -0.00021260976791381836, -0.0001916065812110901, -0.00017060339450836182, -0.00014960020780563354, -0.00012859702110290527, -0.000107593834400177, -8.659064769744873e-05, -6.558746099472046e-05, -4.458427429199219e-05, -2.3581087589263916e-05, -2.5779008865356445e-06, 1.8425285816192627e-05, 3.94284725189209e-05, 6.043165922164917e-05, 8.143484592437744e-05, 0.00010243803262710571, 0.00012344121932983398, 0.00014444440603256226, 0.00016544759273529053, 0.0001864507794380188, 0.00020745396614074707, 0.00022845715284347534, 0.0002494603395462036, 0.0002704635262489319, 0.00029146671295166016, 0.00031246989965438843, 0.0003334730863571167, 0.00035447627305984497, 0.00037547945976257324, 0.0003964826464653015, 0.0004174858331680298, 0.00043848901987075806, 0.00045949220657348633, 0.0004804953932762146, 0.0005014985799789429, 0.0005225017666816711, 0.0005435049533843994, 0.0005645081400871277, 0.000585511326789856, 0.0006065145134925842, 0.0006275177001953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 10.0, 19.0, 17.0, 18.0, 21.0, 22.0, 30.0, 44.0, 50.0, 79.0, 115.0, 212.0, 342.0, 799.0, 2352.0, 9009.0, 83864.0, 894500.0, 46617.0, 7005.0, 1904.0, 681.0, 325.0, 163.0, 93.0, 66.0, 31.0, 31.0, 27.0, 25.0, 15.0, 13.0, 6.0, 6.0, 6.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.37548828125, -0.3657112121582031, -0.35593414306640625, -0.3461570739746094, -0.3363800048828125, -0.3266029357910156, -0.31682586669921875, -0.3070487976074219, -0.297271728515625, -0.2874946594238281, -0.27771759033203125, -0.2679405212402344, -0.2581634521484375, -0.24838638305664062, -0.23860931396484375, -0.22883224487304688, -0.21905517578125, -0.20927810668945312, -0.19950103759765625, -0.18972396850585938, -0.1799468994140625, -0.17016983032226562, -0.16039276123046875, -0.15061569213867188, -0.140838623046875, -0.13106155395507812, -0.12128448486328125, -0.11150741577148438, -0.1017303466796875, -0.09195327758789062, -0.08217620849609375, -0.07239913940429688, -0.0626220703125, -0.052845001220703125, -0.04306793212890625, -0.033290863037109375, -0.0235137939453125, -0.013736724853515625, -0.00395965576171875, 0.005817413330078125, 0.015594482421875, 0.025371551513671875, 0.03514862060546875, 0.044925689697265625, 0.0547027587890625, 0.06447982788085938, 0.07425689697265625, 0.08403396606445312, 0.09381103515625, 0.10358810424804688, 0.11336517333984375, 0.12314224243164062, 0.1329193115234375, 0.14269638061523438, 0.15247344970703125, 0.16225051879882812, 0.172027587890625, 0.18180465698242188, 0.19158172607421875, 0.20135879516601562, 0.2111358642578125, 0.22091293334960938, 0.23069000244140625, 0.24046707153320312, 0.250244140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 3.0, 11.0, 10.0, 21.0, 49.0, 121.0, 240.0, 267.0, 132.0, 74.0, 36.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.378662109375, -0.3704719543457031, -0.36228179931640625, -0.3540916442871094, -0.3459014892578125, -0.3377113342285156, -0.32952117919921875, -0.3213310241699219, -0.313140869140625, -0.3049507141113281, -0.29676055908203125, -0.2885704040527344, -0.2803802490234375, -0.2721900939941406, -0.26399993896484375, -0.2558097839355469, -0.24761962890625, -0.23942947387695312, -0.23123931884765625, -0.22304916381835938, -0.2148590087890625, -0.20666885375976562, -0.19847869873046875, -0.19028854370117188, -0.182098388671875, -0.17390823364257812, -0.16571807861328125, -0.15752792358398438, -0.1493377685546875, -0.14114761352539062, -0.13295745849609375, -0.12476730346679688, -0.1165771484375, -0.10838699340820312, -0.10019683837890625, -0.09200668334960938, -0.0838165283203125, -0.07562637329101562, -0.06743621826171875, -0.059246063232421875, -0.051055908203125, -0.042865753173828125, -0.03467559814453125, -0.026485443115234375, -0.0182952880859375, -0.010105133056640625, -0.00191497802734375, 0.006275177001953125, 0.01446533203125, 0.022655487060546875, 0.03084564208984375, 0.039035797119140625, 0.0472259521484375, 0.055416107177734375, 0.06360626220703125, 0.07179641723632812, 0.079986572265625, 0.08817672729492188, 0.09636688232421875, 0.10455703735351562, 0.1127471923828125, 0.12093734741210938, 0.12912750244140625, 0.13731765747070312, 0.1455078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 9.0, 7.0, 9.0, 30.0, 46.0, 71.0, 157.0, 282.0, 175.0, 79.0, 57.0, 29.0, 13.0, 9.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5559524297714233, -1.50979483127594, -1.463637351989746, -1.4174797534942627, -1.3713221549987793, -1.325164556503296, -1.2790069580078125, -1.2328494787216187, -1.1866918802261353, -1.1405342817306519, -1.094376802444458, -1.0482192039489746, -1.0020616054534912, -0.9559040069580078, -0.9097464680671692, -0.8635889291763306, -0.8174313306808472, -0.7712737321853638, -0.7251161932945251, -0.6789586544036865, -0.6328010559082031, -0.5866434574127197, -0.5404859185218811, -0.4943283498287201, -0.4481707811355591, -0.40201321244239807, -0.35585564374923706, -0.30969807505607605, -0.26354050636291504, -0.21738293766975403, -0.17122536897659302, -0.125067800283432, -0.078910231590271, -0.032752662897109985, 0.013404905796051025, 0.059562474489212036, 0.10572004318237305, 0.15187761187553406, 0.19803518056869507, 0.24419274926185608, 0.2903503179550171, 0.3365078866481781, 0.3826654553413391, 0.4288230240345001, 0.47498059272766113, 0.5211381912231445, 0.5672957301139832, 0.6134532690048218, 0.6596108675003052, 0.7057684659957886, 0.7519260048866272, 0.7980835437774658, 0.8442411422729492, 0.8903987407684326, 0.9365562796592712, 0.9827138185501099, 1.0288714170455933, 1.0750290155410767, 1.1211864948272705, 1.167344093322754, 1.2135016918182373, 1.2596592903137207, 1.305816888809204, 1.351974368095398, 1.3981319665908813]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 7.0, 12.0, 10.0, 15.0, 21.0, 22.0, 36.0, 37.0, 55.0, 72.0, 79.0, 81.0, 69.0, 70.0, 63.0, 66.0, 48.0, 41.0, 44.0, 28.0, 29.0, 20.0, 16.0, 8.0, 5.0, 7.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1837421655654907, -1.1493579149246216, -1.114973783493042, -1.0805895328521729, -1.0462052822113037, -1.0118211507797241, -0.977436900138855, -0.9430527091026306, -0.9086685180664062, -0.8742843270301819, -0.8399001359939575, -0.8055158853530884, -0.771131694316864, -0.7367475032806396, -0.7023632526397705, -0.6679790616035461, -0.6335948705673218, -0.5992106795310974, -0.564826488494873, -0.5304422378540039, -0.49605804681777954, -0.4616738557815552, -0.4272896349430084, -0.39290541410446167, -0.3585212230682373, -0.32413703203201294, -0.2897528111934662, -0.25536859035491943, -0.22098439931869507, -0.1866001933813095, -0.15221598744392395, -0.11783178150653839, -0.08344769477844238, -0.049063488841056824, -0.014679282903671265, 0.019704923033714294, 0.054089128971099854, 0.08847333490848541, 0.12285754084587097, 0.15724174678325653, 0.1916259527206421, 0.22601015865802765, 0.2603943645954132, 0.29477858543395996, 0.3291627764701843, 0.3635469675064087, 0.39793118834495544, 0.4323154091835022, 0.46669960021972656, 0.5010837912559509, 0.5354679822921753, 0.5698522329330444, 0.6042364239692688, 0.6386206150054932, 0.6730048656463623, 0.7073890566825867, 0.741773247718811, 0.7761574387550354, 0.8105416297912598, 0.8449258804321289, 0.8793100714683533, 0.9136942625045776, 0.9480785131454468, 0.9824627041816711, 1.0168468952178955]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 5.0, 22.0, 12.0, 39.0, 30.0, 58.0, 86.0, 161.0, 259.0, 432.0, 785.0, 1573.0, 3886.0, 11689.0, 62749.0, 3950422.0, 136279.0, 16552.0, 4895.0, 1983.0, 948.0, 503.0, 308.0, 192.0, 140.0, 72.0, 50.0, 39.0, 26.0, 23.0, 10.0, 5.0, 11.0, 10.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.673828125, -0.6549224853515625, -0.636016845703125, -0.6171112060546875, -0.59820556640625, -0.5792999267578125, -0.560394287109375, -0.5414886474609375, -0.5225830078125, -0.5036773681640625, -0.484771728515625, -0.4658660888671875, -0.44696044921875, -0.4280548095703125, -0.409149169921875, -0.3902435302734375, -0.371337890625, -0.3524322509765625, -0.333526611328125, -0.3146209716796875, -0.29571533203125, -0.2768096923828125, -0.257904052734375, -0.2389984130859375, -0.2200927734375, -0.2011871337890625, -0.182281494140625, -0.1633758544921875, -0.14447021484375, -0.1255645751953125, -0.106658935546875, -0.0877532958984375, -0.06884765625, -0.0499420166015625, -0.031036376953125, -0.0121307373046875, 0.00677490234375, 0.0256805419921875, 0.044586181640625, 0.0634918212890625, 0.0823974609375, 0.1013031005859375, 0.120208740234375, 0.1391143798828125, 0.15802001953125, 0.1769256591796875, 0.195831298828125, 0.2147369384765625, 0.233642578125, 0.2525482177734375, 0.271453857421875, 0.2903594970703125, 0.30926513671875, 0.3281707763671875, 0.347076416015625, 0.3659820556640625, 0.3848876953125, 0.4037933349609375, 0.422698974609375, 0.4416046142578125, 0.46051025390625, 0.4794158935546875, 0.498321533203125, 0.5172271728515625, 0.5361328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 3.0, 7.0, 19.0, 17.0, 30.0, 35.0, 46.0, 62.0, 78.0, 77.0, 106.0, 108.0, 99.0, 65.0, 55.0, 48.0, 33.0, 23.0, 15.0, 10.0, 13.0, 4.0, 2.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020660400390625, -0.01999044418334961, -0.01932048797607422, -0.018650531768798828, -0.017980575561523438, -0.017310619354248047, -0.016640663146972656, -0.015970706939697266, -0.015300750732421875, -0.014630794525146484, -0.013960838317871094, -0.013290882110595703, -0.012620925903320312, -0.011950969696044922, -0.011281013488769531, -0.01061105728149414, -0.00994110107421875, -0.00927114486694336, -0.008601188659667969, -0.007931232452392578, -0.0072612762451171875, -0.006591320037841797, -0.005921363830566406, -0.005251407623291016, -0.004581451416015625, -0.003911495208740234, -0.0032415390014648438, -0.002571582794189453, -0.0019016265869140625, -0.0012316703796386719, -0.0005617141723632812, 0.00010824203491210938, 0.0007781982421875, 0.0014481544494628906, 0.0021181106567382812, 0.002788066864013672, 0.0034580230712890625, 0.004127979278564453, 0.004797935485839844, 0.005467891693115234, 0.006137847900390625, 0.006807804107666016, 0.007477760314941406, 0.008147716522216797, 0.008817672729492188, 0.009487628936767578, 0.010157585144042969, 0.01082754135131836, 0.01149749755859375, 0.01216745376586914, 0.012837409973144531, 0.013507366180419922, 0.014177322387695312, 0.014847278594970703, 0.015517234802246094, 0.016187191009521484, 0.016857147216796875, 0.017527103424072266, 0.018197059631347656, 0.018867015838623047, 0.019536972045898438, 0.020206928253173828, 0.02087688446044922, 0.02154684066772461, 0.022216796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 11.0, 8.0, 38.0, 47.0, 92.0, 546.0, 17184.0, 4153678.0, 21877.0, 611.0, 82.0, 39.0, 14.0, 7.0, 17.0, 10.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.111328125, -2.0669021606445312, -2.0224761962890625, -1.9780502319335938, -1.933624267578125, -1.8891983032226562, -1.8447723388671875, -1.8003463745117188, -1.75592041015625, -1.7114944458007812, -1.6670684814453125, -1.6226425170898438, -1.578216552734375, -1.5337905883789062, -1.4893646240234375, -1.4449386596679688, -1.4005126953125, -1.3560867309570312, -1.3116607666015625, -1.2672348022460938, -1.222808837890625, -1.1783828735351562, -1.1339569091796875, -1.0895309448242188, -1.04510498046875, -1.0006790161132812, -0.9562530517578125, -0.9118270874023438, -0.867401123046875, -0.8229751586914062, -0.7785491943359375, -0.7341232299804688, -0.689697265625, -0.6452713012695312, -0.6008453369140625, -0.5564193725585938, -0.511993408203125, -0.46756744384765625, -0.4231414794921875, -0.37871551513671875, -0.33428955078125, -0.28986358642578125, -0.2454376220703125, -0.20101165771484375, -0.156585693359375, -0.11215972900390625, -0.0677337646484375, -0.02330780029296875, 0.0211181640625, 0.06554412841796875, 0.1099700927734375, 0.15439605712890625, 0.198822021484375, 0.24324798583984375, 0.2876739501953125, 0.33209991455078125, 0.37652587890625, 0.42095184326171875, 0.4653778076171875, 0.5098037719726562, 0.554229736328125, 0.5986557006835938, 0.6430816650390625, 0.6875076293945312, 0.73193359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 8.0, 13.0, 12.0, 19.0, 19.0, 44.0, 66.0, 151.0, 174.0, 430.0, 1430.0, 861.0, 296.0, 147.0, 95.0, 64.0, 43.0, 31.0, 25.0, 18.0, 19.0, 16.0, 8.0, 6.0, 7.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.04141378402709961, -0.04007244110107422, -0.03873109817504883, -0.03738975524902344, -0.03604841232299805, -0.034707069396972656, -0.033365726470947266, -0.032024383544921875, -0.030683040618896484, -0.029341697692871094, -0.028000354766845703, -0.026659011840820312, -0.025317668914794922, -0.02397632598876953, -0.02263498306274414, -0.02129364013671875, -0.01995229721069336, -0.01861095428466797, -0.017269611358642578, -0.015928268432617188, -0.014586925506591797, -0.013245582580566406, -0.011904239654541016, -0.010562896728515625, -0.009221553802490234, -0.007880210876464844, -0.006538867950439453, -0.0051975250244140625, -0.003856182098388672, -0.0025148391723632812, -0.0011734962463378906, 0.0001678466796875, 0.0015091896057128906, 0.0028505325317382812, 0.004191875457763672, 0.0055332183837890625, 0.006874561309814453, 0.008215904235839844, 0.009557247161865234, 0.010898590087890625, 0.012239933013916016, 0.013581275939941406, 0.014922618865966797, 0.016263961791992188, 0.017605304718017578, 0.01894664764404297, 0.02028799057006836, 0.02162933349609375, 0.02297067642211914, 0.02431201934814453, 0.025653362274169922, 0.026994705200195312, 0.028336048126220703, 0.029677391052246094, 0.031018733978271484, 0.032360076904296875, 0.033701419830322266, 0.035042762756347656, 0.03638410568237305, 0.03772544860839844, 0.03906679153442383, 0.04040813446044922, 0.04174947738647461, 0.0430908203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 13.0, 409.0, 569.0, 16.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.047494888305664, -4.958988666534424, -4.870481967926025, -4.781975746154785, -4.693469047546387, -4.6049628257751465, -4.516456127166748, -4.427949905395508, -4.339443206787109, -4.250936985015869, -4.162430286407471, -4.0739240646362305, -3.985417366027832, -3.896911144256592, -3.8084046840667725, -3.719898223876953, -3.631392002105713, -3.5428855419158936, -3.454379081726074, -3.365872621536255, -3.2773661613464355, -3.1888599395751953, -3.100353479385376, -3.0118470191955566, -2.9233405590057373, -2.834834098815918, -2.7463276386260986, -2.6578211784362793, -2.569314956665039, -2.4808084964752197, -2.3923020362854004, -2.303795576095581, -2.2152891159057617, -2.1267826557159424, -2.038276195526123, -1.9497698545455933, -1.861263394355774, -1.7727569341659546, -1.6842505931854248, -1.5957441329956055, -1.5072376728057861, -1.4187312126159668, -1.3302247524261475, -1.2417184114456177, -1.1532119512557983, -1.064705491065979, -0.9761990904808044, -0.8876926898956299, -0.7991862893104553, -0.7106798887252808, -0.6221734285354614, -0.5336669683456421, -0.44516056776046753, -0.3566541373729706, -0.26814770698547363, -0.17964130640029907, -0.09113484621047974, -0.002628415822982788, 0.08587801456451416, 0.1743844449520111, 0.26289087533950806, 0.351397305727005, 0.43990373611450195, 0.5284101366996765, 0.6169165968894958]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 9.0, 21.0, 23.0, 39.0, 51.0, 83.0, 102.0, 133.0, 126.0, 130.0, 101.0, 73.0, 48.0, 32.0, 13.0, 5.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8497622609138489, -0.8315975069999695, -0.8134327530860901, -0.7952679395675659, -0.7771031856536865, -0.7589384317398071, -0.7407736778259277, -0.7226089239120483, -0.704444169998169, -0.6862794160842896, -0.6681146621704102, -0.649949848651886, -0.6317850947380066, -0.6136203408241272, -0.5954555869102478, -0.5772908329963684, -0.5591260194778442, -0.5409612655639648, -0.5227965116500854, -0.5046316981315613, -0.4864669442176819, -0.4683021903038025, -0.4501374363899231, -0.4319726824760437, -0.4138078987598419, -0.3956431448459625, -0.37747836112976074, -0.35931360721588135, -0.34114885330200195, -0.32298406958580017, -0.3048193156719208, -0.286654531955719, -0.2684897780418396, -0.2503250241279602, -0.23216024041175842, -0.21399548649787903, -0.19583071768283844, -0.17766594886779785, -0.15950119495391846, -0.14133642613887787, -0.12317165732383728, -0.10500688850879669, -0.0868421271443367, -0.06867736577987671, -0.05051259696483612, -0.03234782814979553, -0.01418306678533554, 0.003981694579124451, 0.02214646339416504, 0.04031122848391533, 0.05847599357366562, 0.07664075493812561, 0.0948055237531662, 0.11297029256820679, 0.13113504648208618, 0.14929981529712677, 0.16746458411216736, 0.18562935292720795, 0.20379412174224854, 0.22195887565612793, 0.24012364447116852, 0.2582884132862091, 0.2764531672000885, 0.2946179509162903, 0.3127827048301697]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 16.0, 8.0, 15.0, 21.0, 25.0, 29.0, 34.0, 44.0, 44.0, 44.0, 57.0, 455.0, 56357.0, 988470.0, 2390.0, 138.0, 52.0, 62.0, 59.0, 39.0, 36.0, 27.0, 25.0, 13.0, 16.0, 21.0, 11.0, 10.0, 6.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9928436279296875, -0.956390380859375, -0.9199371337890625, -0.88348388671875, -0.8470306396484375, -0.810577392578125, -0.7741241455078125, -0.7376708984375, -0.7012176513671875, -0.664764404296875, -0.6283111572265625, -0.59185791015625, -0.5554046630859375, -0.518951416015625, -0.4824981689453125, -0.446044921875, -0.4095916748046875, -0.373138427734375, -0.3366851806640625, -0.30023193359375, -0.2637786865234375, -0.227325439453125, -0.1908721923828125, -0.1544189453125, -0.1179656982421875, -0.081512451171875, -0.0450592041015625, -0.00860595703125, 0.0278472900390625, 0.064300537109375, 0.1007537841796875, 0.13720703125, 0.1736602783203125, 0.210113525390625, 0.2465667724609375, 0.28302001953125, 0.3194732666015625, 0.355926513671875, 0.3923797607421875, 0.4288330078125, 0.4652862548828125, 0.501739501953125, 0.5381927490234375, 0.57464599609375, 0.6110992431640625, 0.647552490234375, 0.6840057373046875, 0.720458984375, 0.7569122314453125, 0.793365478515625, 0.8298187255859375, 0.86627197265625, 0.9027252197265625, 0.939178466796875, 0.9756317138671875, 1.0120849609375, 1.0485382080078125, 1.084991455078125, 1.1214447021484375, 1.15789794921875, 1.1943511962890625, 1.230804443359375, 1.2672576904296875, 1.3037109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 21.0, 114.0, 304.0, 391.0, 154.0, 27.0, 3.0, 3.0], "bins": [-0.228271484375, -0.22440552711486816, -0.22053956985473633, -0.2166736125946045, -0.21280765533447266, -0.20894169807434082, -0.20507574081420898, -0.20120978355407715, -0.1973438262939453, -0.19347786903381348, -0.18961191177368164, -0.1857459545135498, -0.18187999725341797, -0.17801403999328613, -0.1741480827331543, -0.17028212547302246, -0.16641616821289062, -0.1625502109527588, -0.15868425369262695, -0.15481829643249512, -0.15095233917236328, -0.14708638191223145, -0.1432204246520996, -0.13935446739196777, -0.13548851013183594, -0.1316225528717041, -0.12775659561157227, -0.12389063835144043, -0.1200246810913086, -0.11615872383117676, -0.11229276657104492, -0.10842680931091309, -0.10456085205078125, -0.10069489479064941, -0.09682893753051758, -0.09296298027038574, -0.0890970230102539, -0.08523106575012207, -0.08136510848999023, -0.0774991512298584, -0.07363319396972656, -0.06976723670959473, -0.06590127944946289, -0.062035322189331055, -0.05816936492919922, -0.05430340766906738, -0.05043745040893555, -0.04657149314880371, -0.042705535888671875, -0.03883957862854004, -0.0349736213684082, -0.031107664108276367, -0.02724170684814453, -0.023375749588012695, -0.01950979232788086, -0.015643835067749023, -0.011777877807617188, -0.007911920547485352, -0.004045963287353516, -0.0001800060272216797, 0.0036859512329101562, 0.007551908493041992, 0.011417865753173828, 0.015283823013305664, 0.0191497802734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 9.0, 8.0, 14.0, 11.0, 13.0, 13.0, 22.0, 32.0, 61.0, 96.0, 171.0, 315.0, 596.0, 1327.0, 2573.0, 5470.0, 12722.0, 31172.0, 90488.0, 327859.0, 397600.0, 113081.0, 37511.0, 14793.0, 6439.0, 3004.0, 1470.0, 725.0, 397.0, 211.0, 149.0, 74.0, 42.0, 29.0, 24.0, 7.0, 10.0, 7.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.15971946716308594, -0.15403366088867188, -0.1483478546142578, -0.14266204833984375, -0.1369762420654297, -0.13129043579101562, -0.12560462951660156, -0.1199188232421875, -0.11423301696777344, -0.10854721069335938, -0.10286140441894531, -0.09717559814453125, -0.09148979187011719, -0.08580398559570312, -0.08011817932128906, -0.074432373046875, -0.06874656677246094, -0.06306076049804688, -0.05737495422363281, -0.05168914794921875, -0.04600334167480469, -0.040317535400390625, -0.03463172912597656, -0.0289459228515625, -0.023260116577148438, -0.017574310302734375, -0.011888504028320312, -0.00620269775390625, -0.0005168914794921875, 0.005168914794921875, 0.010854721069335938, 0.01654052734375, 0.022226333618164062, 0.027912139892578125, 0.03359794616699219, 0.03928375244140625, 0.04496955871582031, 0.050655364990234375, 0.05634117126464844, 0.0620269775390625, 0.06771278381347656, 0.07339859008789062, 0.07908439636230469, 0.08477020263671875, 0.09045600891113281, 0.09614181518554688, 0.10182762145996094, 0.107513427734375, 0.11319923400878906, 0.11888504028320312, 0.12457084655761719, 0.13025665283203125, 0.1359424591064453, 0.14162826538085938, 0.14731407165527344, 0.1529998779296875, 0.15868568420410156, 0.16437149047851562, 0.1700572967529297, 0.17574310302734375, 0.1814289093017578, 0.18711471557617188, 0.19280052185058594, 0.198486328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 9.0, 4.0, 6.0, 5.0, 1.0, 11.0, 6.0, 10.0, 14.0, 19.0, 19.0, 21.0, 28.0, 28.0, 31.0, 37.0, 37.0, 35.0, 55.0, 42.0, 55.0, 51.0, 64.0, 57.0, 49.0, 42.0, 32.0, 34.0, 35.0, 30.0, 26.0, 26.0, 13.0, 13.0, 10.0, 13.0, 11.0, 5.0, 6.0, 5.0, 3.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.1429595947265625, -0.137725830078125, -0.1324920654296875, -0.12725830078125, -0.1220245361328125, -0.116790771484375, -0.1115570068359375, -0.1063232421875, -0.1010894775390625, -0.095855712890625, -0.0906219482421875, -0.08538818359375, -0.0801544189453125, -0.074920654296875, -0.0696868896484375, -0.064453125, -0.0592193603515625, -0.053985595703125, -0.0487518310546875, -0.04351806640625, -0.0382843017578125, -0.033050537109375, -0.0278167724609375, -0.0225830078125, -0.0173492431640625, -0.012115478515625, -0.0068817138671875, -0.00164794921875, 0.0035858154296875, 0.008819580078125, 0.0140533447265625, 0.019287109375, 0.0245208740234375, 0.029754638671875, 0.0349884033203125, 0.04022216796875, 0.0454559326171875, 0.050689697265625, 0.0559234619140625, 0.0611572265625, 0.0663909912109375, 0.071624755859375, 0.0768585205078125, 0.08209228515625, 0.0873260498046875, 0.092559814453125, 0.0977935791015625, 0.10302734375, 0.1082611083984375, 0.113494873046875, 0.1187286376953125, 0.12396240234375, 0.1291961669921875, 0.134429931640625, 0.1396636962890625, 0.1448974609375, 0.1501312255859375, 0.155364990234375, 0.1605987548828125, 0.16583251953125, 0.1710662841796875, 0.176300048828125, 0.1815338134765625, 0.186767578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 1.0, 3.0, 6.0, 4.0, 2.0, 7.0, 18.0, 17.0, 18.0, 17.0, 32.0, 58.0, 79.0, 170.0, 420.0, 1455.0, 7675.0, 126635.0, 865655.0, 40374.0, 4309.0, 942.0, 296.0, 132.0, 74.0, 41.0, 18.0, 22.0, 15.0, 8.0, 8.0, 6.0, 11.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3232421875, -0.31183624267578125, -0.3004302978515625, -0.28902435302734375, -0.277618408203125, -0.26621246337890625, -0.2548065185546875, -0.24340057373046875, -0.23199462890625, -0.22058868408203125, -0.2091827392578125, -0.19777679443359375, -0.186370849609375, -0.17496490478515625, -0.1635589599609375, -0.15215301513671875, -0.1407470703125, -0.12934112548828125, -0.1179351806640625, -0.10652923583984375, -0.095123291015625, -0.08371734619140625, -0.0723114013671875, -0.06090545654296875, -0.04949951171875, -0.03809356689453125, -0.0266876220703125, -0.01528167724609375, -0.003875732421875, 0.00753021240234375, 0.0189361572265625, 0.03034210205078125, 0.041748046875, 0.05315399169921875, 0.0645599365234375, 0.07596588134765625, 0.087371826171875, 0.09877777099609375, 0.1101837158203125, 0.12158966064453125, 0.13299560546875, 0.14440155029296875, 0.1558074951171875, 0.16721343994140625, 0.178619384765625, 0.19002532958984375, 0.2014312744140625, 0.21283721923828125, 0.2242431640625, 0.23564910888671875, 0.2470550537109375, 0.25846099853515625, 0.269866943359375, 0.28127288818359375, 0.2926788330078125, 0.30408477783203125, 0.31549072265625, 0.32689666748046875, 0.3383026123046875, 0.34970855712890625, 0.361114501953125, 0.37252044677734375, 0.3839263916015625, 0.39533233642578125, 0.40673828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 9.0, 12.0, 9.0, 19.0, 16.0, 39.0, 47.0, 50.0, 74.0, 95.0, 140.0, 94.0, 87.0, 63.0, 46.0, 45.0, 32.0, 23.0, 16.0, 21.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006394386291503906, -0.0006220713257789612, -0.0006047040224075317, -0.0005873367190361023, -0.0005699694156646729, -0.0005526021122932434, -0.000535234808921814, -0.0005178675055503845, -0.0005005002021789551, -0.00048313289880752563, -0.0004657655954360962, -0.00044839829206466675, -0.0004310309886932373, -0.00041366368532180786, -0.0003962963819503784, -0.000378929078578949, -0.00036156177520751953, -0.0003441944718360901, -0.00032682716846466064, -0.0003094598650932312, -0.00029209256172180176, -0.0002747252583503723, -0.00025735795497894287, -0.00023999065160751343, -0.00022262334823608398, -0.00020525604486465454, -0.0001878887414932251, -0.00017052143812179565, -0.0001531541347503662, -0.00013578683137893677, -0.00011841952800750732, -0.00010105222463607788, -8.368492126464844e-05, -6.6317617893219e-05, -4.895031452178955e-05, -3.158301115036011e-05, -1.4215707778930664e-05, 3.1515955924987793e-06, 2.0518898963928223e-05, 3.7886202335357666e-05, 5.525350570678711e-05, 7.262080907821655e-05, 8.9988112449646e-05, 0.00010735541582107544, 0.00012472271919250488, 0.00014209002256393433, 0.00015945732593536377, 0.0001768246293067932, 0.00019419193267822266, 0.0002115592360496521, 0.00022892653942108154, 0.000246293842792511, 0.00026366114616394043, 0.0002810284495353699, 0.0002983957529067993, 0.00031576305627822876, 0.0003331303596496582, 0.00035049766302108765, 0.0003678649663925171, 0.00038523226976394653, 0.000402599573135376, 0.0004199668765068054, 0.00043733417987823486, 0.0004547014832496643, 0.00047206878662109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 7.0, 2.0, 12.0, 22.0, 31.0, 84.0, 364.0, 1782.0, 16783.0, 865695.0, 156484.0, 6028.0, 853.0, 232.0, 75.0, 34.0, 19.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.355743408203125, -0.33941650390625, -0.323089599609375, -0.3067626953125, -0.290435791015625, -0.27410888671875, -0.257781982421875, -0.241455078125, -0.225128173828125, -0.20880126953125, -0.192474365234375, -0.1761474609375, -0.159820556640625, -0.14349365234375, -0.127166748046875, -0.11083984375, -0.094512939453125, -0.07818603515625, -0.061859130859375, -0.0455322265625, -0.029205322265625, -0.01287841796875, 0.003448486328125, 0.019775390625, 0.036102294921875, 0.05242919921875, 0.068756103515625, 0.0850830078125, 0.101409912109375, 0.11773681640625, 0.134063720703125, 0.150390625, 0.166717529296875, 0.18304443359375, 0.199371337890625, 0.2156982421875, 0.232025146484375, 0.24835205078125, 0.264678955078125, 0.281005859375, 0.297332763671875, 0.31365966796875, 0.329986572265625, 0.3463134765625, 0.362640380859375, 0.37896728515625, 0.395294189453125, 0.41162109375, 0.427947998046875, 0.44427490234375, 0.460601806640625, 0.4769287109375, 0.493255615234375, 0.50958251953125, 0.525909423828125, 0.542236328125, 0.558563232421875, 0.57489013671875, 0.591217041015625, 0.6075439453125, 0.623870849609375, 0.64019775390625, 0.656524658203125, 0.6728515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 15.0, 10.0, 26.0, 52.0, 114.0, 228.0, 245.0, 134.0, 58.0, 34.0, 15.0, 7.0, 6.0, 6.0, 10.0, 4.0, 3.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15393829345703125, -0.1462554931640625, -0.13857269287109375, -0.130889892578125, -0.12320709228515625, -0.1155242919921875, -0.10784149169921875, -0.10015869140625, -0.09247589111328125, -0.0847930908203125, -0.07711029052734375, -0.069427490234375, -0.06174468994140625, -0.0540618896484375, -0.04637908935546875, -0.0386962890625, -0.03101348876953125, -0.0233306884765625, -0.01564788818359375, -0.007965087890625, -0.00028228759765625, 0.0074005126953125, 0.01508331298828125, 0.02276611328125, 0.03044891357421875, 0.0381317138671875, 0.04581451416015625, 0.053497314453125, 0.06118011474609375, 0.0688629150390625, 0.07654571533203125, 0.084228515625, 0.09191131591796875, 0.0995941162109375, 0.10727691650390625, 0.114959716796875, 0.12264251708984375, 0.1303253173828125, 0.13800811767578125, 0.14569091796875, 0.15337371826171875, 0.1610565185546875, 0.16873931884765625, 0.176422119140625, 0.18410491943359375, 0.1917877197265625, 0.19947052001953125, 0.2071533203125, 0.21483612060546875, 0.2225189208984375, 0.23020172119140625, 0.237884521484375, 0.24556732177734375, 0.2532501220703125, 0.26093292236328125, 0.26861572265625, 0.27629852294921875, 0.2839813232421875, 0.29166412353515625, 0.299346923828125, 0.30702972412109375, 0.3147125244140625, 0.32239532470703125, 0.330078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 716.0, 285.0, 11.0, 2.0], "bins": [-35.85194778442383, -35.262821197509766, -34.67369079589844, -34.084564208984375, -33.49543380737305, -32.906307220458984, -32.317176818847656, -31.728050231933594, -31.1389217376709, -30.549793243408203, -29.960664749145508, -29.371536254882812, -28.782407760620117, -28.193279266357422, -27.60415267944336, -27.015024185180664, -26.42589569091797, -25.836767196655273, -25.247638702392578, -24.658510208129883, -24.069381713867188, -23.480255126953125, -22.891124725341797, -22.301998138427734, -21.712867736816406, -21.12373924255371, -20.534610748291016, -19.94548225402832, -19.356353759765625, -18.767227172851562, -18.178096771240234, -17.588970184326172, -16.999839782714844, -16.41071128845215, -15.821582794189453, -15.232454299926758, -14.643326759338379, -14.054198265075684, -13.465069770812988, -12.87594223022461, -12.286813735961914, -11.697685241699219, -11.108556747436523, -10.519428253173828, -9.93030071258545, -9.341172218322754, -8.752043724060059, -8.16291618347168, -7.573787689208984, -6.984659194946289, -6.395531177520752, -5.806402683258057, -5.2172746658325195, -4.628146171569824, -4.039017677307129, -3.449889659881592, -2.8607611656188965, -2.2716329097747803, -1.6825045347213745, -1.0933761596679688, -0.5042479038238525, 0.08488035202026367, 0.674008846282959, 1.263136863708496, 1.8522653579711914]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 18.0, 21.0, 37.0, 51.0, 80.0, 84.0, 93.0, 92.0, 106.0, 95.0, 88.0, 73.0, 55.0, 42.0, 19.0, 20.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1014342308044434, -3.031130075454712, -2.9608261585235596, -2.890522003173828, -2.8202178478240967, -2.7499136924743652, -2.679609775543213, -2.6093056201934814, -2.53900146484375, -2.4686973094940186, -2.398393392562866, -2.3280892372131348, -2.2577850818634033, -2.187480926513672, -2.1171770095825195, -2.046872854232788, -1.9765689373016357, -1.9062649011611938, -1.8359607458114624, -1.7656567096710205, -1.695352554321289, -1.6250485181808472, -1.5547444820404053, -1.4844403266906738, -1.414136290550232, -1.34383225440979, -1.2735280990600586, -1.2032240629196167, -1.1329200267791748, -1.0626158714294434, -0.9923118352890015, -0.9220077395439148, -0.851703405380249, -0.7813993096351624, -0.7110952138900757, -0.6407911777496338, -0.5704870820045471, -0.5001829862594604, -0.42987892031669617, -0.3595748543739319, -0.2892707586288452, -0.21896667778491974, -0.14866259694099426, -0.07835851609706879, -0.00805443525314331, 0.06224966049194336, 0.13255372643470764, 0.20285779237747192, 0.2731618881225586, 0.34346598386764526, 0.41377004981040955, 0.48407411575317383, 0.5543782114982605, 0.6246823072433472, 0.6949863433837891, 0.7652904391288757, 0.8355945348739624, 0.9058986306190491, 0.9762027263641357, 1.0465067625045776, 1.1168107986450195, 1.187114953994751, 1.2574189901351929, 1.3277230262756348, 1.3980271816253662]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 7.0, 22.0, 43.0, 84.0, 131.0, 242.0, 500.0, 281616.0, 3911146.0, 420.0, 54.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -9.029586791992188, -8.856048583984375, -8.682510375976562, -8.50897216796875, -8.335433959960938, -8.161895751953125, -7.9883575439453125, -7.8148193359375, -7.6412811279296875, -7.467742919921875, -7.2942047119140625, -7.12066650390625, -6.9471282958984375, -6.773590087890625, -6.6000518798828125, -6.426513671875, -6.2529754638671875, -6.079437255859375, -5.9058990478515625, -5.73236083984375, -5.5588226318359375, -5.385284423828125, -5.2117462158203125, -5.0382080078125, -4.8646697998046875, -4.691131591796875, -4.5175933837890625, -4.34405517578125, -4.1705169677734375, -3.996978759765625, -3.8234405517578125, -3.64990234375, -3.4763641357421875, -3.302825927734375, -3.1292877197265625, -2.95574951171875, -2.7822113037109375, -2.608673095703125, -2.4351348876953125, -2.2615966796875, -2.0880584716796875, -1.914520263671875, -1.7409820556640625, -1.56744384765625, -1.3939056396484375, -1.220367431640625, -1.0468292236328125, -0.873291015625, -0.6997528076171875, -0.526214599609375, -0.3526763916015625, -0.17913818359375, -0.0055999755859375, 0.167938232421875, 0.3414764404296875, 0.5150146484375, 0.6885528564453125, 0.862091064453125, 1.0356292724609375, 1.20916748046875, 1.3827056884765625, 1.556243896484375, 1.7297821044921875, 1.9033203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 22.0, 109.0, 253.0, 358.0, 181.0, 61.0, 14.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2536892890930176, -0.24883365631103516, -0.24397802352905273, -0.2391223907470703, -0.2342667579650879, -0.22941112518310547, -0.22455549240112305, -0.21969985961914062, -0.2148442268371582, -0.20998859405517578, -0.20513296127319336, -0.20027732849121094, -0.19542169570922852, -0.1905660629272461, -0.18571043014526367, -0.18085479736328125, -0.17599916458129883, -0.1711435317993164, -0.16628789901733398, -0.16143226623535156, -0.15657663345336914, -0.15172100067138672, -0.1468653678894043, -0.14200973510742188, -0.13715410232543945, -0.13229846954345703, -0.1274428367614746, -0.12258720397949219, -0.11773157119750977, -0.11287593841552734, -0.10802030563354492, -0.1031646728515625, -0.09830904006958008, -0.09345340728759766, -0.08859777450561523, -0.08374214172363281, -0.07888650894165039, -0.07403087615966797, -0.06917524337768555, -0.06431961059570312, -0.0594639778137207, -0.05460834503173828, -0.04975271224975586, -0.04489707946777344, -0.040041446685791016, -0.035185813903808594, -0.030330181121826172, -0.02547454833984375, -0.020618915557861328, -0.015763282775878906, -0.010907649993896484, -0.0060520172119140625, -0.0011963844299316406, 0.0036592483520507812, 0.008514881134033203, 0.013370513916015625, 0.018226146697998047, 0.02308177947998047, 0.02793741226196289, 0.03279304504394531, 0.037648677825927734, 0.042504310607910156, 0.04735994338989258, 0.052215576171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 11.0, 23.0, 48.0, 93.0, 128.0, 163.0, 245.0, 325.0, 4059024.0, 133454.0, 365.0, 184.0, 84.0, 63.0, 33.0, 26.0, 7.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.6119384765625, -8.411376953125, -8.2108154296875, -8.01025390625, -7.8096923828125, -7.609130859375, -7.4085693359375, -7.2080078125, -7.0074462890625, -6.806884765625, -6.6063232421875, -6.40576171875, -6.2052001953125, -6.004638671875, -5.8040771484375, -5.603515625, -5.4029541015625, -5.202392578125, -5.0018310546875, -4.80126953125, -4.6007080078125, -4.400146484375, -4.1995849609375, -3.9990234375, -3.7984619140625, -3.597900390625, -3.3973388671875, -3.19677734375, -2.9962158203125, -2.795654296875, -2.5950927734375, -2.39453125, -2.1939697265625, -1.993408203125, -1.7928466796875, -1.59228515625, -1.3917236328125, -1.191162109375, -0.9906005859375, -0.7900390625, -0.5894775390625, -0.388916015625, -0.1883544921875, 0.01220703125, 0.2127685546875, 0.413330078125, 0.6138916015625, 0.814453125, 1.0150146484375, 1.215576171875, 1.4161376953125, 1.61669921875, 1.8172607421875, 2.017822265625, 2.2183837890625, 2.4189453125, 2.6195068359375, 2.820068359375, 3.0206298828125, 3.22119140625, 3.4217529296875, 3.622314453125, 3.8228759765625, 4.0234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 13.0, 834.0, 3081.0, 118.0, 27.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.2394065856933594, -1.2151412963867188, -1.1908760070800781, -1.1666107177734375, -1.1423454284667969, -1.1180801391601562, -1.0938148498535156, -1.069549560546875, -1.0452842712402344, -1.0210189819335938, -0.9967536926269531, -0.9724884033203125, -0.9482231140136719, -0.9239578247070312, -0.8996925354003906, -0.87542724609375, -0.8511619567871094, -0.8268966674804688, -0.8026313781738281, -0.7783660888671875, -0.7541007995605469, -0.7298355102539062, -0.7055702209472656, -0.681304931640625, -0.6570396423339844, -0.6327743530273438, -0.6085090637207031, -0.5842437744140625, -0.5599784851074219, -0.5357131958007812, -0.5114479064941406, -0.4871826171875, -0.4629173278808594, -0.43865203857421875, -0.4143867492675781, -0.3901214599609375, -0.3658561706542969, -0.34159088134765625, -0.3173255920410156, -0.293060302734375, -0.2687950134277344, -0.24452972412109375, -0.22026443481445312, -0.1959991455078125, -0.17173385620117188, -0.14746856689453125, -0.12320327758789062, -0.09893798828125, -0.07467269897460938, -0.05040740966796875, -0.026142120361328125, -0.0018768310546875, 0.022388458251953125, 0.04665374755859375, 0.07091903686523438, 0.095184326171875, 0.11944961547851562, 0.14371490478515625, 0.16798019409179688, 0.1922454833984375, 0.21651077270507812, 0.24077606201171875, 0.2650413513183594, 0.289306640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 32.0, 189.0, 662.0, 100.0, 21.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.177988052368164, -7.979977130889893, -7.781966686248779, -7.583955764770508, -7.385944843292236, -7.187933921813965, -6.989923477172852, -6.79191255569458, -6.593901634216309, -6.395890712738037, -6.197880268096924, -5.999869346618652, -5.801858425140381, -5.603847503662109, -5.405837059020996, -5.207826137542725, -5.009815216064453, -4.811804294586182, -4.613793849945068, -4.415782928466797, -4.217772006988525, -4.019761085510254, -3.8217506408691406, -3.623739719390869, -3.425729274749756, -3.2277185916900635, -3.029707670211792, -2.8316969871520996, -2.633686065673828, -2.4356753826141357, -2.2376646995544434, -2.039653778076172, -1.8416428565979004, -1.6436320543289185, -1.4456212520599365, -1.2476105690002441, -1.0495996475219727, -0.8515889048576355, -0.6535781621932983, -0.4555673599243164, -0.2575565576553345, -0.05954577028751373, 0.138465017080307, 0.33647578954696655, 0.5344865918159485, 0.7324973940849304, 0.9305081367492676, 1.1285189390182495, 1.3265297412872314, 1.5245405435562134, 1.7225513458251953, 1.9205620288848877, 2.118572950363159, 2.3165836334228516, 2.514594554901123, 2.7126052379608154, 2.910615921020508, 3.1086266040802, 3.3066375255584717, 3.504648208618164, 3.7026591300964355, 3.900669813156128, 4.09868049621582, 4.296691417694092, 4.494702339172363]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 17.0, 31.0, 48.0, 69.0, 127.0, 145.0, 154.0, 140.0, 88.0, 82.0, 58.0, 16.0, 16.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9885764122009277, -3.8607213497161865, -3.7328662872314453, -3.605011224746704, -3.477156162261963, -3.349301338195801, -3.2214462757110596, -3.0935912132263184, -2.965736150741577, -2.837881088256836, -2.7100260257720947, -2.5821709632873535, -2.4543161392211914, -2.326460838317871, -2.198606014251709, -2.0707509517669678, -1.9428958892822266, -1.8150408267974854, -1.6871857643127441, -1.5593308210372925, -1.4314757585525513, -1.30362069606781, -1.1757657527923584, -1.0479106903076172, -0.920055627822876, -0.7922005653381348, -0.6643455624580383, -0.5364905595779419, -0.4086354970932007, -0.2807804346084595, -0.15292543172836304, -0.0250704288482666, 0.10278463363647461, 0.23063966631889343, 0.35849469900131226, 0.4863497316837311, 0.6142047643661499, 0.7420598268508911, 0.8699148297309875, 0.997769832611084, 1.1256248950958252, 1.2534799575805664, 1.3813350200653076, 1.5091899633407593, 1.6370450258255005, 1.7649000883102417, 1.8927550315856934, 2.0206100940704346, 2.148465156555176, 2.276320219039917, 2.404175281524658, 2.5320303440093994, 2.6598854064941406, 2.7877402305603027, 2.915595293045044, 3.043450355529785, 3.1713054180145264, 3.2991604804992676, 3.427015542984009, 3.55487060546875, 3.682725429534912, 3.8105807304382324, 3.9384355545043945, 4.066290855407715, 4.194145679473877]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 14.0, 12.0, 17.0, 29.0, 36.0, 52.0, 92.0, 134.0, 304.0, 847.0, 3132.0, 26193.0, 876757.0, 131568.0, 6928.0, 1499.0, 452.0, 182.0, 91.0, 72.0, 39.0, 32.0, 18.0, 18.0, 13.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.689453125, -1.6421661376953125, -1.594879150390625, -1.5475921630859375, -1.50030517578125, -1.4530181884765625, -1.405731201171875, -1.3584442138671875, -1.3111572265625, -1.2638702392578125, -1.216583251953125, -1.1692962646484375, -1.12200927734375, -1.0747222900390625, -1.027435302734375, -0.9801483154296875, -0.932861328125, -0.8855743408203125, -0.838287353515625, -0.7910003662109375, -0.74371337890625, -0.6964263916015625, -0.649139404296875, -0.6018524169921875, -0.5545654296875, -0.5072784423828125, -0.459991455078125, -0.4127044677734375, -0.36541748046875, -0.3181304931640625, -0.270843505859375, -0.2235565185546875, -0.17626953125, -0.1289825439453125, -0.081695556640625, -0.0344085693359375, 0.01287841796875, 0.0601654052734375, 0.107452392578125, 0.1547393798828125, 0.2020263671875, 0.2493133544921875, 0.296600341796875, 0.3438873291015625, 0.39117431640625, 0.4384613037109375, 0.485748291015625, 0.5330352783203125, 0.580322265625, 0.6276092529296875, 0.674896240234375, 0.7221832275390625, 0.76947021484375, 0.8167572021484375, 0.864044189453125, 0.9113311767578125, 0.9586181640625, 1.0059051513671875, 1.053192138671875, 1.1004791259765625, 1.14776611328125, 1.1950531005859375, 1.242340087890625, 1.2896270751953125, 1.3369140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 15.0, 31.0, 50.0, 90.0, 153.0, 175.0, 167.0, 127.0, 89.0, 51.0, 29.0, 11.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.3369712829589844, -0.32946014404296875, -0.3219490051269531, -0.3144378662109375, -0.3069267272949219, -0.29941558837890625, -0.2919044494628906, -0.284393310546875, -0.2768821716308594, -0.26937103271484375, -0.2618598937988281, -0.2543487548828125, -0.24683761596679688, -0.23932647705078125, -0.23181533813476562, -0.22430419921875, -0.21679306030273438, -0.20928192138671875, -0.20177078247070312, -0.1942596435546875, -0.18674850463867188, -0.17923736572265625, -0.17172622680664062, -0.164215087890625, -0.15670394897460938, -0.14919281005859375, -0.14168167114257812, -0.1341705322265625, -0.12665939331054688, -0.11914825439453125, -0.11163711547851562, -0.1041259765625, -0.09661483764648438, -0.08910369873046875, -0.08159255981445312, -0.0740814208984375, -0.06657028198242188, -0.05905914306640625, -0.051548004150390625, -0.044036865234375, -0.036525726318359375, -0.02901458740234375, -0.021503448486328125, -0.0139923095703125, -0.006481170654296875, 0.00102996826171875, 0.008541107177734375, 0.01605224609375, 0.023563385009765625, 0.03107452392578125, 0.038585662841796875, 0.0460968017578125, 0.053607940673828125, 0.06111907958984375, 0.06863021850585938, 0.076141357421875, 0.08365249633789062, 0.09116363525390625, 0.09867477416992188, 0.1061859130859375, 0.11369705200195312, 0.12120819091796875, 0.12871932983398438, 0.13623046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 8.0, 3.0, 6.0, 13.0, 13.0, 13.0, 14.0, 27.0, 39.0, 41.0, 103.0, 200.0, 477.0, 1552.0, 7747.0, 72380.0, 807991.0, 142566.0, 12034.0, 2140.0, 600.0, 247.0, 116.0, 57.0, 34.0, 28.0, 16.0, 15.0, 8.0, 11.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6234817504882812, -0.6024322509765625, -0.5813827514648438, -0.560333251953125, -0.5392837524414062, -0.5182342529296875, -0.49718475341796875, -0.47613525390625, -0.45508575439453125, -0.4340362548828125, -0.41298675537109375, -0.391937255859375, -0.37088775634765625, -0.3498382568359375, -0.32878875732421875, -0.3077392578125, -0.28668975830078125, -0.2656402587890625, -0.24459075927734375, -0.223541259765625, -0.20249176025390625, -0.1814422607421875, -0.16039276123046875, -0.13934326171875, -0.11829376220703125, -0.0972442626953125, -0.07619476318359375, -0.055145263671875, -0.03409576416015625, -0.0130462646484375, 0.00800323486328125, 0.029052734375, 0.05010223388671875, 0.0711517333984375, 0.09220123291015625, 0.113250732421875, 0.13430023193359375, 0.1553497314453125, 0.17639923095703125, 0.19744873046875, 0.21849822998046875, 0.2395477294921875, 0.26059722900390625, 0.281646728515625, 0.30269622802734375, 0.3237457275390625, 0.34479522705078125, 0.3658447265625, 0.38689422607421875, 0.4079437255859375, 0.42899322509765625, 0.450042724609375, 0.47109222412109375, 0.4921417236328125, 0.5131912231445312, 0.53424072265625, 0.5552902221679688, 0.5763397216796875, 0.5973892211914062, 0.618438720703125, 0.6394882202148438, 0.6605377197265625, 0.6815872192382812, 0.70263671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 7.0, 6.0, 8.0, 8.0, 10.0, 17.0, 12.0, 22.0, 31.0, 38.0, 35.0, 42.0, 46.0, 45.0, 63.0, 59.0, 56.0, 48.0, 46.0, 55.0, 50.0, 44.0, 50.0, 35.0, 23.0, 22.0, 24.0, 16.0, 13.0, 8.0, 5.0, 13.0, 4.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3512382507324219, -0.33992767333984375, -0.3286170959472656, -0.3173065185546875, -0.3059959411621094, -0.29468536376953125, -0.2833747863769531, -0.272064208984375, -0.2607536315917969, -0.24944305419921875, -0.23813247680664062, -0.2268218994140625, -0.21551132202148438, -0.20420074462890625, -0.19289016723632812, -0.18157958984375, -0.17026901245117188, -0.15895843505859375, -0.14764785766601562, -0.1363372802734375, -0.12502670288085938, -0.11371612548828125, -0.10240554809570312, -0.091094970703125, -0.07978439331054688, -0.06847381591796875, -0.057163238525390625, -0.0458526611328125, -0.034542083740234375, -0.02323150634765625, -0.011920928955078125, -0.0006103515625, 0.010700225830078125, 0.02201080322265625, 0.033321380615234375, 0.0446319580078125, 0.055942535400390625, 0.06725311279296875, 0.07856369018554688, 0.089874267578125, 0.10118484497070312, 0.11249542236328125, 0.12380599975585938, 0.1351165771484375, 0.14642715454101562, 0.15773773193359375, 0.16904830932617188, 0.18035888671875, 0.19166946411132812, 0.20298004150390625, 0.21429061889648438, 0.2256011962890625, 0.23691177368164062, 0.24822235107421875, 0.2595329284667969, 0.270843505859375, 0.2821540832519531, 0.29346466064453125, 0.3047752380371094, 0.3160858154296875, 0.3273963928222656, 0.33870697021484375, 0.3500175476074219, 0.361328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 1.0, 9.0, 5.0, 6.0, 23.0, 31.0, 36.0, 73.0, 155.0, 276.0, 786.0, 2824.0, 20945.0, 887824.0, 126701.0, 6471.0, 1425.0, 470.0, 226.0, 111.0, 54.0, 33.0, 27.0, 15.0, 10.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.763671875, -0.742889404296875, -0.72210693359375, -0.701324462890625, -0.6805419921875, -0.659759521484375, -0.63897705078125, -0.618194580078125, -0.597412109375, -0.576629638671875, -0.55584716796875, -0.535064697265625, -0.5142822265625, -0.493499755859375, -0.47271728515625, -0.451934814453125, -0.43115234375, -0.410369873046875, -0.38958740234375, -0.368804931640625, -0.3480224609375, -0.327239990234375, -0.30645751953125, -0.285675048828125, -0.264892578125, -0.244110107421875, -0.22332763671875, -0.202545166015625, -0.1817626953125, -0.160980224609375, -0.14019775390625, -0.119415283203125, -0.0986328125, -0.077850341796875, -0.05706787109375, -0.036285400390625, -0.0155029296875, 0.005279541015625, 0.02606201171875, 0.046844482421875, 0.067626953125, 0.088409423828125, 0.10919189453125, 0.129974365234375, 0.1507568359375, 0.171539306640625, 0.19232177734375, 0.213104248046875, 0.23388671875, 0.254669189453125, 0.27545166015625, 0.296234130859375, 0.3170166015625, 0.337799072265625, 0.35858154296875, 0.379364013671875, 0.400146484375, 0.420928955078125, 0.44171142578125, 0.462493896484375, 0.4832763671875, 0.504058837890625, 0.52484130859375, 0.545623779296875, 0.56640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 9.0, 13.0, 19.0, 31.0, 42.0, 63.0, 87.0, 142.0, 192.0, 123.0, 89.0, 57.0, 40.0, 28.0, 18.0, 19.0, 12.0, 6.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.000949859619140625, -0.0009294338524341583, -0.0009090080857276917, -0.000888582319021225, -0.0008681565523147583, -0.0008477307856082916, -0.000827305018901825, -0.0008068792521953583, -0.0007864534854888916, -0.0007660277187824249, -0.0007456019520759583, -0.0007251761853694916, -0.0007047504186630249, -0.0006843246519565582, -0.0006638988852500916, -0.0006434731185436249, -0.0006230473518371582, -0.0006026215851306915, -0.0005821958184242249, -0.0005617700517177582, -0.0005413442850112915, -0.0005209185183048248, -0.0005004927515983582, -0.0004800669848918915, -0.0004596412181854248, -0.00043921545147895813, -0.00041878968477249146, -0.0003983639180660248, -0.0003779381513595581, -0.00035751238465309143, -0.00033708661794662476, -0.0003166608512401581, -0.0002962350845336914, -0.00027580931782722473, -0.00025538355112075806, -0.00023495778441429138, -0.0002145320177078247, -0.00019410625100135803, -0.00017368048429489136, -0.00015325471758842468, -0.000132828950881958, -0.00011240318417549133, -9.197741746902466e-05, -7.155165076255798e-05, -5.112588405609131e-05, -3.0700117349624634e-05, -1.0274350643157959e-05, 1.0151416063308716e-05, 3.057718276977539e-05, 5.1002949476242065e-05, 7.142871618270874e-05, 9.185448288917542e-05, 0.00011228024959564209, 0.00013270601630210876, 0.00015313178300857544, 0.00017355754971504211, 0.0001939833164215088, 0.00021440908312797546, 0.00023483484983444214, 0.0002552606165409088, 0.0002756863832473755, 0.00029611214995384216, 0.00031653791666030884, 0.0003369636833667755, 0.0003573894500732422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 17.0, 28.0, 43.0, 86.0, 193.0, 369.0, 962.0, 3627.0, 24012.0, 727462.0, 274901.0, 12961.0, 2483.0, 795.0, 283.0, 134.0, 66.0, 36.0, 29.0, 18.0, 7.0, 8.0, 2.0, 6.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.5790901184082031, -0.5624771118164062, -0.5458641052246094, -0.5292510986328125, -0.5126380920410156, -0.49602508544921875, -0.4794120788574219, -0.462799072265625, -0.4461860656738281, -0.42957305908203125, -0.4129600524902344, -0.3963470458984375, -0.3797340393066406, -0.36312103271484375, -0.3465080261230469, -0.32989501953125, -0.3132820129394531, -0.29666900634765625, -0.2800559997558594, -0.2634429931640625, -0.24682998657226562, -0.23021697998046875, -0.21360397338867188, -0.196990966796875, -0.18037796020507812, -0.16376495361328125, -0.14715194702148438, -0.1305389404296875, -0.11392593383789062, -0.09731292724609375, -0.08069992065429688, -0.0640869140625, -0.047473907470703125, -0.03086090087890625, -0.014247894287109375, 0.0023651123046875, 0.018978118896484375, 0.03559112548828125, 0.052204132080078125, 0.068817138671875, 0.08543014526367188, 0.10204315185546875, 0.11865615844726562, 0.1352691650390625, 0.15188217163085938, 0.16849517822265625, 0.18510818481445312, 0.20172119140625, 0.21833419799804688, 0.23494720458984375, 0.2515602111816406, 0.2681732177734375, 0.2847862243652344, 0.30139923095703125, 0.3180122375488281, 0.334625244140625, 0.3512382507324219, 0.36785125732421875, 0.3844642639160156, 0.4010772705078125, 0.4176902770996094, 0.43430328369140625, 0.4509162902832031, 0.467529296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 6.0, 16.0, 16.0, 31.0, 61.0, 114.0, 198.0, 230.0, 141.0, 72.0, 39.0, 23.0, 22.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339599609375, -0.3299293518066406, -0.32025909423828125, -0.3105888366699219, -0.3009185791015625, -0.2912483215332031, -0.28157806396484375, -0.2719078063964844, -0.262237548828125, -0.2525672912597656, -0.24289703369140625, -0.23322677612304688, -0.2235565185546875, -0.21388626098632812, -0.20421600341796875, -0.19454574584960938, -0.18487548828125, -0.17520523071289062, -0.16553497314453125, -0.15586471557617188, -0.1461944580078125, -0.13652420043945312, -0.12685394287109375, -0.11718368530273438, -0.107513427734375, -0.09784317016601562, -0.08817291259765625, -0.07850265502929688, -0.0688323974609375, -0.059162139892578125, -0.04949188232421875, -0.039821624755859375, -0.0301513671875, -0.020481109619140625, -0.01081085205078125, -0.001140594482421875, 0.0085296630859375, 0.018199920654296875, 0.02787017822265625, 0.037540435791015625, 0.047210693359375, 0.056880950927734375, 0.06655120849609375, 0.07622146606445312, 0.0858917236328125, 0.09556198120117188, 0.10523223876953125, 0.11490249633789062, 0.12457275390625, 0.13424301147460938, 0.14391326904296875, 0.15358352661132812, 0.1632537841796875, 0.17292404174804688, 0.18259429931640625, 0.19226455688476562, 0.201934814453125, 0.21160507202148438, 0.22127532958984375, 0.23094558715820312, 0.2406158447265625, 0.2502861022949219, 0.25995635986328125, 0.2696266174316406, 0.279296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 55.0, 713.0, 216.0, 19.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.172452926635742, -16.811790466308594, -16.451126098632812, -16.09046173095703, -15.729799270629883, -15.369135856628418, -15.008472442626953, -14.647809028625488, -14.287145614624023, -13.926482200622559, -13.565818786621094, -13.205155372619629, -12.844491958618164, -12.4838285446167, -12.123165130615234, -11.76250171661377, -11.401838302612305, -11.04117488861084, -10.680511474609375, -10.31984806060791, -9.959184646606445, -9.59852123260498, -9.237857818603516, -8.87719440460205, -8.516530990600586, -8.155867576599121, -7.795204162597656, -7.434540748596191, -7.073877334594727, -6.713213920593262, -6.352550506591797, -5.991887092590332, -5.631224632263184, -5.270561218261719, -4.909897804260254, -4.549234390258789, -4.188570976257324, -3.8279075622558594, -3.4672441482543945, -3.1065807342529297, -2.745917320251465, -2.38525390625, -2.024590492248535, -1.6639270782470703, -1.3032636642456055, -0.9426002502441406, -0.5819368362426758, -0.22127342224121094, 0.1393899917602539, 0.5000534057617188, 0.8607168197631836, 1.2213802337646484, 1.5820436477661133, 1.9427070617675781, 2.303370475769043, 2.664033889770508, 3.0246973037719727, 3.3853607177734375, 3.7460241317749023, 4.106687545776367, 4.467350959777832, 4.828014373779297, 5.188677787780762, 5.549341201782227, 5.910004615783691]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 15.0, 15.0, 10.0, 18.0, 35.0, 32.0, 38.0, 48.0, 50.0, 63.0, 53.0, 61.0, 44.0, 69.0, 66.0, 46.0, 57.0, 49.0, 41.0, 37.0, 23.0, 20.0, 22.0, 17.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3792190551757812, -2.297229528427124, -2.215240001678467, -2.1332504749298096, -2.0512609481811523, -1.9692714214324951, -1.887281894683838, -1.8052923679351807, -1.7233028411865234, -1.6413133144378662, -1.559323787689209, -1.4773342609405518, -1.3953447341918945, -1.3133552074432373, -1.23136568069458, -1.1493761539459229, -1.0673866271972656, -0.9853971004486084, -0.9034075736999512, -0.821418046951294, -0.7394285202026367, -0.6574389934539795, -0.5754494667053223, -0.49345993995666504, -0.4114704132080078, -0.3294808864593506, -0.24749135971069336, -0.16550183296203613, -0.0835123062133789, -0.0015227794647216797, 0.08046674728393555, 0.16245627403259277, 0.24444580078125, 0.3264353275299072, 0.40842485427856445, 0.4904143810272217, 0.5724039077758789, 0.6543934345245361, 0.7363829612731934, 0.8183724880218506, 0.9003620147705078, 0.982351541519165, 1.0643410682678223, 1.1463305950164795, 1.2283201217651367, 1.310309648513794, 1.3922991752624512, 1.4742887020111084, 1.5562782287597656, 1.6382677555084229, 1.72025728225708, 1.8022468090057373, 1.8842363357543945, 1.9662258625030518, 2.048215389251709, 2.130204916000366, 2.2121944427490234, 2.2941839694976807, 2.376173496246338, 2.458163022994995, 2.5401525497436523, 2.6221420764923096, 2.704131603240967, 2.786121129989624, 2.8681106567382812]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 7.0, 13.0, 6.0, 24.0, 13.0, 25.0, 31.0, 32.0, 44.0, 56.0, 84.0, 112.0, 149.0, 243.0, 470.0, 1061.0, 3158.0, 16811.0, 304873.0, 3817401.0, 41708.0, 5820.0, 1401.0, 448.0, 149.0, 72.0, 33.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-2.439453125, -2.3908462524414062, -2.3422393798828125, -2.2936325073242188, -2.245025634765625, -2.1964187622070312, -2.1478118896484375, -2.0992050170898438, -2.05059814453125, -2.0019912719726562, -1.9533843994140625, -1.9047775268554688, -1.856170654296875, -1.8075637817382812, -1.7589569091796875, -1.7103500366210938, -1.6617431640625, -1.6131362915039062, -1.5645294189453125, -1.5159225463867188, -1.467315673828125, -1.4187088012695312, -1.3701019287109375, -1.3214950561523438, -1.27288818359375, -1.2242813110351562, -1.1756744384765625, -1.1270675659179688, -1.078460693359375, -1.0298538208007812, -0.9812469482421875, -0.9326400756835938, -0.884033203125, -0.8354263305664062, -0.7868194580078125, -0.7382125854492188, -0.689605712890625, -0.6409988403320312, -0.5923919677734375, -0.5437850952148438, -0.49517822265625, -0.44657135009765625, -0.3979644775390625, -0.34935760498046875, -0.300750732421875, -0.25214385986328125, -0.2035369873046875, -0.15493011474609375, -0.1063232421875, -0.05771636962890625, -0.0091094970703125, 0.03949737548828125, 0.088104248046875, 0.13671112060546875, 0.1853179931640625, 0.23392486572265625, 0.28253173828125, 0.33113861083984375, 0.3797454833984375, 0.42835235595703125, 0.476959228515625, 0.5255661010742188, 0.5741729736328125, 0.6227798461914062, 0.67138671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 11.0, 12.0, 30.0, 56.0, 86.0, 109.0, 138.0, 172.0, 135.0, 104.0, 52.0, 42.0, 26.0, 22.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.352783203125, -0.3457651138305664, -0.3387470245361328, -0.3317289352416992, -0.3247108459472656, -0.31769275665283203, -0.31067466735839844, -0.30365657806396484, -0.29663848876953125, -0.28962039947509766, -0.28260231018066406, -0.27558422088623047, -0.2685661315917969, -0.2615480422973633, -0.2545299530029297, -0.2475118637084961, -0.2404937744140625, -0.2334756851196289, -0.2264575958251953, -0.21943950653076172, -0.21242141723632812, -0.20540332794189453, -0.19838523864746094, -0.19136714935302734, -0.18434906005859375, -0.17733097076416016, -0.17031288146972656, -0.16329479217529297, -0.15627670288085938, -0.14925861358642578, -0.1422405242919922, -0.1352224349975586, -0.128204345703125, -0.1211862564086914, -0.11416816711425781, -0.10715007781982422, -0.10013198852539062, -0.09311389923095703, -0.08609580993652344, -0.07907772064208984, -0.07205963134765625, -0.06504154205322266, -0.05802345275878906, -0.05100536346435547, -0.043987274169921875, -0.03696918487548828, -0.029951095581054688, -0.022933006286621094, -0.0159149169921875, -0.008896827697753906, -0.0018787384033203125, 0.005139350891113281, 0.012157440185546875, 0.01917552947998047, 0.026193618774414062, 0.033211708068847656, 0.04022979736328125, 0.047247886657714844, 0.05426597595214844, 0.06128406524658203, 0.06830215454101562, 0.07532024383544922, 0.08233833312988281, 0.0893564224243164, 0.09637451171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 12.0, 31.0, 79.0, 123.0, 321.0, 1191.0, 84105.0, 4106574.0, 1421.0, 250.0, 83.0, 45.0, 27.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.201904296875, -7.05224609375, -6.902587890625, -6.7529296875, -6.603271484375, -6.45361328125, -6.303955078125, -6.154296875, -6.004638671875, -5.85498046875, -5.705322265625, -5.5556640625, -5.406005859375, -5.25634765625, -5.106689453125, -4.95703125, -4.807373046875, -4.65771484375, -4.508056640625, -4.3583984375, -4.208740234375, -4.05908203125, -3.909423828125, -3.759765625, -3.610107421875, -3.46044921875, -3.310791015625, -3.1611328125, -3.011474609375, -2.86181640625, -2.712158203125, -2.5625, -2.412841796875, -2.26318359375, -2.113525390625, -1.9638671875, -1.814208984375, -1.66455078125, -1.514892578125, -1.365234375, -1.215576171875, -1.06591796875, -0.916259765625, -0.7666015625, -0.616943359375, -0.46728515625, -0.317626953125, -0.16796875, -0.018310546875, 0.13134765625, 0.281005859375, 0.4306640625, 0.580322265625, 0.72998046875, 0.879638671875, 1.029296875, 1.178955078125, 1.32861328125, 1.478271484375, 1.6279296875, 1.777587890625, 1.92724609375, 2.076904296875, 2.2265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 12.0, 42.0, 94.0, 508.0, 3076.0, 232.0, 53.0, 26.0, 13.0, 9.0, 4.0, 1.0, 2.0, 3.0], "bins": [-0.8466796875, -0.8310966491699219, -0.8155136108398438, -0.7999305725097656, -0.7843475341796875, -0.7687644958496094, -0.7531814575195312, -0.7375984191894531, -0.722015380859375, -0.7064323425292969, -0.6908493041992188, -0.6752662658691406, -0.6596832275390625, -0.6441001892089844, -0.6285171508789062, -0.6129341125488281, -0.59735107421875, -0.5817680358886719, -0.5661849975585938, -0.5506019592285156, -0.5350189208984375, -0.5194358825683594, -0.5038528442382812, -0.4882698059082031, -0.472686767578125, -0.4571037292480469, -0.44152069091796875, -0.4259376525878906, -0.4103546142578125, -0.3947715759277344, -0.37918853759765625, -0.3636054992675781, -0.3480224609375, -0.3324394226074219, -0.31685638427734375, -0.3012733459472656, -0.2856903076171875, -0.2701072692871094, -0.25452423095703125, -0.23894119262695312, -0.223358154296875, -0.20777511596679688, -0.19219207763671875, -0.17660903930664062, -0.1610260009765625, -0.14544296264648438, -0.12985992431640625, -0.11427688598632812, -0.09869384765625, -0.08311080932617188, -0.06752777099609375, -0.051944732666015625, -0.0363616943359375, -0.020778656005859375, -0.00519561767578125, 0.010387420654296875, 0.025970458984375, 0.041553497314453125, 0.05713653564453125, 0.07271957397460938, 0.0883026123046875, 0.10388565063476562, 0.11946868896484375, 0.13505172729492188, 0.150634765625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 15.0, 63.0, 303.0, 457.0, 116.0, 21.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8174827098846436, -3.7092814445495605, -3.6010801792144775, -3.4928789138793945, -3.3846778869628906, -3.2764766216278076, -3.1682753562927246, -3.0600740909576416, -2.9518728256225586, -2.8436715602874756, -2.7354702949523926, -2.6272692680358887, -2.5190680027008057, -2.4108667373657227, -2.3026654720306396, -2.1944642066955566, -2.0862631797790527, -1.9780619144439697, -1.8698607683181763, -1.7616595029830933, -1.6534582376480103, -1.5452570915222168, -1.4370558261871338, -1.3288545608520508, -1.2206532955169678, -1.1124520301818848, -1.0042508840560913, -0.8960496187210083, -0.7878483533859253, -0.6796471476554871, -0.5714459419250488, -0.4632446765899658, -0.3550434112548828, -0.2468421757221222, -0.13864095509052277, -0.03043973445892334, 0.07776150107383728, 0.1859627366065979, 0.29416394233703613, 0.40236520767211914, 0.5105664134025574, 0.6187676191329956, 0.7269688844680786, 0.8351700901985168, 0.9433712959289551, 1.051572561264038, 1.159773826599121, 1.267975091934204, 1.3761762380599976, 1.4843775033950806, 1.592578649520874, 1.700779914855957, 1.80898118019104, 1.917182445526123, 2.025383472442627, 2.133584976196289, 2.241786003112793, 2.349987268447876, 2.458188533782959, 2.566389560699463, 2.674590826034546, 2.782792091369629, 2.890993356704712, 2.999194622039795, 3.107395887374878]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 12.0, 29.0, 44.0, 58.0, 79.0, 81.0, 98.0, 142.0, 113.0, 78.0, 91.0, 57.0, 43.0, 37.0, 15.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1972384452819824, -2.1311795711517334, -2.0651204586029053, -1.9990615844726562, -1.9330027103424072, -1.8669437170028687, -1.80088472366333, -1.734825849533081, -1.668766975402832, -1.6027079820632935, -1.5366491079330444, -1.4705901145935059, -1.4045312404632568, -1.3384722471237183, -1.2724132537841797, -1.2063543796539307, -1.140295386314392, -1.0742363929748535, -1.0081775188446045, -0.9421185255050659, -0.8760596513748169, -0.8100006580352783, -0.7439417243003845, -0.6778827905654907, -0.6118238568305969, -0.5457649230957031, -0.4797059893608093, -0.41364702582359314, -0.34758809208869934, -0.28152915835380554, -0.21547019481658936, -0.14941126108169556, -0.08335232734680176, -0.017293386161327362, 0.048765555024147034, 0.11482450366020203, 0.18088343739509583, 0.24694237112998962, 0.3130013346672058, 0.3790602684020996, 0.4451192021369934, 0.5111781358718872, 0.577237069606781, 0.6432960033416748, 0.7093549966812134, 0.7754138708114624, 0.841472864151001, 0.9075317978858948, 0.9735907316207886, 1.0396497249603271, 1.1057085990905762, 1.1717675924301147, 1.2378264665603638, 1.3038854598999023, 1.3699443340301514, 1.43600332736969, 1.5020623207092285, 1.568121314048767, 1.6341801881790161, 1.7002391815185547, 1.7662980556488037, 1.8323570489883423, 1.8984160423278809, 1.9644749164581299, 2.030533790588379]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 11.0, 16.0, 9.0, 19.0, 36.0, 33.0, 51.0, 81.0, 106.0, 189.0, 359.0, 583.0, 1276.0, 3682.0, 14768.0, 102571.0, 758103.0, 140754.0, 18553.0, 4271.0, 1469.0, 653.0, 332.0, 213.0, 120.0, 75.0, 55.0, 37.0, 31.0, 28.0, 10.0, 16.0, 8.0, 5.0, 7.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.85546875, -0.830718994140625, -0.80596923828125, -0.781219482421875, -0.7564697265625, -0.731719970703125, -0.70697021484375, -0.682220458984375, -0.657470703125, -0.632720947265625, -0.60797119140625, -0.583221435546875, -0.5584716796875, -0.533721923828125, -0.50897216796875, -0.484222412109375, -0.45947265625, -0.434722900390625, -0.40997314453125, -0.385223388671875, -0.3604736328125, -0.335723876953125, -0.31097412109375, -0.286224365234375, -0.261474609375, -0.236724853515625, -0.21197509765625, -0.187225341796875, -0.1624755859375, -0.137725830078125, -0.11297607421875, -0.088226318359375, -0.0634765625, -0.038726806640625, -0.01397705078125, 0.010772705078125, 0.0355224609375, 0.060272216796875, 0.08502197265625, 0.109771728515625, 0.134521484375, 0.159271240234375, 0.18402099609375, 0.208770751953125, 0.2335205078125, 0.258270263671875, 0.28302001953125, 0.307769775390625, 0.33251953125, 0.357269287109375, 0.38201904296875, 0.406768798828125, 0.4315185546875, 0.456268310546875, 0.48101806640625, 0.505767822265625, 0.530517578125, 0.555267333984375, 0.58001708984375, 0.604766845703125, 0.6295166015625, 0.654266357421875, 0.67901611328125, 0.703765869140625, 0.728515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 15.0, 28.0, 58.0, 73.0, 90.0, 103.0, 129.0, 125.0, 99.0, 98.0, 62.0, 44.0, 24.0, 16.0, 9.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.358154296875, -0.35033416748046875, -0.3425140380859375, -0.33469390869140625, -0.326873779296875, -0.31905364990234375, -0.3112335205078125, -0.30341339111328125, -0.29559326171875, -0.28777313232421875, -0.2799530029296875, -0.27213287353515625, -0.264312744140625, -0.25649261474609375, -0.2486724853515625, -0.24085235595703125, -0.2330322265625, -0.22521209716796875, -0.2173919677734375, -0.20957183837890625, -0.201751708984375, -0.19393157958984375, -0.1861114501953125, -0.17829132080078125, -0.17047119140625, -0.16265106201171875, -0.1548309326171875, -0.14701080322265625, -0.139190673828125, -0.13137054443359375, -0.1235504150390625, -0.11573028564453125, -0.10791015625, -0.10009002685546875, -0.0922698974609375, -0.08444976806640625, -0.076629638671875, -0.06880950927734375, -0.0609893798828125, -0.05316925048828125, -0.04534912109375, -0.03752899169921875, -0.0297088623046875, -0.02188873291015625, -0.014068603515625, -0.00624847412109375, 0.0015716552734375, 0.00939178466796875, 0.0172119140625, 0.02503204345703125, 0.0328521728515625, 0.04067230224609375, 0.048492431640625, 0.05631256103515625, 0.0641326904296875, 0.07195281982421875, 0.07977294921875, 0.08759307861328125, 0.0954132080078125, 0.10323333740234375, 0.111053466796875, 0.11887359619140625, 0.1266937255859375, 0.13451385498046875, 0.142333984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 8.0, 7.0, 8.0, 14.0, 27.0, 25.0, 47.0, 101.0, 158.0, 336.0, 795.0, 2299.0, 7868.0, 38259.0, 407027.0, 529414.0, 48386.0, 9239.0, 2754.0, 928.0, 390.0, 175.0, 99.0, 51.0, 27.0, 20.0, 17.0, 17.0, 7.0, 3.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5732421875, -0.5547866821289062, -0.5363311767578125, -0.5178756713867188, -0.499420166015625, -0.48096466064453125, -0.4625091552734375, -0.44405364990234375, -0.42559814453125, -0.40714263916015625, -0.3886871337890625, -0.37023162841796875, -0.351776123046875, -0.33332061767578125, -0.3148651123046875, -0.29640960693359375, -0.2779541015625, -0.25949859619140625, -0.2410430908203125, -0.22258758544921875, -0.204132080078125, -0.18567657470703125, -0.1672210693359375, -0.14876556396484375, -0.13031005859375, -0.11185455322265625, -0.0933990478515625, -0.07494354248046875, -0.056488037109375, -0.03803253173828125, -0.0195770263671875, -0.00112152099609375, 0.017333984375, 0.03578948974609375, 0.0542449951171875, 0.07270050048828125, 0.091156005859375, 0.10961151123046875, 0.1280670166015625, 0.14652252197265625, 0.16497802734375, 0.18343353271484375, 0.2018890380859375, 0.22034454345703125, 0.238800048828125, 0.25725555419921875, 0.2757110595703125, 0.29416656494140625, 0.3126220703125, 0.33107757568359375, 0.3495330810546875, 0.36798858642578125, 0.386444091796875, 0.40489959716796875, 0.4233551025390625, 0.44181060791015625, 0.46026611328125, 0.47872161865234375, 0.4971771240234375, 0.5156326293945312, 0.534088134765625, 0.5525436401367188, 0.5709991455078125, 0.5894546508789062, 0.60791015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 4.0, 9.0, 9.0, 12.0, 7.0, 22.0, 18.0, 34.0, 29.0, 44.0, 46.0, 52.0, 51.0, 54.0, 44.0, 71.0, 57.0, 74.0, 60.0, 47.0, 30.0, 37.0, 34.0, 25.0, 18.0, 20.0, 7.0, 13.0, 14.0, 5.0, 5.0, 5.0, 9.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5009765625, -0.48497772216796875, -0.4689788818359375, -0.45298004150390625, -0.436981201171875, -0.42098236083984375, -0.4049835205078125, -0.38898468017578125, -0.37298583984375, -0.35698699951171875, -0.3409881591796875, -0.32498931884765625, -0.308990478515625, -0.29299163818359375, -0.2769927978515625, -0.26099395751953125, -0.2449951171875, -0.22899627685546875, -0.2129974365234375, -0.19699859619140625, -0.180999755859375, -0.16500091552734375, -0.1490020751953125, -0.13300323486328125, -0.11700439453125, -0.10100555419921875, -0.0850067138671875, -0.06900787353515625, -0.053009033203125, -0.03701019287109375, -0.0210113525390625, -0.00501251220703125, 0.010986328125, 0.02698516845703125, 0.0429840087890625, 0.05898284912109375, 0.074981689453125, 0.09098052978515625, 0.1069793701171875, 0.12297821044921875, 0.13897705078125, 0.15497589111328125, 0.1709747314453125, 0.18697357177734375, 0.202972412109375, 0.21897125244140625, 0.2349700927734375, 0.25096893310546875, 0.2669677734375, 0.28296661376953125, 0.2989654541015625, 0.31496429443359375, 0.330963134765625, 0.34696197509765625, 0.3629608154296875, 0.37895965576171875, 0.39495849609375, 0.41095733642578125, 0.4269561767578125, 0.44295501708984375, 0.458953857421875, 0.47495269775390625, 0.4909515380859375, 0.5069503784179688, 0.52294921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 4.0, 6.0, 3.0, 3.0, 6.0, 3.0, 12.0, 8.0, 17.0, 24.0, 47.0, 62.0, 94.0, 207.0, 412.0, 967.0, 2486.0, 7692.0, 39571.0, 739279.0, 232314.0, 17601.0, 4726.0, 1629.0, 685.0, 293.0, 159.0, 84.0, 43.0, 29.0, 20.0, 11.0, 13.0, 7.0, 9.0, 2.0, 9.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337158203125, -0.3265533447265625, -0.315948486328125, -0.3053436279296875, -0.29473876953125, -0.2841339111328125, -0.273529052734375, -0.2629241943359375, -0.2523193359375, -0.2417144775390625, -0.231109619140625, -0.2205047607421875, -0.20989990234375, -0.1992950439453125, -0.188690185546875, -0.1780853271484375, -0.16748046875, -0.1568756103515625, -0.146270751953125, -0.1356658935546875, -0.12506103515625, -0.1144561767578125, -0.103851318359375, -0.0932464599609375, -0.0826416015625, -0.0720367431640625, -0.061431884765625, -0.0508270263671875, -0.04022216796875, -0.0296173095703125, -0.019012451171875, -0.0084075927734375, 0.002197265625, 0.0128021240234375, 0.023406982421875, 0.0340118408203125, 0.04461669921875, 0.0552215576171875, 0.065826416015625, 0.0764312744140625, 0.0870361328125, 0.0976409912109375, 0.108245849609375, 0.1188507080078125, 0.12945556640625, 0.1400604248046875, 0.150665283203125, 0.1612701416015625, 0.171875, 0.1824798583984375, 0.193084716796875, 0.2036895751953125, 0.21429443359375, 0.2248992919921875, 0.235504150390625, 0.2461090087890625, 0.2567138671875, 0.2673187255859375, 0.277923583984375, 0.2885284423828125, 0.29913330078125, 0.3097381591796875, 0.320343017578125, 0.3309478759765625, 0.341552734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 5.0, 9.0, 9.0, 23.0, 27.0, 28.0, 39.0, 52.0, 60.0, 81.0, 100.0, 102.0, 121.0, 80.0, 52.0, 43.0, 45.0, 19.0, 17.0, 20.0, 17.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020074844360351562, -0.00019417330622673035, -0.00018759816884994507, -0.0001810230314731598, -0.0001744478940963745, -0.00016787275671958923, -0.00016129761934280396, -0.00015472248196601868, -0.0001481473445892334, -0.00014157220721244812, -0.00013499706983566284, -0.00012842193245887756, -0.00012184679508209229, -0.00011527165770530701, -0.00010869652032852173, -0.00010212138295173645, -9.554624557495117e-05, -8.89711081981659e-05, -8.239597082138062e-05, -7.582083344459534e-05, -6.924569606781006e-05, -6.267055869102478e-05, -5.60954213142395e-05, -4.9520283937454224e-05, -4.2945146560668945e-05, -3.637000918388367e-05, -2.979487180709839e-05, -2.321973443031311e-05, -1.6644597053527832e-05, -1.0069459676742554e-05, -3.4943222999572754e-06, 3.080815076828003e-06, 9.655952453613281e-06, 1.623108983039856e-05, 2.2806227207183838e-05, 2.9381364583969116e-05, 3.5956501960754395e-05, 4.253163933753967e-05, 4.910677671432495e-05, 5.568191409111023e-05, 6.225705146789551e-05, 6.883218884468079e-05, 7.540732622146606e-05, 8.198246359825134e-05, 8.855760097503662e-05, 9.51327383518219e-05, 0.00010170787572860718, 0.00010828301310539246, 0.00011485815048217773, 0.00012143328785896301, 0.0001280084252357483, 0.00013458356261253357, 0.00014115869998931885, 0.00014773383736610413, 0.0001543089747428894, 0.00016088411211967468, 0.00016745924949645996, 0.00017403438687324524, 0.00018060952425003052, 0.0001871846616268158, 0.00019375979900360107, 0.00020033493638038635, 0.00020691007375717163, 0.0002134852111339569, 0.0002200603485107422]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 2.0, 9.0, 10.0, 7.0, 5.0, 20.0, 27.0, 29.0, 64.0, 62.0, 93.0, 157.0, 233.0, 363.0, 681.0, 1137.0, 2168.0, 4105.0, 8915.0, 29630.0, 224974.0, 659007.0, 86581.0, 16838.0, 6391.0, 3094.0, 1643.0, 871.0, 515.0, 319.0, 190.0, 105.0, 81.0, 47.0, 36.0, 23.0, 33.0, 27.0, 12.0, 13.0, 6.0, 7.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2147216796875, -0.20827293395996094, -0.20182418823242188, -0.1953754425048828, -0.18892669677734375, -0.1824779510498047, -0.17602920532226562, -0.16958045959472656, -0.1631317138671875, -0.15668296813964844, -0.15023422241210938, -0.1437854766845703, -0.13733673095703125, -0.1308879852294922, -0.12443923950195312, -0.11799049377441406, -0.111541748046875, -0.10509300231933594, -0.09864425659179688, -0.09219551086425781, -0.08574676513671875, -0.07929801940917969, -0.07284927368164062, -0.06640052795410156, -0.0599517822265625, -0.05350303649902344, -0.047054290771484375, -0.04060554504394531, -0.03415679931640625, -0.027708053588867188, -0.021259307861328125, -0.014810562133789062, -0.00836181640625, -0.0019130706787109375, 0.004535675048828125, 0.010984420776367188, 0.01743316650390625, 0.023881912231445312, 0.030330657958984375, 0.03677940368652344, 0.0432281494140625, 0.04967689514160156, 0.056125640869140625, 0.06257438659667969, 0.06902313232421875, 0.07547187805175781, 0.08192062377929688, 0.08836936950683594, 0.094818115234375, 0.10126686096191406, 0.10771560668945312, 0.11416435241699219, 0.12061309814453125, 0.1270618438720703, 0.13351058959960938, 0.13995933532714844, 0.1464080810546875, 0.15285682678222656, 0.15930557250976562, 0.1657543182373047, 0.17220306396484375, 0.1786518096923828, 0.18510055541992188, 0.19154930114746094, 0.197998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 8.0, 10.0, 10.0, 23.0, 44.0, 63.0, 89.0, 142.0, 180.0, 149.0, 99.0, 57.0, 38.0, 25.0, 15.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.19840049743652344, -0.19233322143554688, -0.1862659454345703, -0.18019866943359375, -0.1741313934326172, -0.16806411743164062, -0.16199684143066406, -0.1559295654296875, -0.14986228942871094, -0.14379501342773438, -0.1377277374267578, -0.13166046142578125, -0.1255931854248047, -0.11952590942382812, -0.11345863342285156, -0.107391357421875, -0.10132408142089844, -0.09525680541992188, -0.08918952941894531, -0.08312225341796875, -0.07705497741699219, -0.07098770141601562, -0.06492042541503906, -0.0588531494140625, -0.05278587341308594, -0.046718597412109375, -0.04065132141113281, -0.03458404541015625, -0.028516769409179688, -0.022449493408203125, -0.016382217407226562, -0.01031494140625, -0.0042476654052734375, 0.001819610595703125, 0.007886886596679688, 0.01395416259765625, 0.020021438598632812, 0.026088714599609375, 0.03215599060058594, 0.0382232666015625, 0.04429054260253906, 0.050357818603515625, 0.05642509460449219, 0.06249237060546875, 0.06855964660644531, 0.07462692260742188, 0.08069419860839844, 0.086761474609375, 0.09282875061035156, 0.09889602661132812, 0.10496330261230469, 0.11103057861328125, 0.11709785461425781, 0.12316513061523438, 0.12923240661621094, 0.1352996826171875, 0.14136695861816406, 0.14743423461914062, 0.1535015106201172, 0.15956878662109375, 0.1656360626220703, 0.17170333862304688, 0.17777061462402344, 0.183837890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 27.0, 52.0, 88.0, 158.0, 219.0, 190.0, 107.0, 57.0, 30.0, 12.0, 14.0, 4.0, 9.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4275474548339844, -3.336244821548462, -3.2449419498443604, -3.153639316558838, -3.0623364448547363, -2.971033811569214, -2.8797311782836914, -2.78842830657959, -2.6971256732940674, -2.605823040008545, -2.5145201683044434, -2.423217535018921, -2.3319146633148193, -2.240612030029297, -2.1493091583251953, -2.058006525039673, -1.9667037725448608, -1.8754010200500488, -1.7840982675552368, -1.6927955150604248, -1.6014928817749023, -1.5101901292800903, -1.4188873767852783, -1.3275847434997559, -1.2362818717956543, -1.1449791193008423, -1.0536763668060303, -0.962373673915863, -0.8710709810256958, -0.7797682285308838, -0.6884654760360718, -0.5971627831459045, -0.5058600902557373, -0.4145573675632477, -0.32325464487075806, -0.23195189237594604, -0.14064916968345642, -0.0493464469909668, 0.041956305503845215, 0.13325899839401245, 0.22456175088882446, 0.3158644735813141, 0.4071671962738037, 0.4984699487686157, 0.5897727012634277, 0.681075394153595, 0.772378146648407, 0.8636808395385742, 0.9549835920333862, 1.0462863445281982, 1.1375890970230103, 1.2288918495178223, 1.3201944828033447, 1.4114972352981567, 1.5027999877929688, 1.5941026210784912, 1.6854054927825928, 1.7767082452774048, 1.8680109977722168, 1.9593136310577393, 2.050616502761841, 2.1419191360473633, 2.233222007751465, 2.3245246410369873, 2.4158272743225098]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 3.0, 2.0, 10.0, 6.0, 7.0, 15.0, 21.0, 15.0, 19.0, 26.0, 27.0, 29.0, 34.0, 43.0, 33.0, 38.0, 43.0, 47.0, 38.0, 47.0, 42.0, 44.0, 42.0, 37.0, 43.0, 51.0, 33.0, 28.0, 20.0, 29.0, 23.0, 12.0, 16.0, 12.0, 12.0, 7.0, 12.0, 7.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.403439521789551, -2.3265132904052734, -2.249587059020996, -2.1726608276367188, -2.0957345962524414, -2.018808364868164, -1.9418822526931763, -1.864956021308899, -1.7880297899246216, -1.7111035585403442, -1.634177327156067, -1.5572510957717896, -1.4803249835968018, -1.4033987522125244, -1.326472520828247, -1.2495462894439697, -1.1726200580596924, -1.095693826675415, -1.0187675952911377, -0.9418414235115051, -0.8649151921272278, -0.7879889607429504, -0.7110627889633179, -0.6341365575790405, -0.5572103261947632, -0.48028409481048584, -0.4033578932285309, -0.3264316916465759, -0.24950546026229858, -0.17257922887802124, -0.09565302729606628, -0.018726825714111328, 0.058199405670166016, 0.13512562215328217, 0.21205183863639832, 0.28897804021835327, 0.3659042716026306, 0.44283050298690796, 0.5197566747665405, 0.5966829061508179, 0.6736091375350952, 0.7505353689193726, 0.8274616003036499, 0.9043877720832825, 0.9813140034675598, 1.0582401752471924, 1.1351664066314697, 1.212092638015747, 1.2890188694000244, 1.3659451007843018, 1.442871332168579, 1.5197975635528564, 1.5967237949371338, 1.6736500263214111, 1.750576138496399, 1.8275023698806763, 1.9044286012649536, 1.981354832649231, 2.0582809448242188, 2.135207176208496, 2.2121334075927734, 2.289059638977051, 2.365985870361328, 2.4429121017456055, 2.519838333129883]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 8.0, 5.0, 13.0, 10.0, 18.0, 18.0, 37.0, 37.0, 55.0, 65.0, 96.0, 131.0, 195.0, 282.0, 522.0, 1033.0, 2577.0, 8856.0, 54036.0, 3771524.0, 322194.0, 24179.0, 5139.0, 1719.0, 724.0, 363.0, 195.0, 97.0, 57.0, 29.0, 20.0, 18.0, 8.0, 5.0, 1.0, 0.0, 5.0, 2.0], "bins": [-1.498046875, -1.46533203125, -1.4326171875, -1.39990234375, -1.3671875, -1.33447265625, -1.3017578125, -1.26904296875, -1.236328125, -1.20361328125, -1.1708984375, -1.13818359375, -1.10546875, -1.07275390625, -1.0400390625, -1.00732421875, -0.974609375, -0.94189453125, -0.9091796875, -0.87646484375, -0.84375, -0.81103515625, -0.7783203125, -0.74560546875, -0.712890625, -0.68017578125, -0.6474609375, -0.61474609375, -0.58203125, -0.54931640625, -0.5166015625, -0.48388671875, -0.451171875, -0.41845703125, -0.3857421875, -0.35302734375, -0.3203125, -0.28759765625, -0.2548828125, -0.22216796875, -0.189453125, -0.15673828125, -0.1240234375, -0.09130859375, -0.05859375, -0.02587890625, 0.0068359375, 0.03955078125, 0.072265625, 0.10498046875, 0.1376953125, 0.17041015625, 0.203125, 0.23583984375, 0.2685546875, 0.30126953125, 0.333984375, 0.36669921875, 0.3994140625, 0.43212890625, 0.46484375, 0.49755859375, 0.5302734375, 0.56298828125, 0.595703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 11.0, 29.0, 42.0, 76.0, 99.0, 96.0, 107.0, 126.0, 100.0, 82.0, 89.0, 47.0, 25.0, 22.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.364990234375, -0.3570709228515625, -0.349151611328125, -0.3412322998046875, -0.33331298828125, -0.3253936767578125, -0.317474365234375, -0.3095550537109375, -0.3016357421875, -0.2937164306640625, -0.285797119140625, -0.2778778076171875, -0.26995849609375, -0.2620391845703125, -0.254119873046875, -0.2462005615234375, -0.23828125, -0.2303619384765625, -0.222442626953125, -0.2145233154296875, -0.20660400390625, -0.1986846923828125, -0.190765380859375, -0.1828460693359375, -0.1749267578125, -0.1670074462890625, -0.159088134765625, -0.1511688232421875, -0.14324951171875, -0.1353302001953125, -0.127410888671875, -0.1194915771484375, -0.111572265625, -0.1036529541015625, -0.095733642578125, -0.0878143310546875, -0.07989501953125, -0.0719757080078125, -0.064056396484375, -0.0561370849609375, -0.0482177734375, -0.0402984619140625, -0.032379150390625, -0.0244598388671875, -0.01654052734375, -0.0086212158203125, -0.000701904296875, 0.0072174072265625, 0.01513671875, 0.0230560302734375, 0.030975341796875, 0.0388946533203125, 0.04681396484375, 0.0547332763671875, 0.062652587890625, 0.0705718994140625, 0.0784912109375, 0.0864105224609375, 0.094329833984375, 0.1022491455078125, 0.11016845703125, 0.1180877685546875, 0.126007080078125, 0.1339263916015625, 0.141845703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 42.0, 46.0, 136.0, 245.0, 549.0, 2116.0, 30431.0, 4116669.0, 40785.0, 2206.0, 603.0, 267.0, 94.0, 39.0, 18.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.46484375, -1.41839599609375, -1.3719482421875, -1.32550048828125, -1.279052734375, -1.23260498046875, -1.1861572265625, -1.13970947265625, -1.09326171875, -1.04681396484375, -1.0003662109375, -0.95391845703125, -0.907470703125, -0.86102294921875, -0.8145751953125, -0.76812744140625, -0.7216796875, -0.67523193359375, -0.6287841796875, -0.58233642578125, -0.535888671875, -0.48944091796875, -0.4429931640625, -0.39654541015625, -0.35009765625, -0.30364990234375, -0.2572021484375, -0.21075439453125, -0.164306640625, -0.11785888671875, -0.0714111328125, -0.02496337890625, 0.021484375, 0.06793212890625, 0.1143798828125, 0.16082763671875, 0.207275390625, 0.25372314453125, 0.3001708984375, 0.34661865234375, 0.39306640625, 0.43951416015625, 0.4859619140625, 0.53240966796875, 0.578857421875, 0.62530517578125, 0.6717529296875, 0.71820068359375, 0.7646484375, 0.81109619140625, 0.8575439453125, 0.90399169921875, 0.950439453125, 0.99688720703125, 1.0433349609375, 1.08978271484375, 1.13623046875, 1.18267822265625, 1.2291259765625, 1.27557373046875, 1.322021484375, 1.36846923828125, 1.4149169921875, 1.46136474609375, 1.5078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 7.0, 5.0, 13.0, 21.0, 43.0, 111.0, 347.0, 2571.0, 686.0, 146.0, 62.0, 28.0, 5.0, 14.0, 12.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256103515625, -0.24776077270507812, -0.23941802978515625, -0.23107528686523438, -0.2227325439453125, -0.21438980102539062, -0.20604705810546875, -0.19770431518554688, -0.189361572265625, -0.18101882934570312, -0.17267608642578125, -0.16433334350585938, -0.1559906005859375, -0.14764785766601562, -0.13930511474609375, -0.13096237182617188, -0.12261962890625, -0.11427688598632812, -0.10593414306640625, -0.09759140014648438, -0.0892486572265625, -0.08090591430664062, -0.07256317138671875, -0.06422042846679688, -0.055877685546875, -0.047534942626953125, -0.03919219970703125, -0.030849456787109375, -0.0225067138671875, -0.014163970947265625, -0.00582122802734375, 0.002521514892578125, 0.0108642578125, 0.019207000732421875, 0.02754974365234375, 0.035892486572265625, 0.0442352294921875, 0.052577972412109375, 0.06092071533203125, 0.06926345825195312, 0.077606201171875, 0.08594894409179688, 0.09429168701171875, 0.10263442993164062, 0.1109771728515625, 0.11931991577148438, 0.12766265869140625, 0.13600540161132812, 0.14434814453125, 0.15269088745117188, 0.16103363037109375, 0.16937637329101562, 0.1777191162109375, 0.18606185913085938, 0.19440460205078125, 0.20274734497070312, 0.211090087890625, 0.21943283081054688, 0.22777557373046875, 0.23611831665039062, 0.2444610595703125, 0.2528038024902344, 0.26114654541015625, 0.2694892883300781, 0.27783203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 10.0, 14.0, 90.0, 527.0, 329.0, 28.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.754229545593262, -4.660699844360352, -4.5671706199646, -4.4736409187316895, -4.3801116943359375, -4.286581993103027, -4.193052768707275, -4.099523067474365, -4.005993843078613, -3.9124643802642822, -3.818934917449951, -3.72540545463562, -3.631875991821289, -3.538346529006958, -3.444817066192627, -3.351287603378296, -3.257758140563965, -3.164228677749634, -3.0706992149353027, -2.9771697521209717, -2.8836402893066406, -2.7901108264923096, -2.6965813636779785, -2.6030519008636475, -2.5095221996307373, -2.4159927368164062, -2.322463274002075, -2.228933811187744, -2.135404348373413, -2.041874885559082, -1.948345422744751, -1.85481595993042, -1.7612864971160889, -1.6677570343017578, -1.5742275714874268, -1.4806981086730957, -1.3871686458587646, -1.2936391830444336, -1.2001097202301025, -1.1065802574157715, -1.0130507946014404, -0.9195213317871094, -0.8259918689727783, -0.7324624061584473, -0.6389329433441162, -0.5454034805297852, -0.4518739581108093, -0.35834449529647827, -0.26481497287750244, -0.1712855100631714, -0.07775603234767914, 0.01577344536781311, 0.10930290818214417, 0.20283237099647522, 0.29636186361312866, 0.3898913264274597, 0.48342078924179077, 0.5769502520561218, 0.6704797148704529, 0.7640092372894287, 0.8575387001037598, 0.9510681629180908, 1.0445976257324219, 1.138127088546753, 1.231656551361084]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 6.0, 15.0, 18.0, 14.0, 24.0, 29.0, 25.0, 25.0, 45.0, 47.0, 63.0, 62.0, 52.0, 64.0, 53.0, 60.0, 59.0, 37.0, 51.0, 32.0, 36.0, 35.0, 36.0, 20.0, 15.0, 14.0, 9.0, 3.0, 10.0, 7.0, 8.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5759319067001343, -0.5590312480926514, -0.5421305298805237, -0.5252298712730408, -0.5083291530609131, -0.4914284944534302, -0.4745278060436249, -0.4576271176338196, -0.4407264292240143, -0.423825740814209, -0.4069250524044037, -0.3900243639945984, -0.3731237053871155, -0.3562229871749878, -0.3393223285675049, -0.3224216401576996, -0.3055209517478943, -0.288620263338089, -0.2717195749282837, -0.2548188865184784, -0.2379182130098343, -0.221017524600029, -0.2041168510913849, -0.1872161626815796, -0.1703154742717743, -0.153414785861969, -0.1365140974521637, -0.11961342394351959, -0.1027127355337143, -0.085812047123909, -0.0689113661646843, -0.052010685205459595, -0.0351099967956543, -0.018209312111139297, -0.001308627426624298, 0.015592057257890701, 0.0324927419424057, 0.049393430352211, 0.0662941113114357, 0.0831947922706604, 0.1000954806804657, 0.116996169090271, 0.1338968575000763, 0.1507975310087204, 0.1676982194185257, 0.184598907828331, 0.2014995813369751, 0.2184002697467804, 0.2353009581565857, 0.252201646566391, 0.2691023349761963, 0.2860030233860016, 0.3029037117958069, 0.3198043704032898, 0.3367050588130951, 0.3536057472229004, 0.3705064356327057, 0.387407124042511, 0.4043078124523163, 0.4212085008621216, 0.4381091594696045, 0.4550098776817322, 0.4719105362892151, 0.4888112246990204, 0.5057119131088257]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 8.0, 8.0, 8.0, 16.0, 24.0, 33.0, 45.0, 64.0, 109.0, 182.0, 326.0, 728.0, 1666.0, 5611.0, 30722.0, 406472.0, 551782.0, 40587.0, 6510.0, 1963.0, 802.0, 361.0, 202.0, 108.0, 60.0, 55.0, 35.0, 24.0, 12.0, 14.0, 6.0, 10.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9697265625, -0.9420700073242188, -0.9144134521484375, -0.8867568969726562, -0.859100341796875, -0.8314437866210938, -0.8037872314453125, -0.7761306762695312, -0.74847412109375, -0.7208175659179688, -0.6931610107421875, -0.6655044555664062, -0.637847900390625, -0.6101913452148438, -0.5825347900390625, -0.5548782348632812, -0.5272216796875, -0.49956512451171875, -0.4719085693359375, -0.44425201416015625, -0.416595458984375, -0.38893890380859375, -0.3612823486328125, -0.33362579345703125, -0.30596923828125, -0.27831268310546875, -0.2506561279296875, -0.22299957275390625, -0.195343017578125, -0.16768646240234375, -0.1400299072265625, -0.11237335205078125, -0.084716796875, -0.05706024169921875, -0.0294036865234375, -0.00174713134765625, 0.025909423828125, 0.05356597900390625, 0.0812225341796875, 0.10887908935546875, 0.13653564453125, 0.16419219970703125, 0.1918487548828125, 0.21950531005859375, 0.247161865234375, 0.27481842041015625, 0.3024749755859375, 0.33013153076171875, 0.3577880859375, 0.38544464111328125, 0.4131011962890625, 0.44075775146484375, 0.468414306640625, 0.49607086181640625, 0.5237274169921875, 0.5513839721679688, 0.57904052734375, 0.6066970825195312, 0.6343536376953125, 0.6620101928710938, 0.689666748046875, 0.7173233032226562, 0.7449798583984375, 0.7726364135742188, 0.80029296875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 11.0, 19.0, 39.0, 54.0, 77.0, 83.0, 114.0, 113.0, 106.0, 101.0, 72.0, 77.0, 44.0, 33.0, 20.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.3544921875, -0.346588134765625, -0.33868408203125, -0.330780029296875, -0.3228759765625, -0.314971923828125, -0.30706787109375, -0.299163818359375, -0.291259765625, -0.283355712890625, -0.27545166015625, -0.267547607421875, -0.2596435546875, -0.251739501953125, -0.24383544921875, -0.235931396484375, -0.22802734375, -0.220123291015625, -0.21221923828125, -0.204315185546875, -0.1964111328125, -0.188507080078125, -0.18060302734375, -0.172698974609375, -0.164794921875, -0.156890869140625, -0.14898681640625, -0.141082763671875, -0.1331787109375, -0.125274658203125, -0.11737060546875, -0.109466552734375, -0.1015625, -0.093658447265625, -0.08575439453125, -0.077850341796875, -0.0699462890625, -0.062042236328125, -0.05413818359375, -0.046234130859375, -0.038330078125, -0.030426025390625, -0.02252197265625, -0.014617919921875, -0.0067138671875, 0.001190185546875, 0.00909423828125, 0.016998291015625, 0.02490234375, 0.032806396484375, 0.04071044921875, 0.048614501953125, 0.0565185546875, 0.064422607421875, 0.07232666015625, 0.080230712890625, 0.088134765625, 0.096038818359375, 0.10394287109375, 0.111846923828125, 0.1197509765625, 0.127655029296875, 0.13555908203125, 0.143463134765625, 0.1513671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 13.0, 20.0, 30.0, 51.0, 82.0, 163.0, 358.0, 861.0, 2932.0, 14276.0, 166386.0, 790330.0, 62244.0, 7750.0, 1852.0, 636.0, 246.0, 127.0, 62.0, 39.0, 21.0, 13.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.021484375, -0.9948348999023438, -0.9681854248046875, -0.9415359497070312, -0.914886474609375, -0.8882369995117188, -0.8615875244140625, -0.8349380493164062, -0.80828857421875, -0.7816390991210938, -0.7549896240234375, -0.7283401489257812, -0.701690673828125, -0.6750411987304688, -0.6483917236328125, -0.6217422485351562, -0.5950927734375, -0.5684432983398438, -0.5417938232421875, -0.5151443481445312, -0.488494873046875, -0.46184539794921875, -0.4351959228515625, -0.40854644775390625, -0.38189697265625, -0.35524749755859375, -0.3285980224609375, -0.30194854736328125, -0.275299072265625, -0.24864959716796875, -0.2220001220703125, -0.19535064697265625, -0.168701171875, -0.14205169677734375, -0.1154022216796875, -0.08875274658203125, -0.062103271484375, -0.03545379638671875, -0.0088043212890625, 0.01784515380859375, 0.04449462890625, 0.07114410400390625, 0.0977935791015625, 0.12444305419921875, 0.151092529296875, 0.17774200439453125, 0.2043914794921875, 0.23104095458984375, 0.2576904296875, 0.28433990478515625, 0.3109893798828125, 0.33763885498046875, 0.364288330078125, 0.39093780517578125, 0.4175872802734375, 0.44423675537109375, 0.47088623046875, 0.49753570556640625, 0.5241851806640625, 0.5508346557617188, 0.577484130859375, 0.6041336059570312, 0.6307830810546875, 0.6574325561523438, 0.68408203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 18.0, 15.0, 22.0, 33.0, 34.0, 61.0, 51.0, 63.0, 72.0, 78.0, 75.0, 94.0, 87.0, 50.0, 52.0, 41.0, 38.0, 21.0, 25.0, 10.0, 10.0, 7.0, 8.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9715118408203125, -0.945465087890625, -0.9194183349609375, -0.89337158203125, -0.8673248291015625, -0.841278076171875, -0.8152313232421875, -0.7891845703125, -0.7631378173828125, -0.737091064453125, -0.7110443115234375, -0.68499755859375, -0.6589508056640625, -0.632904052734375, -0.6068572998046875, -0.580810546875, -0.5547637939453125, -0.528717041015625, -0.5026702880859375, -0.47662353515625, -0.4505767822265625, -0.424530029296875, -0.3984832763671875, -0.3724365234375, -0.3463897705078125, -0.320343017578125, -0.2942962646484375, -0.26824951171875, -0.2422027587890625, -0.216156005859375, -0.1901092529296875, -0.1640625, -0.1380157470703125, -0.111968994140625, -0.0859222412109375, -0.05987548828125, -0.0338287353515625, -0.007781982421875, 0.0182647705078125, 0.0443115234375, 0.0703582763671875, 0.096405029296875, 0.1224517822265625, 0.14849853515625, 0.1745452880859375, 0.200592041015625, 0.2266387939453125, 0.252685546875, 0.2787322998046875, 0.304779052734375, 0.3308258056640625, 0.35687255859375, 0.3829193115234375, 0.408966064453125, 0.4350128173828125, 0.4610595703125, 0.4871063232421875, 0.513153076171875, 0.5391998291015625, 0.56524658203125, 0.5912933349609375, 0.617340087890625, 0.6433868408203125, 0.66943359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 13.0, 14.0, 45.0, 59.0, 155.0, 327.0, 830.0, 3206.0, 24965.0, 657966.0, 343261.0, 14333.0, 2206.0, 636.0, 248.0, 119.0, 64.0, 36.0, 23.0, 8.0, 8.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.474853515625, -0.46378135681152344, -0.4527091979980469, -0.4416370391845703, -0.43056488037109375, -0.4194927215576172, -0.4084205627441406, -0.39734840393066406, -0.3862762451171875, -0.37520408630371094, -0.3641319274902344, -0.3530597686767578, -0.34198760986328125, -0.3309154510498047, -0.3198432922363281, -0.30877113342285156, -0.297698974609375, -0.28662681579589844, -0.2755546569824219, -0.2644824981689453, -0.25341033935546875, -0.2423381805419922, -0.23126602172851562, -0.22019386291503906, -0.2091217041015625, -0.19804954528808594, -0.18697738647460938, -0.1759052276611328, -0.16483306884765625, -0.1537609100341797, -0.14268875122070312, -0.13161659240722656, -0.12054443359375, -0.10947227478027344, -0.09840011596679688, -0.08732795715332031, -0.07625579833984375, -0.06518363952636719, -0.054111480712890625, -0.04303932189941406, -0.0319671630859375, -0.020895004272460938, -0.009822845458984375, 0.0012493133544921875, 0.01232147216796875, 0.023393630981445312, 0.034465789794921875, 0.04553794860839844, 0.056610107421875, 0.06768226623535156, 0.07875442504882812, 0.08982658386230469, 0.10089874267578125, 0.11197090148925781, 0.12304306030273438, 0.13411521911621094, 0.1451873779296875, 0.15625953674316406, 0.16733169555664062, 0.1784038543701172, 0.18947601318359375, 0.2005481719970703, 0.21162033081054688, 0.22269248962402344, 0.2337646484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 21.0, 11.0, 24.0, 37.0, 47.0, 63.0, 93.0, 117.0, 144.0, 125.0, 94.0, 72.0, 43.0, 37.0, 24.0, 12.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021189451217651367, -0.00020444393157958984, -0.00019699335098266602, -0.0001895427703857422, -0.00018209218978881836, -0.00017464160919189453, -0.0001671910285949707, -0.00015974044799804688, -0.00015228986740112305, -0.00014483928680419922, -0.0001373887062072754, -0.00012993812561035156, -0.00012248754501342773, -0.0001150369644165039, -0.00010758638381958008, -0.00010013580322265625, -9.268522262573242e-05, -8.52346420288086e-05, -7.778406143188477e-05, -7.033348083496094e-05, -6.288290023803711e-05, -5.543231964111328e-05, -4.798173904418945e-05, -4.0531158447265625e-05, -3.30805778503418e-05, -2.562999725341797e-05, -1.817941665649414e-05, -1.0728836059570312e-05, -3.2782554626464844e-06, 4.172325134277344e-06, 1.1622905731201172e-05, 1.9073486328125e-05, 2.6524066925048828e-05, 3.3974647521972656e-05, 4.1425228118896484e-05, 4.887580871582031e-05, 5.632638931274414e-05, 6.377696990966797e-05, 7.12275505065918e-05, 7.867813110351562e-05, 8.612871170043945e-05, 9.357929229736328e-05, 0.00010102987289428711, 0.00010848045349121094, 0.00011593103408813477, 0.0001233816146850586, 0.00013083219528198242, 0.00013828277587890625, 0.00014573335647583008, 0.0001531839370727539, 0.00016063451766967773, 0.00016808509826660156, 0.0001755356788635254, 0.00018298625946044922, 0.00019043684005737305, 0.00019788742065429688, 0.0002053380012512207, 0.00021278858184814453, 0.00022023916244506836, 0.0002276897430419922, 0.00023514032363891602, 0.00024259090423583984, 0.00025004148483276367, 0.0002574920654296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 9.0, 15.0, 21.0, 29.0, 45.0, 81.0, 160.0, 292.0, 636.0, 1443.0, 3893.0, 15761.0, 128755.0, 724536.0, 148430.0, 17272.0, 4249.0, 1508.0, 644.0, 347.0, 165.0, 91.0, 51.0, 44.0, 25.0, 11.0, 13.0, 7.0, 6.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20214271545410156, -0.19505691528320312, -0.1879711151123047, -0.18088531494140625, -0.1737995147705078, -0.16671371459960938, -0.15962791442871094, -0.1525421142578125, -0.14545631408691406, -0.13837051391601562, -0.1312847137451172, -0.12419891357421875, -0.11711311340332031, -0.11002731323242188, -0.10294151306152344, -0.095855712890625, -0.08876991271972656, -0.08168411254882812, -0.07459831237792969, -0.06751251220703125, -0.06042671203613281, -0.053340911865234375, -0.04625511169433594, -0.0391693115234375, -0.03208351135253906, -0.024997711181640625, -0.017911911010742188, -0.01082611083984375, -0.0037403106689453125, 0.003345489501953125, 0.010431289672851562, 0.01751708984375, 0.024602890014648438, 0.031688690185546875, 0.03877449035644531, 0.04586029052734375, 0.05294609069824219, 0.060031890869140625, 0.06711769104003906, 0.0742034912109375, 0.08128929138183594, 0.08837509155273438, 0.09546089172363281, 0.10254669189453125, 0.10963249206542969, 0.11671829223632812, 0.12380409240722656, 0.130889892578125, 0.13797569274902344, 0.14506149291992188, 0.1521472930908203, 0.15923309326171875, 0.1663188934326172, 0.17340469360351562, 0.18049049377441406, 0.1875762939453125, 0.19466209411621094, 0.20174789428710938, 0.2088336944580078, 0.21591949462890625, 0.2230052947998047, 0.23009109497070312, 0.23717689514160156, 0.2442626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 28.0, 35.0, 60.0, 119.0, 146.0, 136.0, 142.0, 121.0, 72.0, 40.0, 23.0, 17.0, 11.0, 11.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2012939453125, -0.19450759887695312, -0.18772125244140625, -0.18093490600585938, -0.1741485595703125, -0.16736221313476562, -0.16057586669921875, -0.15378952026367188, -0.147003173828125, -0.14021682739257812, -0.13343048095703125, -0.12664413452148438, -0.1198577880859375, -0.11307144165039062, -0.10628509521484375, -0.09949874877929688, -0.09271240234375, -0.08592605590820312, -0.07913970947265625, -0.07235336303710938, -0.0655670166015625, -0.058780670166015625, -0.05199432373046875, -0.045207977294921875, -0.038421630859375, -0.031635284423828125, -0.02484893798828125, -0.018062591552734375, -0.0112762451171875, -0.004489898681640625, 0.00229644775390625, 0.009082794189453125, 0.015869140625, 0.022655487060546875, 0.02944183349609375, 0.036228179931640625, 0.0430145263671875, 0.049800872802734375, 0.05658721923828125, 0.06337356567382812, 0.070159912109375, 0.07694625854492188, 0.08373260498046875, 0.09051895141601562, 0.0973052978515625, 0.10409164428710938, 0.11087799072265625, 0.11766433715820312, 0.12445068359375, 0.13123703002929688, 0.13802337646484375, 0.14480972290039062, 0.1515960693359375, 0.15838241577148438, 0.16516876220703125, 0.17195510864257812, 0.178741455078125, 0.18552780151367188, 0.19231414794921875, 0.19910049438476562, 0.2058868408203125, 0.21267318725585938, 0.21945953369140625, 0.22624588012695312, 0.2330322265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 24.0, 113.0, 350.0, 324.0, 122.0, 47.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.79746150970459, -11.58298110961914, -11.368501663208008, -11.154021263122559, -10.93954086303711, -10.72506046295166, -10.510580062866211, -10.296100616455078, -10.081620216369629, -9.86713981628418, -9.652660369873047, -9.438179969787598, -9.223699569702148, -9.0092191696167, -8.79473876953125, -8.580259323120117, -8.365778923034668, -8.151298522949219, -7.936818599700928, -7.722338676452637, -7.5078582763671875, -7.293377876281738, -7.078897953033447, -6.864418029785156, -6.649937629699707, -6.435457229614258, -6.220977306365967, -6.006497383117676, -5.792016983032227, -5.577536582946777, -5.363056659698486, -5.148576736450195, -4.934096336364746, -4.719615936279297, -4.505136013031006, -4.290656089782715, -4.076175689697266, -3.8616955280303955, -3.6472153663635254, -3.4327352046966553, -3.2182552814483643, -3.003775119781494, -2.789294958114624, -2.574814796447754, -2.360334634780884, -2.1458544731140137, -1.9313743114471436, -1.7168941497802734, -1.5024139881134033, -1.2879338264465332, -1.073453664779663, -0.858973503112793, -0.6444933414459229, -0.43001317977905273, -0.21553301811218262, -0.0010528564453125, 0.21342730522155762, 0.42790746688842773, 0.6423876285552979, 0.856867790222168, 1.071347951889038, 1.2858281135559082, 1.5003082752227783, 1.7147884368896484, 1.9292685985565186]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 3.0, 9.0, 16.0, 13.0, 19.0, 21.0, 19.0, 21.0, 24.0, 29.0, 34.0, 39.0, 54.0, 48.0, 47.0, 42.0, 53.0, 53.0, 44.0, 47.0, 56.0, 43.0, 45.0, 37.0, 38.0, 26.0, 20.0, 12.0, 18.0, 10.0, 10.0, 6.0, 11.0, 6.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6948161125183105, -2.5970306396484375, -2.4992451667785645, -2.4014594554901123, -2.3036739826202393, -2.205888509750366, -2.108102798461914, -2.010317325592041, -1.912531852722168, -1.814746379852295, -1.7169607877731323, -1.6191751956939697, -1.5213897228240967, -1.4236042499542236, -1.325818657875061, -1.2280330657958984, -1.1302475929260254, -1.0324621200561523, -0.9346765279769897, -0.8368909955024719, -0.7391054630279541, -0.6413199305534363, -0.5435343980789185, -0.44574886560440063, -0.3479633331298828, -0.250177800655365, -0.15239226818084717, -0.054606735706329346, 0.04317879676818848, 0.1409643292427063, 0.23874986171722412, 0.33653539419174194, 0.43432092666625977, 0.5321064591407776, 0.6298919916152954, 0.7276775240898132, 0.825463056564331, 0.9232485890388489, 1.0210341215133667, 1.1188197135925293, 1.2166051864624023, 1.3143906593322754, 1.412176251411438, 1.5099618434906006, 1.6077473163604736, 1.7055327892303467, 1.8033183813095093, 1.9011039733886719, 1.998889446258545, 2.096674919128418, 2.194460391998291, 2.292246103286743, 2.390031576156616, 2.4878170490264893, 2.5856027603149414, 2.6833882331848145, 2.7811737060546875, 2.8789591789245605, 2.9767446517944336, 3.0745303630828857, 3.172315835952759, 3.270101308822632, 3.367887020111084, 3.465672492980957, 3.56345796585083]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 10.0, 12.0, 9.0, 8.0, 12.0, 25.0, 31.0, 47.0, 57.0, 90.0, 104.0, 166.0, 299.0, 520.0, 1062.0, 2196.0, 6392.0, 31391.0, 762183.0, 3329656.0, 46896.0, 8400.0, 2612.0, 1083.0, 482.0, 228.0, 115.0, 63.0, 44.0, 29.0, 15.0, 8.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.7333984375, -1.6940765380859375, -1.654754638671875, -1.6154327392578125, -1.57611083984375, -1.5367889404296875, -1.497467041015625, -1.4581451416015625, -1.4188232421875, -1.3795013427734375, -1.340179443359375, -1.3008575439453125, -1.26153564453125, -1.2222137451171875, -1.182891845703125, -1.1435699462890625, -1.104248046875, -1.0649261474609375, -1.025604248046875, -0.9862823486328125, -0.94696044921875, -0.9076385498046875, -0.868316650390625, -0.8289947509765625, -0.7896728515625, -0.7503509521484375, -0.711029052734375, -0.6717071533203125, -0.63238525390625, -0.5930633544921875, -0.553741455078125, -0.5144195556640625, -0.47509765625, -0.4357757568359375, -0.396453857421875, -0.3571319580078125, -0.31781005859375, -0.2784881591796875, -0.239166259765625, -0.1998443603515625, -0.1605224609375, -0.1212005615234375, -0.081878662109375, -0.0425567626953125, -0.00323486328125, 0.0360870361328125, 0.075408935546875, 0.1147308349609375, 0.154052734375, 0.1933746337890625, 0.232696533203125, 0.2720184326171875, 0.31134033203125, 0.3506622314453125, 0.389984130859375, 0.4293060302734375, 0.4686279296875, 0.5079498291015625, 0.547271728515625, 0.5865936279296875, 0.62591552734375, 0.6652374267578125, 0.704559326171875, 0.7438812255859375, 0.783203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 13.0, 18.0, 29.0, 49.0, 57.0, 94.0, 96.0, 121.0, 112.0, 102.0, 81.0, 71.0, 54.0, 47.0, 21.0, 15.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3553581237792969, -0.34694671630859375, -0.3385353088378906, -0.3301239013671875, -0.3217124938964844, -0.31330108642578125, -0.3048896789550781, -0.296478271484375, -0.2880668640136719, -0.27965545654296875, -0.2712440490722656, -0.2628326416015625, -0.2544212341308594, -0.24600982666015625, -0.23759841918945312, -0.22918701171875, -0.22077560424804688, -0.21236419677734375, -0.20395278930664062, -0.1955413818359375, -0.18712997436523438, -0.17871856689453125, -0.17030715942382812, -0.161895751953125, -0.15348434448242188, -0.14507293701171875, -0.13666152954101562, -0.1282501220703125, -0.11983871459960938, -0.11142730712890625, -0.10301589965820312, -0.0946044921875, -0.08619308471679688, -0.07778167724609375, -0.06937026977539062, -0.0609588623046875, -0.052547454833984375, -0.04413604736328125, -0.035724639892578125, -0.027313232421875, -0.018901824951171875, -0.01049041748046875, -0.002079010009765625, 0.0063323974609375, 0.014743804931640625, 0.02315521240234375, 0.031566619873046875, 0.03997802734375, 0.048389434814453125, 0.05680084228515625, 0.06521224975585938, 0.0736236572265625, 0.08203506469726562, 0.09044647216796875, 0.09885787963867188, 0.107269287109375, 0.11568069458007812, 0.12409210205078125, 0.13250350952148438, 0.1409149169921875, 0.14932632446289062, 0.15773773193359375, 0.16614913940429688, 0.174560546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 17.0, 14.0, 29.0, 31.0, 38.0, 92.0, 176.0, 367.0, 888.0, 2922.0, 18616.0, 4103116.0, 62271.0, 4185.0, 951.0, 305.0, 118.0, 56.0, 36.0, 20.0, 8.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.9110565185546875, -2.835784912109375, -2.7605133056640625, -2.68524169921875, -2.6099700927734375, -2.534698486328125, -2.4594268798828125, -2.3841552734375, -2.3088836669921875, -2.233612060546875, -2.1583404541015625, -2.08306884765625, -2.0077972412109375, -1.932525634765625, -1.8572540283203125, -1.781982421875, -1.7067108154296875, -1.631439208984375, -1.5561676025390625, -1.48089599609375, -1.4056243896484375, -1.330352783203125, -1.2550811767578125, -1.1798095703125, -1.1045379638671875, -1.029266357421875, -0.9539947509765625, -0.87872314453125, -0.8034515380859375, -0.728179931640625, -0.6529083251953125, -0.57763671875, -0.5023651123046875, -0.427093505859375, -0.3518218994140625, -0.27655029296875, -0.2012786865234375, -0.126007080078125, -0.0507354736328125, 0.0245361328125, 0.0998077392578125, 0.175079345703125, 0.2503509521484375, 0.32562255859375, 0.4008941650390625, 0.476165771484375, 0.5514373779296875, 0.626708984375, 0.7019805908203125, 0.777252197265625, 0.8525238037109375, 0.92779541015625, 1.0030670166015625, 1.078338623046875, 1.1536102294921875, 1.2288818359375, 1.3041534423828125, 1.379425048828125, 1.4546966552734375, 1.52996826171875, 1.6052398681640625, 1.680511474609375, 1.7557830810546875, 1.8310546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 7.0, 25.0, 32.0, 93.0, 421.0, 3057.0, 317.0, 63.0, 26.0, 4.0, 5.0, 4.0, 1.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4033203125, -1.37548828125, -1.34765625, -1.31982421875, -1.2919921875, -1.26416015625, -1.236328125, -1.20849609375, -1.1806640625, -1.15283203125, -1.125, -1.09716796875, -1.0693359375, -1.04150390625, -1.013671875, -0.98583984375, -0.9580078125, -0.93017578125, -0.90234375, -0.87451171875, -0.8466796875, -0.81884765625, -0.791015625, -0.76318359375, -0.7353515625, -0.70751953125, -0.6796875, -0.65185546875, -0.6240234375, -0.59619140625, -0.568359375, -0.54052734375, -0.5126953125, -0.48486328125, -0.45703125, -0.42919921875, -0.4013671875, -0.37353515625, -0.345703125, -0.31787109375, -0.2900390625, -0.26220703125, -0.234375, -0.20654296875, -0.1787109375, -0.15087890625, -0.123046875, -0.09521484375, -0.0673828125, -0.03955078125, -0.01171875, 0.01611328125, 0.0439453125, 0.07177734375, 0.099609375, 0.12744140625, 0.1552734375, 0.18310546875, 0.2109375, 0.23876953125, 0.2666015625, 0.29443359375, 0.322265625, 0.35009765625, 0.3779296875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 15.0, 40.0, 102.0, 289.0, 297.0, 159.0, 49.0, 18.0, 8.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7295894622802734, -3.623584032058716, -3.517578601837158, -3.4115729331970215, -3.305567502975464, -3.1995620727539062, -3.0935564041137695, -2.987550973892212, -2.8815455436706543, -2.7755401134490967, -2.669534683227539, -2.5635290145874023, -2.4575235843658447, -2.351518154144287, -2.2455124855041504, -2.1395070552825928, -2.033501625061035, -1.9274961948394775, -1.8214906454086304, -1.7154850959777832, -1.6094796657562256, -1.503474235534668, -1.3974686861038208, -1.2914631366729736, -1.185457706451416, -1.0794522762298584, -0.9734467267990112, -0.8674412369728088, -0.7614357471466064, -0.655430257320404, -0.5494247674942017, -0.44341927766799927, -0.3374135494232178, -0.23140805959701538, -0.125402569770813, -0.019397079944610596, 0.0866084098815918, 0.1926138997077942, 0.2986193895339966, 0.404624879360199, 0.5106303691864014, 0.6166358590126038, 0.7226413488388062, 0.8286468386650085, 0.9346523284912109, 1.0406577587127686, 1.1466633081436157, 1.252668857574463, 1.3586742877960205, 1.4646797180175781, 1.5706852674484253, 1.6766908168792725, 1.78269624710083, 1.8887016773223877, 1.9947072267532349, 2.100712776184082, 2.2067182064056396, 2.3127236366271973, 2.418729305267334, 2.5247347354888916, 2.630740165710449, 2.736745595932007, 2.8427510261535645, 2.948756694793701, 3.054762125015259]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 15.0, 20.0, 40.0, 72.0, 108.0, 139.0, 155.0, 168.0, 129.0, 79.0, 42.0, 22.0, 6.0, 9.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.620720863342285, -4.48499870300293, -4.349277019500732, -4.213555335998535, -4.07783317565918, -3.9421112537384033, -3.806389331817627, -3.6706674098968506, -3.534945487976074, -3.399223566055298, -3.2635016441345215, -3.127779722213745, -2.9920578002929688, -2.8563358783721924, -2.720613956451416, -2.5848920345306396, -2.4491701126098633, -2.313448190689087, -2.1777262687683105, -2.042004346847534, -1.9062824249267578, -1.7705605030059814, -1.634838581085205, -1.4991166591644287, -1.3633947372436523, -1.227672815322876, -1.0919508934020996, -0.9562289714813232, -0.8205070495605469, -0.6847851276397705, -0.5490632057189941, -0.4133412837982178, -0.2776193618774414, -0.14189743995666504, -0.006175518035888672, 0.1295464038848877, 0.26526832580566406, 0.40099024772644043, 0.5367121696472168, 0.6724340915679932, 0.8081560134887695, 0.9438779354095459, 1.0795998573303223, 1.2153217792510986, 1.351043701171875, 1.4867656230926514, 1.6224875450134277, 1.758209466934204, 1.8939313888549805, 2.029653310775757, 2.165375232696533, 2.3010971546173096, 2.436819076538086, 2.5725409984588623, 2.7082629203796387, 2.843984842300415, 2.9797067642211914, 3.1154286861419678, 3.251150608062744, 3.3868725299835205, 3.522594451904297, 3.6583163738250732, 3.7940382957458496, 3.929760217666626, 4.065482139587402]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 11.0, 21.0, 33.0, 29.0, 80.0, 106.0, 150.0, 216.0, 377.0, 699.0, 1444.0, 4138.0, 19291.0, 191988.0, 731609.0, 82082.0, 10860.0, 2765.0, 1125.0, 600.0, 301.0, 196.0, 127.0, 80.0, 59.0, 32.0, 24.0, 22.0, 18.0, 7.0, 6.0, 11.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9171371459960938, -0.8904266357421875, -0.8637161254882812, -0.837005615234375, -0.8102951049804688, -0.7835845947265625, -0.7568740844726562, -0.73016357421875, -0.7034530639648438, -0.6767425537109375, -0.6500320434570312, -0.623321533203125, -0.5966110229492188, -0.5699005126953125, -0.5431900024414062, -0.5164794921875, -0.48976898193359375, -0.4630584716796875, -0.43634796142578125, -0.409637451171875, -0.38292694091796875, -0.3562164306640625, -0.32950592041015625, -0.30279541015625, -0.27608489990234375, -0.2493743896484375, -0.22266387939453125, -0.195953369140625, -0.16924285888671875, -0.1425323486328125, -0.11582183837890625, -0.089111328125, -0.06240081787109375, -0.0356903076171875, -0.00897979736328125, 0.017730712890625, 0.04444122314453125, 0.0711517333984375, 0.09786224365234375, 0.12457275390625, 0.15128326416015625, 0.1779937744140625, 0.20470428466796875, 0.231414794921875, 0.25812530517578125, 0.2848358154296875, 0.31154632568359375, 0.3382568359375, 0.36496734619140625, 0.3916778564453125, 0.41838836669921875, 0.445098876953125, 0.47180938720703125, 0.4985198974609375, 0.5252304077148438, 0.55194091796875, 0.5786514282226562, 0.6053619384765625, 0.6320724487304688, 0.658782958984375, 0.6854934692382812, 0.7122039794921875, 0.7389144897460938, 0.765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 14.0, 34.0, 64.0, 100.0, 118.0, 124.0, 135.0, 122.0, 108.0, 81.0, 42.0, 27.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.4297676086425781, -0.41910552978515625, -0.4084434509277344, -0.3977813720703125, -0.3871192932128906, -0.37645721435546875, -0.3657951354980469, -0.355133056640625, -0.3444709777832031, -0.33380889892578125, -0.3231468200683594, -0.3124847412109375, -0.3018226623535156, -0.29116058349609375, -0.2804985046386719, -0.26983642578125, -0.2591743469238281, -0.24851226806640625, -0.23785018920898438, -0.2271881103515625, -0.21652603149414062, -0.20586395263671875, -0.19520187377929688, -0.184539794921875, -0.17387771606445312, -0.16321563720703125, -0.15255355834960938, -0.1418914794921875, -0.13122940063476562, -0.12056732177734375, -0.10990524291992188, -0.0992431640625, -0.08858108520507812, -0.07791900634765625, -0.06725692749023438, -0.0565948486328125, -0.045932769775390625, -0.03527069091796875, -0.024608612060546875, -0.013946533203125, -0.003284454345703125, 0.00737762451171875, 0.018039703369140625, 0.0287017822265625, 0.039363861083984375, 0.05002593994140625, 0.060688018798828125, 0.07135009765625, 0.08201217651367188, 0.09267425537109375, 0.10333633422851562, 0.1139984130859375, 0.12466049194335938, 0.13532257080078125, 0.14598464965820312, 0.156646728515625, 0.16730880737304688, 0.17797088623046875, 0.18863296508789062, 0.1992950439453125, 0.20995712280273438, 0.22061920166015625, 0.23128128051757812, 0.241943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 9.0, 10.0, 19.0, 23.0, 31.0, 39.0, 50.0, 102.0, 126.0, 244.0, 338.0, 651.0, 1249.0, 2422.0, 5140.0, 11745.0, 29731.0, 85057.0, 274067.0, 407830.0, 148878.0, 48188.0, 18120.0, 7442.0, 3299.0, 1628.0, 821.0, 494.0, 274.0, 158.0, 90.0, 68.0, 49.0, 41.0, 24.0, 21.0, 13.0, 11.0, 7.0, 7.0, 3.0, 6.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2694511413574219, -0.26082611083984375, -0.2522010803222656, -0.2435760498046875, -0.23495101928710938, -0.22632598876953125, -0.21770095825195312, -0.209075927734375, -0.20045089721679688, -0.19182586669921875, -0.18320083618164062, -0.1745758056640625, -0.16595077514648438, -0.15732574462890625, -0.14870071411132812, -0.14007568359375, -0.13145065307617188, -0.12282562255859375, -0.11420059204101562, -0.1055755615234375, -0.09695053100585938, -0.08832550048828125, -0.07970046997070312, -0.071075439453125, -0.062450408935546875, -0.05382537841796875, -0.045200347900390625, -0.0365753173828125, -0.027950286865234375, -0.01932525634765625, -0.010700225830078125, -0.0020751953125, 0.006549835205078125, 0.01517486572265625, 0.023799896240234375, 0.0324249267578125, 0.041049957275390625, 0.04967498779296875, 0.058300018310546875, 0.066925048828125, 0.07555007934570312, 0.08417510986328125, 0.09280014038085938, 0.1014251708984375, 0.11005020141601562, 0.11867523193359375, 0.12730026245117188, 0.13592529296875, 0.14455032348632812, 0.15317535400390625, 0.16180038452148438, 0.1704254150390625, 0.17905044555664062, 0.18767547607421875, 0.19630050659179688, 0.204925537109375, 0.21355056762695312, 0.22217559814453125, 0.23080062866210938, 0.2394256591796875, 0.24805068969726562, 0.25667572021484375, 0.2653007507324219, 0.27392578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 14.0, 9.0, 11.0, 16.0, 13.0, 18.0, 23.0, 15.0, 26.0, 30.0, 32.0, 48.0, 27.0, 37.0, 53.0, 43.0, 53.0, 50.0, 47.0, 31.0, 34.0, 34.0, 51.0, 32.0, 33.0, 35.0, 24.0, 23.0, 27.0, 21.0, 15.0, 11.0, 8.0, 5.0, 10.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.483154296875, -0.4691314697265625, -0.455108642578125, -0.4410858154296875, -0.42706298828125, -0.4130401611328125, -0.399017333984375, -0.3849945068359375, -0.3709716796875, -0.3569488525390625, -0.342926025390625, -0.3289031982421875, -0.31488037109375, -0.3008575439453125, -0.286834716796875, -0.2728118896484375, -0.2587890625, -0.2447662353515625, -0.230743408203125, -0.2167205810546875, -0.20269775390625, -0.1886749267578125, -0.174652099609375, -0.1606292724609375, -0.1466064453125, -0.1325836181640625, -0.118560791015625, -0.1045379638671875, -0.09051513671875, -0.0764923095703125, -0.062469482421875, -0.0484466552734375, -0.034423828125, -0.0204010009765625, -0.006378173828125, 0.0076446533203125, 0.02166748046875, 0.0356903076171875, 0.049713134765625, 0.0637359619140625, 0.0777587890625, 0.0917816162109375, 0.105804443359375, 0.1198272705078125, 0.13385009765625, 0.1478729248046875, 0.161895751953125, 0.1759185791015625, 0.18994140625, 0.2039642333984375, 0.217987060546875, 0.2320098876953125, 0.24603271484375, 0.2600555419921875, 0.274078369140625, 0.2881011962890625, 0.3021240234375, 0.3161468505859375, 0.330169677734375, 0.3441925048828125, 0.35821533203125, 0.3722381591796875, 0.386260986328125, 0.4002838134765625, 0.414306640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 21.0, 20.0, 28.0, 38.0, 56.0, 112.0, 161.0, 298.0, 625.0, 1429.0, 4028.0, 15148.0, 79477.0, 474381.0, 393613.0, 61034.0, 12310.0, 3314.0, 1244.0, 543.0, 250.0, 150.0, 92.0, 64.0, 26.0, 20.0, 14.0, 9.0, 5.0, 3.0, 9.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18833351135253906, -0.18294143676757812, -0.1775493621826172, -0.17215728759765625, -0.1667652130126953, -0.16137313842773438, -0.15598106384277344, -0.1505889892578125, -0.14519691467285156, -0.13980484008789062, -0.1344127655029297, -0.12902069091796875, -0.12362861633300781, -0.11823654174804688, -0.11284446716308594, -0.107452392578125, -0.10206031799316406, -0.09666824340820312, -0.09127616882324219, -0.08588409423828125, -0.08049201965332031, -0.07509994506835938, -0.06970787048339844, -0.0643157958984375, -0.05892372131347656, -0.053531646728515625, -0.04813957214355469, -0.04274749755859375, -0.03735542297363281, -0.031963348388671875, -0.026571273803710938, -0.02117919921875, -0.015787124633789062, -0.010395050048828125, -0.0050029754638671875, 0.00038909912109375, 0.0057811737060546875, 0.011173248291015625, 0.016565322875976562, 0.0219573974609375, 0.027349472045898438, 0.032741546630859375, 0.03813362121582031, 0.04352569580078125, 0.04891777038574219, 0.054309844970703125, 0.05970191955566406, 0.065093994140625, 0.07048606872558594, 0.07587814331054688, 0.08127021789550781, 0.08666229248046875, 0.09205436706542969, 0.09744644165039062, 0.10283851623535156, 0.1082305908203125, 0.11362266540527344, 0.11901473999023438, 0.12440681457519531, 0.12979888916015625, 0.1351909637451172, 0.14058303833007812, 0.14597511291503906, 0.1513671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 12.0, 7.0, 12.0, 13.0, 30.0, 22.0, 50.0, 44.0, 69.0, 71.0, 104.0, 116.0, 103.0, 78.0, 69.0, 49.0, 38.0, 22.0, 17.0, 21.0, 7.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001614093780517578, -0.0001561492681503296, -0.00015088915824890137, -0.00014562904834747314, -0.00014036893844604492, -0.0001351088285446167, -0.00012984871864318848, -0.00012458860874176025, -0.00011932849884033203, -0.00011406838893890381, -0.00010880827903747559, -0.00010354816913604736, -9.828805923461914e-05, -9.302794933319092e-05, -8.77678394317627e-05, -8.250772953033447e-05, -7.724761962890625e-05, -7.198750972747803e-05, -6.67273998260498e-05, -6.146728992462158e-05, -5.620718002319336e-05, -5.094707012176514e-05, -4.5686960220336914e-05, -4.042685031890869e-05, -3.516674041748047e-05, -2.9906630516052246e-05, -2.4646520614624023e-05, -1.93864107131958e-05, -1.4126300811767578e-05, -8.866190910339355e-06, -3.606081008911133e-06, 1.6540288925170898e-06, 6.9141387939453125e-06, 1.2174248695373535e-05, 1.7434358596801758e-05, 2.269446849822998e-05, 2.7954578399658203e-05, 3.3214688301086426e-05, 3.847479820251465e-05, 4.373490810394287e-05, 4.8995018005371094e-05, 5.4255127906799316e-05, 5.951523780822754e-05, 6.477534770965576e-05, 7.003545761108398e-05, 7.529556751251221e-05, 8.055567741394043e-05, 8.581578731536865e-05, 9.107589721679688e-05, 9.63360071182251e-05, 0.00010159611701965332, 0.00010685622692108154, 0.00011211633682250977, 0.00011737644672393799, 0.0001226365566253662, 0.00012789666652679443, 0.00013315677642822266, 0.00013841688632965088, 0.0001436769962310791, 0.00014893710613250732, 0.00015419721603393555, 0.00015945732593536377, 0.000164717435836792, 0.00016997754573822021, 0.00017523765563964844]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 10.0, 11.0, 9.0, 21.0, 26.0, 41.0, 44.0, 56.0, 104.0, 163.0, 246.0, 377.0, 789.0, 1296.0, 2456.0, 5540.0, 14503.0, 47602.0, 205329.0, 494967.0, 202286.0, 47179.0, 14448.0, 5588.0, 2415.0, 1229.0, 654.0, 406.0, 257.0, 142.0, 109.0, 82.0, 48.0, 34.0, 27.0, 14.0, 10.0, 8.0, 6.0, 11.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1253662109375, -0.12138557434082031, -0.11740493774414062, -0.11342430114746094, -0.10944366455078125, -0.10546302795410156, -0.10148239135742188, -0.09750175476074219, -0.0935211181640625, -0.08954048156738281, -0.08555984497070312, -0.08157920837402344, -0.07759857177734375, -0.07361793518066406, -0.06963729858398438, -0.06565666198730469, -0.061676025390625, -0.05769538879394531, -0.053714752197265625, -0.04973411560058594, -0.04575347900390625, -0.04177284240722656, -0.037792205810546875, -0.03381156921386719, -0.0298309326171875, -0.025850296020507812, -0.021869659423828125, -0.017889022827148438, -0.01390838623046875, -0.009927749633789062, -0.005947113037109375, -0.0019664764404296875, 0.00201416015625, 0.0059947967529296875, 0.009975433349609375, 0.013956069946289062, 0.01793670654296875, 0.021917343139648438, 0.025897979736328125, 0.029878616333007812, 0.0338592529296875, 0.03783988952636719, 0.041820526123046875, 0.04580116271972656, 0.04978179931640625, 0.05376243591308594, 0.057743072509765625, 0.06172370910644531, 0.065704345703125, 0.06968498229980469, 0.07366561889648438, 0.07764625549316406, 0.08162689208984375, 0.08560752868652344, 0.08958816528320312, 0.09356880187988281, 0.0975494384765625, 0.10153007507324219, 0.10551071166992188, 0.10949134826660156, 0.11347198486328125, 0.11745262145996094, 0.12143325805664062, 0.1254138946533203, 0.12939453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 15.0, 11.0, 18.0, 41.0, 44.0, 66.0, 70.0, 90.0, 113.0, 140.0, 80.0, 80.0, 47.0, 37.0, 35.0, 26.0, 16.0, 14.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.123291015625, -0.11836624145507812, -0.11344146728515625, -0.10851669311523438, -0.1035919189453125, -0.09866714477539062, -0.09374237060546875, -0.08881759643554688, -0.083892822265625, -0.07896804809570312, -0.07404327392578125, -0.06911849975585938, -0.0641937255859375, -0.059268951416015625, -0.05434417724609375, -0.049419403076171875, -0.04449462890625, -0.039569854736328125, -0.03464508056640625, -0.029720306396484375, -0.0247955322265625, -0.019870758056640625, -0.01494598388671875, -0.010021209716796875, -0.005096435546875, -0.000171661376953125, 0.00475311279296875, 0.009677886962890625, 0.0146026611328125, 0.019527435302734375, 0.02445220947265625, 0.029376983642578125, 0.0343017578125, 0.039226531982421875, 0.04415130615234375, 0.049076080322265625, 0.0540008544921875, 0.058925628662109375, 0.06385040283203125, 0.06877517700195312, 0.073699951171875, 0.07862472534179688, 0.08354949951171875, 0.08847427368164062, 0.0933990478515625, 0.09832382202148438, 0.10324859619140625, 0.10817337036132812, 0.11309814453125, 0.11802291870117188, 0.12294769287109375, 0.12787246704101562, 0.1327972412109375, 0.13772201538085938, 0.14264678955078125, 0.14757156372070312, 0.152496337890625, 0.15742111206054688, 0.16234588623046875, 0.16727066040039062, 0.1721954345703125, 0.17712020874023438, 0.18204498291015625, 0.18696975708007812, 0.19189453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 31.0, 101.0, 358.0, 320.0, 117.0, 40.0, 17.0, 11.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8362627029418945, -4.6495041847229, -4.462745666503906, -4.275987148284912, -4.089228630065918, -3.902470111846924, -3.7157113552093506, -3.5289528369903564, -3.3421943187713623, -3.155435800552368, -2.968677282333374, -2.781918525695801, -2.5951600074768066, -2.4084014892578125, -2.2216429710388184, -2.034884452819824, -1.84812593460083, -1.661367416381836, -1.4746088981628418, -1.287850260734558, -1.101091742515564, -0.9143332242965698, -0.7275745868682861, -0.540816068649292, -0.35405755043029785, -0.16729900240898132, 0.019459545612335205, 0.20621812343597412, 0.39297664165496826, 0.5797351598739624, 0.7664937973022461, 0.9532523155212402, 1.1400108337402344, 1.3267693519592285, 1.5135278701782227, 1.7002865076065063, 1.8870450258255005, 2.073803424835205, 2.2605621814727783, 2.4473206996917725, 2.6340792179107666, 2.8208377361297607, 3.007596254348755, 3.194355010986328, 3.3811135292053223, 3.5678720474243164, 3.7546305656433105, 3.9413890838623047, 4.128147602081299, 4.314906120300293, 4.501664638519287, 4.688423156738281, 4.875181674957275, 5.0619401931762695, 5.248699188232422, 5.435457229614258, 5.62221622467041, 5.808974742889404, 5.995733261108398, 6.182491779327393, 6.369250297546387, 6.556008815765381, 6.742767333984375, 6.929526329040527, 7.116284370422363]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 10.0, 7.0, 12.0, 14.0, 25.0, 24.0, 29.0, 37.0, 35.0, 40.0, 51.0, 54.0, 63.0, 50.0, 68.0, 62.0, 59.0, 49.0, 44.0, 56.0, 38.0, 37.0, 24.0, 30.0, 27.0, 11.0, 12.0, 7.0, 7.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.413717269897461, -3.3074533939361572, -3.2011895179748535, -3.09492564201355, -2.988661766052246, -2.8823978900909424, -2.7761340141296387, -2.669869899749756, -2.5636062622070312, -2.4573423862457275, -2.351078510284424, -2.24481463432312, -2.1385507583618164, -2.0322868824005127, -1.9260228872299194, -1.8197590112686157, -1.7134950160980225, -1.6072311401367188, -1.500967264175415, -1.3947033882141113, -1.2884395122528076, -1.182175636291504, -1.0759116411209106, -0.9696477651596069, -0.8633838891983032, -0.7571200132369995, -0.6508561372756958, -0.5445922017097473, -0.4383283257484436, -0.3320644497871399, -0.2258005142211914, -0.1195366382598877, -0.013273000717163086, 0.09299089014530182, 0.19925478100776672, 0.3055186867713928, 0.41178256273269653, 0.5180464386940002, 0.6243103742599487, 0.7305742502212524, 0.8368381261825562, 0.9431020021438599, 1.0493658781051636, 1.1556298732757568, 1.2618937492370605, 1.3681576251983643, 1.474421501159668, 1.5806853771209717, 1.6869492530822754, 1.793213129043579, 1.8994770050048828, 2.0057408809661865, 2.1120047569274902, 2.218268632888794, 2.3245325088500977, 2.4307966232299805, 2.537060260772705, 2.643324136734009, 2.7495880126953125, 2.855851888656616, 2.96211576461792, 3.0683796405792236, 3.1746435165405273, 3.28090763092041, 3.387171506881714]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 10.0, 16.0, 14.0, 26.0, 45.0, 81.0, 144.0, 248.0, 605.0, 1633.0, 9947.0, 3670741.0, 501257.0, 7440.0, 1253.0, 427.0, 184.0, 103.0, 46.0, 19.0, 14.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.9803924560546875, -1.929534912109375, -1.8786773681640625, -1.82781982421875, -1.7769622802734375, -1.726104736328125, -1.6752471923828125, -1.6243896484375, -1.5735321044921875, -1.522674560546875, -1.4718170166015625, -1.42095947265625, -1.3701019287109375, -1.319244384765625, -1.2683868408203125, -1.217529296875, -1.1666717529296875, -1.115814208984375, -1.0649566650390625, -1.01409912109375, -0.9632415771484375, -0.912384033203125, -0.8615264892578125, -0.8106689453125, -0.7598114013671875, -0.708953857421875, -0.6580963134765625, -0.60723876953125, -0.5563812255859375, -0.505523681640625, -0.4546661376953125, -0.40380859375, -0.3529510498046875, -0.302093505859375, -0.2512359619140625, -0.20037841796875, -0.1495208740234375, -0.098663330078125, -0.0478057861328125, 0.0030517578125, 0.0539093017578125, 0.104766845703125, 0.1556243896484375, 0.20648193359375, 0.2573394775390625, 0.308197021484375, 0.3590545654296875, 0.409912109375, 0.4607696533203125, 0.511627197265625, 0.5624847412109375, 0.61334228515625, 0.6641998291015625, 0.715057373046875, 0.7659149169921875, 0.8167724609375, 0.8676300048828125, 0.918487548828125, 0.9693450927734375, 1.02020263671875, 1.0710601806640625, 1.121917724609375, 1.1727752685546875, 1.2236328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 4.0, 13.0, 31.0, 47.0, 80.0, 75.0, 116.0, 136.0, 138.0, 107.0, 85.0, 73.0, 53.0, 23.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452392578125, -0.4413566589355469, -0.43032073974609375, -0.4192848205566406, -0.4082489013671875, -0.3972129821777344, -0.38617706298828125, -0.3751411437988281, -0.364105224609375, -0.3530693054199219, -0.34203338623046875, -0.3309974670410156, -0.3199615478515625, -0.3089256286621094, -0.29788970947265625, -0.2868537902832031, -0.27581787109375, -0.2647819519042969, -0.25374603271484375, -0.24271011352539062, -0.2316741943359375, -0.22063827514648438, -0.20960235595703125, -0.19856643676757812, -0.187530517578125, -0.17649459838867188, -0.16545867919921875, -0.15442276000976562, -0.1433868408203125, -0.13235092163085938, -0.12131500244140625, -0.11027908325195312, -0.0992431640625, -0.08820724487304688, -0.07717132568359375, -0.06613540649414062, -0.0550994873046875, -0.044063568115234375, -0.03302764892578125, -0.021991729736328125, -0.010955810546875, 8.0108642578125e-05, 0.01111602783203125, 0.022151947021484375, 0.0331878662109375, 0.044223785400390625, 0.05525970458984375, 0.06629562377929688, 0.07733154296875, 0.08836746215820312, 0.09940338134765625, 0.11043930053710938, 0.1214752197265625, 0.13251113891601562, 0.14354705810546875, 0.15458297729492188, 0.165618896484375, 0.17665481567382812, 0.18769073486328125, 0.19872665405273438, 0.2097625732421875, 0.22079849243164062, 0.23183441162109375, 0.24287033081054688, 0.25390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 9.0, 14.0, 16.0, 32.0, 46.0, 68.0, 129.0, 208.0, 389.0, 841.0, 1830.0, 4684.0, 14722.0, 75574.0, 3310519.0, 717788.0, 48770.0, 11340.0, 3948.0, 1573.0, 769.0, 402.0, 231.0, 139.0, 77.0, 57.0, 35.0, 26.0, 13.0, 12.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.38558197021484375, -0.3717498779296875, -0.35791778564453125, -0.344085693359375, -0.33025360107421875, -0.3164215087890625, -0.30258941650390625, -0.28875732421875, -0.27492523193359375, -0.2610931396484375, -0.24726104736328125, -0.233428955078125, -0.21959686279296875, -0.2057647705078125, -0.19193267822265625, -0.1781005859375, -0.16426849365234375, -0.1504364013671875, -0.13660430908203125, -0.122772216796875, -0.10894012451171875, -0.0951080322265625, -0.08127593994140625, -0.06744384765625, -0.05361175537109375, -0.0397796630859375, -0.02594757080078125, -0.012115478515625, 0.00171661376953125, 0.0155487060546875, 0.02938079833984375, 0.043212890625, 0.05704498291015625, 0.0708770751953125, 0.08470916748046875, 0.098541259765625, 0.11237335205078125, 0.1262054443359375, 0.14003753662109375, 0.15386962890625, 0.16770172119140625, 0.1815338134765625, 0.19536590576171875, 0.209197998046875, 0.22303009033203125, 0.2368621826171875, 0.25069427490234375, 0.2645263671875, 0.27835845947265625, 0.2921905517578125, 0.30602264404296875, 0.319854736328125, 0.33368682861328125, 0.3475189208984375, 0.36135101318359375, 0.37518310546875, 0.38901519775390625, 0.4028472900390625, 0.41667938232421875, 0.430511474609375, 0.44434356689453125, 0.4581756591796875, 0.47200775146484375, 0.48583984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 8.0, 24.0, 34.0, 64.0, 102.0, 324.0, 2099.0, 906.0, 220.0, 108.0, 52.0, 39.0, 25.0, 10.0, 15.0, 6.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.1454315185546875, -0.138763427734375, -0.1320953369140625, -0.12542724609375, -0.1187591552734375, -0.112091064453125, -0.1054229736328125, -0.0987548828125, -0.0920867919921875, -0.085418701171875, -0.0787506103515625, -0.07208251953125, -0.0654144287109375, -0.058746337890625, -0.0520782470703125, -0.04541015625, -0.0387420654296875, -0.032073974609375, -0.0254058837890625, -0.01873779296875, -0.0120697021484375, -0.005401611328125, 0.0012664794921875, 0.0079345703125, 0.0146026611328125, 0.021270751953125, 0.0279388427734375, 0.03460693359375, 0.0412750244140625, 0.047943115234375, 0.0546112060546875, 0.061279296875, 0.0679473876953125, 0.074615478515625, 0.0812835693359375, 0.08795166015625, 0.0946197509765625, 0.101287841796875, 0.1079559326171875, 0.1146240234375, 0.1212921142578125, 0.127960205078125, 0.1346282958984375, 0.14129638671875, 0.1479644775390625, 0.154632568359375, 0.1613006591796875, 0.16796875, 0.1746368408203125, 0.181304931640625, 0.1879730224609375, 0.19464111328125, 0.2013092041015625, 0.207977294921875, 0.2146453857421875, 0.2213134765625, 0.2279815673828125, 0.234649658203125, 0.2413177490234375, 0.24798583984375, 0.2546539306640625, 0.261322021484375, 0.2679901123046875, 0.274658203125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 15.0, 33.0, 169.0, 364.0, 248.0, 112.0, 36.0, 11.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5575941801071167, -0.4986702799797058, -0.4397464096546173, -0.3808225393295288, -0.3218986392021179, -0.26297473907470703, -0.20405086874961853, -0.14512699842453003, -0.08620309829711914, -0.027279213070869446, 0.03164467215538025, 0.09056855738162994, 0.14949244260787964, 0.20841634273529053, 0.26734021306037903, 0.32626408338546753, 0.3851879835128784, 0.4441118836402893, 0.5030357837677002, 0.5619596242904663, 0.6208835244178772, 0.6798074245452881, 0.7387312650680542, 0.7976551651954651, 0.856579065322876, 0.9155029654502869, 0.9744268655776978, 1.0333507061004639, 1.0922746658325195, 1.1511985063552856, 1.2101223468780518, 1.2690463066101074, 1.327970266342163, 1.3868941068649292, 1.4458180665969849, 1.504741907119751, 1.5636658668518066, 1.6225897073745728, 1.6815135478973389, 1.7404375076293945, 1.7993613481521606, 1.8582851886749268, 1.9172091484069824, 1.9761329889297485, 2.0350568294525146, 2.0939807891845703, 2.152904748916626, 2.2118284702301025, 2.270752429962158, 2.329676389694214, 2.3886001110076904, 2.447524070739746, 2.5064480304718018, 2.5653719902038574, 2.624295711517334, 2.6832196712493896, 2.7421436309814453, 2.801067590713501, 2.8599913120269775, 2.918915271759033, 2.977839231491089, 3.0367631912231445, 3.095686912536621, 3.1546108722686768, 3.2135345935821533]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 6.0, 10.0, 12.0, 22.0, 22.0, 20.0, 33.0, 33.0, 48.0, 43.0, 44.0, 45.0, 54.0, 40.0, 54.0, 45.0, 65.0, 66.0, 50.0, 40.0, 35.0, 32.0, 37.0, 33.0, 21.0, 19.0, 18.0, 16.0, 9.0, 3.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4308505058288574, -0.41090407967567444, -0.39095762372016907, -0.3710111975669861, -0.3510647714138031, -0.3311183452606201, -0.31117188930511475, -0.29122546315193176, -0.2712790369987488, -0.2513326108455658, -0.23138616979122162, -0.21143972873687744, -0.19149330258369446, -0.17154686152935028, -0.1516004204750061, -0.13165399432182312, -0.11170753836631775, -0.09176110476255417, -0.07181467115879059, -0.05186823010444641, -0.03192179650068283, -0.01197536289691925, 0.007971078157424927, 0.02791750431060791, 0.04786394536495209, 0.06781037896871567, 0.08775681257247925, 0.10770325362682343, 0.1276496946811676, 0.14759612083435059, 0.16754256188869476, 0.18748898804187775, 0.20743542909622192, 0.2273818701505661, 0.24732829630374908, 0.26727473735809326, 0.28722116351127625, 0.30716758966445923, 0.3271140456199646, 0.3470604717731476, 0.36700689792633057, 0.38695332407951355, 0.4068997800350189, 0.4268462061882019, 0.4467926323413849, 0.46673905849456787, 0.48668551445007324, 0.5066319704055786, 0.526578426361084, 0.5465248823165894, 0.56647127866745, 0.5864177346229553, 0.6063641905784607, 0.6263105869293213, 0.6462570428848267, 0.666203498840332, 0.6861498951911926, 0.706096351146698, 0.7260427474975586, 0.745989203453064, 0.7659356594085693, 0.7858820557594299, 0.8058285117149353, 0.8257749080657959, 0.8457213640213013]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 13.0, 14.0, 17.0, 25.0, 50.0, 50.0, 85.0, 127.0, 208.0, 338.0, 632.0, 1293.0, 3692.0, 16874.0, 131496.0, 713623.0, 153844.0, 19066.0, 4106.0, 1410.0, 665.0, 327.0, 197.0, 137.0, 74.0, 47.0, 37.0, 24.0, 22.0, 15.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.733306884765625, -0.70928955078125, -0.685272216796875, -0.6612548828125, -0.637237548828125, -0.61322021484375, -0.589202880859375, -0.565185546875, -0.541168212890625, -0.51715087890625, -0.493133544921875, -0.4691162109375, -0.445098876953125, -0.42108154296875, -0.397064208984375, -0.373046875, -0.349029541015625, -0.32501220703125, -0.300994873046875, -0.2769775390625, -0.252960205078125, -0.22894287109375, -0.204925537109375, -0.180908203125, -0.156890869140625, -0.13287353515625, -0.108856201171875, -0.0848388671875, -0.060821533203125, -0.03680419921875, -0.012786865234375, 0.01123046875, 0.035247802734375, 0.05926513671875, 0.083282470703125, 0.1072998046875, 0.131317138671875, 0.15533447265625, 0.179351806640625, 0.203369140625, 0.227386474609375, 0.25140380859375, 0.275421142578125, 0.2994384765625, 0.323455810546875, 0.34747314453125, 0.371490478515625, 0.3955078125, 0.419525146484375, 0.44354248046875, 0.467559814453125, 0.4915771484375, 0.515594482421875, 0.53961181640625, 0.563629150390625, 0.587646484375, 0.611663818359375, 0.63568115234375, 0.659698486328125, 0.6837158203125, 0.707733154296875, 0.73175048828125, 0.755767822265625, 0.77978515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 23.0, 30.0, 49.0, 75.0, 88.0, 130.0, 126.0, 134.0, 102.0, 85.0, 66.0, 47.0, 21.0, 9.0, 3.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4100799560546875, -0.399505615234375, -0.3889312744140625, -0.37835693359375, -0.3677825927734375, -0.357208251953125, -0.3466339111328125, -0.3360595703125, -0.3254852294921875, -0.314910888671875, -0.3043365478515625, -0.29376220703125, -0.2831878662109375, -0.272613525390625, -0.2620391845703125, -0.25146484375, -0.2408905029296875, -0.230316162109375, -0.2197418212890625, -0.20916748046875, -0.1985931396484375, -0.188018798828125, -0.1774444580078125, -0.1668701171875, -0.1562957763671875, -0.145721435546875, -0.1351470947265625, -0.12457275390625, -0.1139984130859375, -0.103424072265625, -0.0928497314453125, -0.082275390625, -0.0717010498046875, -0.061126708984375, -0.0505523681640625, -0.03997802734375, -0.0294036865234375, -0.018829345703125, -0.0082550048828125, 0.0023193359375, 0.0128936767578125, 0.023468017578125, 0.0340423583984375, 0.04461669921875, 0.0551910400390625, 0.065765380859375, 0.0763397216796875, 0.0869140625, 0.0974884033203125, 0.108062744140625, 0.1186370849609375, 0.12921142578125, 0.1397857666015625, 0.150360107421875, 0.1609344482421875, 0.1715087890625, 0.1820831298828125, 0.192657470703125, 0.2032318115234375, 0.21380615234375, 0.2243804931640625, 0.234954833984375, 0.2455291748046875, 0.256103515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 10.0, 17.0, 24.0, 29.0, 39.0, 57.0, 81.0, 132.0, 182.0, 303.0, 454.0, 661.0, 1180.0, 2073.0, 3965.0, 8000.0, 17180.0, 39089.0, 99579.0, 277468.0, 358159.0, 142243.0, 53462.0, 22550.0, 10247.0, 5019.0, 2620.0, 1466.0, 788.0, 511.0, 290.0, 188.0, 152.0, 111.0, 60.0, 46.0, 26.0, 25.0, 22.0, 8.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.2724609375, -0.2642478942871094, -0.25603485107421875, -0.24782180786132812, -0.2396087646484375, -0.23139572143554688, -0.22318267822265625, -0.21496963500976562, -0.206756591796875, -0.19854354858398438, -0.19033050537109375, -0.18211746215820312, -0.1739044189453125, -0.16569137573242188, -0.15747833251953125, -0.14926528930664062, -0.14105224609375, -0.13283920288085938, -0.12462615966796875, -0.11641311645507812, -0.1082000732421875, -0.09998703002929688, -0.09177398681640625, -0.08356094360351562, -0.075347900390625, -0.06713485717773438, -0.05892181396484375, -0.050708770751953125, -0.0424957275390625, -0.034282684326171875, -0.02606964111328125, -0.017856597900390625, -0.0096435546875, -0.001430511474609375, 0.00678253173828125, 0.014995574951171875, 0.0232086181640625, 0.031421661376953125, 0.03963470458984375, 0.047847747802734375, 0.056060791015625, 0.06427383422851562, 0.07248687744140625, 0.08069992065429688, 0.0889129638671875, 0.09712600708007812, 0.10533905029296875, 0.11355209350585938, 0.12176513671875, 0.12997817993164062, 0.13819122314453125, 0.14640426635742188, 0.1546173095703125, 0.16283035278320312, 0.17104339599609375, 0.17925643920898438, 0.187469482421875, 0.19568252563476562, 0.20389556884765625, 0.21210861206054688, 0.2203216552734375, 0.22853469848632812, 0.23674774169921875, 0.24496078491210938, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 3.0, 9.0, 11.0, 10.0, 18.0, 8.0, 13.0, 19.0, 14.0, 23.0, 35.0, 33.0, 46.0, 35.0, 41.0, 52.0, 49.0, 47.0, 39.0, 45.0, 41.0, 42.0, 39.0, 30.0, 30.0, 36.0, 34.0, 25.0, 24.0, 28.0, 25.0, 17.0, 19.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5048751831054688, -0.4882659912109375, -0.47165679931640625, -0.455047607421875, -0.43843841552734375, -0.4218292236328125, -0.40522003173828125, -0.38861083984375, -0.37200164794921875, -0.3553924560546875, -0.33878326416015625, -0.322174072265625, -0.30556488037109375, -0.2889556884765625, -0.27234649658203125, -0.2557373046875, -0.23912811279296875, -0.2225189208984375, -0.20590972900390625, -0.189300537109375, -0.17269134521484375, -0.1560821533203125, -0.13947296142578125, -0.12286376953125, -0.10625457763671875, -0.0896453857421875, -0.07303619384765625, -0.056427001953125, -0.03981781005859375, -0.0232086181640625, -0.00659942626953125, 0.010009765625, 0.02661895751953125, 0.0432281494140625, 0.05983734130859375, 0.076446533203125, 0.09305572509765625, 0.1096649169921875, 0.12627410888671875, 0.14288330078125, 0.15949249267578125, 0.1761016845703125, 0.19271087646484375, 0.209320068359375, 0.22592926025390625, 0.2425384521484375, 0.25914764404296875, 0.2757568359375, 0.29236602783203125, 0.3089752197265625, 0.32558441162109375, 0.342193603515625, 0.35880279541015625, 0.3754119873046875, 0.39202117919921875, 0.40863037109375, 0.42523956298828125, 0.4418487548828125, 0.45845794677734375, 0.475067138671875, 0.49167633056640625, 0.5082855224609375, 0.5248947143554688, 0.54150390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 8.0, 12.0, 23.0, 37.0, 83.0, 185.0, 500.0, 1630.0, 8541.0, 148824.0, 816337.0, 64992.0, 5475.0, 1229.0, 358.0, 150.0, 68.0, 41.0, 16.0, 12.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.31298828125, -0.3041419982910156, -0.29529571533203125, -0.2864494323730469, -0.2776031494140625, -0.2687568664550781, -0.25991058349609375, -0.2510643005371094, -0.242218017578125, -0.23337173461914062, -0.22452545166015625, -0.21567916870117188, -0.2068328857421875, -0.19798660278320312, -0.18914031982421875, -0.18029403686523438, -0.17144775390625, -0.16260147094726562, -0.15375518798828125, -0.14490890502929688, -0.1360626220703125, -0.12721633911132812, -0.11837005615234375, -0.10952377319335938, -0.100677490234375, -0.09183120727539062, -0.08298492431640625, -0.07413864135742188, -0.0652923583984375, -0.056446075439453125, -0.04759979248046875, -0.038753509521484375, -0.0299072265625, -0.021060943603515625, -0.01221466064453125, -0.003368377685546875, 0.0054779052734375, 0.014324188232421875, 0.02317047119140625, 0.032016754150390625, 0.040863037109375, 0.049709320068359375, 0.05855560302734375, 0.06740188598632812, 0.0762481689453125, 0.08509445190429688, 0.09394073486328125, 0.10278701782226562, 0.11163330078125, 0.12047958374023438, 0.12932586669921875, 0.13817214965820312, 0.1470184326171875, 0.15586471557617188, 0.16471099853515625, 0.17355728149414062, 0.182403564453125, 0.19124984741210938, 0.20009613037109375, 0.20894241333007812, 0.2177886962890625, 0.22663497924804688, 0.23548126220703125, 0.24432754516601562, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 5.0, 11.0, 5.0, 11.0, 9.0, 16.0, 16.0, 13.0, 29.0, 27.0, 40.0, 40.0, 62.0, 91.0, 80.0, 102.0, 98.0, 63.0, 57.0, 39.0, 25.0, 32.0, 23.0, 20.0, 21.0, 14.0, 10.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015808828175067902, -0.00015285983681678772, -0.00014763139188289642, -0.00014240294694900513, -0.00013717450201511383, -0.00013194605708122253, -0.00012671761214733124, -0.00012148916721343994, -0.00011626072227954865, -0.00011103227734565735, -0.00010580383241176605, -0.00010057538747787476, -9.534694254398346e-05, -9.011849761009216e-05, -8.489005267620087e-05, -7.966160774230957e-05, -7.443316280841827e-05, -6.920471787452698e-05, -6.397627294063568e-05, -5.8747828006744385e-05, -5.351938307285309e-05, -4.829093813896179e-05, -4.3062493205070496e-05, -3.78340482711792e-05, -3.26056033372879e-05, -2.7377158403396606e-05, -2.214871346950531e-05, -1.6920268535614014e-05, -1.1691823601722717e-05, -6.463378667831421e-06, -1.2349337339401245e-06, 3.993511199951172e-06, 9.221956133842468e-06, 1.4450401067733765e-05, 1.967884600162506e-05, 2.4907290935516357e-05, 3.0135735869407654e-05, 3.536418080329895e-05, 4.0592625737190247e-05, 4.582107067108154e-05, 5.104951560497284e-05, 5.6277960538864136e-05, 6.150640547275543e-05, 6.673485040664673e-05, 7.196329534053802e-05, 7.719174027442932e-05, 8.242018520832062e-05, 8.764863014221191e-05, 9.287707507610321e-05, 9.810552000999451e-05, 0.0001033339649438858, 0.0001085624098777771, 0.0001137908548116684, 0.00011901929974555969, 0.000124247744679451, 0.00012947618961334229, 0.00013470463454723358, 0.00013993307948112488, 0.00014516152441501617, 0.00015038996934890747, 0.00015561841428279877, 0.00016084685921669006, 0.00016607530415058136, 0.00017130374908447266]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 9.0, 9.0, 15.0, 16.0, 38.0, 66.0, 97.0, 157.0, 335.0, 620.0, 1280.0, 2850.0, 7101.0, 23549.0, 118359.0, 485917.0, 324171.0, 60573.0, 14382.0, 4917.0, 2064.0, 941.0, 450.0, 274.0, 136.0, 85.0, 44.0, 32.0, 15.0, 18.0, 8.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1473388671875, -0.14298057556152344, -0.13862228393554688, -0.1342639923095703, -0.12990570068359375, -0.1255474090576172, -0.12118911743164062, -0.11683082580566406, -0.1124725341796875, -0.10811424255371094, -0.10375595092773438, -0.09939765930175781, -0.09503936767578125, -0.09068107604980469, -0.08632278442382812, -0.08196449279785156, -0.077606201171875, -0.07324790954589844, -0.06888961791992188, -0.06453132629394531, -0.06017303466796875, -0.05581474304199219, -0.051456451416015625, -0.04709815979003906, -0.0427398681640625, -0.03838157653808594, -0.034023284912109375, -0.029664993286132812, -0.02530670166015625, -0.020948410034179688, -0.016590118408203125, -0.012231826782226562, -0.00787353515625, -0.0035152435302734375, 0.000843048095703125, 0.0052013397216796875, 0.00955963134765625, 0.013917922973632812, 0.018276214599609375, 0.022634506225585938, 0.0269927978515625, 0.03135108947753906, 0.035709381103515625, 0.04006767272949219, 0.04442596435546875, 0.04878425598144531, 0.053142547607421875, 0.05750083923339844, 0.061859130859375, 0.06621742248535156, 0.07057571411132812, 0.07493400573730469, 0.07929229736328125, 0.08365058898925781, 0.08800888061523438, 0.09236717224121094, 0.0967254638671875, 0.10108375549316406, 0.10544204711914062, 0.10980033874511719, 0.11415863037109375, 0.11851692199707031, 0.12287521362304688, 0.12723350524902344, 0.131591796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 6.0, 12.0, 12.0, 25.0, 30.0, 44.0, 50.0, 70.0, 72.0, 92.0, 103.0, 90.0, 88.0, 83.0, 50.0, 40.0, 33.0, 31.0, 20.0, 15.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1859130859375, -0.18097305297851562, -0.17603302001953125, -0.17109298706054688, -0.1661529541015625, -0.16121292114257812, -0.15627288818359375, -0.15133285522460938, -0.146392822265625, -0.14145278930664062, -0.13651275634765625, -0.13157272338867188, -0.1266326904296875, -0.12169265747070312, -0.11675262451171875, -0.11181259155273438, -0.10687255859375, -0.10193252563476562, -0.09699249267578125, -0.09205245971679688, -0.0871124267578125, -0.08217239379882812, -0.07723236083984375, -0.07229232788085938, -0.067352294921875, -0.062412261962890625, -0.05747222900390625, -0.052532196044921875, -0.0475921630859375, -0.042652130126953125, -0.03771209716796875, -0.032772064208984375, -0.02783203125, -0.022891998291015625, -0.01795196533203125, -0.013011932373046875, -0.0080718994140625, -0.003131866455078125, 0.00180816650390625, 0.006748199462890625, 0.011688232421875, 0.016628265380859375, 0.02156829833984375, 0.026508331298828125, 0.0314483642578125, 0.036388397216796875, 0.04132843017578125, 0.046268463134765625, 0.05120849609375, 0.056148529052734375, 0.06108856201171875, 0.06602859497070312, 0.0709686279296875, 0.07590866088867188, 0.08084869384765625, 0.08578872680664062, 0.090728759765625, 0.09566879272460938, 0.10060882568359375, 0.10554885864257812, 0.1104888916015625, 0.11542892456054688, 0.12036895751953125, 0.12530899047851562, 0.1302490234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 38.0, 182.0, 546.0, 177.0, 36.0, 19.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.51819610595703, -16.19015884399414, -15.862123489379883, -15.534086227416992, -15.206049919128418, -14.878013610839844, -14.549976348876953, -14.221940040588379, -13.893903732299805, -13.56586742401123, -13.237831115722656, -12.909793853759766, -12.581757545471191, -12.253721237182617, -11.925683975219727, -11.597647666931152, -11.269611358642578, -10.941575050354004, -10.61353874206543, -10.285501480102539, -9.957465171813965, -9.62942886352539, -9.3013916015625, -8.973355293273926, -8.645318984985352, -8.317282676696777, -7.989245891571045, -7.6612091064453125, -7.333172798156738, -7.005136489868164, -6.677099704742432, -6.349062919616699, -6.021025657653809, -5.692989349365234, -5.364952564239502, -5.0369157791137695, -4.708879470825195, -4.380843162536621, -4.052806377410889, -3.7247698307037354, -3.396733283996582, -3.0686967372894287, -2.7406601905822754, -2.412623643875122, -2.0845870971679688, -1.7565505504608154, -1.428514003753662, -1.1004774570465088, -0.7724409103393555, -0.44440436363220215, -0.11636781692504883, 0.2116687297821045, 0.5397052764892578, 0.8677418231964111, 1.1957783699035645, 1.5238149166107178, 1.851851463317871, 2.1798880100250244, 2.5079245567321777, 2.835961103439331, 3.1639976501464844, 3.4920341968536377, 3.820070743560791, 4.148107528686523, 4.476143836975098]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 4.0, 7.0, 5.0, 7.0, 5.0, 7.0, 7.0, 16.0, 11.0, 18.0, 22.0, 19.0, 29.0, 23.0, 32.0, 27.0, 41.0, 29.0, 35.0, 48.0, 46.0, 39.0, 37.0, 33.0, 43.0, 36.0, 35.0, 31.0, 39.0, 34.0, 34.0, 22.0, 24.0, 24.0, 12.0, 27.0, 13.0, 14.0, 17.0, 11.0, 6.0, 4.0, 11.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.781054973602295, -2.69256591796875, -2.604076862335205, -2.51558780670166, -2.4270989894866943, -2.3386099338531494, -2.2501208782196045, -2.1616318225860596, -2.0731427669525146, -1.9846537113189697, -1.8961647748947144, -1.8076757192611694, -1.7191866636276245, -1.6306977272033691, -1.5422086715698242, -1.4537196159362793, -1.365230679512024, -1.276741623878479, -1.1882526874542236, -1.0997636318206787, -1.0112745761871338, -0.9227855801582336, -0.8342965841293335, -0.7458075284957886, -0.6573185324668884, -0.5688295364379883, -0.48034048080444336, -0.3918514847755432, -0.3033624589443207, -0.21487343311309814, -0.126384437084198, -0.037895381450653076, 0.05059361457824707, 0.1390826404094696, 0.22757165133953094, 0.3160606622695923, 0.4045496881008148, 0.49303871393203735, 0.5815277099609375, 0.6700167655944824, 0.7585057616233826, 0.8469947576522827, 0.9354838132858276, 1.023972749710083, 1.112461805343628, 1.2009508609771729, 1.2894399166107178, 1.3779289722442627, 1.466417908668518, 1.554906964302063, 1.6433959007263184, 1.7318849563598633, 1.8203740119934082, 1.9088630676269531, 1.9973520040512085, 2.085841178894043, 2.174329996109009, 2.2628190517425537, 2.3513081073760986, 2.4397969245910645, 2.5282859802246094, 2.6167750358581543, 2.705264091491699, 2.793753147125244, 2.882242202758789]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 7.0, 13.0, 10.0, 25.0, 47.0, 82.0, 153.0, 352.0, 974.0, 4399.0, 97005.0, 4074987.0, 13397.0, 1883.0, 516.0, 213.0, 110.0, 45.0, 21.0, 13.0, 9.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.267578125, -2.2013702392578125, -2.135162353515625, -2.0689544677734375, -2.00274658203125, -1.9365386962890625, -1.870330810546875, -1.8041229248046875, -1.7379150390625, -1.6717071533203125, -1.605499267578125, -1.5392913818359375, -1.47308349609375, -1.4068756103515625, -1.340667724609375, -1.2744598388671875, -1.208251953125, -1.1420440673828125, -1.075836181640625, -1.0096282958984375, -0.94342041015625, -0.8772125244140625, -0.811004638671875, -0.7447967529296875, -0.6785888671875, -0.6123809814453125, -0.546173095703125, -0.4799652099609375, -0.41375732421875, -0.3475494384765625, -0.281341552734375, -0.2151336669921875, -0.14892578125, -0.0827178955078125, -0.016510009765625, 0.0496978759765625, 0.11590576171875, 0.1821136474609375, 0.248321533203125, 0.3145294189453125, 0.3807373046875, 0.4469451904296875, 0.513153076171875, 0.5793609619140625, 0.64556884765625, 0.7117767333984375, 0.777984619140625, 0.8441925048828125, 0.910400390625, 0.9766082763671875, 1.042816162109375, 1.1090240478515625, 1.17523193359375, 1.2414398193359375, 1.307647705078125, 1.3738555908203125, 1.4400634765625, 1.5062713623046875, 1.572479248046875, 1.6386871337890625, 1.70489501953125, 1.7711029052734375, 1.837310791015625, 1.9035186767578125, 1.9697265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 10.0, 19.0, 42.0, 55.0, 57.0, 84.0, 101.0, 94.0, 90.0, 90.0, 96.0, 76.0, 61.0, 45.0, 25.0, 15.0, 15.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.38376617431640625, -0.3734893798828125, -0.36321258544921875, -0.352935791015625, -0.34265899658203125, -0.3323822021484375, -0.32210540771484375, -0.31182861328125, -0.30155181884765625, -0.2912750244140625, -0.28099822998046875, -0.270721435546875, -0.26044464111328125, -0.2501678466796875, -0.23989105224609375, -0.2296142578125, -0.21933746337890625, -0.2090606689453125, -0.19878387451171875, -0.188507080078125, -0.17823028564453125, -0.1679534912109375, -0.15767669677734375, -0.14739990234375, -0.13712310791015625, -0.1268463134765625, -0.11656951904296875, -0.106292724609375, -0.09601593017578125, -0.0857391357421875, -0.07546234130859375, -0.065185546875, -0.05490875244140625, -0.0446319580078125, -0.03435516357421875, -0.024078369140625, -0.01380157470703125, -0.0035247802734375, 0.00675201416015625, 0.01702880859375, 0.02730560302734375, 0.0375823974609375, 0.04785919189453125, 0.058135986328125, 0.06841278076171875, 0.0786895751953125, 0.08896636962890625, 0.0992431640625, 0.10951995849609375, 0.1197967529296875, 0.13007354736328125, 0.140350341796875, 0.15062713623046875, 0.1609039306640625, 0.17118072509765625, 0.18145751953125, 0.19173431396484375, 0.2020111083984375, 0.21228790283203125, 0.222564697265625, 0.23284149169921875, 0.2431182861328125, 0.25339508056640625, 0.263671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 4.0, 7.0, 13.0, 14.0, 29.0, 41.0, 41.0, 66.0, 104.0, 149.0, 235.0, 304.0, 628.0, 1121.0, 2502.0, 6753.0, 29823.0, 321798.0, 3713541.0, 94094.0, 14738.0, 4243.0, 1819.0, 857.0, 489.0, 327.0, 190.0, 125.0, 64.0, 70.0, 36.0, 19.0, 14.0, 10.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.546875, -0.5293960571289062, -0.5119171142578125, -0.49443817138671875, -0.476959228515625, -0.45948028564453125, -0.4420013427734375, -0.42452239990234375, -0.40704345703125, -0.38956451416015625, -0.3720855712890625, -0.35460662841796875, -0.337127685546875, -0.31964874267578125, -0.3021697998046875, -0.28469085693359375, -0.2672119140625, -0.24973297119140625, -0.2322540283203125, -0.21477508544921875, -0.197296142578125, -0.17981719970703125, -0.1623382568359375, -0.14485931396484375, -0.12738037109375, -0.10990142822265625, -0.0924224853515625, -0.07494354248046875, -0.057464599609375, -0.03998565673828125, -0.0225067138671875, -0.00502777099609375, 0.012451171875, 0.02993011474609375, 0.0474090576171875, 0.06488800048828125, 0.082366943359375, 0.09984588623046875, 0.1173248291015625, 0.13480377197265625, 0.15228271484375, 0.16976165771484375, 0.1872406005859375, 0.20471954345703125, 0.222198486328125, 0.23967742919921875, 0.2571563720703125, 0.27463531494140625, 0.2921142578125, 0.30959320068359375, 0.3270721435546875, 0.34455108642578125, 0.362030029296875, 0.37950897216796875, 0.3969879150390625, 0.41446685791015625, 0.43194580078125, 0.44942474365234375, 0.4669036865234375, 0.48438262939453125, 0.501861572265625, 0.5193405151367188, 0.5368194580078125, 0.5542984008789062, 0.57177734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 21.0, 45.0, 53.0, 108.0, 346.0, 2418.0, 706.0, 175.0, 71.0, 39.0, 26.0, 14.0, 8.0, 6.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.3936004638671875, -0.381927490234375, -0.3702545166015625, -0.35858154296875, -0.3469085693359375, -0.335235595703125, -0.3235626220703125, -0.3118896484375, -0.3002166748046875, -0.288543701171875, -0.2768707275390625, -0.26519775390625, -0.2535247802734375, -0.241851806640625, -0.2301788330078125, -0.218505859375, -0.2068328857421875, -0.195159912109375, -0.1834869384765625, -0.17181396484375, -0.1601409912109375, -0.148468017578125, -0.1367950439453125, -0.1251220703125, -0.1134490966796875, -0.101776123046875, -0.0901031494140625, -0.07843017578125, -0.0667572021484375, -0.055084228515625, -0.0434112548828125, -0.03173828125, -0.0200653076171875, -0.008392333984375, 0.0032806396484375, 0.01495361328125, 0.0266265869140625, 0.038299560546875, 0.0499725341796875, 0.0616455078125, 0.0733184814453125, 0.084991455078125, 0.0966644287109375, 0.10833740234375, 0.1200103759765625, 0.131683349609375, 0.1433563232421875, 0.155029296875, 0.1667022705078125, 0.178375244140625, 0.1900482177734375, 0.20172119140625, 0.2133941650390625, 0.225067138671875, 0.2367401123046875, 0.2484130859375, 0.2600860595703125, 0.271759033203125, 0.2834320068359375, 0.29510498046875, 0.3067779541015625, 0.318450927734375, 0.3301239013671875, 0.341796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 26.0, 92.0, 423.0, 365.0, 64.0, 13.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2928340435028076, -1.173526406288147, -1.0542187690734863, -0.9349111914634705, -0.8156035542488098, -0.6962959170341492, -0.5769883394241333, -0.45768070220947266, -0.338373064994812, -0.21906544268131256, -0.09975782036781311, 0.019549787044525146, 0.1388574242591858, 0.25816506147384644, 0.3774726390838623, 0.49678027629852295, 0.6160879135131836, 0.7353955507278442, 0.8547031879425049, 0.9740107655525208, 1.0933184623718262, 1.2126259803771973, 1.331933617591858, 1.4512412548065186, 1.5705488920211792, 1.6898565292358398, 1.8091641664505005, 1.9284718036651611, 2.0477793216705322, 2.1670870780944824, 2.2863945960998535, 2.4057021141052246, 2.5250096321105957, 2.644317150115967, 2.763624906539917, 2.882932424545288, 3.0022401809692383, 3.1215476989746094, 3.2408552169799805, 3.3601629734039307, 3.479470729827881, 3.598778247833252, 3.718086004257202, 3.8373935222625732, 3.9567012786865234, 4.0760087966918945, 4.195316314697266, 4.314623832702637, 4.433931350708008, 4.553238868713379, 4.67254638671875, 4.791854381561279, 4.91116189956665, 5.0304694175720215, 5.149776935577393, 5.269084930419922, 5.388392448425293, 5.507699966430664, 5.627007484436035, 5.7463154792785645, 5.8656229972839355, 5.984930515289307, 6.104238033294678, 6.223546028137207, 6.342853546142578]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 14.0, 10.0, 13.0, 20.0, 25.0, 20.0, 34.0, 27.0, 44.0, 52.0, 42.0, 56.0, 63.0, 59.0, 67.0, 59.0, 42.0, 47.0, 56.0, 36.0, 41.0, 28.0, 29.0, 28.0, 16.0, 16.0, 14.0, 5.0, 4.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7749946117401123, -0.7453752756118774, -0.7157559394836426, -0.6861366033554077, -0.6565172076225281, -0.6268978714942932, -0.5972785353660583, -0.5676591992378235, -0.5380398035049438, -0.508420467376709, -0.47880110144615173, -0.44918176531791687, -0.4195623993873596, -0.38994306325912476, -0.3603237271308899, -0.33070439100265503, -0.30108505487442017, -0.2714657187461853, -0.24184635281562805, -0.2122270166873932, -0.18260766565799713, -0.15298831462860107, -0.12336897850036621, -0.09374962747097015, -0.0641302764415741, -0.03451092913746834, -0.004891581833362579, 0.02472776174545288, 0.05434711277484894, 0.083966463804245, 0.11358579993247986, 0.14320515096187592, 0.17282450199127197, 0.20244385302066803, 0.2320632040500641, 0.26168254017829895, 0.2913019061088562, 0.32092124223709106, 0.3505405783653259, 0.3801599144935608, 0.40977928042411804, 0.4393986165523529, 0.46901798248291016, 0.498637318611145, 0.5282566547393799, 0.5578759908676147, 0.5874953269958496, 0.6171147227287292, 0.6467340588569641, 0.676353394985199, 0.7059727311134338, 0.7355921268463135, 0.7652114629745483, 0.7948307991027832, 0.8244501352310181, 0.8540694713592529, 0.8836888074874878, 0.9133081436157227, 0.9429274797439575, 0.9725468158721924, 1.0021661520004272, 1.031785488128662, 1.0614049434661865, 1.0910242795944214, 1.1206436157226562]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 15.0, 11.0, 14.0, 37.0, 50.0, 67.0, 119.0, 183.0, 358.0, 707.0, 1474.0, 3799.0, 12692.0, 66878.0, 626939.0, 288250.0, 34036.0, 7868.0, 2706.0, 1079.0, 514.0, 284.0, 141.0, 102.0, 62.0, 45.0, 31.0, 19.0, 11.0, 11.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.87646484375, -0.8505477905273438, -0.8246307373046875, -0.7987136840820312, -0.772796630859375, -0.7468795776367188, -0.7209625244140625, -0.6950454711914062, -0.66912841796875, -0.6432113647460938, -0.6172943115234375, -0.5913772583007812, -0.565460205078125, -0.5395431518554688, -0.5136260986328125, -0.48770904541015625, -0.4617919921875, -0.43587493896484375, -0.4099578857421875, -0.38404083251953125, -0.358123779296875, -0.33220672607421875, -0.3062896728515625, -0.28037261962890625, -0.25445556640625, -0.22853851318359375, -0.2026214599609375, -0.17670440673828125, -0.150787353515625, -0.12487030029296875, -0.0989532470703125, -0.07303619384765625, -0.047119140625, -0.02120208740234375, 0.0047149658203125, 0.03063201904296875, 0.056549072265625, 0.08246612548828125, 0.1083831787109375, 0.13430023193359375, 0.16021728515625, 0.18613433837890625, 0.2120513916015625, 0.23796844482421875, 0.263885498046875, 0.28980255126953125, 0.3157196044921875, 0.34163665771484375, 0.3675537109375, 0.39347076416015625, 0.4193878173828125, 0.44530487060546875, 0.471221923828125, 0.49713897705078125, 0.5230560302734375, 0.5489730834960938, 0.57489013671875, 0.6008071899414062, 0.6267242431640625, 0.6526412963867188, 0.678558349609375, 0.7044754028320312, 0.7303924560546875, 0.7563095092773438, 0.7822265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 5.0, 20.0, 23.0, 46.0, 44.0, 58.0, 77.0, 89.0, 98.0, 84.0, 96.0, 87.0, 75.0, 64.0, 51.0, 30.0, 12.0, 18.0, 9.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36962890625, -0.35974884033203125, -0.3498687744140625, -0.33998870849609375, -0.330108642578125, -0.32022857666015625, -0.3103485107421875, -0.30046844482421875, -0.29058837890625, -0.28070831298828125, -0.2708282470703125, -0.26094818115234375, -0.251068115234375, -0.24118804931640625, -0.2313079833984375, -0.22142791748046875, -0.2115478515625, -0.20166778564453125, -0.1917877197265625, -0.18190765380859375, -0.172027587890625, -0.16214752197265625, -0.1522674560546875, -0.14238739013671875, -0.13250732421875, -0.12262725830078125, -0.1127471923828125, -0.10286712646484375, -0.092987060546875, -0.08310699462890625, -0.0732269287109375, -0.06334686279296875, -0.053466796875, -0.04358673095703125, -0.0337066650390625, -0.02382659912109375, -0.013946533203125, -0.00406646728515625, 0.0058135986328125, 0.01569366455078125, 0.02557373046875, 0.03545379638671875, 0.0453338623046875, 0.05521392822265625, 0.065093994140625, 0.07497406005859375, 0.0848541259765625, 0.09473419189453125, 0.1046142578125, 0.11449432373046875, 0.1243743896484375, 0.13425445556640625, 0.144134521484375, 0.15401458740234375, 0.1638946533203125, 0.17377471923828125, 0.18365478515625, 0.19353485107421875, 0.2034149169921875, 0.21329498291015625, 0.223175048828125, 0.23305511474609375, 0.2429351806640625, 0.25281524658203125, 0.2626953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 7.0, 2.0, 10.0, 2.0, 11.0, 15.0, 18.0, 12.0, 29.0, 45.0, 56.0, 65.0, 127.0, 164.0, 297.0, 544.0, 1086.0, 2266.0, 5964.0, 19651.0, 92381.0, 552460.0, 304100.0, 49119.0, 12053.0, 4251.0, 1753.0, 797.0, 466.0, 245.0, 147.0, 118.0, 85.0, 58.0, 34.0, 29.0, 18.0, 16.0, 10.0, 14.0, 7.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.5439453125, -0.5287551879882812, -0.5135650634765625, -0.49837493896484375, -0.483184814453125, -0.46799468994140625, -0.4528045654296875, -0.43761444091796875, -0.42242431640625, -0.40723419189453125, -0.3920440673828125, -0.37685394287109375, -0.361663818359375, -0.34647369384765625, -0.3312835693359375, -0.31609344482421875, -0.3009033203125, -0.28571319580078125, -0.2705230712890625, -0.25533294677734375, -0.240142822265625, -0.22495269775390625, -0.2097625732421875, -0.19457244873046875, -0.17938232421875, -0.16419219970703125, -0.1490020751953125, -0.13381195068359375, -0.118621826171875, -0.10343170166015625, -0.0882415771484375, -0.07305145263671875, -0.057861328125, -0.04267120361328125, -0.0274810791015625, -0.01229095458984375, 0.002899169921875, 0.01808929443359375, 0.0332794189453125, 0.04846954345703125, 0.06365966796875, 0.07884979248046875, 0.0940399169921875, 0.10923004150390625, 0.124420166015625, 0.13961029052734375, 0.1548004150390625, 0.16999053955078125, 0.1851806640625, 0.20037078857421875, 0.2155609130859375, 0.23075103759765625, 0.245941162109375, 0.26113128662109375, 0.2763214111328125, 0.29151153564453125, 0.30670166015625, 0.32189178466796875, 0.3370819091796875, 0.35227203369140625, 0.367462158203125, 0.38265228271484375, 0.3978424072265625, 0.41303253173828125, 0.42822265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 9.0, 6.0, 12.0, 13.0, 17.0, 13.0, 26.0, 18.0, 35.0, 35.0, 31.0, 49.0, 39.0, 48.0, 48.0, 57.0, 52.0, 52.0, 45.0, 42.0, 43.0, 43.0, 32.0, 41.0, 41.0, 24.0, 17.0, 21.0, 18.0, 19.0, 12.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6298828125, -0.608551025390625, -0.58721923828125, -0.565887451171875, -0.5445556640625, -0.523223876953125, -0.50189208984375, -0.480560302734375, -0.459228515625, -0.437896728515625, -0.41656494140625, -0.395233154296875, -0.3739013671875, -0.352569580078125, -0.33123779296875, -0.309906005859375, -0.28857421875, -0.267242431640625, -0.24591064453125, -0.224578857421875, -0.2032470703125, -0.181915283203125, -0.16058349609375, -0.139251708984375, -0.117919921875, -0.096588134765625, -0.07525634765625, -0.053924560546875, -0.0325927734375, -0.011260986328125, 0.01007080078125, 0.031402587890625, 0.052734375, 0.074066162109375, 0.09539794921875, 0.116729736328125, 0.1380615234375, 0.159393310546875, 0.18072509765625, 0.202056884765625, 0.223388671875, 0.244720458984375, 0.26605224609375, 0.287384033203125, 0.3087158203125, 0.330047607421875, 0.35137939453125, 0.372711181640625, 0.39404296875, 0.415374755859375, 0.43670654296875, 0.458038330078125, 0.4793701171875, 0.500701904296875, 0.52203369140625, 0.543365478515625, 0.564697265625, 0.586029052734375, 0.60736083984375, 0.628692626953125, 0.6500244140625, 0.671356201171875, 0.69268798828125, 0.714019775390625, 0.7353515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 4.0, 14.0, 22.0, 75.0, 264.0, 1369.0, 819029.0, 226354.0, 1075.0, 224.0, 68.0, 20.0, 13.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.08270263671875, -1.0452880859375, -1.00787353515625, -0.970458984375, -0.93304443359375, -0.8956298828125, -0.85821533203125, -0.82080078125, -0.78338623046875, -0.7459716796875, -0.70855712890625, -0.671142578125, -0.63372802734375, -0.5963134765625, -0.55889892578125, -0.521484375, -0.48406982421875, -0.4466552734375, -0.40924072265625, -0.371826171875, -0.33441162109375, -0.2969970703125, -0.25958251953125, -0.22216796875, -0.18475341796875, -0.1473388671875, -0.10992431640625, -0.072509765625, -0.03509521484375, 0.0023193359375, 0.03973388671875, 0.0771484375, 0.11456298828125, 0.1519775390625, 0.18939208984375, 0.226806640625, 0.26422119140625, 0.3016357421875, 0.33905029296875, 0.37646484375, 0.41387939453125, 0.4512939453125, 0.48870849609375, 0.526123046875, 0.56353759765625, 0.6009521484375, 0.63836669921875, 0.67578125, 0.71319580078125, 0.7506103515625, 0.78802490234375, 0.825439453125, 0.86285400390625, 0.9002685546875, 0.93768310546875, 0.97509765625, 1.01251220703125, 1.0499267578125, 1.08734130859375, 1.124755859375, 1.16217041015625, 1.1995849609375, 1.23699951171875, 1.2744140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 23.0, 94.0, 455.0, 341.0, 57.0, 18.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0020198822021484375, -0.001982402056455612, -0.0019449219107627869, -0.0019074417650699615, -0.0018699616193771362, -0.001832481473684311, -0.0017950013279914856, -0.0017575211822986603, -0.001720041036605835, -0.0016825608909130096, -0.0016450807452201843, -0.001607600599527359, -0.0015701204538345337, -0.0015326403081417084, -0.001495160162448883, -0.0014576800167560577, -0.0014201998710632324, -0.001382719725370407, -0.0013452395796775818, -0.0013077594339847565, -0.0012702792882919312, -0.0012327991425991058, -0.0011953189969062805, -0.0011578388512134552, -0.0011203587055206299, -0.0010828785598278046, -0.0010453984141349792, -0.001007918268442154, -0.0009704381227493286, -0.0009329579770565033, -0.000895477831363678, -0.0008579976856708527, -0.0008205175399780273, -0.000783037394285202, -0.0007455572485923767, -0.0007080771028995514, -0.0006705969572067261, -0.0006331168115139008, -0.0005956366658210754, -0.0005581565201282501, -0.0005206763744354248, -0.0004831962287425995, -0.00044571608304977417, -0.00040823593735694885, -0.00037075579166412354, -0.0003332756459712982, -0.0002957955002784729, -0.0002583153545856476, -0.00022083520889282227, -0.00018335506319999695, -0.00014587491750717163, -0.00010839477181434631, -7.0914626121521e-05, -3.343448042869568e-05, 4.045665264129639e-06, 4.1525810956954956e-05, 7.900595664978027e-05, 0.00011648610234260559, 0.0001539662480354309, 0.00019144639372825623, 0.00022892653942108154, 0.00026640668511390686, 0.0003038868308067322, 0.0003413669764995575, 0.0003788471221923828]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 6.0, 12.0, 34.0, 59.0, 120.0, 223.0, 1086.0, 781437.0, 264365.0, 786.0, 234.0, 82.0, 49.0, 27.0, 13.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.564453125, -1.5242919921875, -1.484130859375, -1.4439697265625, -1.40380859375, -1.3636474609375, -1.323486328125, -1.2833251953125, -1.2431640625, -1.2030029296875, -1.162841796875, -1.1226806640625, -1.08251953125, -1.0423583984375, -1.002197265625, -0.9620361328125, -0.921875, -0.8817138671875, -0.841552734375, -0.8013916015625, -0.76123046875, -0.7210693359375, -0.680908203125, -0.6407470703125, -0.6005859375, -0.5604248046875, -0.520263671875, -0.4801025390625, -0.43994140625, -0.3997802734375, -0.359619140625, -0.3194580078125, -0.279296875, -0.2391357421875, -0.198974609375, -0.1588134765625, -0.11865234375, -0.0784912109375, -0.038330078125, 0.0018310546875, 0.0419921875, 0.0821533203125, 0.122314453125, 0.1624755859375, 0.20263671875, 0.2427978515625, 0.282958984375, 0.3231201171875, 0.36328125, 0.4034423828125, 0.443603515625, 0.4837646484375, 0.52392578125, 0.5640869140625, 0.604248046875, 0.6444091796875, 0.6845703125, 0.7247314453125, 0.764892578125, 0.8050537109375, 0.84521484375, 0.8853759765625, 0.925537109375, 0.9656982421875, 1.005859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 47.0, 387.0, 487.0, 67.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7109375, -1.668212890625, -1.62548828125, -1.582763671875, -1.5400390625, -1.497314453125, -1.45458984375, -1.411865234375, -1.369140625, -1.326416015625, -1.28369140625, -1.240966796875, -1.1982421875, -1.155517578125, -1.11279296875, -1.070068359375, -1.02734375, -0.984619140625, -0.94189453125, -0.899169921875, -0.8564453125, -0.813720703125, -0.77099609375, -0.728271484375, -0.685546875, -0.642822265625, -0.60009765625, -0.557373046875, -0.5146484375, -0.471923828125, -0.42919921875, -0.386474609375, -0.34375, -0.301025390625, -0.25830078125, -0.215576171875, -0.1728515625, -0.130126953125, -0.08740234375, -0.044677734375, -0.001953125, 0.040771484375, 0.08349609375, 0.126220703125, 0.1689453125, 0.211669921875, 0.25439453125, 0.297119140625, 0.33984375, 0.382568359375, 0.42529296875, 0.468017578125, 0.5107421875, 0.553466796875, 0.59619140625, 0.638916015625, 0.681640625, 0.724365234375, 0.76708984375, 0.809814453125, 0.8525390625, 0.895263671875, 0.93798828125, 0.980712890625, 1.0234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 15.0, 208.0, 558.0, 167.0, 39.0, 11.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.039624214172363, -13.681843757629395, -13.324064254760742, -12.966283798217773, -12.608504295349121, -12.250723838806152, -11.8929443359375, -11.535163879394531, -11.177383422851562, -10.819602966308594, -10.461823463439941, -10.104043006896973, -9.74626350402832, -9.388483047485352, -9.030702590942383, -8.67292308807373, -8.315143585205078, -7.957363605499268, -7.599583625793457, -7.241803169250488, -6.884023666381836, -6.526243209838867, -6.168463230133057, -5.810683250427246, -5.4529032707214355, -5.095123291015625, -4.7373433113098145, -4.379563331604004, -4.021782875061035, -3.6640031337738037, -3.306222915649414, -2.9484429359436035, -2.5906620025634766, -2.232882022857666, -1.875101923942566, -1.5173218250274658, -1.1595418453216553, -0.8017618656158447, -0.4439816474914551, -0.08620166778564453, 0.271578311920166, 0.6293583512306213, 0.9871383905410767, 1.3449184894561768, 1.7026984691619873, 2.060478448867798, 2.4182586669921875, 2.776038646697998, 3.1338186264038086, 3.491598606109619, 3.8493785858154297, 4.207159042358398, 4.564938545227051, 4.9227190017700195, 5.28049898147583, 5.638278961181641, 5.996058940887451, 6.353838920593262, 6.711618900299072, 7.069398880004883, 7.427179336547852, 7.784958839416504, 8.142739295959473, 8.500518798828125, 8.858299255371094]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 7.0, 12.0, 6.0, 6.0, 17.0, 15.0, 18.0, 16.0, 18.0, 20.0, 29.0, 21.0, 20.0, 28.0, 41.0, 30.0, 42.0, 28.0, 39.0, 43.0, 32.0, 42.0, 52.0, 45.0, 47.0, 38.0, 38.0, 26.0, 23.0, 34.0, 26.0, 28.0, 11.0, 14.0, 14.0, 12.0, 12.0, 10.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.8073842525482178, -2.716726779937744, -2.6260693073272705, -2.535411834716797, -2.444754123687744, -2.3540966510772705, -2.263439178466797, -2.1727817058563232, -2.0821242332458496, -1.991466760635376, -1.9008092880249023, -1.8101516962051392, -1.7194942235946655, -1.628836750984192, -1.5381791591644287, -1.447521686553955, -1.3568642139434814, -1.2662067413330078, -1.1755492687225342, -1.084891676902771, -0.9942342042922974, -0.9035767316818237, -0.8129191994667053, -0.7222616672515869, -0.6316041946411133, -0.5409467220306396, -0.45028918981552124, -0.3596316874027252, -0.2689741849899292, -0.17831668257713318, -0.08765918016433716, 0.00299835205078125, 0.09365558624267578, 0.1843130886554718, 0.2749705910682678, 0.36562809348106384, 0.45628559589385986, 0.5469430685043335, 0.6376006007194519, 0.7282581329345703, 0.818915605545044, 0.9095730781555176, 1.0002305507659912, 1.0908881425857544, 1.181545615196228, 1.2722030878067017, 1.3628606796264648, 1.4535181522369385, 1.544175624847412, 1.6348330974578857, 1.7254905700683594, 1.8161481618881226, 1.9068056344985962, 1.9974631071090698, 2.088120698928833, 2.1787781715393066, 2.2694356441497803, 2.360093116760254, 2.4507505893707275, 2.541408061981201, 2.632065773010254, 2.7227232456207275, 2.813380718231201, 2.904038190841675, 2.9946956634521484]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 3.0, 11.0, 12.0, 7.0, 26.0, 37.0, 55.0, 82.0, 118.0, 191.0, 386.0, 816.0, 2295.0, 9424.0, 100956.0, 4014250.0, 55652.0, 6811.0, 1747.0, 658.0, 326.0, 185.0, 102.0, 52.0, 24.0, 17.0, 13.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9087295532226562, -0.8755645751953125, -0.8423995971679688, -0.809234619140625, -0.7760696411132812, -0.7429046630859375, -0.7097396850585938, -0.67657470703125, -0.6434097290039062, -0.6102447509765625, -0.5770797729492188, -0.543914794921875, -0.5107498168945312, -0.4775848388671875, -0.44441986083984375, -0.4112548828125, -0.37808990478515625, -0.3449249267578125, -0.31175994873046875, -0.278594970703125, -0.24542999267578125, -0.2122650146484375, -0.17910003662109375, -0.14593505859375, -0.11277008056640625, -0.0796051025390625, -0.04644012451171875, -0.013275146484375, 0.01988983154296875, 0.0530548095703125, 0.08621978759765625, 0.119384765625, 0.15254974365234375, 0.1857147216796875, 0.21887969970703125, 0.252044677734375, 0.28520965576171875, 0.3183746337890625, 0.35153961181640625, 0.38470458984375, 0.41786956787109375, 0.4510345458984375, 0.48419952392578125, 0.517364501953125, 0.5505294799804688, 0.5836944580078125, 0.6168594360351562, 0.6500244140625, 0.6831893920898438, 0.7163543701171875, 0.7495193481445312, 0.782684326171875, 0.8158493041992188, 0.8490142822265625, 0.8821792602539062, 0.91534423828125, 0.9485092163085938, 0.9816741943359375, 1.0148391723632812, 1.048004150390625, 1.0811691284179688, 1.1143341064453125, 1.1474990844726562, 1.1806640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 10.0, 14.0, 27.0, 34.0, 34.0, 51.0, 58.0, 57.0, 78.0, 99.0, 90.0, 87.0, 72.0, 77.0, 55.0, 53.0, 32.0, 25.0, 17.0, 18.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.36423492431640625, -0.3542022705078125, -0.34416961669921875, -0.334136962890625, -0.32410430908203125, -0.3140716552734375, -0.30403900146484375, -0.29400634765625, -0.28397369384765625, -0.2739410400390625, -0.26390838623046875, -0.253875732421875, -0.24384307861328125, -0.2338104248046875, -0.22377777099609375, -0.2137451171875, -0.20371246337890625, -0.1936798095703125, -0.18364715576171875, -0.173614501953125, -0.16358184814453125, -0.1535491943359375, -0.14351654052734375, -0.13348388671875, -0.12345123291015625, -0.1134185791015625, -0.10338592529296875, -0.093353271484375, -0.08332061767578125, -0.0732879638671875, -0.06325531005859375, -0.05322265625, -0.04319000244140625, -0.0331573486328125, -0.02312469482421875, -0.013092041015625, -0.00305938720703125, 0.0069732666015625, 0.01700592041015625, 0.02703857421875, 0.03707122802734375, 0.0471038818359375, 0.05713653564453125, 0.067169189453125, 0.07720184326171875, 0.0872344970703125, 0.09726715087890625, 0.1072998046875, 0.11733245849609375, 0.1273651123046875, 0.13739776611328125, 0.147430419921875, 0.15746307373046875, 0.1674957275390625, 0.17752838134765625, 0.18756103515625, 0.19759368896484375, 0.2076263427734375, 0.21765899658203125, 0.227691650390625, 0.23772430419921875, 0.2477569580078125, 0.25778961181640625, 0.267822265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 12.0, 9.0, 10.0, 9.0, 20.0, 18.0, 29.0, 38.0, 58.0, 67.0, 100.0, 172.0, 271.0, 544.0, 1136.0, 2979.0, 11607.0, 128478.0, 3969921.0, 65629.0, 8463.0, 2468.0, 1040.0, 483.0, 246.0, 160.0, 103.0, 60.0, 41.0, 29.0, 16.0, 11.0, 16.0, 12.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8403167724609375, -0.815887451171875, -0.7914581298828125, -0.76702880859375, -0.7425994873046875, -0.718170166015625, -0.6937408447265625, -0.6693115234375, -0.6448822021484375, -0.620452880859375, -0.5960235595703125, -0.57159423828125, -0.5471649169921875, -0.522735595703125, -0.4983062744140625, -0.473876953125, -0.4494476318359375, -0.425018310546875, -0.4005889892578125, -0.37615966796875, -0.3517303466796875, -0.327301025390625, -0.3028717041015625, -0.2784423828125, -0.2540130615234375, -0.229583740234375, -0.2051544189453125, -0.18072509765625, -0.1562957763671875, -0.131866455078125, -0.1074371337890625, -0.0830078125, -0.0585784912109375, -0.034149169921875, -0.0097198486328125, 0.01470947265625, 0.0391387939453125, 0.063568115234375, 0.0879974365234375, 0.1124267578125, 0.1368560791015625, 0.161285400390625, 0.1857147216796875, 0.21014404296875, 0.2345733642578125, 0.259002685546875, 0.2834320068359375, 0.307861328125, 0.3322906494140625, 0.356719970703125, 0.3811492919921875, 0.40557861328125, 0.4300079345703125, 0.454437255859375, 0.4788665771484375, 0.5032958984375, 0.5277252197265625, 0.552154541015625, 0.5765838623046875, 0.60101318359375, 0.6254425048828125, 0.649871826171875, 0.6743011474609375, 0.69873046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 12.0, 18.0, 24.0, 56.0, 235.0, 2617.0, 867.0, 142.0, 48.0, 19.0, 14.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.697265625, -0.6826953887939453, -0.6681251525878906, -0.6535549163818359, -0.6389846801757812, -0.6244144439697266, -0.6098442077636719, -0.5952739715576172, -0.5807037353515625, -0.5661334991455078, -0.5515632629394531, -0.5369930267333984, -0.5224227905273438, -0.5078525543212891, -0.4932823181152344, -0.4787120819091797, -0.464141845703125, -0.4495716094970703, -0.4350013732910156, -0.42043113708496094, -0.40586090087890625, -0.39129066467285156, -0.3767204284667969, -0.3621501922607422, -0.3475799560546875, -0.3330097198486328, -0.3184394836425781, -0.30386924743652344, -0.28929901123046875, -0.27472877502441406, -0.2601585388183594, -0.2455883026123047, -0.23101806640625, -0.2164478302001953, -0.20187759399414062, -0.18730735778808594, -0.17273712158203125, -0.15816688537597656, -0.14359664916992188, -0.1290264129638672, -0.1144561767578125, -0.09988594055175781, -0.08531570434570312, -0.07074546813964844, -0.05617523193359375, -0.04160499572753906, -0.027034759521484375, -0.012464523315429688, 0.002105712890625, 0.016675949096679688, 0.031246185302734375, 0.04581642150878906, 0.06038665771484375, 0.07495689392089844, 0.08952713012695312, 0.10409736633300781, 0.1186676025390625, 0.1332378387451172, 0.14780807495117188, 0.16237831115722656, 0.17694854736328125, 0.19151878356933594, 0.20608901977539062, 0.2206592559814453, 0.2352294921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 10.0, 16.0, 44.0, 100.0, 210.0, 298.0, 196.0, 75.0, 29.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5799061059951782, -1.5246837139129639, -1.469461441040039, -1.4142390489578247, -1.3590166568756104, -1.303794264793396, -1.2485718727111816, -1.1933495998382568, -1.1381272077560425, -1.0829048156738281, -1.0276825428009033, -0.972460150718689, -0.9172377586364746, -0.8620153665542603, -0.8067930340766907, -0.7515707015991211, -0.6963483095169067, -0.6411259174346924, -0.5859035849571228, -0.5306812524795532, -0.47545886039733887, -0.4202364981174469, -0.36501413583755493, -0.30979177355766296, -0.254569411277771, -0.19934704899787903, -0.14412468671798706, -0.08890232443809509, -0.033679962158203125, 0.021542400121688843, 0.07676476240158081, 0.13198712468147278, 0.1872096061706543, 0.24243196845054626, 0.29765433073043823, 0.3528766930103302, 0.40809905529022217, 0.46332141757011414, 0.5185437798500061, 0.5737661123275757, 0.62898850440979, 0.6842108964920044, 0.739433228969574, 0.7946555614471436, 0.8498779535293579, 0.9051003456115723, 0.9603226780891418, 1.0155450105667114, 1.0707674026489258, 1.1259897947311401, 1.1812121868133545, 1.2364344596862793, 1.2916568517684937, 1.346879243850708, 1.4021015167236328, 1.4573239088058472, 1.5125463008880615, 1.5677686929702759, 1.6229910850524902, 1.678213357925415, 1.7334357500076294, 1.7886581420898438, 1.8438804149627686, 1.899102807044983, 1.9543251991271973]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 3.0, 4.0, 6.0, 20.0, 14.0, 22.0, 34.0, 32.0, 40.0, 40.0, 43.0, 60.0, 70.0, 57.0, 58.0, 55.0, 56.0, 62.0, 51.0, 51.0, 45.0, 44.0, 31.0, 17.0, 18.0, 16.0, 7.0, 15.0, 6.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.018858790397644, -0.9912204742431641, -0.9635821580886841, -0.9359437823295593, -0.9083054661750793, -0.8806671500205994, -0.8530288338661194, -0.8253904581069946, -0.7977521419525146, -0.7701138257980347, -0.7424755096435547, -0.7148371338844299, -0.68719881772995, -0.65956050157547, -0.63192218542099, -0.6042838096618652, -0.5766454935073853, -0.5490071773529053, -0.5213688611984253, -0.4937305152416229, -0.46609216928482056, -0.4384538531303406, -0.4108155369758606, -0.3831771910190582, -0.35553890466690063, -0.32790058851242065, -0.3002622425556183, -0.2726239264011383, -0.24498558044433594, -0.21734726428985596, -0.18970893323421478, -0.1620706021785736, -0.13443225622177124, -0.10679392516613007, -0.07915559411048889, -0.051517270505428314, -0.02387893944978714, 0.0037593841552734375, 0.03139771521091461, 0.059036046266555786, 0.08667437732219696, 0.11431270837783813, 0.1419510394334793, 0.16958937048912048, 0.19722768664360046, 0.22486601769924164, 0.2525043487548828, 0.2801426649093628, 0.30778101086616516, 0.33541932702064514, 0.3630576729774475, 0.3906959891319275, 0.41833433508872986, 0.44597265124320984, 0.4736109972000122, 0.5012493133544922, 0.5288876295089722, 0.5565259456634521, 0.5841642618179321, 0.6118026375770569, 0.6394409537315369, 0.6670792698860168, 0.6947175860404968, 0.7223559617996216, 0.7499942779541016]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 9.0, 4.0, 3.0, 15.0, 16.0, 20.0, 41.0, 76.0, 132.0, 205.0, 402.0, 842.0, 2593.0, 12676.0, 103998.0, 770211.0, 136763.0, 15650.0, 3002.0, 1009.0, 375.0, 208.0, 107.0, 78.0, 53.0, 31.0, 16.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9356155395507812, -0.9068756103515625, -0.8781356811523438, -0.849395751953125, -0.8206558227539062, -0.7919158935546875, -0.7631759643554688, -0.73443603515625, -0.7056961059570312, -0.6769561767578125, -0.6482162475585938, -0.619476318359375, -0.5907363891601562, -0.5619964599609375, -0.5332565307617188, -0.5045166015625, -0.47577667236328125, -0.4470367431640625, -0.41829681396484375, -0.389556884765625, -0.36081695556640625, -0.3320770263671875, -0.30333709716796875, -0.27459716796875, -0.24585723876953125, -0.2171173095703125, -0.18837738037109375, -0.159637451171875, -0.13089752197265625, -0.1021575927734375, -0.07341766357421875, -0.044677734375, -0.01593780517578125, 0.0128021240234375, 0.04154205322265625, 0.070281982421875, 0.09902191162109375, 0.1277618408203125, 0.15650177001953125, 0.18524169921875, 0.21398162841796875, 0.2427215576171875, 0.27146148681640625, 0.300201416015625, 0.32894134521484375, 0.3576812744140625, 0.38642120361328125, 0.4151611328125, 0.44390106201171875, 0.4726409912109375, 0.5013809204101562, 0.530120849609375, 0.5588607788085938, 0.5876007080078125, 0.6163406372070312, 0.64508056640625, 0.6738204956054688, 0.7025604248046875, 0.7313003540039062, 0.760040283203125, 0.7887802124023438, 0.8175201416015625, 0.8462600708007812, 0.875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 19.0, 25.0, 41.0, 46.0, 57.0, 67.0, 75.0, 106.0, 103.0, 74.0, 91.0, 70.0, 68.0, 50.0, 33.0, 30.0, 16.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.38896942138671875, -0.3782806396484375, -0.36759185791015625, -0.356903076171875, -0.34621429443359375, -0.3355255126953125, -0.32483673095703125, -0.31414794921875, -0.30345916748046875, -0.2927703857421875, -0.28208160400390625, -0.271392822265625, -0.26070404052734375, -0.2500152587890625, -0.23932647705078125, -0.2286376953125, -0.21794891357421875, -0.2072601318359375, -0.19657135009765625, -0.185882568359375, -0.17519378662109375, -0.1645050048828125, -0.15381622314453125, -0.14312744140625, -0.13243865966796875, -0.1217498779296875, -0.11106109619140625, -0.100372314453125, -0.08968353271484375, -0.0789947509765625, -0.06830596923828125, -0.0576171875, -0.04692840576171875, -0.0362396240234375, -0.02555084228515625, -0.014862060546875, -0.00417327880859375, 0.0065155029296875, 0.01720428466796875, 0.02789306640625, 0.03858184814453125, 0.0492706298828125, 0.05995941162109375, 0.070648193359375, 0.08133697509765625, 0.0920257568359375, 0.10271453857421875, 0.1134033203125, 0.12409210205078125, 0.1347808837890625, 0.14546966552734375, 0.156158447265625, 0.16684722900390625, 0.1775360107421875, 0.18822479248046875, 0.19891357421875, 0.20960235595703125, 0.2202911376953125, 0.23097991943359375, 0.241668701171875, 0.25235748291015625, 0.2630462646484375, 0.27373504638671875, 0.284423828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 8.0, 3.0, 9.0, 9.0, 5.0, 14.0, 18.0, 40.0, 57.0, 68.0, 107.0, 166.0, 277.0, 492.0, 1132.0, 3168.0, 10520.0, 47042.0, 306125.0, 558289.0, 94188.0, 18367.0, 4950.0, 1797.0, 707.0, 356.0, 181.0, 135.0, 80.0, 57.0, 38.0, 46.0, 31.0, 17.0, 8.0, 7.0, 9.0, 5.0, 3.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46533203125, -0.45041656494140625, -0.4355010986328125, -0.42058563232421875, -0.405670166015625, -0.39075469970703125, -0.3758392333984375, -0.36092376708984375, -0.34600830078125, -0.33109283447265625, -0.3161773681640625, -0.30126190185546875, -0.286346435546875, -0.27143096923828125, -0.2565155029296875, -0.24160003662109375, -0.2266845703125, -0.21176910400390625, -0.1968536376953125, -0.18193817138671875, -0.167022705078125, -0.15210723876953125, -0.1371917724609375, -0.12227630615234375, -0.10736083984375, -0.09244537353515625, -0.0775299072265625, -0.06261444091796875, -0.047698974609375, -0.03278350830078125, -0.0178680419921875, -0.00295257568359375, 0.011962890625, 0.02687835693359375, 0.0417938232421875, 0.05670928955078125, 0.071624755859375, 0.08654022216796875, 0.1014556884765625, 0.11637115478515625, 0.13128662109375, 0.14620208740234375, 0.1611175537109375, 0.17603302001953125, 0.190948486328125, 0.20586395263671875, 0.2207794189453125, 0.23569488525390625, 0.2506103515625, 0.26552581787109375, 0.2804412841796875, 0.29535675048828125, 0.310272216796875, 0.32518768310546875, 0.3401031494140625, 0.35501861572265625, 0.36993408203125, 0.38484954833984375, 0.3997650146484375, 0.41468048095703125, 0.429595947265625, 0.44451141357421875, 0.4594268798828125, 0.47434234619140625, 0.4892578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 7.0, 9.0, 15.0, 13.0, 9.0, 21.0, 20.0, 22.0, 30.0, 36.0, 43.0, 33.0, 52.0, 40.0, 37.0, 46.0, 53.0, 40.0, 54.0, 49.0, 41.0, 41.0, 47.0, 28.0, 36.0, 25.0, 21.0, 27.0, 19.0, 17.0, 11.0, 15.0, 10.0, 3.0, 10.0, 9.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.650390625, -0.629425048828125, -0.60845947265625, -0.587493896484375, -0.5665283203125, -0.545562744140625, -0.52459716796875, -0.503631591796875, -0.482666015625, -0.461700439453125, -0.44073486328125, -0.419769287109375, -0.3988037109375, -0.377838134765625, -0.35687255859375, -0.335906982421875, -0.31494140625, -0.293975830078125, -0.27301025390625, -0.252044677734375, -0.2310791015625, -0.210113525390625, -0.18914794921875, -0.168182373046875, -0.147216796875, -0.126251220703125, -0.10528564453125, -0.084320068359375, -0.0633544921875, -0.042388916015625, -0.02142333984375, -0.000457763671875, 0.0205078125, 0.041473388671875, 0.06243896484375, 0.083404541015625, 0.1043701171875, 0.125335693359375, 0.14630126953125, 0.167266845703125, 0.188232421875, 0.209197998046875, 0.23016357421875, 0.251129150390625, 0.2720947265625, 0.293060302734375, 0.31402587890625, 0.334991455078125, 0.35595703125, 0.376922607421875, 0.39788818359375, 0.418853759765625, 0.4398193359375, 0.460784912109375, 0.48175048828125, 0.502716064453125, 0.523681640625, 0.544647216796875, 0.56561279296875, 0.586578369140625, 0.6075439453125, 0.628509521484375, 0.64947509765625, 0.670440673828125, 0.69140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 14.0, 25.0, 30.0, 43.0, 52.0, 75.0, 114.0, 130.0, 282.0, 479.0, 1260.0, 5710.0, 59262.0, 704925.0, 256334.0, 15674.0, 2383.0, 790.0, 380.0, 209.0, 116.0, 82.0, 53.0, 45.0, 21.0, 16.0, 7.0, 7.0, 4.0, 10.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193603515625, -0.18686866760253906, -0.18013381958007812, -0.1733989715576172, -0.16666412353515625, -0.1599292755126953, -0.15319442749023438, -0.14645957946777344, -0.1397247314453125, -0.13298988342285156, -0.12625503540039062, -0.11952018737792969, -0.11278533935546875, -0.10605049133300781, -0.09931564331054688, -0.09258079528808594, -0.085845947265625, -0.07911109924316406, -0.07237625122070312, -0.06564140319824219, -0.05890655517578125, -0.05217170715332031, -0.045436859130859375, -0.03870201110839844, -0.0319671630859375, -0.025232315063476562, -0.018497467041015625, -0.011762619018554688, -0.00502777099609375, 0.0017070770263671875, 0.008441925048828125, 0.015176773071289062, 0.02191162109375, 0.028646469116210938, 0.035381317138671875, 0.04211616516113281, 0.04885101318359375, 0.05558586120605469, 0.062320709228515625, 0.06905555725097656, 0.0757904052734375, 0.08252525329589844, 0.08926010131835938, 0.09599494934082031, 0.10272979736328125, 0.10946464538574219, 0.11619949340820312, 0.12293434143066406, 0.129669189453125, 0.13640403747558594, 0.14313888549804688, 0.1498737335205078, 0.15660858154296875, 0.1633434295654297, 0.17007827758789062, 0.17681312561035156, 0.1835479736328125, 0.19028282165527344, 0.19701766967773438, 0.2037525177001953, 0.21048736572265625, 0.2172222137451172, 0.22395706176757812, 0.23069190979003906, 0.2374267578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 15.0, 31.0, 87.0, 270.0, 358.0, 137.0, 57.0, 24.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008192062377929688, -0.0008028671145439148, -0.0007865279912948608, -0.0007701888680458069, -0.0007538497447967529, -0.000737510621547699, -0.000721171498298645, -0.0007048323750495911, -0.0006884932518005371, -0.0006721541285514832, -0.0006558150053024292, -0.0006394758820533752, -0.0006231367588043213, -0.0006067976355552673, -0.0005904585123062134, -0.0005741193890571594, -0.0005577802658081055, -0.0005414411425590515, -0.0005251020193099976, -0.0005087628960609436, -0.0004924237728118896, -0.0004760846495628357, -0.00045974552631378174, -0.0004434064030647278, -0.00042706727981567383, -0.0004107281565666199, -0.0003943890333175659, -0.00037804991006851196, -0.000361710786819458, -0.00034537166357040405, -0.0003290325403213501, -0.00031269341707229614, -0.0002963542938232422, -0.00028001517057418823, -0.0002636760473251343, -0.0002473369240760803, -0.00023099780082702637, -0.0002146586775779724, -0.00019831955432891846, -0.0001819804310798645, -0.00016564130783081055, -0.0001493021845817566, -0.00013296306133270264, -0.00011662393808364868, -0.00010028481483459473, -8.394569158554077e-05, -6.760656833648682e-05, -5.126744508743286e-05, -3.4928321838378906e-05, -1.858919858932495e-05, -2.250075340270996e-06, 1.4089047908782959e-05, 3.0428171157836914e-05, 4.676729440689087e-05, 6.310641765594482e-05, 7.944554090499878e-05, 9.578466415405273e-05, 0.00011212378740310669, 0.00012846291065216064, 0.0001448020339012146, 0.00016114115715026855, 0.0001774802803993225, 0.00019381940364837646, 0.00021015852689743042, 0.00022649765014648438]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 10.0, 12.0, 26.0, 25.0, 49.0, 83.0, 128.0, 265.0, 568.0, 1418.0, 4315.0, 26251.0, 392611.0, 572882.0, 41242.0, 5591.0, 1690.0, 652.0, 320.0, 159.0, 102.0, 52.0, 34.0, 20.0, 18.0, 7.0, 8.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.189208984375, -0.18270492553710938, -0.17620086669921875, -0.16969680786132812, -0.1631927490234375, -0.15668869018554688, -0.15018463134765625, -0.14368057250976562, -0.137176513671875, -0.13067245483398438, -0.12416839599609375, -0.11766433715820312, -0.1111602783203125, -0.10465621948242188, -0.09815216064453125, -0.09164810180664062, -0.08514404296875, -0.07863998413085938, -0.07213592529296875, -0.06563186645507812, -0.0591278076171875, -0.052623748779296875, -0.04611968994140625, -0.039615631103515625, -0.033111572265625, -0.026607513427734375, -0.02010345458984375, -0.013599395751953125, -0.0070953369140625, -0.000591278076171875, 0.00591278076171875, 0.012416839599609375, 0.0189208984375, 0.025424957275390625, 0.03192901611328125, 0.038433074951171875, 0.0449371337890625, 0.051441192626953125, 0.05794525146484375, 0.06444931030273438, 0.070953369140625, 0.07745742797851562, 0.08396148681640625, 0.09046554565429688, 0.0969696044921875, 0.10347366333007812, 0.10997772216796875, 0.11648178100585938, 0.12298583984375, 0.12948989868164062, 0.13599395751953125, 0.14249801635742188, 0.1490020751953125, 0.15550613403320312, 0.16201019287109375, 0.16851425170898438, 0.175018310546875, 0.18152236938476562, 0.18802642822265625, 0.19453048706054688, 0.2010345458984375, 0.20753860473632812, 0.21404266357421875, 0.22054672241210938, 0.22705078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 19.0, 30.0, 53.0, 96.0, 149.0, 202.0, 175.0, 100.0, 71.0, 40.0, 25.0, 10.0, 11.0, 4.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2450103759765625, -0.234649658203125, -0.2242889404296875, -0.21392822265625, -0.2035675048828125, -0.193206787109375, -0.1828460693359375, -0.1724853515625, -0.1621246337890625, -0.151763916015625, -0.1414031982421875, -0.13104248046875, -0.1206817626953125, -0.110321044921875, -0.0999603271484375, -0.089599609375, -0.0792388916015625, -0.068878173828125, -0.0585174560546875, -0.04815673828125, -0.0377960205078125, -0.027435302734375, -0.0170745849609375, -0.0067138671875, 0.0036468505859375, 0.014007568359375, 0.0243682861328125, 0.03472900390625, 0.0450897216796875, 0.055450439453125, 0.0658111572265625, 0.076171875, 0.0865325927734375, 0.096893310546875, 0.1072540283203125, 0.11761474609375, 0.1279754638671875, 0.138336181640625, 0.1486968994140625, 0.1590576171875, 0.1694183349609375, 0.179779052734375, 0.1901397705078125, 0.20050048828125, 0.2108612060546875, 0.221221923828125, 0.2315826416015625, 0.241943359375, 0.2523040771484375, 0.262664794921875, 0.2730255126953125, 0.28338623046875, 0.2937469482421875, 0.304107666015625, 0.3144683837890625, 0.3248291015625, 0.3351898193359375, 0.345550537109375, 0.3559112548828125, 0.36627197265625, 0.3766326904296875, 0.386993408203125, 0.3973541259765625, 0.40771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 19.0, 145.0, 495.0, 259.0, 62.0, 14.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.169074058532715, -6.876773834228516, -6.584473133087158, -6.292172431945801, -5.999872207641602, -5.707571983337402, -5.415271282196045, -5.1229705810546875, -4.830670356750488, -4.538370132446289, -4.246069431304932, -3.9537689685821533, -3.661468505859375, -3.3691680431365967, -3.0768675804138184, -2.78456711769104, -2.4922666549682617, -2.1999661922454834, -1.907665729522705, -1.6153652667999268, -1.3230648040771484, -1.0307643413543701, -0.7384638786315918, -0.4461634159088135, -0.15386295318603516, 0.13843750953674316, 0.4307379722595215, 0.7230384349822998, 1.0153388977050781, 1.3076393604278564, 1.5999398231506348, 1.892240285873413, 2.184539794921875, 2.4768402576446533, 2.7691407203674316, 3.06144118309021, 3.3537416458129883, 3.6460421085357666, 3.938342571258545, 4.230643272399902, 4.522943496704102, 4.815243721008301, 5.107544422149658, 5.399845123291016, 5.692145347595215, 5.984445571899414, 6.2767462730407715, 6.569046974182129, 6.861347198486328, 7.153647422790527, 7.445948123931885, 7.738248825073242, 8.030549049377441, 8.32284927368164, 8.615150451660156, 8.907450675964355, 9.199750900268555, 9.492051124572754, 9.784351348876953, 10.076652526855469, 10.368952751159668, 10.661252975463867, 10.953554153442383, 11.245854377746582, 11.538154602050781]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 2.0, 9.0, 7.0, 7.0, 7.0, 8.0, 10.0, 9.0, 13.0, 16.0, 21.0, 20.0, 16.0, 37.0, 26.0, 27.0, 34.0, 33.0, 34.0, 31.0, 43.0, 34.0, 43.0, 49.0, 40.0, 36.0, 45.0, 29.0, 30.0, 44.0, 25.0, 23.0, 21.0, 32.0, 22.0, 17.0, 20.0, 14.0, 16.0, 10.0, 11.0, 7.0, 3.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.585902214050293, -2.4994189739227295, -2.412935495376587, -2.3264522552490234, -2.239968776702881, -2.1534855365753174, -2.067002296447754, -1.9805189371109009, -1.8940355777740479, -1.8075522184371948, -1.7210688591003418, -1.6345856189727783, -1.5481022596359253, -1.4616189002990723, -1.3751356601715088, -1.2886523008346558, -1.2021689414978027, -1.1156855821609497, -1.0292022228240967, -0.9427189826965332, -0.8562356233596802, -0.7697522640228271, -0.6832689642906189, -0.5967856645584106, -0.5103023052215576, -0.423818975687027, -0.33733564615249634, -0.2508523166179657, -0.16436898708343506, -0.07788565754890442, 0.00859767198562622, 0.09508097171783447, 0.1815643310546875, 0.26804766058921814, 0.3545309901237488, 0.4410143196582794, 0.5274976491928101, 0.6139810085296631, 0.7004643082618713, 0.7869476079940796, 0.8734309673309326, 0.9599143266677856, 1.0463976860046387, 1.1328809261322021, 1.2193642854690552, 1.3058476448059082, 1.3923308849334717, 1.4788142442703247, 1.5652976036071777, 1.6517809629440308, 1.7382643222808838, 1.8247475624084473, 1.9112309217453003, 1.9977142810821533, 2.084197521209717, 2.1706809997558594, 2.257164239883423, 2.3436474800109863, 2.430130958557129, 2.5166141986846924, 2.603097438812256, 2.6895809173583984, 2.776064157485962, 2.8625473976135254, 2.949030876159668]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 10.0, 18.0, 39.0, 45.0, 70.0, 120.0, 230.0, 444.0, 1026.0, 2250.0, 6045.0, 20469.0, 285254.0, 3832270.0, 32991.0, 7907.0, 2721.0, 1178.0, 531.0, 254.0, 146.0, 85.0, 50.0, 32.0, 21.0, 21.0, 12.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1298828125, -1.0947265625, -1.0595703125, -1.0244140625, -0.9892578125, -0.9541015625, -0.9189453125, -0.8837890625, -0.8486328125, -0.8134765625, -0.7783203125, -0.7431640625, -0.7080078125, -0.6728515625, -0.6376953125, -0.6025390625, -0.5673828125, -0.5322265625, -0.4970703125, -0.4619140625, -0.4267578125, -0.3916015625, -0.3564453125, -0.3212890625, -0.2861328125, -0.2509765625, -0.2158203125, -0.1806640625, -0.1455078125, -0.1103515625, -0.0751953125, -0.0400390625, -0.0048828125, 0.0302734375, 0.0654296875, 0.1005859375, 0.1357421875, 0.1708984375, 0.2060546875, 0.2412109375, 0.2763671875, 0.3115234375, 0.3466796875, 0.3818359375, 0.4169921875, 0.4521484375, 0.4873046875, 0.5224609375, 0.5576171875, 0.5927734375, 0.6279296875, 0.6630859375, 0.6982421875, 0.7333984375, 0.7685546875, 0.8037109375, 0.8388671875, 0.8740234375, 0.9091796875, 0.9443359375, 0.9794921875, 1.0146484375, 1.0498046875, 1.0849609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 12.0, 19.0, 12.0, 22.0, 40.0, 40.0, 56.0, 54.0, 64.0, 75.0, 80.0, 79.0, 82.0, 77.0, 59.0, 61.0, 49.0, 38.0, 31.0, 23.0, 12.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358154296875, -0.3479766845703125, -0.337799072265625, -0.3276214599609375, -0.31744384765625, -0.3072662353515625, -0.297088623046875, -0.2869110107421875, -0.2767333984375, -0.2665557861328125, -0.256378173828125, -0.2462005615234375, -0.23602294921875, -0.2258453369140625, -0.215667724609375, -0.2054901123046875, -0.1953125, -0.1851348876953125, -0.174957275390625, -0.1647796630859375, -0.15460205078125, -0.1444244384765625, -0.134246826171875, -0.1240692138671875, -0.1138916015625, -0.1037139892578125, -0.093536376953125, -0.0833587646484375, -0.07318115234375, -0.0630035400390625, -0.052825927734375, -0.0426483154296875, -0.032470703125, -0.0222930908203125, -0.012115478515625, -0.0019378662109375, 0.00823974609375, 0.0184173583984375, 0.028594970703125, 0.0387725830078125, 0.0489501953125, 0.0591278076171875, 0.069305419921875, 0.0794830322265625, 0.08966064453125, 0.0998382568359375, 0.110015869140625, 0.1201934814453125, 0.13037109375, 0.1405487060546875, 0.150726318359375, 0.1609039306640625, 0.17108154296875, 0.1812591552734375, 0.191436767578125, 0.2016143798828125, 0.2117919921875, 0.2219696044921875, 0.232147216796875, 0.2423248291015625, 0.25250244140625, 0.2626800537109375, 0.272857666015625, 0.2830352783203125, 0.293212890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 8.0, 11.0, 15.0, 24.0, 28.0, 36.0, 62.0, 94.0, 154.0, 354.0, 685.0, 1738.0, 6766.0, 61963.0, 4047341.0, 64561.0, 7075.0, 1782.0, 734.0, 370.0, 158.0, 110.0, 58.0, 39.0, 36.0, 19.0, 19.0, 16.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93798828125, -0.9061965942382812, -0.8744049072265625, -0.8426132202148438, -0.810821533203125, -0.7790298461914062, -0.7472381591796875, -0.7154464721679688, -0.68365478515625, -0.6518630981445312, -0.6200714111328125, -0.5882797241210938, -0.556488037109375, -0.5246963500976562, -0.4929046630859375, -0.46111297607421875, -0.4293212890625, -0.39752960205078125, -0.3657379150390625, -0.33394622802734375, -0.302154541015625, -0.27036285400390625, -0.2385711669921875, -0.20677947998046875, -0.17498779296875, -0.14319610595703125, -0.1114044189453125, -0.07961273193359375, -0.047821044921875, -0.01602935791015625, 0.0157623291015625, 0.04755401611328125, 0.079345703125, 0.11113739013671875, 0.1429290771484375, 0.17472076416015625, 0.206512451171875, 0.23830413818359375, 0.2700958251953125, 0.30188751220703125, 0.33367919921875, 0.36547088623046875, 0.3972625732421875, 0.42905426025390625, 0.460845947265625, 0.49263763427734375, 0.5244293212890625, 0.5562210083007812, 0.5880126953125, 0.6198043823242188, 0.6515960693359375, 0.6833877563476562, 0.715179443359375, 0.7469711303710938, 0.7787628173828125, 0.8105545043945312, 0.84234619140625, 0.8741378784179688, 0.9059295654296875, 0.9377212524414062, 0.969512939453125, 1.0013046264648438, 1.0330963134765625, 1.0648880004882812, 1.0966796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 27.0, 21.0, 93.0, 447.0, 3199.0, 152.0, 56.0, 22.0, 23.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.3557853698730469, -0.33730316162109375, -0.3188209533691406, -0.3003387451171875, -0.2818565368652344, -0.26337432861328125, -0.24489212036132812, -0.226409912109375, -0.20792770385742188, -0.18944549560546875, -0.17096328735351562, -0.1524810791015625, -0.13399887084960938, -0.11551666259765625, -0.09703445434570312, -0.07855224609375, -0.060070037841796875, -0.04158782958984375, -0.023105621337890625, -0.0046234130859375, 0.013858795166015625, 0.03234100341796875, 0.050823211669921875, 0.069305419921875, 0.08778762817382812, 0.10626983642578125, 0.12475204467773438, 0.1432342529296875, 0.16171646118164062, 0.18019866943359375, 0.19868087768554688, 0.2171630859375, 0.23564529418945312, 0.25412750244140625, 0.2726097106933594, 0.2910919189453125, 0.3095741271972656, 0.32805633544921875, 0.3465385437011719, 0.365020751953125, 0.3835029602050781, 0.40198516845703125, 0.4204673767089844, 0.4389495849609375, 0.4574317932128906, 0.47591400146484375, 0.4943962097167969, 0.51287841796875, 0.5313606262207031, 0.5498428344726562, 0.5683250427246094, 0.5868072509765625, 0.6052894592285156, 0.6237716674804688, 0.6422538757324219, 0.660736083984375, 0.6792182922363281, 0.6977005004882812, 0.7161827087402344, 0.7346649169921875, 0.7531471252441406, 0.7716293334960938, 0.7901115417480469, 0.80859375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 14.0, 30.0, 147.0, 493.0, 225.0, 59.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8485846519470215, -1.7629787921905518, -1.6773728132247925, -1.5917669534683228, -1.506161093711853, -1.4205551147460938, -1.334949254989624, -1.2493433952331543, -1.1637375354766846, -1.0781316757202148, -0.9925257563591003, -0.9069198369979858, -0.8213139772415161, -0.7357080578804016, -0.6501021385192871, -0.5644962787628174, -0.4788902997970581, -0.393284410238266, -0.3076785206794739, -0.22207260131835938, -0.13646671175956726, -0.050860822200775146, 0.034745097160339355, 0.12035095691680908, 0.20595687627792358, 0.2915627658367157, 0.3771686553955078, 0.4627745747566223, 0.5483804941177368, 0.6339863538742065, 0.719592273235321, 0.8051981329917908, 0.8908040523529053, 0.9764099717140198, 1.0620158910751343, 1.147621750831604, 1.2332276105880737, 1.318833589553833, 1.4044394493103027, 1.4900453090667725, 1.5756511688232422, 1.661257028579712, 1.7468630075454712, 1.832468867301941, 1.9180747270584106, 2.00368070602417, 2.0892865657806396, 2.1748924255371094, 2.260498523712158, 2.346104383468628, 2.4317102432250977, 2.5173163414001465, 2.602922201156616, 2.688528060913086, 2.7741339206695557, 2.8597397804260254, 2.945345640182495, 3.030951499938965, 3.1165573596954346, 3.2021632194519043, 3.287769317626953, 3.373375177383423, 3.4589810371398926, 3.5445868968963623, 3.630192756652832]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 13.0, 5.0, 10.0, 16.0, 24.0, 42.0, 49.0, 54.0, 47.0, 68.0, 78.0, 64.0, 80.0, 61.0, 58.0, 65.0, 60.0, 35.0, 30.0, 38.0, 28.0, 20.0, 13.0, 8.0, 11.0, 12.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.15854811668396, -1.1239628791809082, -1.089377522468567, -1.0547922849655151, -1.0202069282531738, -0.9856216907501221, -0.9510364532470703, -0.9164511561393738, -0.8818658590316772, -0.8472805619239807, -0.8126952648162842, -0.7781100273132324, -0.7435247302055359, -0.7089394330978394, -0.6743541955947876, -0.6397688984870911, -0.6051836013793945, -0.570598304271698, -0.5360130071640015, -0.5014277696609497, -0.4668424725532532, -0.43225717544555664, -0.3976719081401825, -0.36308664083480835, -0.3285013437271118, -0.2939160466194153, -0.25933077931404114, -0.2247454971075058, -0.19016021490097046, -0.15557493269443512, -0.12098965048789978, -0.08640436828136444, -0.0518190860748291, -0.017233803868293762, 0.017351478338241577, 0.051936760544776917, 0.08652204275131226, 0.1211073249578476, 0.15569260716438293, 0.19027788937091827, 0.2248631715774536, 0.25944846868515015, 0.2940337359905243, 0.32861900329589844, 0.36320430040359497, 0.3977895975112915, 0.43237486481666565, 0.4669601321220398, 0.5015454292297363, 0.5361307263374329, 0.5707160234451294, 0.6053012609481812, 0.6398865580558777, 0.6744718551635742, 0.709057092666626, 0.7436423897743225, 0.778227686882019, 0.8128129839897156, 0.8473982810974121, 0.8819835186004639, 0.9165688157081604, 0.9511541128158569, 0.9857393503189087, 1.02032470703125, 1.0549099445343018]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 11.0, 22.0, 29.0, 49.0, 66.0, 114.0, 191.0, 360.0, 684.0, 1570.0, 4413.0, 15428.0, 69977.0, 416285.0, 440600.0, 74658.0, 16097.0, 4644.0, 1748.0, 754.0, 330.0, 176.0, 119.0, 84.0, 43.0, 30.0, 20.0, 12.0, 11.0, 1.0, 3.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.6849441528320312, -0.6648101806640625, -0.6446762084960938, -0.624542236328125, -0.6044082641601562, -0.5842742919921875, -0.5641403198242188, -0.54400634765625, -0.5238723754882812, -0.5037384033203125, -0.48360443115234375, -0.463470458984375, -0.44333648681640625, -0.4232025146484375, -0.40306854248046875, -0.3829345703125, -0.36280059814453125, -0.3426666259765625, -0.32253265380859375, -0.302398681640625, -0.28226470947265625, -0.2621307373046875, -0.24199676513671875, -0.22186279296875, -0.20172882080078125, -0.1815948486328125, -0.16146087646484375, -0.141326904296875, -0.12119293212890625, -0.1010589599609375, -0.08092498779296875, -0.060791015625, -0.04065704345703125, -0.0205230712890625, -0.00038909912109375, 0.019744873046875, 0.03987884521484375, 0.0600128173828125, 0.08014678955078125, 0.10028076171875, 0.12041473388671875, 0.1405487060546875, 0.16068267822265625, 0.180816650390625, 0.20095062255859375, 0.2210845947265625, 0.24121856689453125, 0.2613525390625, 0.28148651123046875, 0.3016204833984375, 0.32175445556640625, 0.341888427734375, 0.36202239990234375, 0.3821563720703125, 0.40229034423828125, 0.42242431640625, 0.44255828857421875, 0.4626922607421875, 0.48282623291015625, 0.502960205078125, 0.5230941772460938, 0.5432281494140625, 0.5633621215820312, 0.58349609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 10.0, 10.0, 17.0, 21.0, 28.0, 40.0, 46.0, 50.0, 60.0, 63.0, 72.0, 76.0, 75.0, 82.0, 83.0, 52.0, 53.0, 33.0, 48.0, 32.0, 23.0, 12.0, 6.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34033203125, -0.33028411865234375, -0.3202362060546875, -0.31018829345703125, -0.300140380859375, -0.29009246826171875, -0.2800445556640625, -0.26999664306640625, -0.25994873046875, -0.24990081787109375, -0.2398529052734375, -0.22980499267578125, -0.219757080078125, -0.20970916748046875, -0.1996612548828125, -0.18961334228515625, -0.1795654296875, -0.16951751708984375, -0.1594696044921875, -0.14942169189453125, -0.139373779296875, -0.12932586669921875, -0.1192779541015625, -0.10923004150390625, -0.09918212890625, -0.08913421630859375, -0.0790863037109375, -0.06903839111328125, -0.058990478515625, -0.04894256591796875, -0.0388946533203125, -0.02884674072265625, -0.018798828125, -0.00875091552734375, 0.0012969970703125, 0.01134490966796875, 0.021392822265625, 0.03144073486328125, 0.0414886474609375, 0.05153656005859375, 0.06158447265625, 0.07163238525390625, 0.0816802978515625, 0.09172821044921875, 0.101776123046875, 0.11182403564453125, 0.1218719482421875, 0.13191986083984375, 0.1419677734375, 0.15201568603515625, 0.1620635986328125, 0.17211151123046875, 0.182159423828125, 0.19220733642578125, 0.2022552490234375, 0.21230316162109375, 0.22235107421875, 0.23239898681640625, 0.2424468994140625, 0.25249481201171875, 0.262542724609375, 0.27259063720703125, 0.2826385498046875, 0.29268646240234375, 0.302734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 20.0, 17.0, 30.0, 49.0, 53.0, 112.0, 167.0, 264.0, 525.0, 893.0, 1907.0, 4621.0, 14690.0, 69489.0, 498534.0, 384432.0, 52984.0, 11962.0, 3970.0, 1698.0, 893.0, 443.0, 271.0, 145.0, 110.0, 59.0, 52.0, 27.0, 22.0, 16.0, 15.0, 7.0, 8.0, 6.0, 5.0, 3.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5576171875, -0.540679931640625, -0.52374267578125, -0.506805419921875, -0.4898681640625, -0.472930908203125, -0.45599365234375, -0.439056396484375, -0.422119140625, -0.405181884765625, -0.38824462890625, -0.371307373046875, -0.3543701171875, -0.337432861328125, -0.32049560546875, -0.303558349609375, -0.28662109375, -0.269683837890625, -0.25274658203125, -0.235809326171875, -0.2188720703125, -0.201934814453125, -0.18499755859375, -0.168060302734375, -0.151123046875, -0.134185791015625, -0.11724853515625, -0.100311279296875, -0.0833740234375, -0.066436767578125, -0.04949951171875, -0.032562255859375, -0.015625, 0.001312255859375, 0.01824951171875, 0.035186767578125, 0.0521240234375, 0.069061279296875, 0.08599853515625, 0.102935791015625, 0.119873046875, 0.136810302734375, 0.15374755859375, 0.170684814453125, 0.1876220703125, 0.204559326171875, 0.22149658203125, 0.238433837890625, 0.25537109375, 0.272308349609375, 0.28924560546875, 0.306182861328125, 0.3231201171875, 0.340057373046875, 0.35699462890625, 0.373931884765625, 0.390869140625, 0.407806396484375, 0.42474365234375, 0.441680908203125, 0.4586181640625, 0.475555419921875, 0.49249267578125, 0.509429931640625, 0.5263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 7.0, 6.0, 11.0, 16.0, 21.0, 30.0, 31.0, 39.0, 53.0, 58.0, 59.0, 61.0, 62.0, 55.0, 65.0, 61.0, 68.0, 49.0, 46.0, 40.0, 32.0, 28.0, 18.0, 22.0, 12.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.03125, -0.9936676025390625, -0.956085205078125, -0.9185028076171875, -0.88092041015625, -0.8433380126953125, -0.805755615234375, -0.7681732177734375, -0.7305908203125, -0.6930084228515625, -0.655426025390625, -0.6178436279296875, -0.58026123046875, -0.5426788330078125, -0.505096435546875, -0.4675140380859375, -0.429931640625, -0.3923492431640625, -0.354766845703125, -0.3171844482421875, -0.27960205078125, -0.2420196533203125, -0.204437255859375, -0.1668548583984375, -0.1292724609375, -0.0916900634765625, -0.054107666015625, -0.0165252685546875, 0.02105712890625, 0.0586395263671875, 0.096221923828125, 0.1338043212890625, 0.17138671875, 0.2089691162109375, 0.246551513671875, 0.2841339111328125, 0.32171630859375, 0.3592987060546875, 0.396881103515625, 0.4344635009765625, 0.4720458984375, 0.5096282958984375, 0.547210693359375, 0.5847930908203125, 0.62237548828125, 0.6599578857421875, 0.697540283203125, 0.7351226806640625, 0.772705078125, 0.8102874755859375, 0.847869873046875, 0.8854522705078125, 0.92303466796875, 0.9606170654296875, 0.998199462890625, 1.0357818603515625, 1.0733642578125, 1.1109466552734375, 1.148529052734375, 1.1861114501953125, 1.22369384765625, 1.2612762451171875, 1.298858642578125, 1.3364410400390625, 1.3740234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 10.0, 14.0, 12.0, 32.0, 28.0, 47.0, 76.0, 158.0, 360.0, 864.0, 2877.0, 20156.0, 597151.0, 408264.0, 14670.0, 2385.0, 755.0, 293.0, 157.0, 89.0, 51.0, 32.0, 10.0, 9.0, 16.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2917671203613281, -0.28202056884765625, -0.2722740173339844, -0.2625274658203125, -0.2527809143066406, -0.24303436279296875, -0.23328781127929688, -0.223541259765625, -0.21379470825195312, -0.20404815673828125, -0.19430160522460938, -0.1845550537109375, -0.17480850219726562, -0.16506195068359375, -0.15531539916992188, -0.14556884765625, -0.13582229614257812, -0.12607574462890625, -0.11632919311523438, -0.1065826416015625, -0.09683609008789062, -0.08708953857421875, -0.07734298706054688, -0.067596435546875, -0.057849884033203125, -0.04810333251953125, -0.038356781005859375, -0.0286102294921875, -0.018863677978515625, -0.00911712646484375, 0.000629425048828125, 0.0103759765625, 0.020122528076171875, 0.02986907958984375, 0.039615631103515625, 0.0493621826171875, 0.059108734130859375, 0.06885528564453125, 0.07860183715820312, 0.088348388671875, 0.09809494018554688, 0.10784149169921875, 0.11758804321289062, 0.1273345947265625, 0.13708114624023438, 0.14682769775390625, 0.15657424926757812, 0.16632080078125, 0.17606735229492188, 0.18581390380859375, 0.19556045532226562, 0.2053070068359375, 0.21505355834960938, 0.22480010986328125, 0.23454666137695312, 0.244293212890625, 0.2540397644042969, 0.26378631591796875, 0.2735328674316406, 0.2832794189453125, 0.2930259704589844, 0.30277252197265625, 0.3125190734863281, 0.322265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 14.0, 18.0, 36.0, 38.0, 54.0, 67.0, 112.0, 201.0, 156.0, 89.0, 62.0, 43.0, 35.0, 26.0, 14.0, 9.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.0002986006438732147, -0.0002910718321800232, -0.00028354302048683167, -0.00027601420879364014, -0.0002684853971004486, -0.0002609565854072571, -0.00025342777371406555, -0.000245898962020874, -0.0002383701503276825, -0.00023084133863449097, -0.00022331252694129944, -0.0002157837152481079, -0.00020825490355491638, -0.00020072609186172485, -0.00019319728016853333, -0.0001856684684753418, -0.00017813965678215027, -0.00017061084508895874, -0.0001630820333957672, -0.00015555322170257568, -0.00014802441000938416, -0.00014049559831619263, -0.0001329667866230011, -0.00012543797492980957, -0.00011790916323661804, -0.00011038035154342651, -0.00010285153985023499, -9.532272815704346e-05, -8.779391646385193e-05, -8.02651047706604e-05, -7.273629307746887e-05, -6.520748138427734e-05, -5.7678669691085815e-05, -5.014985799789429e-05, -4.262104630470276e-05, -3.509223461151123e-05, -2.7563422918319702e-05, -2.0034611225128174e-05, -1.2505799531936646e-05, -4.976987838745117e-06, 2.551823854446411e-06, 1.008063554763794e-05, 1.7609447240829468e-05, 2.5138258934020996e-05, 3.2667070627212524e-05, 4.019588232040405e-05, 4.772469401359558e-05, 5.525350570678711e-05, 6.278231739997864e-05, 7.031112909317017e-05, 7.78399407863617e-05, 8.536875247955322e-05, 9.289756417274475e-05, 0.00010042637586593628, 0.00010795518755912781, 0.00011548399925231934, 0.00012301281094551086, 0.0001305416226387024, 0.00013807043433189392, 0.00014559924602508545, 0.00015312805771827698, 0.0001606568694114685, 0.00016818568110466003, 0.00017571449279785156]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 15.0, 31.0, 49.0, 64.0, 177.0, 353.0, 921.0, 2841.0, 14686.0, 167288.0, 752761.0, 95496.0, 10169.0, 2275.0, 751.0, 286.0, 151.0, 98.0, 58.0, 18.0, 17.0, 13.0, 6.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23465728759765625, -0.2263946533203125, -0.21813201904296875, -0.209869384765625, -0.20160675048828125, -0.1933441162109375, -0.18508148193359375, -0.17681884765625, -0.16855621337890625, -0.1602935791015625, -0.15203094482421875, -0.143768310546875, -0.13550567626953125, -0.1272430419921875, -0.11898040771484375, -0.1107177734375, -0.10245513916015625, -0.0941925048828125, -0.08592987060546875, -0.077667236328125, -0.06940460205078125, -0.0611419677734375, -0.05287933349609375, -0.04461669921875, -0.03635406494140625, -0.0280914306640625, -0.01982879638671875, -0.011566162109375, -0.00330352783203125, 0.0049591064453125, 0.01322174072265625, 0.021484375, 0.02974700927734375, 0.0380096435546875, 0.04627227783203125, 0.054534912109375, 0.06279754638671875, 0.0710601806640625, 0.07932281494140625, 0.08758544921875, 0.09584808349609375, 0.1041107177734375, 0.11237335205078125, 0.120635986328125, 0.12889862060546875, 0.1371612548828125, 0.14542388916015625, 0.1536865234375, 0.16194915771484375, 0.1702117919921875, 0.17847442626953125, 0.186737060546875, 0.19499969482421875, 0.2032623291015625, 0.21152496337890625, 0.21978759765625, 0.22805023193359375, 0.2363128662109375, 0.24457550048828125, 0.252838134765625, 0.26110076904296875, 0.2693634033203125, 0.27762603759765625, 0.285888671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 14.0, 14.0, 23.0, 33.0, 33.0, 46.0, 71.0, 111.0, 141.0, 163.0, 120.0, 63.0, 54.0, 30.0, 26.0, 13.0, 17.0, 8.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3231315612792969, -0.31154632568359375, -0.2999610900878906, -0.2883758544921875, -0.2767906188964844, -0.26520538330078125, -0.2536201477050781, -0.242034912109375, -0.23044967651367188, -0.21886444091796875, -0.20727920532226562, -0.1956939697265625, -0.18410873413085938, -0.17252349853515625, -0.16093826293945312, -0.14935302734375, -0.13776779174804688, -0.12618255615234375, -0.11459732055664062, -0.1030120849609375, -0.09142684936523438, -0.07984161376953125, -0.06825637817382812, -0.056671142578125, -0.045085906982421875, -0.03350067138671875, -0.021915435791015625, -0.0103302001953125, 0.001255035400390625, 0.01284027099609375, 0.024425506591796875, 0.0360107421875, 0.047595977783203125, 0.05918121337890625, 0.07076644897460938, 0.0823516845703125, 0.09393692016601562, 0.10552215576171875, 0.11710739135742188, 0.128692626953125, 0.14027786254882812, 0.15186309814453125, 0.16344833374023438, 0.1750335693359375, 0.18661880493164062, 0.19820404052734375, 0.20978927612304688, 0.22137451171875, 0.23295974731445312, 0.24454498291015625, 0.2561302185058594, 0.2677154541015625, 0.2793006896972656, 0.29088592529296875, 0.3024711608886719, 0.314056396484375, 0.3256416320800781, 0.33722686767578125, 0.3488121032714844, 0.3603973388671875, 0.3719825744628906, 0.38356781005859375, 0.3951530456542969, 0.40673828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 15.0, 30.0, 45.0, 104.0, 207.0, 253.0, 158.0, 81.0, 46.0, 28.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.850019931793213, -2.675107717514038, -2.500195264816284, -2.3252830505371094, -2.1503705978393555, -1.9754583835601807, -1.8005461692810059, -1.6256338357925415, -1.4507215023040771, -1.2758091688156128, -1.1008968353271484, -0.9259846210479736, -0.7510722875595093, -0.5761599540710449, -0.4012477397918701, -0.22633540630340576, -0.051423072814941406, 0.12348923087120056, 0.29840153455734253, 0.4733138084411621, 0.6482261419296265, 0.8231384754180908, 0.9980506896972656, 1.17296302318573, 1.3478753566741943, 1.5227876901626587, 1.697700023651123, 1.8726122379302979, 2.0475244522094727, 2.2224369049072266, 2.3973491191864014, 2.572261333465576, 2.7471742630004883, 2.922086477279663, 3.096998929977417, 3.271911144256592, 3.4468235969543457, 3.6217358112335205, 3.7966480255126953, 3.971560478210449, 4.146472930908203, 4.321385383605957, 4.496297359466553, 4.671209812164307, 4.8461222648620605, 5.021034240722656, 5.19594669342041, 5.370859146118164, 5.54577112197876, 5.720683574676514, 5.895595550537109, 6.070508003234863, 6.245420455932617, 6.420332908630371, 6.595244884490967, 6.770157337188721, 6.945069313049316, 7.11998176574707, 7.294893741607666, 7.46980619430542, 7.644718647003174, 7.8196306228637695, 7.994543075561523, 8.169455528259277, 8.344367980957031]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 6.0, 6.0, 7.0, 22.0, 15.0, 14.0, 18.0, 20.0, 33.0, 17.0, 39.0, 26.0, 35.0, 35.0, 35.0, 48.0, 35.0, 50.0, 52.0, 43.0, 42.0, 35.0, 42.0, 35.0, 35.0, 32.0, 27.0, 28.0, 30.0, 23.0, 15.0, 15.0, 11.0, 10.0, 8.0, 9.0, 10.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.188874244689941, -5.028903961181641, -4.868933200836182, -4.708962917327881, -4.54899263381958, -4.389021873474121, -4.22905158996582, -4.0690813064575195, -3.9091107845306396, -3.7491402626037598, -3.589169979095459, -3.429199457168579, -3.269228935241699, -3.1092586517333984, -2.9492881298065186, -2.7893176078796387, -2.629347324371338, -2.469376802444458, -2.3094065189361572, -2.1494359970092773, -1.989465594291687, -1.8294951915740967, -1.6695246696472168, -1.5095542669296265, -1.3495838642120361, -1.1896134614944458, -1.0296430587768555, -0.8696725368499756, -0.7097021341323853, -0.5497317314147949, -0.3897612690925598, -0.2297908067703247, -0.06982040405273438, 0.09015002846717834, 0.25012046098709106, 0.4100908935070038, 0.5700613260269165, 0.7300317287445068, 0.8900021910667419, 1.049972653388977, 1.2099430561065674, 1.3699134588241577, 1.529883861541748, 1.689854383468628, 1.8498247861862183, 2.0097951889038086, 2.1697657108306885, 2.3297362327575684, 2.489706516265869, 2.649677038192749, 2.80964732170105, 2.9696178436279297, 3.1295881271362305, 3.2895586490631104, 3.4495291709899902, 3.609499454498291, 3.769469976425171, 3.929440498352051, 4.089410781860352, 4.249381065368652, 4.409351825714111, 4.569322109222412, 4.729292392730713, 4.889263153076172, 5.049233436584473]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 11.0, 8.0, 30.0, 18.0, 36.0, 76.0, 79.0, 138.0, 224.0, 374.0, 635.0, 1038.0, 1754.0, 3468.0, 6708.0, 15074.0, 45428.0, 894545.0, 3139230.0, 53414.0, 16437.0, 6982.0, 3607.0, 1931.0, 1114.0, 696.0, 436.0, 263.0, 160.0, 112.0, 74.0, 64.0, 31.0, 26.0, 20.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.76904296875, -0.747100830078125, -0.72515869140625, -0.703216552734375, -0.6812744140625, -0.659332275390625, -0.63739013671875, -0.615447998046875, -0.593505859375, -0.571563720703125, -0.54962158203125, -0.527679443359375, -0.5057373046875, -0.483795166015625, -0.46185302734375, -0.439910888671875, -0.41796875, -0.396026611328125, -0.37408447265625, -0.352142333984375, -0.3302001953125, -0.308258056640625, -0.28631591796875, -0.264373779296875, -0.242431640625, -0.220489501953125, -0.19854736328125, -0.176605224609375, -0.1546630859375, -0.132720947265625, -0.11077880859375, -0.088836669921875, -0.06689453125, -0.044952392578125, -0.02301025390625, -0.001068115234375, 0.0208740234375, 0.042816162109375, 0.06475830078125, 0.086700439453125, 0.108642578125, 0.130584716796875, 0.15252685546875, 0.174468994140625, 0.1964111328125, 0.218353271484375, 0.24029541015625, 0.262237548828125, 0.2841796875, 0.306121826171875, 0.32806396484375, 0.350006103515625, 0.3719482421875, 0.393890380859375, 0.41583251953125, 0.437774658203125, 0.459716796875, 0.481658935546875, 0.50360107421875, 0.525543212890625, 0.5474853515625, 0.569427490234375, 0.59136962890625, 0.613311767578125, 0.63525390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 7.0, 5.0, 8.0, 13.0, 13.0, 20.0, 33.0, 19.0, 26.0, 40.0, 40.0, 42.0, 43.0, 42.0, 56.0, 75.0, 50.0, 68.0, 50.0, 48.0, 50.0, 59.0, 39.0, 30.0, 27.0, 24.0, 24.0, 17.0, 7.0, 10.0, 8.0, 9.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3213844299316406, -0.31147003173828125, -0.3015556335449219, -0.2916412353515625, -0.2817268371582031, -0.27181243896484375, -0.2618980407714844, -0.251983642578125, -0.24206924438476562, -0.23215484619140625, -0.22224044799804688, -0.2123260498046875, -0.20241165161132812, -0.19249725341796875, -0.18258285522460938, -0.17266845703125, -0.16275405883789062, -0.15283966064453125, -0.14292526245117188, -0.1330108642578125, -0.12309646606445312, -0.11318206787109375, -0.10326766967773438, -0.093353271484375, -0.08343887329101562, -0.07352447509765625, -0.06361007690429688, -0.0536956787109375, -0.043781280517578125, -0.03386688232421875, -0.023952484130859375, -0.0140380859375, -0.004123687744140625, 0.00579071044921875, 0.015705108642578125, 0.0256195068359375, 0.035533905029296875, 0.04544830322265625, 0.055362701416015625, 0.065277099609375, 0.07519149780273438, 0.08510589599609375, 0.09502029418945312, 0.1049346923828125, 0.11484909057617188, 0.12476348876953125, 0.13467788696289062, 0.14459228515625, 0.15450668334960938, 0.16442108154296875, 0.17433547973632812, 0.1842498779296875, 0.19416427612304688, 0.20407867431640625, 0.21399307250976562, 0.223907470703125, 0.23382186889648438, 0.24373626708984375, 0.2536506652832031, 0.2635650634765625, 0.2734794616699219, 0.28339385986328125, 0.2933082580566406, 0.30322265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 10.0, 13.0, 29.0, 21.0, 47.0, 73.0, 141.0, 199.0, 303.0, 577.0, 1076.0, 2265.0, 5720.0, 17917.0, 91421.0, 3893109.0, 146005.0, 22806.0, 7076.0, 2721.0, 1142.0, 573.0, 411.0, 202.0, 151.0, 103.0, 52.0, 45.0, 22.0, 17.0, 9.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.5988998413085938, -0.5771942138671875, -0.5554885864257812, -0.533782958984375, -0.5120773315429688, -0.4903717041015625, -0.46866607666015625, -0.44696044921875, -0.42525482177734375, -0.4035491943359375, -0.38184356689453125, -0.360137939453125, -0.33843231201171875, -0.3167266845703125, -0.29502105712890625, -0.2733154296875, -0.25160980224609375, -0.2299041748046875, -0.20819854736328125, -0.186492919921875, -0.16478729248046875, -0.1430816650390625, -0.12137603759765625, -0.09967041015625, -0.07796478271484375, -0.0562591552734375, -0.03455352783203125, -0.012847900390625, 0.00885772705078125, 0.0305633544921875, 0.05226898193359375, 0.073974609375, 0.09568023681640625, 0.1173858642578125, 0.13909149169921875, 0.160797119140625, 0.18250274658203125, 0.2042083740234375, 0.22591400146484375, 0.24761962890625, 0.26932525634765625, 0.2910308837890625, 0.31273651123046875, 0.334442138671875, 0.35614776611328125, 0.3778533935546875, 0.39955902099609375, 0.4212646484375, 0.44297027587890625, 0.4646759033203125, 0.48638153076171875, 0.508087158203125, 0.5297927856445312, 0.5514984130859375, 0.5732040405273438, 0.59490966796875, 0.6166152954101562, 0.6383209228515625, 0.6600265502929688, 0.681732177734375, 0.7034378051757812, 0.7251434326171875, 0.7468490600585938, 0.7685546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 11.0, 3.0, 13.0, 16.0, 13.0, 23.0, 40.0, 89.0, 252.0, 3112.0, 279.0, 82.0, 51.0, 24.0, 21.0, 14.0, 3.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7666015625, -0.7461700439453125, -0.725738525390625, -0.7053070068359375, -0.68487548828125, -0.6644439697265625, -0.644012451171875, -0.6235809326171875, -0.6031494140625, -0.5827178955078125, -0.562286376953125, -0.5418548583984375, -0.52142333984375, -0.5009918212890625, -0.480560302734375, -0.4601287841796875, -0.439697265625, -0.4192657470703125, -0.398834228515625, -0.3784027099609375, -0.35797119140625, -0.3375396728515625, -0.317108154296875, -0.2966766357421875, -0.2762451171875, -0.2558135986328125, -0.235382080078125, -0.2149505615234375, -0.19451904296875, -0.1740875244140625, -0.153656005859375, -0.1332244873046875, -0.11279296875, -0.0923614501953125, -0.071929931640625, -0.0514984130859375, -0.03106689453125, -0.0106353759765625, 0.009796142578125, 0.0302276611328125, 0.0506591796875, 0.0710906982421875, 0.091522216796875, 0.1119537353515625, 0.13238525390625, 0.1528167724609375, 0.173248291015625, 0.1936798095703125, 0.214111328125, 0.2345428466796875, 0.254974365234375, 0.2754058837890625, 0.29583740234375, 0.3162689208984375, 0.336700439453125, 0.3571319580078125, 0.3775634765625, 0.3979949951171875, 0.418426513671875, 0.4388580322265625, 0.45928955078125, 0.4797210693359375, 0.500152587890625, 0.5205841064453125, 0.541015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 8.0, 28.0, 99.0, 326.0, 377.0, 99.0, 30.0, 13.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.024125099182129, -4.915098190307617, -4.806070804595947, -4.6970438957214355, -4.588016986846924, -4.478989601135254, -4.369962692260742, -4.2609357833862305, -4.1519083976745605, -4.042881488800049, -3.933854341506958, -3.824827194213867, -3.7158000469207764, -3.6067728996276855, -3.497745990753174, -3.388718843460083, -3.2796919345855713, -3.1706647872924805, -3.0616378784179688, -2.952610731124878, -2.843583583831787, -2.7345566749572754, -2.6255295276641846, -2.5165023803710938, -2.407475471496582, -2.298448324203491, -2.1894214153289795, -2.0803942680358887, -1.9713671207427979, -1.8623400926589966, -1.7533130645751953, -1.6442859172821045, -1.5352587699890137, -1.4262317419052124, -1.3172045946121216, -1.2081775665283203, -1.0991504192352295, -0.9901233911514282, -0.881096363067627, -0.7720692753791809, -0.6630421876907349, -0.5540151000022888, -0.44498804211616516, -0.3359609842300415, -0.22693389654159546, -0.11790680885314941, -0.008879780769348145, 0.1001473069190979, 0.20917439460754395, 0.31820148229599, 0.42722854018211365, 0.5362555980682373, 0.6452826857566833, 0.7543097734451294, 0.8633368015289307, 0.9723638892173767, 1.0813909769058228, 1.190418004989624, 1.2994451522827148, 1.4084721803665161, 1.5174992084503174, 1.6265263557434082, 1.7355533838272095, 1.8445804119110107, 1.9536075592041016]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 10.0, 14.0, 11.0, 14.0, 23.0, 34.0, 32.0, 30.0, 42.0, 37.0, 33.0, 41.0, 52.0, 51.0, 49.0, 62.0, 52.0, 64.0, 45.0, 42.0, 28.0, 51.0, 35.0, 30.0, 33.0, 24.0, 15.0, 9.0, 4.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.594771146774292, -1.5484250783920288, -1.5020790100097656, -1.4557329416275024, -1.4093868732452393, -1.3630409240722656, -1.3166948556900024, -1.2703487873077393, -1.224002718925476, -1.177656650543213, -1.1313105821609497, -1.0849645137786865, -1.038618564605713, -0.9922724366188049, -0.9459264278411865, -0.8995803594589233, -0.8532342910766602, -0.806888222694397, -0.7605421543121338, -0.7141961455345154, -0.6678500771522522, -0.621504008769989, -0.5751579999923706, -0.5288119316101074, -0.48246586322784424, -0.43611979484558105, -0.38977375626564026, -0.34342771768569946, -0.2970816493034363, -0.2507355809211731, -0.2043895423412323, -0.1580435037612915, -0.11169755458831787, -0.06535150110721588, -0.01900544762611389, 0.027340605854988098, 0.07368665933609009, 0.12003271281719208, 0.16637876629829407, 0.21272480487823486, 0.25907087326049805, 0.30541694164276123, 0.351762980222702, 0.3981090188026428, 0.444455087184906, 0.4908011555671692, 0.5371471643447876, 0.5834932327270508, 0.629839301109314, 0.6761853694915771, 0.7225314378738403, 0.7688774466514587, 0.8152235150337219, 0.8615695834159851, 0.9079155921936035, 0.9542616605758667, 1.0006077289581299, 1.046953797340393, 1.0932998657226562, 1.1396459341049194, 1.1859920024871826, 1.2323379516601562, 1.2786840200424194, 1.3250300884246826, 1.3713761568069458]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 10.0, 12.0, 13.0, 20.0, 37.0, 35.0, 76.0, 133.0, 253.0, 492.0, 1141.0, 3343.0, 12559.0, 63615.0, 489989.0, 408390.0, 52770.0, 10564.0, 2966.0, 1106.0, 506.0, 198.0, 130.0, 85.0, 38.0, 19.0, 19.0, 11.0, 10.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8828125, -0.8575515747070312, -0.8322906494140625, -0.8070297241210938, -0.781768798828125, -0.7565078735351562, -0.7312469482421875, -0.7059860229492188, -0.68072509765625, -0.6554641723632812, -0.6302032470703125, -0.6049423217773438, -0.579681396484375, -0.5544204711914062, -0.5291595458984375, -0.5038986206054688, -0.4786376953125, -0.45337677001953125, -0.4281158447265625, -0.40285491943359375, -0.377593994140625, -0.35233306884765625, -0.3270721435546875, -0.30181121826171875, -0.27655029296875, -0.25128936767578125, -0.2260284423828125, -0.20076751708984375, -0.175506591796875, -0.15024566650390625, -0.1249847412109375, -0.09972381591796875, -0.074462890625, -0.04920196533203125, -0.0239410400390625, 0.00131988525390625, 0.026580810546875, 0.05184173583984375, 0.0771026611328125, 0.10236358642578125, 0.12762451171875, 0.15288543701171875, 0.1781463623046875, 0.20340728759765625, 0.228668212890625, 0.25392913818359375, 0.2791900634765625, 0.30445098876953125, 0.3297119140625, 0.35497283935546875, 0.3802337646484375, 0.40549468994140625, 0.430755615234375, 0.45601654052734375, 0.4812774658203125, 0.5065383911132812, 0.53179931640625, 0.5570602416992188, 0.5823211669921875, 0.6075820922851562, 0.632843017578125, 0.6581039428710938, 0.6833648681640625, 0.7086257934570312, 0.73388671875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 9.0, 13.0, 21.0, 25.0, 25.0, 28.0, 31.0, 32.0, 34.0, 38.0, 41.0, 48.0, 69.0, 57.0, 54.0, 65.0, 58.0, 45.0, 45.0, 46.0, 36.0, 38.0, 26.0, 24.0, 19.0, 13.0, 9.0, 13.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3212890625, -0.31159210205078125, -0.3018951416015625, -0.29219818115234375, -0.282501220703125, -0.27280426025390625, -0.2631072998046875, -0.25341033935546875, -0.24371337890625, -0.23401641845703125, -0.2243194580078125, -0.21462249755859375, -0.204925537109375, -0.19522857666015625, -0.1855316162109375, -0.17583465576171875, -0.1661376953125, -0.15644073486328125, -0.1467437744140625, -0.13704681396484375, -0.127349853515625, -0.11765289306640625, -0.1079559326171875, -0.09825897216796875, -0.08856201171875, -0.07886505126953125, -0.0691680908203125, -0.05947113037109375, -0.049774169921875, -0.04007720947265625, -0.0303802490234375, -0.02068328857421875, -0.010986328125, -0.00128936767578125, 0.0084075927734375, 0.01810455322265625, 0.027801513671875, 0.03749847412109375, 0.0471954345703125, 0.05689239501953125, 0.06658935546875, 0.07628631591796875, 0.0859832763671875, 0.09568023681640625, 0.105377197265625, 0.11507415771484375, 0.1247711181640625, 0.13446807861328125, 0.1441650390625, 0.15386199951171875, 0.1635589599609375, 0.17325592041015625, 0.182952880859375, 0.19264984130859375, 0.2023468017578125, 0.21204376220703125, 0.22174072265625, 0.23143768310546875, 0.2411346435546875, 0.25083160400390625, 0.260528564453125, 0.27022552490234375, 0.2799224853515625, 0.28961944580078125, 0.29931640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 13.0, 13.0, 20.0, 42.0, 55.0, 79.0, 156.0, 256.0, 583.0, 1846.0, 8116.0, 66339.0, 832481.0, 122555.0, 12040.0, 2520.0, 740.0, 296.0, 167.0, 83.0, 45.0, 30.0, 26.0, 10.0, 13.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9163742065429688, -0.8791351318359375, -0.8418960571289062, -0.804656982421875, -0.7674179077148438, -0.7301788330078125, -0.6929397583007812, -0.65570068359375, -0.6184616088867188, -0.5812225341796875, -0.5439834594726562, -0.506744384765625, -0.46950531005859375, -0.4322662353515625, -0.39502716064453125, -0.3577880859375, -0.32054901123046875, -0.2833099365234375, -0.24607086181640625, -0.208831787109375, -0.17159271240234375, -0.1343536376953125, -0.09711456298828125, -0.05987548828125, -0.02263641357421875, 0.0146026611328125, 0.05184173583984375, 0.089080810546875, 0.12631988525390625, 0.1635589599609375, 0.20079803466796875, 0.238037109375, 0.27527618408203125, 0.3125152587890625, 0.34975433349609375, 0.386993408203125, 0.42423248291015625, 0.4614715576171875, 0.49871063232421875, 0.53594970703125, 0.5731887817382812, 0.6104278564453125, 0.6476669311523438, 0.684906005859375, 0.7221450805664062, 0.7593841552734375, 0.7966232299804688, 0.8338623046875, 0.8711013793945312, 0.9083404541015625, 0.9455795288085938, 0.982818603515625, 1.0200576782226562, 1.0572967529296875, 1.0945358276367188, 1.13177490234375, 1.1690139770507812, 1.2062530517578125, 1.2434921264648438, 1.280731201171875, 1.3179702758789062, 1.3552093505859375, 1.3924484252929688, 1.4296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 14.0, 10.0, 6.0, 17.0, 19.0, 19.0, 28.0, 31.0, 31.0, 49.0, 48.0, 55.0, 65.0, 67.0, 61.0, 66.0, 64.0, 59.0, 45.0, 40.0, 32.0, 42.0, 33.0, 13.0, 21.0, 9.0, 9.0, 8.0, 2.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.701629638671875, -1.64739990234375, -1.593170166015625, -1.5389404296875, -1.484710693359375, -1.43048095703125, -1.376251220703125, -1.322021484375, -1.267791748046875, -1.21356201171875, -1.159332275390625, -1.1051025390625, -1.050872802734375, -0.99664306640625, -0.942413330078125, -0.88818359375, -0.833953857421875, -0.77972412109375, -0.725494384765625, -0.6712646484375, -0.617034912109375, -0.56280517578125, -0.508575439453125, -0.454345703125, -0.400115966796875, -0.34588623046875, -0.291656494140625, -0.2374267578125, -0.183197021484375, -0.12896728515625, -0.074737548828125, -0.0205078125, 0.033721923828125, 0.08795166015625, 0.142181396484375, 0.1964111328125, 0.250640869140625, 0.30487060546875, 0.359100341796875, 0.413330078125, 0.467559814453125, 0.52178955078125, 0.576019287109375, 0.6302490234375, 0.684478759765625, 0.73870849609375, 0.792938232421875, 0.84716796875, 0.901397705078125, 0.95562744140625, 1.009857177734375, 1.0640869140625, 1.118316650390625, 1.17254638671875, 1.226776123046875, 1.281005859375, 1.335235595703125, 1.38946533203125, 1.443695068359375, 1.4979248046875, 1.552154541015625, 1.60638427734375, 1.660614013671875, 1.71484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 5.0, 2.0, 13.0, 23.0, 31.0, 56.0, 110.0, 241.0, 648.0, 2434.0, 24535.0, 943782.0, 71033.0, 4093.0, 886.0, 352.0, 130.0, 67.0, 27.0, 29.0, 10.0, 9.0, 9.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64794921875, -0.627471923828125, -0.60699462890625, -0.586517333984375, -0.5660400390625, -0.545562744140625, -0.52508544921875, -0.504608154296875, -0.484130859375, -0.463653564453125, -0.44317626953125, -0.422698974609375, -0.4022216796875, -0.381744384765625, -0.36126708984375, -0.340789794921875, -0.3203125, -0.299835205078125, -0.27935791015625, -0.258880615234375, -0.2384033203125, -0.217926025390625, -0.19744873046875, -0.176971435546875, -0.156494140625, -0.136016845703125, -0.11553955078125, -0.095062255859375, -0.0745849609375, -0.054107666015625, -0.03363037109375, -0.013153076171875, 0.00732421875, 0.027801513671875, 0.04827880859375, 0.068756103515625, 0.0892333984375, 0.109710693359375, 0.13018798828125, 0.150665283203125, 0.171142578125, 0.191619873046875, 0.21209716796875, 0.232574462890625, 0.2530517578125, 0.273529052734375, 0.29400634765625, 0.314483642578125, 0.3349609375, 0.355438232421875, 0.37591552734375, 0.396392822265625, 0.4168701171875, 0.437347412109375, 0.45782470703125, 0.478302001953125, 0.498779296875, 0.519256591796875, 0.53973388671875, 0.560211181640625, 0.5806884765625, 0.601165771484375, 0.62164306640625, 0.642120361328125, 0.66259765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 15.0, 16.0, 35.0, 35.0, 52.0, 95.0, 155.0, 210.0, 147.0, 61.0, 49.0, 29.0, 21.0, 22.0, 10.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023508071899414062, -0.00022409111261367798, -0.00021310150623321533, -0.00020211189985275269, -0.00019112229347229004, -0.0001801326870918274, -0.00016914308071136475, -0.0001581534743309021, -0.00014716386795043945, -0.0001361742615699768, -0.00012518465518951416, -0.00011419504880905151, -0.00010320544242858887, -9.221583604812622e-05, -8.122622966766357e-05, -7.023662328720093e-05, -5.924701690673828e-05, -4.8257410526275635e-05, -3.726780414581299e-05, -2.6278197765350342e-05, -1.5288591384887695e-05, -4.298985004425049e-06, 6.690621376037598e-06, 1.7680227756500244e-05, 2.866983413696289e-05, 3.965944051742554e-05, 5.0649046897888184e-05, 6.163865327835083e-05, 7.262825965881348e-05, 8.361786603927612e-05, 9.460747241973877e-05, 0.00010559707880020142, 0.00011658668518066406, 0.0001275762915611267, 0.00013856589794158936, 0.000149555504322052, 0.00016054511070251465, 0.0001715347170829773, 0.00018252432346343994, 0.0001935139298439026, 0.00020450353622436523, 0.00021549314260482788, 0.00022648274898529053, 0.00023747235536575317, 0.0002484619617462158, 0.00025945156812667847, 0.0002704411745071411, 0.00028143078088760376, 0.0002924203872680664, 0.00030340999364852905, 0.0003143996000289917, 0.00032538920640945435, 0.000336378812789917, 0.00034736841917037964, 0.0003583580255508423, 0.00036934763193130493, 0.0003803372383117676, 0.0003913268446922302, 0.00040231645107269287, 0.0004133060574531555, 0.00042429566383361816, 0.0004352852702140808, 0.00044627487659454346, 0.0004572644829750061, 0.00046825408935546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 15.0, 22.0, 27.0, 62.0, 137.0, 242.0, 588.0, 2662.0, 44016.0, 963124.0, 34224.0, 2360.0, 606.0, 222.0, 103.0, 54.0, 39.0, 22.0, 7.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6884765625, -0.6685028076171875, -0.648529052734375, -0.6285552978515625, -0.60858154296875, -0.5886077880859375, -0.568634033203125, -0.5486602783203125, -0.5286865234375, -0.5087127685546875, -0.488739013671875, -0.4687652587890625, -0.44879150390625, -0.4288177490234375, -0.408843994140625, -0.3888702392578125, -0.368896484375, -0.3489227294921875, -0.328948974609375, -0.3089752197265625, -0.28900146484375, -0.2690277099609375, -0.249053955078125, -0.2290802001953125, -0.2091064453125, -0.1891326904296875, -0.169158935546875, -0.1491851806640625, -0.12921142578125, -0.1092376708984375, -0.089263916015625, -0.0692901611328125, -0.04931640625, -0.0293426513671875, -0.009368896484375, 0.0106048583984375, 0.03057861328125, 0.0505523681640625, 0.070526123046875, 0.0904998779296875, 0.1104736328125, 0.1304473876953125, 0.150421142578125, 0.1703948974609375, 0.19036865234375, 0.2103424072265625, 0.230316162109375, 0.2502899169921875, 0.270263671875, 0.2902374267578125, 0.310211181640625, 0.3301849365234375, 0.35015869140625, 0.3701324462890625, 0.390106201171875, 0.4100799560546875, 0.4300537109375, 0.4500274658203125, 0.470001220703125, 0.4899749755859375, 0.50994873046875, 0.5299224853515625, 0.549896240234375, 0.5698699951171875, 0.58984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 30.0, 33.0, 83.0, 173.0, 285.0, 190.0, 84.0, 47.0, 28.0, 11.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.119140625, -1.0877151489257812, -1.0562896728515625, -1.0248641967773438, -0.993438720703125, -0.9620132446289062, -0.9305877685546875, -0.8991622924804688, -0.86773681640625, -0.8363113403320312, -0.8048858642578125, -0.7734603881835938, -0.742034912109375, -0.7106094360351562, -0.6791839599609375, -0.6477584838867188, -0.6163330078125, -0.5849075317382812, -0.5534820556640625, -0.5220565795898438, -0.490631103515625, -0.45920562744140625, -0.4277801513671875, -0.39635467529296875, -0.36492919921875, -0.33350372314453125, -0.3020782470703125, -0.27065277099609375, -0.239227294921875, -0.20780181884765625, -0.1763763427734375, -0.14495086669921875, -0.113525390625, -0.08209991455078125, -0.0506744384765625, -0.01924896240234375, 0.012176513671875, 0.04360198974609375, 0.0750274658203125, 0.10645294189453125, 0.13787841796875, 0.16930389404296875, 0.2007293701171875, 0.23215484619140625, 0.263580322265625, 0.29500579833984375, 0.3264312744140625, 0.35785675048828125, 0.3892822265625, 0.42070770263671875, 0.4521331787109375, 0.48355865478515625, 0.514984130859375, 0.5464096069335938, 0.5778350830078125, 0.6092605590820312, 0.64068603515625, 0.6721115112304688, 0.7035369873046875, 0.7349624633789062, 0.766387939453125, 0.7978134155273438, 0.8292388916015625, 0.8606643676757812, 0.89208984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 4.0, 3.0, 10.0, 16.0, 24.0, 49.0, 129.0, 235.0, 280.0, 139.0, 74.0, 24.0, 12.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0], "bins": [-15.32483959197998, -15.036296844482422, -14.747754096984863, -14.459211349487305, -14.170668601989746, -13.882125854492188, -13.593583106994629, -13.30504035949707, -13.016497611999512, -12.727954864501953, -12.439412117004395, -12.150869369506836, -11.862326622009277, -11.573783874511719, -11.28524112701416, -10.996698379516602, -10.708154678344727, -10.419611930847168, -10.13106918334961, -9.84252643585205, -9.553983688354492, -9.265440940856934, -8.976898193359375, -8.688355445861816, -8.399812698364258, -8.1112699508667, -7.822727203369141, -7.534184455871582, -7.245641708374023, -6.957098960876465, -6.668556213378906, -6.380013465881348, -6.091469764709473, -5.802927017211914, -5.5143842697143555, -5.225841522216797, -4.937298774719238, -4.64875602722168, -4.360213279724121, -4.0716705322265625, -3.783127784729004, -3.4945850372314453, -3.2060422897338867, -2.917499542236328, -2.6289567947387695, -2.340414047241211, -2.0518710613250732, -1.7633283138275146, -1.474785566329956, -1.1862428188323975, -0.8977000117301941, -0.6091572046279907, -0.32061445713043213, -0.032071709632873535, 0.2564711570739746, 0.5450139045715332, 0.8335566520690918, 1.1220993995666504, 1.410642147064209, 1.6991850137710571, 1.9877277612686157, 2.2762703895568848, 2.5648133754730225, 2.853356122970581, 3.1418988704681396]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 6.0, 10.0, 14.0, 15.0, 18.0, 29.0, 24.0, 36.0, 37.0, 44.0, 56.0, 47.0, 71.0, 55.0, 51.0, 56.0, 53.0, 54.0, 31.0, 40.0, 32.0, 33.0, 28.0, 27.0, 27.0, 22.0, 8.0, 10.0, 15.0, 9.0, 11.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.401443481445312, -8.115632057189941, -7.829820156097412, -7.544008731842041, -7.258196830749512, -6.972385406494141, -6.6865739822387695, -6.400762557983398, -6.114950656890869, -5.829139232635498, -5.543327331542969, -5.257515907287598, -4.971704483032227, -4.685892581939697, -4.400081157684326, -4.114269256591797, -3.828457832336426, -3.5426461696624756, -3.2568345069885254, -2.9710230827331543, -2.685211420059204, -2.399399757385254, -2.113588333129883, -1.8277766704559326, -1.5419650077819824, -1.2561533451080322, -0.9703418016433716, -0.6845301985740662, -0.39871859550476074, -0.11290693283081055, 0.1729046106338501, 0.45871615409851074, 0.7445278167724609, 1.0303394794464111, 1.3161510229110718, 1.6019625663757324, 1.8877742290496826, 2.173585891723633, 2.459397315979004, 2.745208978652954, 3.0310206413269043, 3.3168323040008545, 3.6026439666748047, 3.888455390930176, 4.174266815185547, 4.460078716278076, 4.745890140533447, 5.031702041625977, 5.317513465881348, 5.603324890136719, 5.889136791229248, 6.174948215484619, 6.460760116577148, 6.7465715408325195, 7.032382965087891, 7.318194389343262, 7.604006290435791, 7.889817714691162, 8.175629615783691, 8.461441040039062, 8.747252464294434, 9.033063888549805, 9.318876266479492, 9.604687690734863, 9.890499114990234]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 5.0, 10.0, 10.0, 19.0, 38.0, 71.0, 171.0, 308.0, 719.0, 2057.0, 10999.0, 4026860.0, 144246.0, 6190.0, 1494.0, 614.0, 217.0, 107.0, 67.0, 23.0, 19.0, 13.0, 5.0, 2.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.330078125, -1.2975234985351562, -1.2649688720703125, -1.2324142456054688, -1.199859619140625, -1.1673049926757812, -1.1347503662109375, -1.1021957397460938, -1.06964111328125, -1.0370864868164062, -1.0045318603515625, -0.9719772338867188, -0.939422607421875, -0.9068679809570312, -0.8743133544921875, -0.8417587280273438, -0.8092041015625, -0.7766494750976562, -0.7440948486328125, -0.7115402221679688, -0.678985595703125, -0.6464309692382812, -0.6138763427734375, -0.5813217163085938, -0.54876708984375, -0.5162124633789062, -0.4836578369140625, -0.45110321044921875, -0.418548583984375, -0.38599395751953125, -0.3534393310546875, -0.32088470458984375, -0.288330078125, -0.25577545166015625, -0.2232208251953125, -0.19066619873046875, -0.158111572265625, -0.12555694580078125, -0.0930023193359375, -0.06044769287109375, -0.02789306640625, 0.00466156005859375, 0.0372161865234375, 0.06977081298828125, 0.102325439453125, 0.13488006591796875, 0.1674346923828125, 0.19998931884765625, 0.2325439453125, 0.26509857177734375, 0.2976531982421875, 0.33020782470703125, 0.362762451171875, 0.39531707763671875, 0.4278717041015625, 0.46042633056640625, 0.49298095703125, 0.5255355834960938, 0.5580902099609375, 0.5906448364257812, 0.623199462890625, 0.6557540893554688, 0.6883087158203125, 0.7208633422851562, 0.75341796875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 12.0, 13.0, 14.0, 16.0, 30.0, 23.0, 16.0, 30.0, 37.0, 44.0, 43.0, 32.0, 47.0, 43.0, 53.0, 50.0, 50.0, 51.0, 44.0, 35.0, 50.0, 47.0, 32.0, 32.0, 24.0, 16.0, 14.0, 17.0, 21.0, 13.0, 10.0, 9.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.4169921875, -0.40517425537109375, -0.3933563232421875, -0.38153839111328125, -0.369720458984375, -0.35790252685546875, -0.3460845947265625, -0.33426666259765625, -0.32244873046875, -0.31063079833984375, -0.2988128662109375, -0.28699493408203125, -0.275177001953125, -0.26335906982421875, -0.2515411376953125, -0.23972320556640625, -0.2279052734375, -0.21608734130859375, -0.2042694091796875, -0.19245147705078125, -0.180633544921875, -0.16881561279296875, -0.1569976806640625, -0.14517974853515625, -0.13336181640625, -0.12154388427734375, -0.1097259521484375, -0.09790802001953125, -0.086090087890625, -0.07427215576171875, -0.0624542236328125, -0.05063629150390625, -0.038818359375, -0.02700042724609375, -0.0151824951171875, -0.00336456298828125, 0.008453369140625, 0.02027130126953125, 0.0320892333984375, 0.04390716552734375, 0.05572509765625, 0.06754302978515625, 0.0793609619140625, 0.09117889404296875, 0.102996826171875, 0.11481475830078125, 0.1266326904296875, 0.13845062255859375, 0.1502685546875, 0.16208648681640625, 0.1739044189453125, 0.18572235107421875, 0.197540283203125, 0.20935821533203125, 0.2211761474609375, 0.23299407958984375, 0.24481201171875, 0.25662994384765625, 0.2684478759765625, 0.28026580810546875, 0.292083740234375, 0.30390167236328125, 0.3157196044921875, 0.32753753662109375, 0.33935546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 6.0, 13.0, 27.0, 43.0, 58.0, 80.0, 162.0, 296.0, 605.0, 1245.0, 3239.0, 14035.0, 3992501.0, 169087.0, 8320.0, 2417.0, 1005.0, 500.0, 267.0, 166.0, 69.0, 37.0, 50.0, 19.0, 11.0, 9.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.181640625, -1.1540756225585938, -1.1265106201171875, -1.0989456176757812, -1.071380615234375, -1.0438156127929688, -1.0162506103515625, -0.9886856079101562, -0.96112060546875, -0.9335556030273438, -0.9059906005859375, -0.8784255981445312, -0.850860595703125, -0.8232955932617188, -0.7957305908203125, -0.7681655883789062, -0.7406005859375, -0.7130355834960938, -0.6854705810546875, -0.6579055786132812, -0.630340576171875, -0.6027755737304688, -0.5752105712890625, -0.5476455688476562, -0.52008056640625, -0.49251556396484375, -0.4649505615234375, -0.43738555908203125, -0.409820556640625, -0.38225555419921875, -0.3546905517578125, -0.32712554931640625, -0.299560546875, -0.27199554443359375, -0.2444305419921875, -0.21686553955078125, -0.189300537109375, -0.16173553466796875, -0.1341705322265625, -0.10660552978515625, -0.07904052734375, -0.05147552490234375, -0.0239105224609375, 0.00365447998046875, 0.031219482421875, 0.05878448486328125, 0.0863494873046875, 0.11391448974609375, 0.1414794921875, 0.16904449462890625, 0.1966094970703125, 0.22417449951171875, 0.251739501953125, 0.27930450439453125, 0.3068695068359375, 0.33443450927734375, 0.36199951171875, 0.38956451416015625, 0.4171295166015625, 0.44469451904296875, 0.472259521484375, 0.49982452392578125, 0.5273895263671875, 0.5549545288085938, 0.58251953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 8.0, 8.0, 35.0, 56.0, 393.0, 3461.0, 60.0, 24.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331787109375, -0.3235187530517578, -0.3152503967285156, -0.30698204040527344, -0.29871368408203125, -0.29044532775878906, -0.2821769714355469, -0.2739086151123047, -0.2656402587890625, -0.2573719024658203, -0.24910354614257812, -0.24083518981933594, -0.23256683349609375, -0.22429847717285156, -0.21603012084960938, -0.2077617645263672, -0.199493408203125, -0.1912250518798828, -0.18295669555664062, -0.17468833923339844, -0.16641998291015625, -0.15815162658691406, -0.14988327026367188, -0.1416149139404297, -0.1333465576171875, -0.1250782012939453, -0.11680984497070312, -0.10854148864746094, -0.10027313232421875, -0.09200477600097656, -0.08373641967773438, -0.07546806335449219, -0.06719970703125, -0.05893135070800781, -0.050662994384765625, -0.04239463806152344, -0.03412628173828125, -0.025857925415039062, -0.017589569091796875, -0.009321212768554688, -0.0010528564453125, 0.0072154998779296875, 0.015483856201171875, 0.023752212524414062, 0.03202056884765625, 0.04028892517089844, 0.048557281494140625, 0.05682563781738281, 0.065093994140625, 0.07336235046386719, 0.08163070678710938, 0.08989906311035156, 0.09816741943359375, 0.10643577575683594, 0.11470413208007812, 0.12297248840332031, 0.1312408447265625, 0.1395092010498047, 0.14777755737304688, 0.15604591369628906, 0.16431427001953125, 0.17258262634277344, 0.18085098266601562, 0.1891193389892578, 0.1973876953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 12.0, 34.0, 109.0, 496.0, 320.0, 34.0, 6.0, 2.0, 1.0, 2.0], "bins": [-3.0160655975341797, -2.964134931564331, -2.9122045040130615, -2.860273838043213, -2.8083434104919434, -2.7564127445220947, -2.704482316970825, -2.6525516510009766, -2.600621223449707, -2.5486905574798584, -2.496760129928589, -2.4448294639587402, -2.3928990364074707, -2.340968370437622, -2.2890379428863525, -2.237107276916504, -2.1851768493652344, -2.1332461833953857, -2.081315755844116, -2.0293850898742676, -1.977454662322998, -1.925524115562439, -1.8735935688018799, -1.8216630220413208, -1.7697323560714722, -1.717801809310913, -1.665871262550354, -1.613940715789795, -1.5620101690292358, -1.5100796222686768, -1.4581490755081177, -1.4062185287475586, -1.3542879819869995, -1.3023574352264404, -1.2504268884658813, -1.1984963417053223, -1.1465657949447632, -1.094635248184204, -1.042704701423645, -0.9907741546630859, -0.9388436079025269, -0.8869130611419678, -0.8349825143814087, -0.7830519676208496, -0.7311214208602905, -0.6791908740997314, -0.6272603273391724, -0.5753297805786133, -0.5233991742134094, -0.47146862745285034, -0.41953808069229126, -0.3676075339317322, -0.3156769871711731, -0.2637464106082916, -0.21181586384773254, -0.15988531708717346, -0.10795477032661438, -0.056024219840765, -0.004093669354915619, 0.04783688485622406, 0.09976743161678314, 0.15169799327850342, 0.2036285400390625, 0.2555590867996216, 0.30748963356018066]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 9.0, 9.0, 8.0, 19.0, 13.0, 14.0, 27.0, 24.0, 29.0, 26.0, 20.0, 38.0, 45.0, 47.0, 34.0, 39.0, 46.0, 45.0, 48.0, 38.0, 33.0, 43.0, 18.0, 42.0, 34.0, 28.0, 25.0, 22.0, 19.0, 26.0, 28.0, 18.0, 16.0, 12.0, 9.0, 13.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32217538356781006, -0.30978909134864807, -0.2974027991294861, -0.2850165367126465, -0.2726302444934845, -0.2602439522743225, -0.24785766005516052, -0.23547138273715973, -0.22308510541915894, -0.21069881319999695, -0.19831253588199615, -0.18592624366283417, -0.17353996634483337, -0.1611536741256714, -0.1487673819065094, -0.1363811045885086, -0.12399481236934662, -0.11160852760076523, -0.09922224283218384, -0.08683595061302185, -0.07444967329502106, -0.06206338480114937, -0.04967709630727768, -0.03729081153869629, -0.0249045267701149, -0.012518241070210934, -0.0001319553703069687, 0.012254331260919571, 0.02464061602950096, 0.03702690079808235, 0.04941318929195404, 0.06179947406053543, 0.07418575882911682, 0.08657204359769821, 0.0989583283662796, 0.11134462058544159, 0.12373089790344238, 0.13611719012260437, 0.14850348234176636, 0.16088975965976715, 0.17327603697776794, 0.18566232919692993, 0.19804860651493073, 0.2104348987340927, 0.2228211760520935, 0.2352074682712555, 0.24759376049041748, 0.2599800229072571, 0.27236634492874146, 0.28475263714790344, 0.29713892936706543, 0.30952519178390503, 0.321911484003067, 0.334297776222229, 0.346684068441391, 0.359070360660553, 0.3714566230773926, 0.38384291529655457, 0.39622920751571655, 0.40861546993255615, 0.42100176215171814, 0.4333880543708801, 0.4457743465900421, 0.4581606388092041, 0.4705469012260437]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 11.0, 6.0, 11.0, 12.0, 15.0, 17.0, 38.0, 40.0, 71.0, 111.0, 161.0, 313.0, 609.0, 1465.0, 3693.0, 10713.0, 36885.0, 175171.0, 558455.0, 201001.0, 41219.0, 11582.0, 3904.0, 1589.0, 634.0, 310.0, 165.0, 111.0, 58.0, 53.0, 36.0, 21.0, 16.0, 14.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6463165283203125, -0.625152587890625, -0.6039886474609375, -0.58282470703125, -0.5616607666015625, -0.540496826171875, -0.5193328857421875, -0.4981689453125, -0.4770050048828125, -0.455841064453125, -0.4346771240234375, -0.41351318359375, -0.3923492431640625, -0.371185302734375, -0.3500213623046875, -0.328857421875, -0.3076934814453125, -0.286529541015625, -0.2653656005859375, -0.24420166015625, -0.2230377197265625, -0.201873779296875, -0.1807098388671875, -0.1595458984375, -0.1383819580078125, -0.117218017578125, -0.0960540771484375, -0.07489013671875, -0.0537261962890625, -0.032562255859375, -0.0113983154296875, 0.009765625, 0.0309295654296875, 0.052093505859375, 0.0732574462890625, 0.09442138671875, 0.1155853271484375, 0.136749267578125, 0.1579132080078125, 0.1790771484375, 0.2002410888671875, 0.221405029296875, 0.2425689697265625, 0.26373291015625, 0.2848968505859375, 0.306060791015625, 0.3272247314453125, 0.348388671875, 0.3695526123046875, 0.390716552734375, 0.4118804931640625, 0.43304443359375, 0.4542083740234375, 0.475372314453125, 0.4965362548828125, 0.5177001953125, 0.5388641357421875, 0.560028076171875, 0.5811920166015625, 0.60235595703125, 0.6235198974609375, 0.644683837890625, 0.6658477783203125, 0.68701171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 8.0, 9.0, 13.0, 7.0, 11.0, 11.0, 23.0, 26.0, 31.0, 20.0, 32.0, 33.0, 33.0, 45.0, 39.0, 45.0, 48.0, 48.0, 49.0, 37.0, 57.0, 47.0, 38.0, 48.0, 31.0, 39.0, 29.0, 22.0, 17.0, 16.0, 14.0, 14.0, 18.0, 12.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.365234375, -0.35382080078125, -0.3424072265625, -0.33099365234375, -0.319580078125, -0.30816650390625, -0.2967529296875, -0.28533935546875, -0.27392578125, -0.26251220703125, -0.2510986328125, -0.23968505859375, -0.228271484375, -0.21685791015625, -0.2054443359375, -0.19403076171875, -0.1826171875, -0.17120361328125, -0.1597900390625, -0.14837646484375, -0.136962890625, -0.12554931640625, -0.1141357421875, -0.10272216796875, -0.09130859375, -0.07989501953125, -0.0684814453125, -0.05706787109375, -0.045654296875, -0.03424072265625, -0.0228271484375, -0.01141357421875, 0.0, 0.01141357421875, 0.0228271484375, 0.03424072265625, 0.045654296875, 0.05706787109375, 0.0684814453125, 0.07989501953125, 0.09130859375, 0.10272216796875, 0.1141357421875, 0.12554931640625, 0.136962890625, 0.14837646484375, 0.1597900390625, 0.17120361328125, 0.1826171875, 0.19403076171875, 0.2054443359375, 0.21685791015625, 0.228271484375, 0.23968505859375, 0.2510986328125, 0.26251220703125, 0.27392578125, 0.28533935546875, 0.2967529296875, 0.30816650390625, 0.319580078125, 0.33099365234375, 0.3424072265625, 0.35382080078125, 0.365234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 15.0, 17.0, 32.0, 54.0, 69.0, 124.0, 240.0, 505.0, 1194.0, 3694.0, 14903.0, 106730.0, 781236.0, 117639.0, 15885.0, 3828.0, 1263.0, 475.0, 238.0, 148.0, 82.0, 47.0, 32.0, 24.0, 18.0, 9.0, 7.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.1710205078125, -1.135009765625, -1.0989990234375, -1.06298828125, -1.0269775390625, -0.990966796875, -0.9549560546875, -0.9189453125, -0.8829345703125, -0.846923828125, -0.8109130859375, -0.77490234375, -0.7388916015625, -0.702880859375, -0.6668701171875, -0.630859375, -0.5948486328125, -0.558837890625, -0.5228271484375, -0.48681640625, -0.4508056640625, -0.414794921875, -0.3787841796875, -0.3427734375, -0.3067626953125, -0.270751953125, -0.2347412109375, -0.19873046875, -0.1627197265625, -0.126708984375, -0.0906982421875, -0.0546875, -0.0186767578125, 0.017333984375, 0.0533447265625, 0.08935546875, 0.1253662109375, 0.161376953125, 0.1973876953125, 0.2333984375, 0.2694091796875, 0.305419921875, 0.3414306640625, 0.37744140625, 0.4134521484375, 0.449462890625, 0.4854736328125, 0.521484375, 0.5574951171875, 0.593505859375, 0.6295166015625, 0.66552734375, 0.7015380859375, 0.737548828125, 0.7735595703125, 0.8095703125, 0.8455810546875, 0.881591796875, 0.9176025390625, 0.95361328125, 0.9896240234375, 1.025634765625, 1.0616455078125, 1.09765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 7.0, 13.0, 26.0, 18.0, 31.0, 29.0, 38.0, 48.0, 54.0, 58.0, 49.0, 71.0, 73.0, 76.0, 60.0, 65.0, 56.0, 31.0, 40.0, 30.0, 22.0, 22.0, 20.0, 12.0, 7.0, 10.0, 6.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.872589111328125, -1.79010009765625, -1.707611083984375, -1.6251220703125, -1.542633056640625, -1.46014404296875, -1.377655029296875, -1.295166015625, -1.212677001953125, -1.13018798828125, -1.047698974609375, -0.9652099609375, -0.882720947265625, -0.80023193359375, -0.717742919921875, -0.63525390625, -0.552764892578125, -0.47027587890625, -0.387786865234375, -0.3052978515625, -0.222808837890625, -0.14031982421875, -0.057830810546875, 0.024658203125, 0.107147216796875, 0.18963623046875, 0.272125244140625, 0.3546142578125, 0.437103271484375, 0.51959228515625, 0.602081298828125, 0.6845703125, 0.767059326171875, 0.84954833984375, 0.932037353515625, 1.0145263671875, 1.097015380859375, 1.17950439453125, 1.261993408203125, 1.344482421875, 1.426971435546875, 1.50946044921875, 1.591949462890625, 1.6744384765625, 1.756927490234375, 1.83941650390625, 1.921905517578125, 2.00439453125, 2.086883544921875, 2.16937255859375, 2.251861572265625, 2.3343505859375, 2.416839599609375, 2.49932861328125, 2.581817626953125, 2.664306640625, 2.746795654296875, 2.82928466796875, 2.911773681640625, 2.9942626953125, 3.076751708984375, 3.15924072265625, 3.241729736328125, 3.32421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 5.0, 8.0, 10.0, 21.0, 55.0, 190.0, 866.0, 184153.0, 861774.0, 1115.0, 215.0, 77.0, 36.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7978515625, -1.7230987548828125, -1.648345947265625, -1.5735931396484375, -1.49884033203125, -1.4240875244140625, -1.349334716796875, -1.2745819091796875, -1.1998291015625, -1.1250762939453125, -1.050323486328125, -0.9755706787109375, -0.90081787109375, -0.8260650634765625, -0.751312255859375, -0.6765594482421875, -0.601806640625, -0.5270538330078125, -0.452301025390625, -0.3775482177734375, -0.30279541015625, -0.2280426025390625, -0.153289794921875, -0.0785369873046875, -0.0037841796875, 0.0709686279296875, 0.145721435546875, 0.2204742431640625, 0.29522705078125, 0.3699798583984375, 0.444732666015625, 0.5194854736328125, 0.59423828125, 0.6689910888671875, 0.743743896484375, 0.8184967041015625, 0.89324951171875, 0.9680023193359375, 1.042755126953125, 1.1175079345703125, 1.1922607421875, 1.2670135498046875, 1.341766357421875, 1.4165191650390625, 1.49127197265625, 1.5660247802734375, 1.640777587890625, 1.7155303955078125, 1.790283203125, 1.8650360107421875, 1.939788818359375, 2.0145416259765625, 2.08929443359375, 2.1640472412109375, 2.238800048828125, 2.3135528564453125, 2.3883056640625, 2.4630584716796875, 2.537811279296875, 2.6125640869140625, 2.68731689453125, 2.7620697021484375, 2.836822509765625, 2.9115753173828125, 2.986328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 12.0, 7.0, 8.0, 18.0, 26.0, 36.0, 50.0, 80.0, 76.0, 102.0, 131.0, 103.0, 87.0, 85.0, 48.0, 38.0, 29.0, 17.0, 5.0, 15.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.35560092329979e-05, -8.97776335477829e-05, -8.59992578625679e-05, -8.22208821773529e-05, -7.844250649213791e-05, -7.466413080692291e-05, -7.088575512170792e-05, -6.710737943649292e-05, -6.332900375127792e-05, -5.955062806606293e-05, -5.577225238084793e-05, -5.1993876695632935e-05, -4.821550101041794e-05, -4.443712532520294e-05, -4.0658749639987946e-05, -3.688037395477295e-05, -3.310199826955795e-05, -2.9323622584342957e-05, -2.554524689912796e-05, -2.1766871213912964e-05, -1.7988495528697968e-05, -1.4210119843482971e-05, -1.0431744158267975e-05, -6.6533684730529785e-06, -2.874992787837982e-06, 9.033828973770142e-07, 4.6817585825920105e-06, 8.460134267807007e-06, 1.2238509953022003e-05, 1.6016885638237e-05, 1.9795261323451996e-05, 2.3573637008666992e-05, 2.735201269388199e-05, 3.1130388379096985e-05, 3.490876406431198e-05, 3.868713974952698e-05, 4.2465515434741974e-05, 4.624389111995697e-05, 5.0022266805171967e-05, 5.380064249038696e-05, 5.757901817560196e-05, 6.135739386081696e-05, 6.513576954603195e-05, 6.891414523124695e-05, 7.269252091646194e-05, 7.647089660167694e-05, 8.024927228689194e-05, 8.402764797210693e-05, 8.780602365732193e-05, 9.158439934253693e-05, 9.536277502775192e-05, 9.914115071296692e-05, 0.00010291952639818192, 0.00010669790208339691, 0.00011047627776861191, 0.0001142546534538269, 0.0001180330291390419, 0.0001218114048242569, 0.0001255897805094719, 0.0001293681561946869, 0.00013314653187990189, 0.00013692490756511688, 0.00014070328325033188, 0.00014448165893554688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 13.0, 17.0, 22.0, 53.0, 73.0, 221.0, 933.0, 23965.0, 1015745.0, 6629.0, 566.0, 160.0, 58.0, 44.0, 22.0, 15.0, 9.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.979339599609375, -0.94598388671875, -0.912628173828125, -0.8792724609375, -0.845916748046875, -0.81256103515625, -0.779205322265625, -0.745849609375, -0.712493896484375, -0.67913818359375, -0.645782470703125, -0.6124267578125, -0.579071044921875, -0.54571533203125, -0.512359619140625, -0.47900390625, -0.445648193359375, -0.41229248046875, -0.378936767578125, -0.3455810546875, -0.312225341796875, -0.27886962890625, -0.245513916015625, -0.212158203125, -0.178802490234375, -0.14544677734375, -0.112091064453125, -0.0787353515625, -0.045379638671875, -0.01202392578125, 0.021331787109375, 0.0546875, 0.088043212890625, 0.12139892578125, 0.154754638671875, 0.1881103515625, 0.221466064453125, 0.25482177734375, 0.288177490234375, 0.321533203125, 0.354888916015625, 0.38824462890625, 0.421600341796875, 0.4549560546875, 0.488311767578125, 0.52166748046875, 0.555023193359375, 0.58837890625, 0.621734619140625, 0.65509033203125, 0.688446044921875, 0.7218017578125, 0.755157470703125, 0.78851318359375, 0.821868896484375, 0.855224609375, 0.888580322265625, 0.92193603515625, 0.955291748046875, 0.9886474609375, 1.022003173828125, 1.05535888671875, 1.088714599609375, 1.1220703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 18.0, 49.0, 224.0, 382.0, 206.0, 70.0, 22.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.0650177001953125, -2.020660400390625, -1.9763031005859375, -1.93194580078125, -1.8875885009765625, -1.843231201171875, -1.7988739013671875, -1.7545166015625, -1.7101593017578125, -1.665802001953125, -1.6214447021484375, -1.57708740234375, -1.5327301025390625, -1.488372802734375, -1.4440155029296875, -1.399658203125, -1.3553009033203125, -1.310943603515625, -1.2665863037109375, -1.22222900390625, -1.1778717041015625, -1.133514404296875, -1.0891571044921875, -1.0447998046875, -1.0004425048828125, -0.956085205078125, -0.9117279052734375, -0.86737060546875, -0.8230133056640625, -0.778656005859375, -0.7342987060546875, -0.68994140625, -0.6455841064453125, -0.601226806640625, -0.5568695068359375, -0.51251220703125, -0.4681549072265625, -0.423797607421875, -0.3794403076171875, -0.3350830078125, -0.2907257080078125, -0.246368408203125, -0.2020111083984375, -0.15765380859375, -0.1132965087890625, -0.068939208984375, -0.0245819091796875, 0.019775390625, 0.0641326904296875, 0.108489990234375, 0.1528472900390625, 0.19720458984375, 0.2415618896484375, 0.285919189453125, 0.3302764892578125, 0.3746337890625, 0.4189910888671875, 0.463348388671875, 0.5077056884765625, 0.55206298828125, 0.5964202880859375, 0.640777587890625, 0.6851348876953125, 0.7294921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 12.0, 12.0, 32.0, 33.0, 65.0, 102.0, 180.0, 166.0, 157.0, 87.0, 65.0, 35.0, 27.0, 17.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4891886711120605, -5.271323204040527, -5.053457736968994, -4.835592269897461, -4.617727279663086, -4.3998613357543945, -4.1819963455200195, -3.9641308784484863, -3.746265411376953, -3.52839994430542, -3.3105344772338867, -3.0926692485809326, -2.8748037815093994, -2.656938314437866, -2.439073085784912, -2.221207618713379, -2.0033421516418457, -1.7854766845703125, -1.5676113367080688, -1.3497459888458252, -1.131880521774292, -0.9140150547027588, -0.6961497068405151, -0.4782843589782715, -0.2604188919067383, -0.042553484439849854, 0.17531192302703857, 0.393177330493927, 0.6110427379608154, 0.8289082050323486, 1.0467735528945923, 1.264638900756836, 1.482503890991211, 1.7003693580627441, 1.9182347059249878, 2.1361000537872314, 2.3539655208587646, 2.571830987930298, 2.789696216583252, 3.007561683654785, 3.2254271507263184, 3.4432926177978516, 3.6611580848693848, 3.879023313522339, 4.096888542175293, 4.314754486083984, 4.532619476318359, 4.750484943389893, 4.968350410461426, 5.186215877532959, 5.404081344604492, 5.621946811676025, 5.839812278747559, 6.057677268981934, 6.275542736053467, 6.493408203125, 6.711273670196533, 6.929139137268066, 7.1470046043396, 7.364870071411133, 7.582735061645508, 7.800601005554199, 8.018465995788574, 8.236331939697266, 8.45419692993164]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 3.0, 7.0, 9.0, 12.0, 11.0, 23.0, 10.0, 21.0, 10.0, 23.0, 26.0, 25.0, 35.0, 35.0, 47.0, 54.0, 46.0, 56.0, 51.0, 49.0, 58.0, 45.0, 36.0, 47.0, 42.0, 40.0, 37.0, 23.0, 22.0, 18.0, 14.0, 13.0, 10.0, 8.0, 4.0, 4.0, 5.0, 7.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.621416091918945, -9.329771995544434, -9.038126945495605, -8.746482849121094, -8.454837799072266, -8.163193702697754, -7.871549129486084, -7.579904556274414, -7.288260459899902, -6.996615886688232, -6.7049713134765625, -6.413327217102051, -6.121682643890381, -5.830038070678711, -5.538393497467041, -5.246748924255371, -4.955104351043701, -4.663459777832031, -4.371815204620361, -4.080170631408691, -3.7885265350341797, -3.4968819618225098, -3.20523738861084, -2.913593053817749, -2.621948480606079, -2.330303907394409, -2.0386595726013184, -1.7470149993896484, -1.455370545387268, -1.1637260913848877, -0.8720815181732178, -0.580437183380127, -0.28879261016845703, 0.0028518736362457275, 0.2944963574409485, 0.5861408710479736, 0.877785325050354, 1.1694297790527344, 1.4610743522644043, 1.7527186870574951, 2.044363260269165, 2.336007833480835, 2.627652168273926, 2.9192967414855957, 3.2109413146972656, 3.5025856494903564, 3.7942302227020264, 4.085874557495117, 4.377519130706787, 4.669163703918457, 4.960808277130127, 5.252452850341797, 5.544096946716309, 5.8357415199279785, 6.127386093139648, 6.41903018951416, 6.710675239562988, 7.002319812774658, 7.293964385986328, 7.58560848236084, 7.87725305557251, 8.16889762878418, 8.460542678833008, 8.75218677520752, 9.043830871582031]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 2.0, 6.0, 9.0, 9.0, 8.0, 22.0, 34.0, 42.0, 58.0, 87.0, 139.0, 246.0, 473.0, 1070.0, 2844.0, 12698.0, 847141.0, 3311650.0, 12887.0, 2848.0, 986.0, 431.0, 241.0, 133.0, 80.0, 51.0, 29.0, 15.0, 10.0, 13.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.8699264526367188, -0.8443450927734375, -0.8187637329101562, -0.793182373046875, -0.7676010131835938, -0.7420196533203125, -0.7164382934570312, -0.69085693359375, -0.6652755737304688, -0.6396942138671875, -0.6141128540039062, -0.588531494140625, -0.5629501342773438, -0.5373687744140625, -0.5117874145507812, -0.4862060546875, -0.46062469482421875, -0.4350433349609375, -0.40946197509765625, -0.383880615234375, -0.35829925537109375, -0.3327178955078125, -0.30713653564453125, -0.28155517578125, -0.25597381591796875, -0.2303924560546875, -0.20481109619140625, -0.179229736328125, -0.15364837646484375, -0.1280670166015625, -0.10248565673828125, -0.076904296875, -0.05132293701171875, -0.0257415771484375, -0.00016021728515625, 0.025421142578125, 0.05100250244140625, 0.0765838623046875, 0.10216522216796875, 0.12774658203125, 0.15332794189453125, 0.1789093017578125, 0.20449066162109375, 0.230072021484375, 0.25565338134765625, 0.2812347412109375, 0.30681610107421875, 0.3323974609375, 0.35797882080078125, 0.3835601806640625, 0.40914154052734375, 0.434722900390625, 0.46030426025390625, 0.4858856201171875, 0.5114669799804688, 0.53704833984375, 0.5626296997070312, 0.5882110595703125, 0.6137924194335938, 0.639373779296875, 0.6649551391601562, 0.6905364990234375, 0.7161178588867188, 0.74169921875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 7.0, 7.0, 12.0, 20.0, 22.0, 25.0, 31.0, 23.0, 39.0, 44.0, 52.0, 54.0, 46.0, 60.0, 60.0, 62.0, 56.0, 45.0, 55.0, 44.0, 39.0, 30.0, 29.0, 22.0, 18.0, 29.0, 13.0, 8.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.513671875, -0.4992103576660156, -0.48474884033203125, -0.4702873229980469, -0.4558258056640625, -0.4413642883300781, -0.42690277099609375, -0.4124412536621094, -0.397979736328125, -0.3835182189941406, -0.36905670166015625, -0.3545951843261719, -0.3401336669921875, -0.3256721496582031, -0.31121063232421875, -0.2967491149902344, -0.28228759765625, -0.2678260803222656, -0.25336456298828125, -0.23890304565429688, -0.2244415283203125, -0.20998001098632812, -0.19551849365234375, -0.18105697631835938, -0.166595458984375, -0.15213394165039062, -0.13767242431640625, -0.12321090698242188, -0.1087493896484375, -0.09428787231445312, -0.07982635498046875, -0.06536483764648438, -0.0509033203125, -0.036441802978515625, -0.02198028564453125, -0.007518768310546875, 0.0069427490234375, 0.021404266357421875, 0.03586578369140625, 0.050327301025390625, 0.064788818359375, 0.07925033569335938, 0.09371185302734375, 0.10817337036132812, 0.1226348876953125, 0.13709640502929688, 0.15155792236328125, 0.16601943969726562, 0.18048095703125, 0.19494247436523438, 0.20940399169921875, 0.22386550903320312, 0.2383270263671875, 0.2527885437011719, 0.26725006103515625, 0.2817115783691406, 0.296173095703125, 0.3106346130371094, 0.32509613037109375, 0.3395576477050781, 0.3540191650390625, 0.3684806823730469, 0.38294219970703125, 0.3974037170410156, 0.411865234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 2.0, 5.0, 4.0, 10.0, 13.0, 11.0, 21.0, 28.0, 38.0, 46.0, 66.0, 107.0, 111.0, 156.0, 237.0, 486.0, 725.0, 1377.0, 2818.0, 6711.0, 23421.0, 219023.0, 3854448.0, 63048.0, 12408.0, 4341.0, 1966.0, 1023.0, 578.0, 324.0, 214.0, 119.0, 94.0, 68.0, 57.0, 50.0, 27.0, 31.0, 18.0, 16.0, 9.0, 11.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.417724609375, -0.4034538269042969, -0.38918304443359375, -0.3749122619628906, -0.3606414794921875, -0.3463706970214844, -0.33209991455078125, -0.3178291320800781, -0.303558349609375, -0.2892875671386719, -0.27501678466796875, -0.2607460021972656, -0.2464752197265625, -0.23220443725585938, -0.21793365478515625, -0.20366287231445312, -0.18939208984375, -0.17512130737304688, -0.16085052490234375, -0.14657974243164062, -0.1323089599609375, -0.11803817749023438, -0.10376739501953125, -0.08949661254882812, -0.075225830078125, -0.060955047607421875, -0.04668426513671875, -0.032413482666015625, -0.0181427001953125, -0.003871917724609375, 0.01039886474609375, 0.024669647216796875, 0.0389404296875, 0.053211212158203125, 0.06748199462890625, 0.08175277709960938, 0.0960235595703125, 0.11029434204101562, 0.12456512451171875, 0.13883590698242188, 0.153106689453125, 0.16737747192382812, 0.18164825439453125, 0.19591903686523438, 0.2101898193359375, 0.22446060180664062, 0.23873138427734375, 0.2530021667480469, 0.26727294921875, 0.2815437316894531, 0.29581451416015625, 0.3100852966308594, 0.3243560791015625, 0.3386268615722656, 0.35289764404296875, 0.3671684265136719, 0.381439208984375, 0.3957099914550781, 0.40998077392578125, 0.4242515563964844, 0.4385223388671875, 0.4527931213378906, 0.46706390380859375, 0.4813346862792969, 0.49560546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 10.0, 15.0, 18.0, 50.0, 198.0, 3442.0, 240.0, 55.0, 17.0, 11.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2818450927734375, -0.272918701171875, -0.2639923095703125, -0.25506591796875, -0.2461395263671875, -0.237213134765625, -0.2282867431640625, -0.2193603515625, -0.2104339599609375, -0.201507568359375, -0.1925811767578125, -0.18365478515625, -0.1747283935546875, -0.165802001953125, -0.1568756103515625, -0.14794921875, -0.1390228271484375, -0.130096435546875, -0.1211700439453125, -0.11224365234375, -0.1033172607421875, -0.094390869140625, -0.0854644775390625, -0.0765380859375, -0.0676116943359375, -0.058685302734375, -0.0497589111328125, -0.04083251953125, -0.0319061279296875, -0.022979736328125, -0.0140533447265625, -0.005126953125, 0.0037994384765625, 0.012725830078125, 0.0216522216796875, 0.03057861328125, 0.0395050048828125, 0.048431396484375, 0.0573577880859375, 0.0662841796875, 0.0752105712890625, 0.084136962890625, 0.0930633544921875, 0.10198974609375, 0.1109161376953125, 0.119842529296875, 0.1287689208984375, 0.1376953125, 0.1466217041015625, 0.155548095703125, 0.1644744873046875, 0.17340087890625, 0.1823272705078125, 0.191253662109375, 0.2001800537109375, 0.2091064453125, 0.2180328369140625, 0.226959228515625, 0.2358856201171875, 0.24481201171875, 0.2537384033203125, 0.262664794921875, 0.2715911865234375, 0.280517578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 19.0, 61.0, 186.0, 296.0, 256.0, 137.0, 33.0, 12.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8239659070968628, -0.791095495223999, -0.75822514295578, -0.7253547310829163, -0.6924843788146973, -0.6596139669418335, -0.6267435550689697, -0.593873143196106, -0.561002790927887, -0.5281323790550232, -0.4952620267868042, -0.46239161491394043, -0.42952123284339905, -0.39665085077285767, -0.3637804388999939, -0.3309100568294525, -0.29803967475891113, -0.26516929268836975, -0.23229889571666718, -0.1994284987449646, -0.16655811667442322, -0.13368773460388184, -0.10081733763217926, -0.06794694066047668, -0.0350765585899353, -0.002206169068813324, 0.030664220452308655, 0.06353460997343063, 0.09640499949455261, 0.129275381565094, 0.16214577853679657, 0.19501617550849915, 0.22788643836975098, 0.26075682044029236, 0.29362720251083374, 0.3264976143836975, 0.3593679964542389, 0.3922383785247803, 0.42510879039764404, 0.4579791724681854, 0.4908495545387268, 0.5237199664115906, 0.5565903186798096, 0.5894607305526733, 0.6223311424255371, 0.6552014946937561, 0.6880719065666199, 0.7209422588348389, 0.7538126707077026, 0.7866830825805664, 0.8195534348487854, 0.8524238467216492, 0.8852941989898682, 0.9181646108627319, 0.9510350227355957, 0.9839054346084595, 1.0167758464813232, 1.049646258354187, 1.0825166702270508, 1.115386962890625, 1.1482573747634888, 1.1811277866363525, 1.2139981985092163, 1.24686861038208, 1.2797389030456543]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 14.0, 16.0, 13.0, 23.0, 24.0, 29.0, 32.0, 38.0, 37.0, 40.0, 42.0, 43.0, 52.0, 54.0, 55.0, 58.0, 50.0, 55.0, 32.0, 48.0, 34.0, 29.0, 35.0, 20.0, 28.0, 18.0, 16.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3616759181022644, -0.34910592436790466, -0.3365359306335449, -0.32396596670150757, -0.3113959729671478, -0.2988259792327881, -0.28625598549842834, -0.2736859917640686, -0.26111602783203125, -0.2485460340976715, -0.23597605526447296, -0.22340606153011322, -0.21083608269691467, -0.19826608896255493, -0.1856960952281952, -0.17312610149383545, -0.1605561077594757, -0.14798611402511597, -0.13541613519191742, -0.12284614145755768, -0.11027615517377853, -0.09770616888999939, -0.08513617515563965, -0.0725661888718605, -0.05999620258808136, -0.047426216304302216, -0.03485622629523277, -0.02228623628616333, -0.009716250002384186, 0.0028537362813949585, 0.0154237300157547, 0.027993716299533844, 0.04056370258331299, 0.05313368886709213, 0.06570367515087128, 0.07827366888523102, 0.09084365516901016, 0.1034136414527893, 0.11598363518714905, 0.1285536289215088, 0.14112360775470734, 0.15369360148906708, 0.16626358032226562, 0.17883357405662537, 0.1914035677909851, 0.20397354662418365, 0.2165435403585434, 0.22911351919174194, 0.24168351292610168, 0.2542535066604614, 0.26682350039482117, 0.2793934941291809, 0.29196345806121826, 0.304533451795578, 0.31710344552993774, 0.3296734392642975, 0.3422434329986572, 0.35481342673301697, 0.3673834204673767, 0.37995338439941406, 0.3925233781337738, 0.40509337186813354, 0.4176633656024933, 0.430233359336853, 0.4428033232688904]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 11.0, 17.0, 25.0, 37.0, 78.0, 123.0, 266.0, 535.0, 1285.0, 3519.0, 11558.0, 50822.0, 305097.0, 543072.0, 102342.0, 20661.0, 5647.0, 1876.0, 788.0, 367.0, 188.0, 85.0, 56.0, 35.0, 19.0, 14.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5308380126953125, -0.507965087890625, -0.4850921630859375, -0.46221923828125, -0.4393463134765625, -0.416473388671875, -0.3936004638671875, -0.3707275390625, -0.3478546142578125, -0.324981689453125, -0.3021087646484375, -0.27923583984375, -0.2563629150390625, -0.233489990234375, -0.2106170654296875, -0.187744140625, -0.1648712158203125, -0.141998291015625, -0.1191253662109375, -0.09625244140625, -0.0733795166015625, -0.050506591796875, -0.0276336669921875, -0.0047607421875, 0.0181121826171875, 0.040985107421875, 0.0638580322265625, 0.08673095703125, 0.1096038818359375, 0.132476806640625, 0.1553497314453125, 0.17822265625, 0.2010955810546875, 0.223968505859375, 0.2468414306640625, 0.26971435546875, 0.2925872802734375, 0.315460205078125, 0.3383331298828125, 0.3612060546875, 0.3840789794921875, 0.406951904296875, 0.4298248291015625, 0.45269775390625, 0.4755706787109375, 0.498443603515625, 0.5213165283203125, 0.544189453125, 0.5670623779296875, 0.589935302734375, 0.6128082275390625, 0.63568115234375, 0.6585540771484375, 0.681427001953125, 0.7042999267578125, 0.7271728515625, 0.7500457763671875, 0.772918701171875, 0.7957916259765625, 0.81866455078125, 0.8415374755859375, 0.864410400390625, 0.8872833251953125, 0.91015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 13.0, 8.0, 18.0, 21.0, 15.0, 23.0, 32.0, 19.0, 40.0, 48.0, 37.0, 49.0, 58.0, 54.0, 58.0, 52.0, 63.0, 53.0, 41.0, 37.0, 43.0, 42.0, 23.0, 29.0, 26.0, 17.0, 20.0, 11.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.48974609375, -0.4760704040527344, -0.46239471435546875, -0.4487190246582031, -0.4350433349609375, -0.4213676452636719, -0.40769195556640625, -0.3940162658691406, -0.380340576171875, -0.3666648864746094, -0.35298919677734375, -0.3393135070800781, -0.3256378173828125, -0.3119621276855469, -0.29828643798828125, -0.2846107482910156, -0.27093505859375, -0.2572593688964844, -0.24358367919921875, -0.22990798950195312, -0.2162322998046875, -0.20255661010742188, -0.18888092041015625, -0.17520523071289062, -0.161529541015625, -0.14785385131835938, -0.13417816162109375, -0.12050247192382812, -0.1068267822265625, -0.09315109252929688, -0.07947540283203125, -0.06579971313476562, -0.0521240234375, -0.038448333740234375, -0.02477264404296875, -0.011096954345703125, 0.0025787353515625, 0.016254425048828125, 0.02993011474609375, 0.043605804443359375, 0.057281494140625, 0.07095718383789062, 0.08463287353515625, 0.09830856323242188, 0.1119842529296875, 0.12565994262695312, 0.13933563232421875, 0.15301132202148438, 0.16668701171875, 0.18036270141601562, 0.19403839111328125, 0.20771408081054688, 0.2213897705078125, 0.23506546020507812, 0.24874114990234375, 0.2624168395996094, 0.276092529296875, 0.2897682189941406, 0.30344390869140625, 0.3171195983886719, 0.3307952880859375, 0.3444709777832031, 0.35814666748046875, 0.3718223571777344, 0.385498046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 5.0, 7.0, 9.0, 24.0, 39.0, 67.0, 119.0, 289.0, 712.0, 2946.0, 29303.0, 841453.0, 163411.0, 7936.0, 1386.0, 436.0, 151.0, 96.0, 61.0, 32.0, 13.0, 15.0, 13.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.9326171875, -1.8827362060546875, -1.832855224609375, -1.7829742431640625, -1.73309326171875, -1.6832122802734375, -1.633331298828125, -1.5834503173828125, -1.5335693359375, -1.4836883544921875, -1.433807373046875, -1.3839263916015625, -1.33404541015625, -1.2841644287109375, -1.234283447265625, -1.1844024658203125, -1.134521484375, -1.0846405029296875, -1.034759521484375, -0.9848785400390625, -0.93499755859375, -0.8851165771484375, -0.835235595703125, -0.7853546142578125, -0.7354736328125, -0.6855926513671875, -0.635711669921875, -0.5858306884765625, -0.53594970703125, -0.4860687255859375, -0.436187744140625, -0.3863067626953125, -0.33642578125, -0.2865447998046875, -0.236663818359375, -0.1867828369140625, -0.13690185546875, -0.0870208740234375, -0.037139892578125, 0.0127410888671875, 0.0626220703125, 0.1125030517578125, 0.162384033203125, 0.2122650146484375, 0.26214599609375, 0.3120269775390625, 0.361907958984375, 0.4117889404296875, 0.461669921875, 0.5115509033203125, 0.561431884765625, 0.6113128662109375, 0.66119384765625, 0.7110748291015625, 0.760955810546875, 0.8108367919921875, 0.8607177734375, 0.9105987548828125, 0.960479736328125, 1.0103607177734375, 1.06024169921875, 1.1101226806640625, 1.160003662109375, 1.2098846435546875, 1.259765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 14.0, 16.0, 19.0, 28.0, 33.0, 53.0, 37.0, 58.0, 57.0, 53.0, 67.0, 58.0, 83.0, 63.0, 67.0, 56.0, 46.0, 37.0, 32.0, 39.0, 15.0, 19.0, 8.0, 10.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.443359375, -2.36749267578125, -2.2916259765625, -2.21575927734375, -2.139892578125, -2.06402587890625, -1.9881591796875, -1.91229248046875, -1.83642578125, -1.76055908203125, -1.6846923828125, -1.60882568359375, -1.532958984375, -1.45709228515625, -1.3812255859375, -1.30535888671875, -1.2294921875, -1.15362548828125, -1.0777587890625, -1.00189208984375, -0.926025390625, -0.85015869140625, -0.7742919921875, -0.69842529296875, -0.62255859375, -0.54669189453125, -0.4708251953125, -0.39495849609375, -0.319091796875, -0.24322509765625, -0.1673583984375, -0.09149169921875, -0.015625, 0.06024169921875, 0.1361083984375, 0.21197509765625, 0.287841796875, 0.36370849609375, 0.4395751953125, 0.51544189453125, 0.59130859375, 0.66717529296875, 0.7430419921875, 0.81890869140625, 0.894775390625, 0.97064208984375, 1.0465087890625, 1.12237548828125, 1.1982421875, 1.27410888671875, 1.3499755859375, 1.42584228515625, 1.501708984375, 1.57757568359375, 1.6534423828125, 1.72930908203125, 1.80517578125, 1.88104248046875, 1.9569091796875, 2.03277587890625, 2.108642578125, 2.18450927734375, 2.2603759765625, 2.33624267578125, 2.412109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 26.0, 68.0, 193.0, 1625.0, 1039715.0, 6486.0, 316.0, 77.0, 27.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.857421875, -3.771026611328125, -3.68463134765625, -3.598236083984375, -3.5118408203125, -3.425445556640625, -3.33905029296875, -3.252655029296875, -3.166259765625, -3.079864501953125, -2.99346923828125, -2.907073974609375, -2.8206787109375, -2.734283447265625, -2.64788818359375, -2.561492919921875, -2.47509765625, -2.388702392578125, -2.30230712890625, -2.215911865234375, -2.1295166015625, -2.043121337890625, -1.95672607421875, -1.870330810546875, -1.783935546875, -1.697540283203125, -1.61114501953125, -1.524749755859375, -1.4383544921875, -1.351959228515625, -1.26556396484375, -1.179168701171875, -1.0927734375, -1.006378173828125, -0.91998291015625, -0.833587646484375, -0.7471923828125, -0.660797119140625, -0.57440185546875, -0.488006591796875, -0.401611328125, -0.315216064453125, -0.22882080078125, -0.142425537109375, -0.0560302734375, 0.030364990234375, 0.11676025390625, 0.203155517578125, 0.28955078125, 0.375946044921875, 0.46234130859375, 0.548736572265625, 0.6351318359375, 0.721527099609375, 0.80792236328125, 0.894317626953125, 0.980712890625, 1.067108154296875, 1.15350341796875, 1.239898681640625, 1.3262939453125, 1.412689208984375, 1.49908447265625, 1.585479736328125, 1.671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 8.0, 6.0, 15.0, 25.0, 28.0, 32.0, 38.0, 58.0, 66.0, 81.0, 118.0, 97.0, 102.0, 79.0, 48.0, 39.0, 32.0, 21.0, 21.0, 15.0, 23.0, 7.0, 6.0, 7.0, 9.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5789947509765625e-05, -5.357526242733002e-05, -5.136057734489441e-05, -4.91458922624588e-05, -4.693120718002319e-05, -4.4716522097587585e-05, -4.250183701515198e-05, -4.028715193271637e-05, -3.807246685028076e-05, -3.5857781767845154e-05, -3.3643096685409546e-05, -3.142841160297394e-05, -2.921372652053833e-05, -2.6999041438102722e-05, -2.4784356355667114e-05, -2.2569671273231506e-05, -2.03549861907959e-05, -1.814030110836029e-05, -1.5925616025924683e-05, -1.3710930943489075e-05, -1.1496245861053467e-05, -9.281560778617859e-06, -7.066875696182251e-06, -4.852190613746643e-06, -2.637505531311035e-06, -4.2282044887542725e-07, 1.7918646335601807e-06, 4.0065497159957886e-06, 6.2212347984313965e-06, 8.435919880867004e-06, 1.0650604963302612e-05, 1.286529004573822e-05, 1.5079975128173828e-05, 1.7294660210609436e-05, 1.9509345293045044e-05, 2.1724030375480652e-05, 2.393871545791626e-05, 2.6153400540351868e-05, 2.8368085622787476e-05, 3.0582770705223083e-05, 3.279745578765869e-05, 3.50121408700943e-05, 3.722682595252991e-05, 3.9441511034965515e-05, 4.165619611740112e-05, 4.387088119983673e-05, 4.608556628227234e-05, 4.830025136470795e-05, 5.0514936447143555e-05, 5.272962152957916e-05, 5.494430661201477e-05, 5.715899169445038e-05, 5.9373676776885986e-05, 6.15883618593216e-05, 6.38030469417572e-05, 6.601773202419281e-05, 6.823241710662842e-05, 7.044710218906403e-05, 7.266178727149963e-05, 7.487647235393524e-05, 7.709115743637085e-05, 7.930584251880646e-05, 8.152052760124207e-05, 8.373521268367767e-05, 8.594989776611328e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 15.0, 31.0, 57.0, 139.0, 521.0, 28629.0, 1017289.0, 1477.0, 225.0, 88.0, 38.0, 19.0, 11.0, 4.0, 8.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.3720703125, -2.3046875, -2.2373046875, -2.169921875, -2.1025390625, -2.03515625, -1.9677734375, -1.900390625, -1.8330078125, -1.765625, -1.6982421875, -1.630859375, -1.5634765625, -1.49609375, -1.4287109375, -1.361328125, -1.2939453125, -1.2265625, -1.1591796875, -1.091796875, -1.0244140625, -0.95703125, -0.8896484375, -0.822265625, -0.7548828125, -0.6875, -0.6201171875, -0.552734375, -0.4853515625, -0.41796875, -0.3505859375, -0.283203125, -0.2158203125, -0.1484375, -0.0810546875, -0.013671875, 0.0537109375, 0.12109375, 0.1884765625, 0.255859375, 0.3232421875, 0.390625, 0.4580078125, 0.525390625, 0.5927734375, 0.66015625, 0.7275390625, 0.794921875, 0.8623046875, 0.9296875, 0.9970703125, 1.064453125, 1.1318359375, 1.19921875, 1.2666015625, 1.333984375, 1.4013671875, 1.46875, 1.5361328125, 1.603515625, 1.6708984375, 1.73828125, 1.8056640625, 1.873046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 6.0, 11.0, 15.0, 95.0, 349.0, 383.0, 115.0, 22.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.46521759033203125, -0.4074859619140625, -0.34975433349609375, -0.292022705078125, -0.23429107666015625, -0.1765594482421875, -0.11882781982421875, -0.06109619140625, -0.00336456298828125, 0.0543670654296875, 0.11209869384765625, 0.169830322265625, 0.22756195068359375, 0.2852935791015625, 0.34302520751953125, 0.4007568359375, 0.45848846435546875, 0.5162200927734375, 0.5739517211914062, 0.631683349609375, 0.6894149780273438, 0.7471466064453125, 0.8048782348632812, 0.86260986328125, 0.9203414916992188, 0.9780731201171875, 1.0358047485351562, 1.093536376953125, 1.1512680053710938, 1.2089996337890625, 1.2667312622070312, 1.324462890625, 1.3821945190429688, 1.4399261474609375, 1.4976577758789062, 1.555389404296875, 1.6131210327148438, 1.6708526611328125, 1.7285842895507812, 1.78631591796875, 1.8440475463867188, 1.9017791748046875, 1.9595108032226562, 2.017242431640625, 2.0749740600585938, 2.1327056884765625, 2.1904373168945312, 2.2481689453125, 2.3059005737304688, 2.3636322021484375, 2.4213638305664062, 2.479095458984375, 2.5368270874023438, 2.5945587158203125, 2.6522903442382812, 2.71002197265625, 2.7677536010742188, 2.8254852294921875, 2.8832168579101562, 2.940948486328125, 2.9986801147460938, 3.0564117431640625, 3.1141433715820312, 3.171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 9.0, 16.0, 57.0, 196.0, 328.0, 246.0, 78.0, 31.0, 13.0, 11.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8080573081970215, -7.326276779174805, -6.844496250152588, -6.362715721130371, -5.880935192108154, -5.3991546630859375, -4.9173736572265625, -4.435593605041504, -3.953812837600708, -3.472032308578491, -2.9902517795562744, -2.5084710121154785, -2.0266904830932617, -1.544909954071045, -1.0631294250488281, -0.5813488960266113, -0.09956836700439453, 0.38221219182014465, 0.8639927506446838, 1.3457733392715454, 1.8275538682937622, 2.3093345165252686, 2.7911150455474854, 3.272895574569702, 3.754676103591919, 4.236456871032715, 4.718237400054932, 5.200017929077148, 5.681798458099365, 6.163578987121582, 6.645359516143799, 7.127140045166016, 7.608920097351074, 8.09070110321045, 8.572481155395508, 9.054262161254883, 9.536042213439941, 10.017823219299316, 10.499603271484375, 10.98138427734375, 11.463164329528809, 11.944945335388184, 12.426725387573242, 12.908506393432617, 13.390286445617676, 13.87206745147705, 14.35384750366211, 14.835628509521484, 15.31740951538086, 15.799190521240234, 16.28097152709961, 16.76275062561035, 17.244531631469727, 17.7263126373291, 18.208093643188477, 18.68987274169922, 19.171653747558594, 19.65343475341797, 20.135215759277344, 20.616994857788086, 21.09877586364746, 21.580556869506836, 22.06233787536621, 22.544116973876953, 23.025897979736328]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 3.0, 9.0, 6.0, 6.0, 16.0, 7.0, 25.0, 19.0, 32.0, 26.0, 21.0, 38.0, 27.0, 40.0, 46.0, 66.0, 43.0, 43.0, 65.0, 43.0, 44.0, 45.0, 39.0, 33.0, 37.0, 36.0, 26.0, 24.0, 17.0, 14.0, 22.0, 14.0, 15.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.860803604125977, -7.61000394821167, -7.3592047691345215, -7.108405113220215, -6.857605934143066, -6.60680627822876, -6.356006622314453, -6.105207443237305, -5.854407787322998, -5.603608131408691, -5.352808952331543, -5.102009296417236, -4.85120964050293, -4.600410461425781, -4.349610805511475, -4.098811149597168, -3.8480119705200195, -3.597212553024292, -3.3464131355285645, -3.095613479614258, -2.8448140621185303, -2.5940146446228027, -2.343214988708496, -2.0924155712127686, -1.841616153717041, -1.5908167362213135, -1.3400171995162964, -1.0892176628112793, -0.8384182453155518, -0.5876188278198242, -0.33681929111480713, -0.08601975440979004, 0.1647796630859375, 0.4155791401863098, 0.6663786172866821, 0.9171780943870544, 1.1679775714874268, 1.4187769889831543, 1.6695765256881714, 1.9203760623931885, 2.171175479888916, 2.4219748973846436, 2.672774314880371, 2.9235739707946777, 3.1743733882904053, 3.425172805786133, 3.6759724617004395, 3.926771879196167, 4.1775712966918945, 4.428370952606201, 4.67917013168335, 4.929969787597656, 5.180768966674805, 5.431568622589111, 5.682368278503418, 5.933167457580566, 6.183967113494873, 6.43476676940918, 6.685565948486328, 6.936365604400635, 7.187165260314941, 7.43796443939209, 7.6887640953063965, 7.939563751220703, 8.190362930297852]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 11.0, 6.0, 9.0, 15.0, 16.0, 27.0, 32.0, 45.0, 78.0, 138.0, 221.0, 464.0, 1312.0, 5341.0, 78339.0, 4087748.0, 16682.0, 2332.0, 721.0, 310.0, 150.0, 87.0, 67.0, 33.0, 25.0, 15.0, 9.0, 8.0, 2.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-1.3779296875, -1.3460845947265625, -1.314239501953125, -1.2823944091796875, -1.25054931640625, -1.2187042236328125, -1.186859130859375, -1.1550140380859375, -1.1231689453125, -1.0913238525390625, -1.059478759765625, -1.0276336669921875, -0.99578857421875, -0.9639434814453125, -0.932098388671875, -0.9002532958984375, -0.868408203125, -0.8365631103515625, -0.804718017578125, -0.7728729248046875, -0.74102783203125, -0.7091827392578125, -0.677337646484375, -0.6454925537109375, -0.6136474609375, -0.5818023681640625, -0.549957275390625, -0.5181121826171875, -0.48626708984375, -0.4544219970703125, -0.422576904296875, -0.3907318115234375, -0.35888671875, -0.3270416259765625, -0.295196533203125, -0.2633514404296875, -0.23150634765625, -0.1996612548828125, -0.167816162109375, -0.1359710693359375, -0.1041259765625, -0.0722808837890625, -0.040435791015625, -0.0085906982421875, 0.02325439453125, 0.0550994873046875, 0.086944580078125, 0.1187896728515625, 0.150634765625, 0.1824798583984375, 0.214324951171875, 0.2461700439453125, 0.27801513671875, 0.3098602294921875, 0.341705322265625, 0.3735504150390625, 0.4053955078125, 0.4372406005859375, 0.469085693359375, 0.5009307861328125, 0.53277587890625, 0.5646209716796875, 0.596466064453125, 0.6283111572265625, 0.66015625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 6.0, 10.0, 16.0, 8.0, 22.0, 26.0, 37.0, 28.0, 20.0, 31.0, 37.0, 50.0, 53.0, 60.0, 57.0, 65.0, 58.0, 54.0, 54.0, 43.0, 43.0, 35.0, 25.0, 29.0, 26.0, 17.0, 19.0, 12.0, 7.0, 7.0, 12.0, 3.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3415565490722656, -0.32740020751953125, -0.3132438659667969, -0.2990875244140625, -0.2849311828613281, -0.27077484130859375, -0.2566184997558594, -0.242462158203125, -0.22830581665039062, -0.21414947509765625, -0.19999313354492188, -0.1858367919921875, -0.17168045043945312, -0.15752410888671875, -0.14336776733398438, -0.12921142578125, -0.11505508422851562, -0.10089874267578125, -0.08674240112304688, -0.0725860595703125, -0.058429718017578125, -0.04427337646484375, -0.030117034912109375, -0.015960693359375, -0.001804351806640625, 0.01235198974609375, 0.026508331298828125, 0.0406646728515625, 0.054821014404296875, 0.06897735595703125, 0.08313369750976562, 0.0972900390625, 0.11144638061523438, 0.12560272216796875, 0.13975906372070312, 0.1539154052734375, 0.16807174682617188, 0.18222808837890625, 0.19638442993164062, 0.210540771484375, 0.22469711303710938, 0.23885345458984375, 0.2530097961425781, 0.2671661376953125, 0.2813224792480469, 0.29547882080078125, 0.3096351623535156, 0.32379150390625, 0.3379478454589844, 0.35210418701171875, 0.3662605285644531, 0.3804168701171875, 0.3945732116699219, 0.40872955322265625, 0.4228858947753906, 0.437042236328125, 0.4511985778808594, 0.46535491943359375, 0.4795112609863281, 0.4936676025390625, 0.5078239440917969, 0.5219802856445312, 0.5361366271972656, 0.55029296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 10.0, 21.0, 30.0, 55.0, 75.0, 127.0, 185.0, 314.0, 568.0, 1080.0, 2372.0, 7883.0, 79961.0, 4051127.0, 40383.0, 5805.0, 2113.0, 941.0, 505.0, 274.0, 165.0, 90.0, 69.0, 44.0, 15.0, 16.0, 11.0, 5.0, 6.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6845703125, -0.6634368896484375, -0.642303466796875, -0.6211700439453125, -0.60003662109375, -0.5789031982421875, -0.557769775390625, -0.5366363525390625, -0.5155029296875, -0.4943695068359375, -0.473236083984375, -0.4521026611328125, -0.43096923828125, -0.4098358154296875, -0.388702392578125, -0.3675689697265625, -0.346435546875, -0.3253021240234375, -0.304168701171875, -0.2830352783203125, -0.26190185546875, -0.2407684326171875, -0.219635009765625, -0.1985015869140625, -0.1773681640625, -0.1562347412109375, -0.135101318359375, -0.1139678955078125, -0.09283447265625, -0.0717010498046875, -0.050567626953125, -0.0294342041015625, -0.00830078125, 0.0128326416015625, 0.033966064453125, 0.0550994873046875, 0.07623291015625, 0.0973663330078125, 0.118499755859375, 0.1396331787109375, 0.1607666015625, 0.1819000244140625, 0.203033447265625, 0.2241668701171875, 0.24530029296875, 0.2664337158203125, 0.287567138671875, 0.3087005615234375, 0.329833984375, 0.3509674072265625, 0.372100830078125, 0.3932342529296875, 0.41436767578125, 0.4355010986328125, 0.456634521484375, 0.4777679443359375, 0.4989013671875, 0.5200347900390625, 0.541168212890625, 0.5623016357421875, 0.58343505859375, 0.6045684814453125, 0.625701904296875, 0.6468353271484375, 0.66796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 12.0, 34.0, 81.0, 284.0, 3422.0, 139.0, 47.0, 20.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.25237464904785156, -0.24596023559570312, -0.2395458221435547, -0.23313140869140625, -0.2267169952392578, -0.22030258178710938, -0.21388816833496094, -0.2074737548828125, -0.20105934143066406, -0.19464492797851562, -0.1882305145263672, -0.18181610107421875, -0.1754016876220703, -0.16898727416992188, -0.16257286071777344, -0.156158447265625, -0.14974403381347656, -0.14332962036132812, -0.1369152069091797, -0.13050079345703125, -0.12408638000488281, -0.11767196655273438, -0.11125755310058594, -0.1048431396484375, -0.09842872619628906, -0.09201431274414062, -0.08559989929199219, -0.07918548583984375, -0.07277107238769531, -0.06635665893554688, -0.05994224548339844, -0.05352783203125, -0.04711341857910156, -0.040699005126953125, -0.03428459167480469, -0.02787017822265625, -0.021455764770507812, -0.015041351318359375, -0.008626937866210938, -0.0022125244140625, 0.0042018890380859375, 0.010616302490234375, 0.017030715942382812, 0.02344512939453125, 0.029859542846679688, 0.036273956298828125, 0.04268836975097656, 0.049102783203125, 0.05551719665527344, 0.061931610107421875, 0.06834602355957031, 0.07476043701171875, 0.08117485046386719, 0.08758926391601562, 0.09400367736816406, 0.1004180908203125, 0.10683250427246094, 0.11324691772460938, 0.11966133117675781, 0.12607574462890625, 0.1324901580810547, 0.13890457153320312, 0.14531898498535156, 0.1517333984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 15.0, 35.0, 163.0, 437.0, 289.0, 56.0, 11.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1942410469055176, -2.1520349979400635, -2.1098289489746094, -2.0676229000091553, -2.025416851043701, -1.9832109212875366, -1.9410048723220825, -1.8987988233566284, -1.8565927743911743, -1.8143867254257202, -1.7721806764602661, -1.7299747467041016, -1.6877686977386475, -1.6455626487731934, -1.6033565998077393, -1.5611505508422852, -1.518944501876831, -1.476738452911377, -1.4345324039459229, -1.3923263549804688, -1.3501204252243042, -1.30791437625885, -1.265708327293396, -1.223502278327942, -1.1812963485717773, -1.1390902996063232, -1.0968842506408691, -1.054678201675415, -1.0124722719192505, -0.9702662229537964, -0.9280601739883423, -0.8858541250228882, -0.8436480760574341, -0.80144202709198, -0.7592360377311707, -0.7170299887657166, -0.6748239398002625, -0.6326179504394531, -0.590411901473999, -0.5482058525085449, -0.5059998035430908, -0.4637937843799591, -0.421587735414505, -0.3793817162513733, -0.3371756672859192, -0.2949696481227875, -0.25276362895965576, -0.21055757999420166, -0.16835159063339233, -0.12614555656909943, -0.08393952995538712, -0.041733503341674805, 0.00047253072261810303, 0.04267856478691101, 0.08488458395004272, 0.12709063291549683, 0.16929665207862854, 0.21150268614292145, 0.25370872020721436, 0.29591473937034607, 0.3381207585334778, 0.3803268074989319, 0.4225328266620636, 0.4647388756275177, 0.5069448947906494]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 6.0, 8.0, 3.0, 12.0, 10.0, 14.0, 17.0, 28.0, 35.0, 33.0, 36.0, 33.0, 56.0, 58.0, 75.0, 66.0, 64.0, 55.0, 45.0, 45.0, 57.0, 58.0, 38.0, 30.0, 28.0, 26.0, 16.0, 10.0, 14.0, 10.0, 6.0, 1.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33589857816696167, -0.32257235050201416, -0.30924612283706665, -0.29591989517211914, -0.28259366750717163, -0.2692674398422241, -0.2559412121772766, -0.2426149696111679, -0.2292887419462204, -0.2159625142812729, -0.20263628661632538, -0.18931004405021667, -0.17598381638526917, -0.16265758872032166, -0.14933136105537415, -0.13600513339042664, -0.12267890572547913, -0.10935267806053162, -0.0960264503955841, -0.082700215280056, -0.06937398761510849, -0.05604775995016098, -0.042721524834632874, -0.029395297169685364, -0.016069069504737854, -0.002742839977145195, 0.010583389550447464, 0.023909620940685272, 0.03723584860563278, 0.05056207627058029, 0.0638883113861084, 0.07721453905105591, 0.09054076671600342, 0.10386699438095093, 0.11719322204589844, 0.13051944971084595, 0.14384567737579346, 0.15717190504074097, 0.17049814760684967, 0.18382437527179718, 0.1971506029367447, 0.2104768306016922, 0.2238030582666397, 0.2371293008327484, 0.2504555284976959, 0.26378175616264343, 0.27710798382759094, 0.29043421149253845, 0.30376043915748596, 0.31708666682243347, 0.330412894487381, 0.3437391221523285, 0.357065349817276, 0.3703915774822235, 0.3837178349494934, 0.3970440626144409, 0.4103702902793884, 0.42369651794433594, 0.43702274560928345, 0.45034897327423096, 0.46367520093917847, 0.477001428604126, 0.4903276562690735, 0.503653883934021, 0.5169801115989685]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 10.0, 10.0, 19.0, 22.0, 38.0, 42.0, 73.0, 104.0, 139.0, 279.0, 519.0, 1145.0, 2766.0, 7994.0, 26172.0, 107056.0, 505767.0, 309272.0, 61509.0, 16368.0, 5345.0, 2026.0, 866.0, 414.0, 226.0, 146.0, 66.0, 59.0, 36.0, 17.0, 20.0, 9.0, 4.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5861053466796875, -0.565765380859375, -0.5454254150390625, -0.52508544921875, -0.5047454833984375, -0.484405517578125, -0.4640655517578125, -0.4437255859375, -0.4233856201171875, -0.403045654296875, -0.3827056884765625, -0.36236572265625, -0.3420257568359375, -0.321685791015625, -0.3013458251953125, -0.281005859375, -0.2606658935546875, -0.240325927734375, -0.2199859619140625, -0.19964599609375, -0.1793060302734375, -0.158966064453125, -0.1386260986328125, -0.1182861328125, -0.0979461669921875, -0.077606201171875, -0.0572662353515625, -0.03692626953125, -0.0165863037109375, 0.003753662109375, 0.0240936279296875, 0.04443359375, 0.0647735595703125, 0.085113525390625, 0.1054534912109375, 0.12579345703125, 0.1461334228515625, 0.166473388671875, 0.1868133544921875, 0.2071533203125, 0.2274932861328125, 0.247833251953125, 0.2681732177734375, 0.28851318359375, 0.3088531494140625, 0.329193115234375, 0.3495330810546875, 0.369873046875, 0.3902130126953125, 0.410552978515625, 0.4308929443359375, 0.45123291015625, 0.4715728759765625, 0.491912841796875, 0.5122528076171875, 0.5325927734375, 0.5529327392578125, 0.573272705078125, 0.5936126708984375, 0.61395263671875, 0.6342926025390625, 0.654632568359375, 0.6749725341796875, 0.6953125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 10.0, 10.0, 10.0, 11.0, 15.0, 17.0, 23.0, 35.0, 28.0, 20.0, 47.0, 43.0, 49.0, 62.0, 62.0, 73.0, 66.0, 60.0, 53.0, 47.0, 47.0, 40.0, 32.0, 22.0, 35.0, 19.0, 16.0, 14.0, 9.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3638343811035156, -0.34851837158203125, -0.3332023620605469, -0.3178863525390625, -0.3025703430175781, -0.28725433349609375, -0.2719383239746094, -0.256622314453125, -0.24130630493164062, -0.22599029541015625, -0.21067428588867188, -0.1953582763671875, -0.18004226684570312, -0.16472625732421875, -0.14941024780273438, -0.13409423828125, -0.11877822875976562, -0.10346221923828125, -0.08814620971679688, -0.0728302001953125, -0.057514190673828125, -0.04219818115234375, -0.026882171630859375, -0.011566162109375, 0.003749847412109375, 0.01906585693359375, 0.034381866455078125, 0.0496978759765625, 0.06501388549804688, 0.08032989501953125, 0.09564590454101562, 0.1109619140625, 0.12627792358398438, 0.14159393310546875, 0.15690994262695312, 0.1722259521484375, 0.18754196166992188, 0.20285797119140625, 0.21817398071289062, 0.233489990234375, 0.24880599975585938, 0.26412200927734375, 0.2794380187988281, 0.2947540283203125, 0.3100700378417969, 0.32538604736328125, 0.3407020568847656, 0.35601806640625, 0.3713340759277344, 0.38665008544921875, 0.4019660949707031, 0.4172821044921875, 0.4325981140136719, 0.44791412353515625, 0.4632301330566406, 0.478546142578125, 0.4938621520996094, 0.5091781616210938, 0.5244941711425781, 0.5398101806640625, 0.5551261901855469, 0.5704421997070312, 0.5857582092285156, 0.60107421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 9.0, 7.0, 26.0, 27.0, 36.0, 30.0, 57.0, 85.0, 135.0, 208.0, 458.0, 993.0, 3176.0, 15080.0, 154572.0, 791858.0, 69076.0, 8858.0, 2215.0, 729.0, 337.0, 181.0, 97.0, 72.0, 47.0, 31.0, 29.0, 23.0, 15.0, 12.0, 11.0, 15.0, 7.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.2177734375, -1.1823272705078125, -1.146881103515625, -1.1114349365234375, -1.07598876953125, -1.0405426025390625, -1.005096435546875, -0.9696502685546875, -0.9342041015625, -0.8987579345703125, -0.863311767578125, -0.8278656005859375, -0.79241943359375, -0.7569732666015625, -0.721527099609375, -0.6860809326171875, -0.650634765625, -0.6151885986328125, -0.579742431640625, -0.5442962646484375, -0.50885009765625, -0.4734039306640625, -0.437957763671875, -0.4025115966796875, -0.3670654296875, -0.3316192626953125, -0.296173095703125, -0.2607269287109375, -0.22528076171875, -0.1898345947265625, -0.154388427734375, -0.1189422607421875, -0.08349609375, -0.0480499267578125, -0.012603759765625, 0.0228424072265625, 0.05828857421875, 0.0937347412109375, 0.129180908203125, 0.1646270751953125, 0.2000732421875, 0.2355194091796875, 0.270965576171875, 0.3064117431640625, 0.34185791015625, 0.3773040771484375, 0.412750244140625, 0.4481964111328125, 0.483642578125, 0.5190887451171875, 0.554534912109375, 0.5899810791015625, 0.62542724609375, 0.6608734130859375, 0.696319580078125, 0.7317657470703125, 0.7672119140625, 0.8026580810546875, 0.838104248046875, 0.8735504150390625, 0.90899658203125, 0.9444427490234375, 0.979888916015625, 1.0153350830078125, 1.05078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 10.0, 15.0, 26.0, 28.0, 46.0, 45.0, 58.0, 46.0, 65.0, 66.0, 57.0, 73.0, 57.0, 61.0, 69.0, 52.0, 40.0, 30.0, 34.0, 23.0, 14.0, 12.0, 12.0, 12.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.169921875, -3.0893707275390625, -3.008819580078125, -2.9282684326171875, -2.84771728515625, -2.7671661376953125, -2.686614990234375, -2.6060638427734375, -2.5255126953125, -2.4449615478515625, -2.364410400390625, -2.2838592529296875, -2.20330810546875, -2.1227569580078125, -2.042205810546875, -1.9616546630859375, -1.881103515625, -1.8005523681640625, -1.720001220703125, -1.6394500732421875, -1.55889892578125, -1.4783477783203125, -1.397796630859375, -1.3172454833984375, -1.2366943359375, -1.1561431884765625, -1.075592041015625, -0.9950408935546875, -0.91448974609375, -0.8339385986328125, -0.753387451171875, -0.6728363037109375, -0.59228515625, -0.5117340087890625, -0.431182861328125, -0.3506317138671875, -0.27008056640625, -0.1895294189453125, -0.108978271484375, -0.0284271240234375, 0.0521240234375, 0.1326751708984375, 0.213226318359375, 0.2937774658203125, 0.37432861328125, 0.4548797607421875, 0.535430908203125, 0.6159820556640625, 0.696533203125, 0.7770843505859375, 0.857635498046875, 0.9381866455078125, 1.01873779296875, 1.0992889404296875, 1.179840087890625, 1.2603912353515625, 1.3409423828125, 1.4214935302734375, 1.502044677734375, 1.5825958251953125, 1.66314697265625, 1.7436981201171875, 1.824249267578125, 1.9048004150390625, 1.9853515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 9.0, 14.0, 30.0, 106.0, 1023.0, 1033082.0, 13816.0, 330.0, 71.0, 32.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.26580810546875, -2.1663818359375, -2.06695556640625, -1.967529296875, -1.86810302734375, -1.7686767578125, -1.66925048828125, -1.56982421875, -1.47039794921875, -1.3709716796875, -1.27154541015625, -1.172119140625, -1.07269287109375, -0.9732666015625, -0.87384033203125, -0.7744140625, -0.67498779296875, -0.5755615234375, -0.47613525390625, -0.376708984375, -0.27728271484375, -0.1778564453125, -0.07843017578125, 0.02099609375, 0.12042236328125, 0.2198486328125, 0.31927490234375, 0.418701171875, 0.51812744140625, 0.6175537109375, 0.71697998046875, 0.81640625, 0.91583251953125, 1.0152587890625, 1.11468505859375, 1.214111328125, 1.31353759765625, 1.4129638671875, 1.51239013671875, 1.61181640625, 1.71124267578125, 1.8106689453125, 1.91009521484375, 2.009521484375, 2.10894775390625, 2.2083740234375, 2.30780029296875, 2.4072265625, 2.50665283203125, 2.6060791015625, 2.70550537109375, 2.804931640625, 2.90435791015625, 3.0037841796875, 3.10321044921875, 3.20263671875, 3.30206298828125, 3.4014892578125, 3.50091552734375, 3.600341796875, 3.69976806640625, 3.7991943359375, 3.89862060546875, 3.998046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 12.0, 12.0, 15.0, 18.0, 26.0, 24.0, 30.0, 47.0, 52.0, 93.0, 117.0, 112.0, 110.0, 77.0, 59.0, 50.0, 41.0, 30.0, 20.0, 18.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.955862045288086e-05, -6.752181798219681e-05, -6.548501551151276e-05, -6.34482130408287e-05, -6.141141057014465e-05, -5.93746080994606e-05, -5.733780562877655e-05, -5.53010031580925e-05, -5.326420068740845e-05, -5.1227398216724396e-05, -4.9190595746040344e-05, -4.715379327535629e-05, -4.511699080467224e-05, -4.308018833398819e-05, -4.104338586330414e-05, -3.900658339262009e-05, -3.6969780921936035e-05, -3.4932978451251984e-05, -3.289617598056793e-05, -3.085937350988388e-05, -2.882257103919983e-05, -2.6785768568515778e-05, -2.4748966097831726e-05, -2.2712163627147675e-05, -2.0675361156463623e-05, -1.863855868577957e-05, -1.660175621509552e-05, -1.4564953744411469e-05, -1.2528151273727417e-05, -1.0491348803043365e-05, -8.454546332359314e-06, -6.4177438616752625e-06, -4.380941390991211e-06, -2.3441389203071594e-06, -3.073364496231079e-07, 1.7294660210609436e-06, 3.766268491744995e-06, 5.803070962429047e-06, 7.839873433113098e-06, 9.87667590379715e-06, 1.1913478374481201e-05, 1.3950280845165253e-05, 1.5987083315849304e-05, 1.8023885786533356e-05, 2.0060688257217407e-05, 2.209749072790146e-05, 2.413429319858551e-05, 2.6171095669269562e-05, 2.8207898139953613e-05, 3.0244700610637665e-05, 3.2281503081321716e-05, 3.431830555200577e-05, 3.635510802268982e-05, 3.839191049337387e-05, 4.042871296405792e-05, 4.2465515434741974e-05, 4.4502317905426025e-05, 4.653912037611008e-05, 4.857592284679413e-05, 5.061272531747818e-05, 5.264952778816223e-05, 5.468633025884628e-05, 5.6723132729530334e-05, 5.8759935200214386e-05, 6.079673767089844e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 10.0, 9.0, 18.0, 29.0, 64.0, 114.0, 291.0, 945.0, 4909.0, 269784.0, 762898.0, 7606.0, 1173.0, 376.0, 156.0, 81.0, 32.0, 19.0, 12.0, 8.0, 2.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.515594482421875, -0.49114990234375, -0.466705322265625, -0.4422607421875, -0.417816162109375, -0.39337158203125, -0.368927001953125, -0.344482421875, -0.320037841796875, -0.29559326171875, -0.271148681640625, -0.2467041015625, -0.222259521484375, -0.19781494140625, -0.173370361328125, -0.14892578125, -0.124481201171875, -0.10003662109375, -0.075592041015625, -0.0511474609375, -0.026702880859375, -0.00225830078125, 0.022186279296875, 0.046630859375, 0.071075439453125, 0.09552001953125, 0.119964599609375, 0.1444091796875, 0.168853759765625, 0.19329833984375, 0.217742919921875, 0.2421875, 0.266632080078125, 0.29107666015625, 0.315521240234375, 0.3399658203125, 0.364410400390625, 0.38885498046875, 0.413299560546875, 0.437744140625, 0.462188720703125, 0.48663330078125, 0.511077880859375, 0.5355224609375, 0.559967041015625, 0.58441162109375, 0.608856201171875, 0.63330078125, 0.657745361328125, 0.68218994140625, 0.706634521484375, 0.7310791015625, 0.755523681640625, 0.77996826171875, 0.804412841796875, 0.828857421875, 0.853302001953125, 0.87774658203125, 0.902191162109375, 0.9266357421875, 0.951080322265625, 0.97552490234375, 0.999969482421875, 1.0244140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 8.0, 13.0, 25.0, 72.0, 147.0, 226.0, 248.0, 140.0, 47.0, 29.0, 15.0, 6.0, 3.0, 2.0, 2.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5740737915039062, -0.5402374267578125, -0.5064010620117188, -0.472564697265625, -0.43872833251953125, -0.4048919677734375, -0.37105560302734375, -0.33721923828125, -0.30338287353515625, -0.2695465087890625, -0.23571014404296875, -0.201873779296875, -0.16803741455078125, -0.1342010498046875, -0.10036468505859375, -0.0665283203125, -0.03269195556640625, 0.0011444091796875, 0.03498077392578125, 0.068817138671875, 0.10265350341796875, 0.1364898681640625, 0.17032623291015625, 0.20416259765625, 0.23799896240234375, 0.2718353271484375, 0.30567169189453125, 0.339508056640625, 0.37334442138671875, 0.4071807861328125, 0.44101715087890625, 0.474853515625, 0.5086898803710938, 0.5425262451171875, 0.5763626098632812, 0.610198974609375, 0.6440353393554688, 0.6778717041015625, 0.7117080688476562, 0.74554443359375, 0.7793807983398438, 0.8132171630859375, 0.8470535278320312, 0.880889892578125, 0.9147262573242188, 0.9485626220703125, 0.9823989868164062, 1.0162353515625, 1.0500717163085938, 1.0839080810546875, 1.1177444458007812, 1.151580810546875, 1.1854171752929688, 1.2192535400390625, 1.2530899047851562, 1.28692626953125, 1.3207626342773438, 1.3545989990234375, 1.3884353637695312, 1.422271728515625, 1.4561080932617188, 1.4899444580078125, 1.5237808227539062, 1.5576171875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 29.0, 77.0, 347.0, 405.0, 111.0, 20.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.353656768798828, -9.783933639526367, -9.214211463928223, -8.644489288330078, -8.074766159057617, -7.5050435066223145, -6.935320854187012, -6.365598201751709, -5.795875549316406, -5.2261528968811035, -4.656430244445801, -4.086707592010498, -3.5169849395751953, -2.9472622871398926, -2.37753963470459, -1.807816982269287, -1.2380943298339844, -0.6683716773986816, -0.0986490249633789, 0.47107362747192383, 1.0407962799072266, 1.6105189323425293, 2.180241584777832, 2.7499642372131348, 3.3196868896484375, 3.8894095420837402, 4.459132194519043, 5.028854846954346, 5.598577499389648, 6.168300151824951, 6.738022804260254, 7.307745456695557, 7.877468109130859, 8.44719123840332, 9.016913414001465, 9.58663558959961, 10.15635871887207, 10.726081848144531, 11.295804023742676, 11.86552619934082, 12.435249328613281, 13.004972457885742, 13.574694633483887, 14.144416809082031, 14.714139938354492, 15.283863067626953, 15.853585243225098, 16.423307418823242, 16.993030548095703, 17.562753677368164, 18.132476806640625, 18.702198028564453, 19.271921157836914, 19.841644287109375, 20.411365509033203, 20.981088638305664, 21.550811767578125, 22.120534896850586, 22.690258026123047, 23.259979248046875, 23.829702377319336, 24.399425506591797, 24.969146728515625, 25.538869857788086, 26.108592987060547]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 7.0, 2.0, 6.0, 8.0, 11.0, 8.0, 13.0, 11.0, 15.0, 17.0, 21.0, 25.0, 25.0, 30.0, 25.0, 34.0, 26.0, 38.0, 29.0, 42.0, 46.0, 49.0, 44.0, 53.0, 48.0, 37.0, 35.0, 32.0, 30.0, 23.0, 16.0, 21.0, 21.0, 25.0, 18.0, 13.0, 10.0, 19.0, 13.0, 7.0, 6.0, 6.0, 4.0, 7.0, 9.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-8.002874374389648, -7.768739223480225, -7.534604072570801, -7.300469398498535, -7.066334247589111, -6.8321990966796875, -6.598063945770264, -6.36392879486084, -6.129794120788574, -5.89565896987915, -5.661523818969727, -5.427389144897461, -5.193253993988037, -4.959118843078613, -4.7249836921691895, -4.490848541259766, -4.2567138671875, -4.022578716278076, -3.7884438037872314, -3.5543086528778076, -3.320173740386963, -3.086038589477539, -2.8519034385681152, -2.6177685260772705, -2.3836331367492676, -2.1494979858398438, -1.915363073348999, -1.6812279224395752, -1.4470930099487305, -1.2129578590393066, -0.9788228273391724, -0.7446877956390381, -0.5105528831481934, -0.2764178514480591, -0.04228278994560242, 0.19185227155685425, 0.4259873032569885, 0.6601223945617676, 0.8942574262619019, 1.1283924579620361, 1.3625274896621704, 1.5966625213623047, 1.830797553062439, 2.0649325847625732, 2.299067735671997, 2.533202648162842, 2.7673377990722656, 3.0014729499816895, 3.235607862472534, 3.469743013381958, 3.7038779258728027, 3.9380130767822266, 4.17214822769165, 4.406283378601074, 4.64041805267334, 4.874553203582764, 5.1086883544921875, 5.342823505401611, 5.576958656311035, 5.811093330383301, 6.045228481292725, 6.279363632202148, 6.513498783111572, 6.747633934020996, 6.981768608093262]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 14.0, 13.0, 34.0, 42.0, 82.0, 221.0, 580.0, 2117.0, 29103.0, 4139465.0, 20231.0, 1658.0, 406.0, 135.0, 65.0, 44.0, 17.0, 11.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.4652862548828125, -1.422760009765625, -1.3802337646484375, -1.33770751953125, -1.2951812744140625, -1.252655029296875, -1.2101287841796875, -1.1676025390625, -1.1250762939453125, -1.082550048828125, -1.0400238037109375, -0.99749755859375, -0.9549713134765625, -0.912445068359375, -0.8699188232421875, -0.827392578125, -0.7848663330078125, -0.742340087890625, -0.6998138427734375, -0.65728759765625, -0.6147613525390625, -0.572235107421875, -0.5297088623046875, -0.4871826171875, -0.4446563720703125, -0.402130126953125, -0.3596038818359375, -0.31707763671875, -0.2745513916015625, -0.232025146484375, -0.1894989013671875, -0.14697265625, -0.1044464111328125, -0.061920166015625, -0.0193939208984375, 0.02313232421875, 0.0656585693359375, 0.108184814453125, 0.1507110595703125, 0.1932373046875, 0.2357635498046875, 0.278289794921875, 0.3208160400390625, 0.36334228515625, 0.4058685302734375, 0.448394775390625, 0.4909210205078125, 0.533447265625, 0.5759735107421875, 0.618499755859375, 0.6610260009765625, 0.70355224609375, 0.7460784912109375, 0.788604736328125, 0.8311309814453125, 0.8736572265625, 0.9161834716796875, 0.958709716796875, 1.0012359619140625, 1.04376220703125, 1.0862884521484375, 1.128814697265625, 1.1713409423828125, 1.2138671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 13.0, 12.0, 10.0, 25.0, 27.0, 30.0, 49.0, 36.0, 48.0, 57.0, 55.0, 67.0, 90.0, 69.0, 80.0, 65.0, 42.0, 49.0, 44.0, 24.0, 34.0, 17.0, 13.0, 11.0, 3.0, 4.0, 6.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54296875, -0.5261688232421875, -0.509368896484375, -0.4925689697265625, -0.47576904296875, -0.4589691162109375, -0.442169189453125, -0.4253692626953125, -0.4085693359375, -0.3917694091796875, -0.374969482421875, -0.3581695556640625, -0.34136962890625, -0.3245697021484375, -0.307769775390625, -0.2909698486328125, -0.274169921875, -0.2573699951171875, -0.240570068359375, -0.2237701416015625, -0.20697021484375, -0.1901702880859375, -0.173370361328125, -0.1565704345703125, -0.1397705078125, -0.1229705810546875, -0.106170654296875, -0.0893707275390625, -0.07257080078125, -0.0557708740234375, -0.038970947265625, -0.0221710205078125, -0.00537109375, 0.0114288330078125, 0.028228759765625, 0.0450286865234375, 0.06182861328125, 0.0786285400390625, 0.095428466796875, 0.1122283935546875, 0.1290283203125, 0.1458282470703125, 0.162628173828125, 0.1794281005859375, 0.19622802734375, 0.2130279541015625, 0.229827880859375, 0.2466278076171875, 0.263427734375, 0.2802276611328125, 0.297027587890625, 0.3138275146484375, 0.33062744140625, 0.3474273681640625, 0.364227294921875, 0.3810272216796875, 0.3978271484375, 0.4146270751953125, 0.431427001953125, 0.4482269287109375, 0.46502685546875, 0.4818267822265625, 0.498626708984375, 0.5154266357421875, 0.5322265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 11.0, 18.0, 17.0, 27.0, 20.0, 35.0, 37.0, 35.0, 39.0, 40.0, 42.0, 93.0, 741.0, 4181473.0, 11009.0, 227.0, 67.0, 48.0, 41.0, 51.0, 37.0, 36.0, 22.0, 24.0, 25.0, 17.0, 16.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.43310546875, -3.2998046875, -3.16650390625, -3.033203125, -2.89990234375, -2.7666015625, -2.63330078125, -2.5, -2.36669921875, -2.2333984375, -2.10009765625, -1.966796875, -1.83349609375, -1.7001953125, -1.56689453125, -1.43359375, -1.30029296875, -1.1669921875, -1.03369140625, -0.900390625, -0.76708984375, -0.6337890625, -0.50048828125, -0.3671875, -0.23388671875, -0.1005859375, 0.03271484375, 0.166015625, 0.29931640625, 0.4326171875, 0.56591796875, 0.69921875, 0.83251953125, 0.9658203125, 1.09912109375, 1.232421875, 1.36572265625, 1.4990234375, 1.63232421875, 1.765625, 1.89892578125, 2.0322265625, 2.16552734375, 2.298828125, 2.43212890625, 2.5654296875, 2.69873046875, 2.83203125, 2.96533203125, 3.0986328125, 3.23193359375, 3.365234375, 3.49853515625, 3.6318359375, 3.76513671875, 3.8984375, 4.03173828125, 4.1650390625, 4.29833984375, 4.431640625, 4.56494140625, 4.6982421875, 4.83154296875, 4.96484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 42.0, 3918.0, 112.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.29000091552734375, -0.2279510498046875, -0.16590118408203125, -0.103851318359375, -0.04180145263671875, 0.0202484130859375, 0.08229827880859375, 0.14434814453125, 0.20639801025390625, 0.2684478759765625, 0.33049774169921875, 0.392547607421875, 0.45459747314453125, 0.5166473388671875, 0.5786972045898438, 0.6407470703125, 0.7027969360351562, 0.7648468017578125, 0.8268966674804688, 0.888946533203125, 0.9509963989257812, 1.0130462646484375, 1.0750961303710938, 1.13714599609375, 1.1991958618164062, 1.2612457275390625, 1.3232955932617188, 1.385345458984375, 1.4473953247070312, 1.5094451904296875, 1.5714950561523438, 1.633544921875, 1.6955947875976562, 1.7576446533203125, 1.8196945190429688, 1.881744384765625, 1.9437942504882812, 2.0058441162109375, 2.0678939819335938, 2.12994384765625, 2.1919937133789062, 2.2540435791015625, 2.3160934448242188, 2.378143310546875, 2.4401931762695312, 2.5022430419921875, 2.5642929077148438, 2.6263427734375, 2.6883926391601562, 2.7504425048828125, 2.8124923706054688, 2.874542236328125, 2.9365921020507812, 2.9986419677734375, 3.0606918334960938, 3.12274169921875, 3.1847915649414062, 3.2468414306640625, 3.3088912963867188, 3.370941162109375, 3.4329910278320312, 3.4950408935546875, 3.5570907592773438, 3.619140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 4.0, 26.0, 150.0, 689.0, 116.0, 15.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1708192825317383, -1.8895900249481201, -1.608360767364502, -1.3271315097808838, -1.0459022521972656, -0.7646729946136475, -0.4834437370300293, -0.20221447944641113, 0.07901477813720703, 0.3602440357208252, 0.6414732933044434, 0.9227025508880615, 1.2039318084716797, 1.4851610660552979, 1.766390323638916, 2.047619581222534, 2.3288488388061523, 2.6100780963897705, 2.8913073539733887, 3.172536611557007, 3.453765869140625, 3.734995126724243, 4.016224384307861, 4.297453880310059, 4.578682899475098, 4.859911918640137, 5.141141414642334, 5.422370910644531, 5.70359992980957, 5.984828948974609, 6.266058444976807, 6.547287940979004, 6.828516960144043, 7.109745979309082, 7.390975475311279, 7.672204971313477, 7.953433990478516, 8.234663009643555, 8.515892028808594, 8.79712200164795, 9.078351020812988, 9.359580039978027, 9.640810012817383, 9.922039031982422, 10.203268051147461, 10.4844970703125, 10.765726089477539, 11.046956062316895, 11.328185081481934, 11.609414100646973, 11.890644073486328, 12.171873092651367, 12.453102111816406, 12.734331130981445, 13.015560150146484, 13.29679012298584, 13.578019142150879, 13.859248161315918, 14.140478134155273, 14.421707153320312, 14.702936172485352, 14.98416519165039, 15.26539421081543, 15.546624183654785, 15.827853202819824]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 16.0, 20.0, 42.0, 62.0, 103.0, 142.0, 158.0, 165.0, 102.0, 86.0, 36.0, 29.0, 19.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3709845542907715, -7.169337749481201, -6.967691421508789, -6.766044616699219, -6.564397811889648, -6.362751007080078, -6.161104202270508, -5.959457874298096, -5.757811069488525, -5.556164264678955, -5.354517936706543, -5.152871131896973, -4.951224327087402, -4.749577522277832, -4.547930717468262, -4.34628438949585, -4.144637584686279, -3.942990779876709, -3.7413442134857178, -3.5396976470947266, -3.3380508422851562, -3.136404037475586, -2.9347574710845947, -2.7331109046936035, -2.531464099884033, -2.329817295074463, -2.1281707286834717, -1.926524043083191, -1.7248773574829102, -1.5232306718826294, -1.3215839862823486, -1.1199373006820679, -0.9182901382446289, -0.7166434526443481, -0.5149967670440674, -0.3133500814437866, -0.11170339584350586, 0.0899432897567749, 0.29158997535705566, 0.4932366609573364, 0.6948833465576172, 0.896530032157898, 1.0981767177581787, 1.2998234033584595, 1.5014700889587402, 1.703116774559021, 1.9047634601593018, 2.106410026550293, 2.3080568313598633, 2.5097036361694336, 2.711350202560425, 2.912996768951416, 3.1146435737609863, 3.3162903785705566, 3.517936944961548, 3.719583511352539, 3.9212303161621094, 4.12287712097168, 4.32452392578125, 4.526170253753662, 4.727817058563232, 4.929463863372803, 5.131110191345215, 5.332756996154785, 5.5344038009643555]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 11.0, 8.0, 13.0, 32.0, 36.0, 70.0, 141.0, 249.0, 597.0, 1755.0, 6593.0, 42995.0, 639703.0, 325389.0, 24160.0, 4491.0, 1346.0, 493.0, 212.0, 109.0, 55.0, 37.0, 20.0, 11.0, 13.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.91693115234375, -0.8768310546875, -0.83673095703125, -0.796630859375, -0.75653076171875, -0.7164306640625, -0.67633056640625, -0.63623046875, -0.59613037109375, -0.5560302734375, -0.51593017578125, -0.475830078125, -0.43572998046875, -0.3956298828125, -0.35552978515625, -0.3154296875, -0.27532958984375, -0.2352294921875, -0.19512939453125, -0.155029296875, -0.11492919921875, -0.0748291015625, -0.03472900390625, 0.00537109375, 0.04547119140625, 0.0855712890625, 0.12567138671875, 0.165771484375, 0.20587158203125, 0.2459716796875, 0.28607177734375, 0.326171875, 0.36627197265625, 0.4063720703125, 0.44647216796875, 0.486572265625, 0.52667236328125, 0.5667724609375, 0.60687255859375, 0.64697265625, 0.68707275390625, 0.7271728515625, 0.76727294921875, 0.807373046875, 0.84747314453125, 0.8875732421875, 0.92767333984375, 0.9677734375, 1.00787353515625, 1.0479736328125, 1.08807373046875, 1.128173828125, 1.16827392578125, 1.2083740234375, 1.24847412109375, 1.28857421875, 1.32867431640625, 1.3687744140625, 1.40887451171875, 1.448974609375, 1.48907470703125, 1.5291748046875, 1.56927490234375, 1.609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 6.0, 7.0, 10.0, 20.0, 17.0, 17.0, 25.0, 43.0, 43.0, 45.0, 59.0, 47.0, 53.0, 61.0, 72.0, 70.0, 65.0, 53.0, 56.0, 53.0, 29.0, 32.0, 22.0, 14.0, 16.0, 19.0, 8.0, 4.0, 6.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5878105163574219, -0.5711288452148438, -0.5544471740722656, -0.5377655029296875, -0.5210838317871094, -0.5044021606445312, -0.4877204895019531, -0.471038818359375, -0.4543571472167969, -0.43767547607421875, -0.4209938049316406, -0.4043121337890625, -0.3876304626464844, -0.37094879150390625, -0.3542671203613281, -0.33758544921875, -0.3209037780761719, -0.30422210693359375, -0.2875404357910156, -0.2708587646484375, -0.2541770935058594, -0.23749542236328125, -0.22081375122070312, -0.204132080078125, -0.18745040893554688, -0.17076873779296875, -0.15408706665039062, -0.1374053955078125, -0.12072372436523438, -0.10404205322265625, -0.08736038208007812, -0.0706787109375, -0.053997039794921875, -0.03731536865234375, -0.020633697509765625, -0.0039520263671875, 0.012729644775390625, 0.02941131591796875, 0.046092987060546875, 0.062774658203125, 0.07945632934570312, 0.09613800048828125, 0.11281967163085938, 0.1295013427734375, 0.14618301391601562, 0.16286468505859375, 0.17954635620117188, 0.19622802734375, 0.21290969848632812, 0.22959136962890625, 0.24627304077148438, 0.2629547119140625, 0.2796363830566406, 0.29631805419921875, 0.3129997253417969, 0.329681396484375, 0.3463630676269531, 0.36304473876953125, 0.3797264099121094, 0.3964080810546875, 0.4130897521972656, 0.42977142333984375, 0.4464530944824219, 0.463134765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 6.0, 14.0, 33.0, 61.0, 157.0, 565.0, 4193.0, 1016323.0, 25627.0, 1139.0, 258.0, 90.0, 30.0, 21.0, 10.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.49676513671875, -3.3607177734375, -3.22467041015625, -3.088623046875, -2.95257568359375, -2.8165283203125, -2.68048095703125, -2.54443359375, -2.40838623046875, -2.2723388671875, -2.13629150390625, -2.000244140625, -1.86419677734375, -1.7281494140625, -1.59210205078125, -1.4560546875, -1.32000732421875, -1.1839599609375, -1.04791259765625, -0.911865234375, -0.77581787109375, -0.6397705078125, -0.50372314453125, -0.36767578125, -0.23162841796875, -0.0955810546875, 0.04046630859375, 0.176513671875, 0.31256103515625, 0.4486083984375, 0.58465576171875, 0.720703125, 0.85675048828125, 0.9927978515625, 1.12884521484375, 1.264892578125, 1.40093994140625, 1.5369873046875, 1.67303466796875, 1.80908203125, 1.94512939453125, 2.0811767578125, 2.21722412109375, 2.353271484375, 2.48931884765625, 2.6253662109375, 2.76141357421875, 2.8974609375, 3.03350830078125, 3.1695556640625, 3.30560302734375, 3.441650390625, 3.57769775390625, 3.7137451171875, 3.84979248046875, 3.98583984375, 4.12188720703125, 4.2579345703125, 4.39398193359375, 4.530029296875, 4.66607666015625, 4.8021240234375, 4.93817138671875, 5.07421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 11.0, 24.0, 39.0, 63.0, 92.0, 130.0, 168.0, 151.0, 131.0, 81.0, 52.0, 32.0, 21.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.58154296875, -3.4248046875, -3.26806640625, -3.111328125, -2.95458984375, -2.7978515625, -2.64111328125, -2.484375, -2.32763671875, -2.1708984375, -2.01416015625, -1.857421875, -1.70068359375, -1.5439453125, -1.38720703125, -1.23046875, -1.07373046875, -0.9169921875, -0.76025390625, -0.603515625, -0.44677734375, -0.2900390625, -0.13330078125, 0.0234375, 0.18017578125, 0.3369140625, 0.49365234375, 0.650390625, 0.80712890625, 0.9638671875, 1.12060546875, 1.27734375, 1.43408203125, 1.5908203125, 1.74755859375, 1.904296875, 2.06103515625, 2.2177734375, 2.37451171875, 2.53125, 2.68798828125, 2.8447265625, 3.00146484375, 3.158203125, 3.31494140625, 3.4716796875, 3.62841796875, 3.78515625, 3.94189453125, 4.0986328125, 4.25537109375, 4.412109375, 4.56884765625, 4.7255859375, 4.88232421875, 5.0390625, 5.19580078125, 5.3525390625, 5.50927734375, 5.666015625, 5.82275390625, 5.9794921875, 6.13623046875, 6.29296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 11.0, 13.0, 37.0, 83.0, 290.0, 1235.0, 54041.0, 987664.0, 4387.0, 522.0, 165.0, 61.0, 14.0, 12.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.5045623779296875, -0.476898193359375, -0.4492340087890625, -0.42156982421875, -0.3939056396484375, -0.366241455078125, -0.3385772705078125, -0.3109130859375, -0.2832489013671875, -0.255584716796875, -0.2279205322265625, -0.20025634765625, -0.1725921630859375, -0.144927978515625, -0.1172637939453125, -0.089599609375, -0.0619354248046875, -0.034271240234375, -0.0066070556640625, 0.02105712890625, 0.0487213134765625, 0.076385498046875, 0.1040496826171875, 0.1317138671875, 0.1593780517578125, 0.187042236328125, 0.2147064208984375, 0.24237060546875, 0.2700347900390625, 0.297698974609375, 0.3253631591796875, 0.35302734375, 0.3806915283203125, 0.408355712890625, 0.4360198974609375, 0.46368408203125, 0.4913482666015625, 0.519012451171875, 0.5466766357421875, 0.5743408203125, 0.6020050048828125, 0.629669189453125, 0.6573333740234375, 0.68499755859375, 0.7126617431640625, 0.740325927734375, 0.7679901123046875, 0.795654296875, 0.8233184814453125, 0.850982666015625, 0.8786468505859375, 0.90631103515625, 0.9339752197265625, 0.961639404296875, 0.9893035888671875, 1.0169677734375, 1.0446319580078125, 1.072296142578125, 1.0999603271484375, 1.12762451171875, 1.1552886962890625, 1.182952880859375, 1.2106170654296875, 1.23828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 11.0, 8.0, 6.0, 8.0, 11.0, 12.0, 16.0, 23.0, 24.0, 29.0, 49.0, 64.0, 68.0, 85.0, 93.0, 102.0, 81.0, 59.0, 43.0, 37.0, 30.0, 38.0, 22.0, 18.0, 12.0, 7.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.118680953979492e-05, -3.959052264690399e-05, -3.799423575401306e-05, -3.639794886112213e-05, -3.48016619682312e-05, -3.320537507534027e-05, -3.160908818244934e-05, -3.001280128955841e-05, -2.841651439666748e-05, -2.682022750377655e-05, -2.522394061088562e-05, -2.362765371799469e-05, -2.203136682510376e-05, -2.043507993221283e-05, -1.88387930393219e-05, -1.724250614643097e-05, -1.564621925354004e-05, -1.4049932360649109e-05, -1.2453645467758179e-05, -1.0857358574867249e-05, -9.261071681976318e-06, -7.664784789085388e-06, -6.068497896194458e-06, -4.472211003303528e-06, -2.8759241104125977e-06, -1.2796372175216675e-06, 3.166496753692627e-07, 1.912936568260193e-06, 3.509223461151123e-06, 5.105510354042053e-06, 6.701797246932983e-06, 8.298084139823914e-06, 9.894371032714844e-06, 1.1490657925605774e-05, 1.3086944818496704e-05, 1.4683231711387634e-05, 1.6279518604278564e-05, 1.7875805497169495e-05, 1.9472092390060425e-05, 2.1068379282951355e-05, 2.2664666175842285e-05, 2.4260953068733215e-05, 2.5857239961624146e-05, 2.7453526854515076e-05, 2.9049813747406006e-05, 3.0646100640296936e-05, 3.2242387533187866e-05, 3.3838674426078796e-05, 3.5434961318969727e-05, 3.703124821186066e-05, 3.862753510475159e-05, 4.022382199764252e-05, 4.182010889053345e-05, 4.341639578342438e-05, 4.501268267631531e-05, 4.660896956920624e-05, 4.820525646209717e-05, 4.98015433549881e-05, 5.139783024787903e-05, 5.299411714076996e-05, 5.459040403366089e-05, 5.618669092655182e-05, 5.778297781944275e-05, 5.937926471233368e-05, 6.097555160522461e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 9.0, 19.0, 71.0, 360.0, 41090.0, 1006260.0, 613.0, 90.0, 22.0, 13.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.521484375, -2.458648681640625, -2.39581298828125, -2.332977294921875, -2.2701416015625, -2.207305908203125, -2.14447021484375, -2.081634521484375, -2.018798828125, -1.955963134765625, -1.89312744140625, -1.830291748046875, -1.7674560546875, -1.704620361328125, -1.64178466796875, -1.578948974609375, -1.51611328125, -1.453277587890625, -1.39044189453125, -1.327606201171875, -1.2647705078125, -1.201934814453125, -1.13909912109375, -1.076263427734375, -1.013427734375, -0.950592041015625, -0.88775634765625, -0.824920654296875, -0.7620849609375, -0.699249267578125, -0.63641357421875, -0.573577880859375, -0.5107421875, -0.447906494140625, -0.38507080078125, -0.322235107421875, -0.2593994140625, -0.196563720703125, -0.13372802734375, -0.070892333984375, -0.008056640625, 0.054779052734375, 0.11761474609375, 0.180450439453125, 0.2432861328125, 0.306121826171875, 0.36895751953125, 0.431793212890625, 0.49462890625, 0.557464599609375, 0.62030029296875, 0.683135986328125, 0.7459716796875, 0.808807373046875, 0.87164306640625, 0.934478759765625, 0.997314453125, 1.060150146484375, 1.12298583984375, 1.185821533203125, 1.2486572265625, 1.311492919921875, 1.37432861328125, 1.437164306640625, 1.5]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 20.0, 22.0, 40.0, 55.0, 93.0, 95.0, 111.0, 153.0, 125.0, 96.0, 52.0, 32.0, 25.0, 18.0, 14.0, 12.0, 3.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.33597564697265625, -0.3235626220703125, -0.31114959716796875, -0.298736572265625, -0.28632354736328125, -0.2739105224609375, -0.26149749755859375, -0.24908447265625, -0.23667144775390625, -0.2242584228515625, -0.21184539794921875, -0.199432373046875, -0.18701934814453125, -0.1746063232421875, -0.16219329833984375, -0.1497802734375, -0.13736724853515625, -0.1249542236328125, -0.11254119873046875, -0.100128173828125, -0.08771514892578125, -0.0753021240234375, -0.06288909912109375, -0.05047607421875, -0.03806304931640625, -0.0256500244140625, -0.01323699951171875, -0.000823974609375, 0.01158905029296875, 0.0240020751953125, 0.03641510009765625, 0.048828125, 0.06124114990234375, 0.0736541748046875, 0.08606719970703125, 0.098480224609375, 0.11089324951171875, 0.1233062744140625, 0.13571929931640625, 0.14813232421875, 0.16054534912109375, 0.1729583740234375, 0.18537139892578125, 0.197784423828125, 0.21019744873046875, 0.2226104736328125, 0.23502349853515625, 0.2474365234375, 0.25984954833984375, 0.2722625732421875, 0.28467559814453125, 0.297088623046875, 0.30950164794921875, 0.3219146728515625, 0.33432769775390625, 0.34674072265625, 0.35915374755859375, 0.3715667724609375, 0.38397979736328125, 0.396392822265625, 0.40880584716796875, 0.4212188720703125, 0.43363189697265625, 0.446044921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 43.0, 255.0, 540.0, 119.0, 25.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.860916137695312, -29.035783767700195, -28.210649490356445, -27.385517120361328, -26.560382843017578, -25.73525047302246, -24.91011619567871, -24.084983825683594, -23.259849548339844, -22.434717178344727, -21.609582901000977, -20.78445053100586, -19.95931625366211, -19.134183883666992, -18.309049606323242, -17.483917236328125, -16.658782958984375, -15.833649635314941, -15.008516311645508, -14.183382987976074, -13.35824966430664, -12.533117294311523, -11.707983016967773, -10.882850646972656, -10.057718276977539, -9.232584953308105, -8.407451629638672, -7.582318305969238, -6.757184982299805, -5.932052135467529, -5.106918811798096, -4.281785488128662, -3.4566516876220703, -2.6315183639526367, -1.8063851594924927, -0.9812519550323486, -0.15611863136291504, 0.6690144538879395, 1.494147777557373, 2.3192811012268066, 3.1444144248962402, 3.969547748565674, 4.794681072235107, 5.619813919067383, 6.444947242736816, 7.27008056640625, 8.095213890075684, 8.920347213745117, 9.74548053741455, 10.570613861083984, 11.395747184753418, 12.220880508422852, 13.046013832092285, 13.871147155761719, 14.696279525756836, 15.521413803100586, 16.346546173095703, 17.17167854309082, 17.99681282043457, 18.821945190429688, 19.647079467773438, 20.472211837768555, 21.297346115112305, 22.122478485107422, 22.947612762451172]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 13.0, 17.0, 20.0, 15.0, 18.0, 20.0, 27.0, 27.0, 41.0, 42.0, 42.0, 56.0, 73.0, 64.0, 57.0, 51.0, 35.0, 41.0, 48.0, 41.0, 34.0, 33.0, 33.0, 15.0, 10.0, 21.0, 13.0, 12.0, 7.0, 10.0, 12.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.649940490722656, -8.339446067810059, -8.028952598571777, -7.71845817565918, -7.40796422958374, -7.097470283508301, -6.786975860595703, -6.476481914520264, -6.165987968444824, -5.855494022369385, -5.545000076293945, -5.234505653381348, -4.924011707305908, -4.613517761230469, -4.303023338317871, -3.9925293922424316, -3.682035446166992, -3.3715415000915527, -3.061047315597534, -2.7505531311035156, -2.440059185028076, -2.1295652389526367, -1.8190710544586182, -1.5085768699645996, -1.1980829238891602, -0.8875888586044312, -0.5770947933197021, -0.26660072803497314, 0.04389333724975586, 0.35438740253448486, 0.6648814678192139, 0.9753756523132324, 1.2858695983886719, 1.5963636636734009, 1.9068577289581299, 2.2173519134521484, 2.527845859527588, 2.8383398056030273, 3.148833990097046, 3.4593281745910645, 3.769822120666504, 4.080316066741943, 4.390810012817383, 4.7013044357299805, 5.01179838180542, 5.322292327880859, 5.632786750793457, 5.9432806968688965, 6.253774642944336, 6.564268589019775, 6.874762535095215, 7.1852569580078125, 7.495750904083252, 7.806244850158691, 8.116739273071289, 8.42723274230957, 8.737727165222168, 9.048221588134766, 9.358715057373047, 9.669209480285645, 9.979703903198242, 10.290197372436523, 10.600691795349121, 10.911186218261719, 11.2216796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 5.0, 8.0, 15.0, 23.0, 28.0, 59.0, 104.0, 221.0, 585.0, 1697.0, 6730.0, 52782.0, 4001312.0, 117295.0, 9492.0, 2386.0, 845.0, 333.0, 170.0, 76.0, 49.0, 26.0, 13.0, 7.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.645782470703125, -0.61285400390625, -0.579925537109375, -0.5469970703125, -0.514068603515625, -0.48114013671875, -0.448211669921875, -0.415283203125, -0.382354736328125, -0.34942626953125, -0.316497802734375, -0.2835693359375, -0.250640869140625, -0.21771240234375, -0.184783935546875, -0.15185546875, -0.118927001953125, -0.08599853515625, -0.053070068359375, -0.0201416015625, 0.012786865234375, 0.04571533203125, 0.078643798828125, 0.111572265625, 0.144500732421875, 0.17742919921875, 0.210357666015625, 0.2432861328125, 0.276214599609375, 0.30914306640625, 0.342071533203125, 0.375, 0.407928466796875, 0.44085693359375, 0.473785400390625, 0.5067138671875, 0.539642333984375, 0.57257080078125, 0.605499267578125, 0.638427734375, 0.671356201171875, 0.70428466796875, 0.737213134765625, 0.7701416015625, 0.803070068359375, 0.83599853515625, 0.868927001953125, 0.90185546875, 0.934783935546875, 0.96771240234375, 1.000640869140625, 1.0335693359375, 1.066497802734375, 1.09942626953125, 1.132354736328125, 1.165283203125, 1.198211669921875, 1.23114013671875, 1.264068603515625, 1.2969970703125, 1.329925537109375, 1.36285400390625, 1.395782470703125, 1.4287109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 11.0, 13.0, 24.0, 35.0, 29.0, 38.0, 52.0, 37.0, 51.0, 57.0, 78.0, 77.0, 55.0, 59.0, 61.0, 48.0, 49.0, 48.0, 36.0, 23.0, 29.0, 18.0, 14.0, 8.0, 6.0, 1.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.385040283203125, -0.37066650390625, -0.356292724609375, -0.3419189453125, -0.327545166015625, -0.31317138671875, -0.298797607421875, -0.284423828125, -0.270050048828125, -0.25567626953125, -0.241302490234375, -0.2269287109375, -0.212554931640625, -0.19818115234375, -0.183807373046875, -0.16943359375, -0.155059814453125, -0.14068603515625, -0.126312255859375, -0.1119384765625, -0.097564697265625, -0.08319091796875, -0.068817138671875, -0.054443359375, -0.040069580078125, -0.02569580078125, -0.011322021484375, 0.0030517578125, 0.017425537109375, 0.03179931640625, 0.046173095703125, 0.060546875, 0.074920654296875, 0.08929443359375, 0.103668212890625, 0.1180419921875, 0.132415771484375, 0.14678955078125, 0.161163330078125, 0.175537109375, 0.189910888671875, 0.20428466796875, 0.218658447265625, 0.2330322265625, 0.247406005859375, 0.26177978515625, 0.276153564453125, 0.29052734375, 0.304901123046875, 0.31927490234375, 0.333648681640625, 0.3480224609375, 0.362396240234375, 0.37677001953125, 0.391143798828125, 0.405517578125, 0.419891357421875, 0.43426513671875, 0.448638916015625, 0.4630126953125, 0.477386474609375, 0.49176025390625, 0.506134033203125, 0.5205078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 8.0, 13.0, 13.0, 18.0, 17.0, 58.0, 148.0, 519.0, 2803.0, 45298.0, 4116796.0, 26073.0, 1976.0, 352.0, 87.0, 37.0, 30.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3857421875, -1.3312530517578125, -1.276763916015625, -1.2222747802734375, -1.16778564453125, -1.1132965087890625, -1.058807373046875, -1.0043182373046875, -0.9498291015625, -0.8953399658203125, -0.840850830078125, -0.7863616943359375, -0.73187255859375, -0.6773834228515625, -0.622894287109375, -0.5684051513671875, -0.513916015625, -0.4594268798828125, -0.404937744140625, -0.3504486083984375, -0.29595947265625, -0.2414703369140625, -0.186981201171875, -0.1324920654296875, -0.0780029296875, -0.0235137939453125, 0.030975341796875, 0.0854644775390625, 0.13995361328125, 0.1944427490234375, 0.248931884765625, 0.3034210205078125, 0.35791015625, 0.4123992919921875, 0.466888427734375, 0.5213775634765625, 0.57586669921875, 0.6303558349609375, 0.684844970703125, 0.7393341064453125, 0.7938232421875, 0.8483123779296875, 0.902801513671875, 0.9572906494140625, 1.01177978515625, 1.0662689208984375, 1.120758056640625, 1.1752471923828125, 1.229736328125, 1.2842254638671875, 1.338714599609375, 1.3932037353515625, 1.44769287109375, 1.5021820068359375, 1.556671142578125, 1.6111602783203125, 1.6656494140625, 1.7201385498046875, 1.774627685546875, 1.8291168212890625, 1.88360595703125, 1.9380950927734375, 1.992584228515625, 2.0470733642578125, 2.1015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 8.0, 11.0, 10.0, 11.0, 14.0, 23.0, 32.0, 45.0, 98.0, 301.0, 1295.0, 1599.0, 376.0, 93.0, 55.0, 24.0, 18.0, 10.0, 11.0, 7.0, 1.0, 5.0, 5.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1826171875, -1.1523971557617188, -1.1221771240234375, -1.0919570922851562, -1.061737060546875, -1.0315170288085938, -1.0012969970703125, -0.9710769653320312, -0.94085693359375, -0.9106369018554688, -0.8804168701171875, -0.8501968383789062, -0.819976806640625, -0.7897567749023438, -0.7595367431640625, -0.7293167114257812, -0.6990966796875, -0.6688766479492188, -0.6386566162109375, -0.6084365844726562, -0.578216552734375, -0.5479965209960938, -0.5177764892578125, -0.48755645751953125, -0.45733642578125, -0.42711639404296875, -0.3968963623046875, -0.36667633056640625, -0.336456298828125, -0.30623626708984375, -0.2760162353515625, -0.24579620361328125, -0.215576171875, -0.18535614013671875, -0.1551361083984375, -0.12491607666015625, -0.094696044921875, -0.06447601318359375, -0.0342559814453125, -0.00403594970703125, 0.02618408203125, 0.05640411376953125, 0.0866241455078125, 0.11684417724609375, 0.147064208984375, 0.17728424072265625, 0.2075042724609375, 0.23772430419921875, 0.2679443359375, 0.29816436767578125, 0.3283843994140625, 0.35860443115234375, 0.388824462890625, 0.41904449462890625, 0.4492645263671875, 0.47948455810546875, 0.50970458984375, 0.5399246215820312, 0.5701446533203125, 0.6003646850585938, 0.630584716796875, 0.6608047485351562, 0.6910247802734375, 0.7212448120117188, 0.75146484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 3.0, 7.0, 11.0, 18.0, 45.0, 152.0, 269.0, 288.0, 134.0, 39.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.934274673461914, -8.717409133911133, -8.500543594360352, -8.28367805480957, -8.066812515258789, -7.849946975708008, -7.633081912994385, -7.4162163734436035, -7.199350833892822, -6.982485294342041, -6.76561975479126, -6.5487542152404785, -6.3318891525268555, -6.115023612976074, -5.898158073425293, -5.681292533874512, -5.4644269943237305, -5.247561454772949, -5.030695915222168, -4.813830375671387, -4.5969648361206055, -4.380099296569824, -4.163234233856201, -3.94636869430542, -3.7295031547546387, -3.5126376152038574, -3.295772075653076, -3.078906774520874, -2.8620412349700928, -2.6451756954193115, -2.4283103942871094, -2.211444854736328, -1.9945788383483887, -1.7777132987976074, -1.5608478784561157, -1.343982458114624, -1.1271169185638428, -0.9102513790130615, -0.6933859586715698, -0.4765205383300781, -0.2596549987792969, -0.0427895188331604, 0.17407596111297607, 0.39094144105911255, 0.607806921005249, 0.8246724605560303, 1.041537880897522, 1.2584033012390137, 1.475268840789795, 1.6921343803405762, 1.9089998006820679, 2.1258652210235596, 2.342730760574341, 2.559596300125122, 2.776461601257324, 2.9933271408081055, 3.2101926803588867, 3.427058219909668, 3.643923759460449, 3.8607890605926514, 4.077654838562012, 4.294520378112793, 4.511385440826416, 4.728250980377197, 4.9451165199279785]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 5.0, 7.0, 18.0, 12.0, 21.0, 13.0, 23.0, 27.0, 33.0, 27.0, 39.0, 46.0, 51.0, 46.0, 49.0, 60.0, 37.0, 54.0, 47.0, 54.0, 48.0, 39.0, 35.0, 32.0, 34.0, 31.0, 21.0, 14.0, 11.0, 12.0, 7.0, 5.0, 11.0, 6.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.226373672485352, -4.113289833068848, -4.0002055168151855, -3.8871214389801025, -3.7740373611450195, -3.6609535217285156, -3.5478692054748535, -3.4347853660583496, -3.3217012882232666, -3.2086172103881836, -3.0955331325531006, -2.9824490547180176, -2.8693649768829346, -2.7562808990478516, -2.6431970596313477, -2.5301129817962646, -2.4170289039611816, -2.3039448261260986, -2.1908607482910156, -2.0777766704559326, -1.9646927118301392, -1.8516086339950562, -1.7385245561599731, -1.6254405975341797, -1.5123562812805176, -1.3992722034454346, -1.2861881256103516, -1.1731040477752686, -1.060020089149475, -0.9469360113143921, -0.8338519334793091, -0.7207679152488708, -0.6076838970184326, -0.494599848985672, -0.3815158009529114, -0.26843172311782837, -0.15534767508506775, -0.04226362705230713, 0.07082045078277588, 0.1839044690132141, 0.2969885468482971, 0.41007259488105774, 0.5231566429138184, 0.6362407207489014, 0.7493247985839844, 0.8624088168144226, 0.9754928946495056, 1.0885769128799438, 1.2016609907150269, 1.3147450685501099, 1.4278291463851929, 1.5409131050109863, 1.6539971828460693, 1.7670812606811523, 1.8801653385162354, 1.9932494163513184, 2.1063334941864014, 2.2194175720214844, 2.3325016498565674, 2.4455857276916504, 2.5586698055267334, 2.6717538833618164, 2.7848377227783203, 2.8979218006134033, 3.0110058784484863]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 15.0, 34.0, 26.0, 53.0, 72.0, 111.0, 142.0, 218.0, 359.0, 534.0, 855.0, 1517.0, 2430.0, 4340.0, 8104.0, 15859.0, 33339.0, 75341.0, 183625.0, 340089.0, 215784.0, 88227.0, 38286.0, 18115.0, 9153.0, 4873.0, 2727.0, 1624.0, 979.0, 602.0, 379.0, 246.0, 159.0, 96.0, 71.0, 44.0, 30.0, 25.0, 18.0, 14.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.29150390625, -0.28197479248046875, -0.2724456787109375, -0.26291656494140625, -0.253387451171875, -0.24385833740234375, -0.2343292236328125, -0.22480010986328125, -0.21527099609375, -0.20574188232421875, -0.1962127685546875, -0.18668365478515625, -0.177154541015625, -0.16762542724609375, -0.1580963134765625, -0.14856719970703125, -0.1390380859375, -0.12950897216796875, -0.1199798583984375, -0.11045074462890625, -0.100921630859375, -0.09139251708984375, -0.0818634033203125, -0.07233428955078125, -0.06280517578125, -0.05327606201171875, -0.0437469482421875, -0.03421783447265625, -0.024688720703125, -0.01515960693359375, -0.0056304931640625, 0.00389862060546875, 0.013427734375, 0.02295684814453125, 0.0324859619140625, 0.04201507568359375, 0.051544189453125, 0.06107330322265625, 0.0706024169921875, 0.08013153076171875, 0.08966064453125, 0.09918975830078125, 0.1087188720703125, 0.11824798583984375, 0.127777099609375, 0.13730621337890625, 0.1468353271484375, 0.15636444091796875, 0.1658935546875, 0.17542266845703125, 0.1849517822265625, 0.19448089599609375, 0.204010009765625, 0.21353912353515625, 0.2230682373046875, 0.23259735107421875, 0.24212646484375, 0.25165557861328125, 0.2611846923828125, 0.27071380615234375, 0.280242919921875, 0.28977203369140625, 0.2993011474609375, 0.30883026123046875, 0.318359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 7.0, 14.0, 16.0, 12.0, 17.0, 24.0, 17.0, 28.0, 25.0, 36.0, 46.0, 59.0, 43.0, 39.0, 61.0, 56.0, 46.0, 62.0, 40.0, 46.0, 48.0, 45.0, 32.0, 31.0, 27.0, 21.0, 13.0, 22.0, 8.0, 12.0, 7.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33492279052734375, -0.3236541748046875, -0.31238555908203125, -0.301116943359375, -0.28984832763671875, -0.2785797119140625, -0.26731109619140625, -0.25604248046875, -0.24477386474609375, -0.2335052490234375, -0.22223663330078125, -0.210968017578125, -0.19969940185546875, -0.1884307861328125, -0.17716217041015625, -0.1658935546875, -0.15462493896484375, -0.1433563232421875, -0.13208770751953125, -0.120819091796875, -0.10955047607421875, -0.0982818603515625, -0.08701324462890625, -0.07574462890625, -0.06447601318359375, -0.0532073974609375, -0.04193878173828125, -0.030670166015625, -0.01940155029296875, -0.0081329345703125, 0.00313568115234375, 0.014404296875, 0.02567291259765625, 0.0369415283203125, 0.04821014404296875, 0.059478759765625, 0.07074737548828125, 0.0820159912109375, 0.09328460693359375, 0.10455322265625, 0.11582183837890625, 0.1270904541015625, 0.13835906982421875, 0.149627685546875, 0.16089630126953125, 0.1721649169921875, 0.18343353271484375, 0.1947021484375, 0.20597076416015625, 0.2172393798828125, 0.22850799560546875, 0.239776611328125, 0.25104522705078125, 0.2623138427734375, 0.27358245849609375, 0.28485107421875, 0.29611968994140625, 0.3073883056640625, 0.31865692138671875, 0.329925537109375, 0.34119415283203125, 0.3524627685546875, 0.36373138427734375, 0.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 13.0, 9.0, 11.0, 9.0, 20.0, 31.0, 66.0, 56.0, 123.0, 207.0, 380.0, 702.0, 1894.0, 9539.0, 230640.0, 778746.0, 21190.0, 2877.0, 937.0, 474.0, 250.0, 162.0, 78.0, 55.0, 26.0, 18.0, 18.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.505859375, -1.466400146484375, -1.42694091796875, -1.387481689453125, -1.3480224609375, -1.308563232421875, -1.26910400390625, -1.229644775390625, -1.190185546875, -1.150726318359375, -1.11126708984375, -1.071807861328125, -1.0323486328125, -0.992889404296875, -0.95343017578125, -0.913970947265625, -0.87451171875, -0.835052490234375, -0.79559326171875, -0.756134033203125, -0.7166748046875, -0.677215576171875, -0.63775634765625, -0.598297119140625, -0.558837890625, -0.519378662109375, -0.47991943359375, -0.440460205078125, -0.4010009765625, -0.361541748046875, -0.32208251953125, -0.282623291015625, -0.2431640625, -0.203704833984375, -0.16424560546875, -0.124786376953125, -0.0853271484375, -0.045867919921875, -0.00640869140625, 0.033050537109375, 0.072509765625, 0.111968994140625, 0.15142822265625, 0.190887451171875, 0.2303466796875, 0.269805908203125, 0.30926513671875, 0.348724365234375, 0.38818359375, 0.427642822265625, 0.46710205078125, 0.506561279296875, 0.5460205078125, 0.585479736328125, 0.62493896484375, 0.664398193359375, 0.703857421875, 0.743316650390625, 0.78277587890625, 0.822235107421875, 0.8616943359375, 0.901153564453125, 0.94061279296875, 0.980072021484375, 1.01953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 10.0, 8.0, 6.0, 16.0, 23.0, 19.0, 16.0, 25.0, 29.0, 45.0, 59.0, 68.0, 54.0, 52.0, 37.0, 59.0, 56.0, 43.0, 41.0, 41.0, 47.0, 39.0, 43.0, 25.0, 37.0, 16.0, 24.0, 15.0, 7.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.34478759765625, -1.2989501953125, -1.25311279296875, -1.207275390625, -1.16143798828125, -1.1156005859375, -1.06976318359375, -1.02392578125, -0.97808837890625, -0.9322509765625, -0.88641357421875, -0.840576171875, -0.79473876953125, -0.7489013671875, -0.70306396484375, -0.6572265625, -0.61138916015625, -0.5655517578125, -0.51971435546875, -0.473876953125, -0.42803955078125, -0.3822021484375, -0.33636474609375, -0.29052734375, -0.24468994140625, -0.1988525390625, -0.15301513671875, -0.107177734375, -0.06134033203125, -0.0155029296875, 0.03033447265625, 0.076171875, 0.12200927734375, 0.1678466796875, 0.21368408203125, 0.259521484375, 0.30535888671875, 0.3511962890625, 0.39703369140625, 0.44287109375, 0.48870849609375, 0.5345458984375, 0.58038330078125, 0.626220703125, 0.67205810546875, 0.7178955078125, 0.76373291015625, 0.8095703125, 0.85540771484375, 0.9012451171875, 0.94708251953125, 0.992919921875, 1.03875732421875, 1.0845947265625, 1.13043212890625, 1.17626953125, 1.22210693359375, 1.2679443359375, 1.31378173828125, 1.359619140625, 1.40545654296875, 1.4512939453125, 1.49713134765625, 1.54296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 12.0, 20.0, 37.0, 58.0, 119.0, 231.0, 770.0, 4367.0, 401056.0, 635590.0, 5009.0, 768.0, 250.0, 105.0, 54.0, 32.0, 24.0, 12.0, 10.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359619140625, -0.3416633605957031, -0.32370758056640625, -0.3057518005371094, -0.2877960205078125, -0.2698402404785156, -0.25188446044921875, -0.23392868041992188, -0.215972900390625, -0.19801712036132812, -0.18006134033203125, -0.16210556030273438, -0.1441497802734375, -0.12619400024414062, -0.10823822021484375, -0.09028244018554688, -0.07232666015625, -0.054370880126953125, -0.03641510009765625, -0.018459320068359375, -0.0005035400390625, 0.017452239990234375, 0.03540802001953125, 0.053363800048828125, 0.071319580078125, 0.08927536010742188, 0.10723114013671875, 0.12518692016601562, 0.1431427001953125, 0.16109848022460938, 0.17905426025390625, 0.19701004028320312, 0.2149658203125, 0.23292160034179688, 0.25087738037109375, 0.2688331604003906, 0.2867889404296875, 0.3047447204589844, 0.32270050048828125, 0.3406562805175781, 0.358612060546875, 0.3765678405761719, 0.39452362060546875, 0.4124794006347656, 0.4304351806640625, 0.4483909606933594, 0.46634674072265625, 0.4843025207519531, 0.50225830078125, 0.5202140808105469, 0.5381698608398438, 0.5561256408691406, 0.5740814208984375, 0.5920372009277344, 0.6099929809570312, 0.6279487609863281, 0.645904541015625, 0.6638603210449219, 0.6818161010742188, 0.6997718811035156, 0.7177276611328125, 0.7356834411621094, 0.7536392211914062, 0.7715950012207031, 0.78955078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 7.0, 7.0, 15.0, 18.0, 19.0, 20.0, 31.0, 53.0, 62.0, 61.0, 89.0, 103.0, 101.0, 88.0, 84.0, 50.0, 45.0, 27.0, 13.0, 17.0, 21.0, 6.0, 10.0, 5.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.263090133666992e-05, -5.09209930896759e-05, -4.9211084842681885e-05, -4.7501176595687866e-05, -4.579126834869385e-05, -4.408136010169983e-05, -4.237145185470581e-05, -4.066154360771179e-05, -3.8951635360717773e-05, -3.7241727113723755e-05, -3.5531818866729736e-05, -3.382191061973572e-05, -3.21120023727417e-05, -3.040209412574768e-05, -2.8692185878753662e-05, -2.6982277631759644e-05, -2.5272369384765625e-05, -2.3562461137771606e-05, -2.1852552890777588e-05, -2.014264464378357e-05, -1.843273639678955e-05, -1.6722828149795532e-05, -1.5012919902801514e-05, -1.3303011655807495e-05, -1.1593103408813477e-05, -9.883195161819458e-06, -8.17328691482544e-06, -6.463378667831421e-06, -4.753470420837402e-06, -3.043562173843384e-06, -1.3336539268493652e-06, 3.762543201446533e-07, 2.086162567138672e-06, 3.7960708141326904e-06, 5.505979061126709e-06, 7.2158873081207275e-06, 8.925795555114746e-06, 1.0635703802108765e-05, 1.2345612049102783e-05, 1.4055520296096802e-05, 1.576542854309082e-05, 1.747533679008484e-05, 1.9185245037078857e-05, 2.0895153284072876e-05, 2.2605061531066895e-05, 2.4314969778060913e-05, 2.602487802505493e-05, 2.773478627204895e-05, 2.944469451904297e-05, 3.115460276603699e-05, 3.2864511013031006e-05, 3.4574419260025024e-05, 3.628432750701904e-05, 3.799423575401306e-05, 3.970414400100708e-05, 4.14140522480011e-05, 4.312396049499512e-05, 4.4833868741989136e-05, 4.6543776988983154e-05, 4.825368523597717e-05, 4.996359348297119e-05, 5.167350172996521e-05, 5.338340997695923e-05, 5.509331822395325e-05, 5.6803226470947266e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 16.0, 20.0, 31.0, 69.0, 85.0, 157.0, 240.0, 577.0, 1504.0, 5554.0, 49707.0, 855046.0, 123237.0, 8695.0, 2063.0, 729.0, 330.0, 168.0, 105.0, 62.0, 34.0, 29.0, 21.0, 17.0, 9.0, 11.0, 6.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3440704345703125, -0.334136962890625, -0.3242034912109375, -0.31427001953125, -0.3043365478515625, -0.294403076171875, -0.2844696044921875, -0.2745361328125, -0.2646026611328125, -0.254669189453125, -0.2447357177734375, -0.23480224609375, -0.2248687744140625, -0.214935302734375, -0.2050018310546875, -0.195068359375, -0.1851348876953125, -0.175201416015625, -0.1652679443359375, -0.15533447265625, -0.1454010009765625, -0.135467529296875, -0.1255340576171875, -0.1156005859375, -0.1056671142578125, -0.095733642578125, -0.0858001708984375, -0.07586669921875, -0.0659332275390625, -0.055999755859375, -0.0460662841796875, -0.0361328125, -0.0261993408203125, -0.016265869140625, -0.0063323974609375, 0.00360107421875, 0.0135345458984375, 0.023468017578125, 0.0334014892578125, 0.0433349609375, 0.0532684326171875, 0.063201904296875, 0.0731353759765625, 0.08306884765625, 0.0930023193359375, 0.102935791015625, 0.1128692626953125, 0.122802734375, 0.1327362060546875, 0.142669677734375, 0.1526031494140625, 0.16253662109375, 0.1724700927734375, 0.182403564453125, 0.1923370361328125, 0.2022705078125, 0.2122039794921875, 0.222137451171875, 0.2320709228515625, 0.24200439453125, 0.2519378662109375, 0.261871337890625, 0.2718048095703125, 0.28173828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 8.0, 8.0, 15.0, 18.0, 24.0, 39.0, 30.0, 51.0, 67.0, 75.0, 76.0, 91.0, 87.0, 64.0, 71.0, 61.0, 39.0, 31.0, 36.0, 20.0, 21.0, 12.0, 11.0, 3.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.2310791015625, -0.22271156311035156, -0.21434402465820312, -0.2059764862060547, -0.19760894775390625, -0.1892414093017578, -0.18087387084960938, -0.17250633239746094, -0.1641387939453125, -0.15577125549316406, -0.14740371704101562, -0.1390361785888672, -0.13066864013671875, -0.12230110168457031, -0.11393356323242188, -0.10556602478027344, -0.097198486328125, -0.08883094787597656, -0.08046340942382812, -0.07209587097167969, -0.06372833251953125, -0.05536079406738281, -0.046993255615234375, -0.03862571716308594, -0.0302581787109375, -0.021890640258789062, -0.013523101806640625, -0.0051555633544921875, 0.00321197509765625, 0.011579513549804688, 0.019947052001953125, 0.028314590454101562, 0.03668212890625, 0.04504966735839844, 0.053417205810546875, 0.06178474426269531, 0.07015228271484375, 0.07851982116699219, 0.08688735961914062, 0.09525489807128906, 0.1036224365234375, 0.11198997497558594, 0.12035751342773438, 0.1287250518798828, 0.13709259033203125, 0.1454601287841797, 0.15382766723632812, 0.16219520568847656, 0.170562744140625, 0.17893028259277344, 0.18729782104492188, 0.1956653594970703, 0.20403289794921875, 0.2124004364013672, 0.22076797485351562, 0.22913551330566406, 0.2375030517578125, 0.24587059020996094, 0.2542381286621094, 0.2626056671142578, 0.27097320556640625, 0.2793407440185547, 0.2877082824707031, 0.29607582092285156, 0.304443359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 8.0, 13.0, 8.0, 56.0, 141.0, 389.0, 296.0, 60.0, 19.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.575984954833984, -5.2640790939331055, -4.952172756195068, -4.640266418457031, -4.328360557556152, -4.016454696655273, -3.7045483589172363, -3.3926422595977783, -3.0807361602783203, -2.7688300609588623, -2.4569239616394043, -2.1450178623199463, -1.8331117630004883, -1.5212056636810303, -1.2092995643615723, -0.8973934650421143, -0.5854873657226562, -0.27358126640319824, 0.038324832916259766, 0.3502309322357178, 0.6621370315551758, 0.9740431308746338, 1.2859492301940918, 1.5978553295135498, 1.9097614288330078, 2.221667528152466, 2.533573627471924, 2.845479726791382, 3.15738582611084, 3.469291925430298, 3.781198024749756, 4.093104362487793, 4.405011177062988, 4.716917037963867, 5.028823375701904, 5.340729713439941, 5.65263557434082, 5.964541435241699, 6.276447772979736, 6.588354110717773, 6.900259971618652, 7.212165832519531, 7.524072170257568, 7.8359785079956055, 8.147884368896484, 8.459790229797363, 8.771696090698242, 9.083602905273438, 9.395508766174316, 9.707414627075195, 10.01932144165039, 10.33122730255127, 10.643133163452148, 10.955039024353027, 11.266944885253906, 11.578851699829102, 11.89075756072998, 12.20266342163086, 12.514570236206055, 12.826476097106934, 13.138381958007812, 13.450287818908691, 13.76219367980957, 14.074100494384766, 14.386006355285645]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 12.0, 15.0, 20.0, 18.0, 19.0, 27.0, 32.0, 45.0, 35.0, 48.0, 46.0, 53.0, 75.0, 63.0, 72.0, 67.0, 49.0, 51.0, 48.0, 38.0, 33.0, 23.0, 24.0, 12.0, 27.0, 18.0, 11.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0], "bins": [-8.951157569885254, -8.741640090942383, -8.532122611999512, -8.32260513305664, -8.113086700439453, -7.903569221496582, -7.694051742553711, -7.48453426361084, -7.275016784667969, -7.065499305725098, -6.855981349945068, -6.646463871002197, -6.436946392059326, -6.227428436279297, -6.017910957336426, -5.808393478393555, -5.598875522613525, -5.389358043670654, -5.179840087890625, -4.970322608947754, -4.760805130004883, -4.551287651062012, -4.341769695281982, -4.132252216339111, -3.922734498977661, -3.713216781616211, -3.50369930267334, -3.2941815853118896, -3.0846638679504395, -2.8751463890075684, -2.665628671646118, -2.456110954284668, -2.246593475341797, -2.0370757579803467, -1.8275582790374756, -1.6180405616760254, -1.4085229635238647, -1.199005365371704, -0.9894876480102539, -0.7799700498580933, -0.5704524517059326, -0.3609348237514496, -0.15141719579696655, 0.05810046195983887, 0.2676180601119995, 0.47713565826416016, 0.6866533756256104, 0.896170973777771, 1.1056885719299316, 1.3152061700820923, 1.524723768234253, 1.7342414855957031, 1.9437590837478638, 2.1532766819000244, 2.3627943992614746, 2.5723118782043457, 2.781829595565796, 2.991347312927246, 3.200864791870117, 3.4103825092315674, 3.6199002265930176, 3.8294177055358887, 4.038935661315918, 4.248453140258789, 4.45797061920166]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 10.0, 21.0, 22.0, 36.0, 34.0, 47.0, 78.0, 96.0, 154.0, 274.0, 576.0, 3393.0, 2916750.0, 1267795.0, 3770.0, 548.0, 218.0, 122.0, 80.0, 58.0, 50.0, 25.0, 23.0, 21.0, 21.0, 8.0, 6.0, 8.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.60546875, -1.550048828125, -1.49462890625, -1.439208984375, -1.3837890625, -1.328369140625, -1.27294921875, -1.217529296875, -1.162109375, -1.106689453125, -1.05126953125, -0.995849609375, -0.9404296875, -0.885009765625, -0.82958984375, -0.774169921875, -0.71875, -0.663330078125, -0.60791015625, -0.552490234375, -0.4970703125, -0.441650390625, -0.38623046875, -0.330810546875, -0.275390625, -0.219970703125, -0.16455078125, -0.109130859375, -0.0537109375, 0.001708984375, 0.05712890625, 0.112548828125, 0.16796875, 0.223388671875, 0.27880859375, 0.334228515625, 0.3896484375, 0.445068359375, 0.50048828125, 0.555908203125, 0.611328125, 0.666748046875, 0.72216796875, 0.777587890625, 0.8330078125, 0.888427734375, 0.94384765625, 0.999267578125, 1.0546875, 1.110107421875, 1.16552734375, 1.220947265625, 1.2763671875, 1.331787109375, 1.38720703125, 1.442626953125, 1.498046875, 1.553466796875, 1.60888671875, 1.664306640625, 1.7197265625, 1.775146484375, 1.83056640625, 1.885986328125, 1.94140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 9.0, 16.0, 26.0, 41.0, 62.0, 71.0, 100.0, 118.0, 123.0, 122.0, 101.0, 88.0, 53.0, 39.0, 18.0, 15.0, 10.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.177734375, -1.1543693542480469, -1.1310043334960938, -1.1076393127441406, -1.0842742919921875, -1.0609092712402344, -1.0375442504882812, -1.0141792297363281, -0.990814208984375, -0.9674491882324219, -0.9440841674804688, -0.9207191467285156, -0.8973541259765625, -0.8739891052246094, -0.8506240844726562, -0.8272590637207031, -0.80389404296875, -0.7805290222167969, -0.7571640014648438, -0.7337989807128906, -0.7104339599609375, -0.6870689392089844, -0.6637039184570312, -0.6403388977050781, -0.616973876953125, -0.5936088562011719, -0.5702438354492188, -0.5468788146972656, -0.5235137939453125, -0.5001487731933594, -0.47678375244140625, -0.4534187316894531, -0.4300537109375, -0.4066886901855469, -0.38332366943359375, -0.3599586486816406, -0.3365936279296875, -0.3132286071777344, -0.28986358642578125, -0.2664985656738281, -0.243133544921875, -0.21976852416992188, -0.19640350341796875, -0.17303848266601562, -0.1496734619140625, -0.12630844116210938, -0.10294342041015625, -0.07957839965820312, -0.05621337890625, -0.032848358154296875, -0.00948333740234375, 0.013881683349609375, 0.0372467041015625, 0.060611724853515625, 0.08397674560546875, 0.10734176635742188, 0.130706787109375, 0.15407180786132812, 0.17743682861328125, 0.20080184936523438, 0.2241668701171875, 0.24753189086914062, 0.27089691162109375, 0.2942619323730469, 0.317626953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 14.0, 9.0, 13.0, 20.0, 38.0, 54.0, 91.0, 120.0, 207.0, 323.0, 559.0, 1003.0, 2158.0, 4897.0, 13425.0, 54437.0, 1470335.0, 2549161.0, 70091.0, 15976.0, 5775.0, 2601.0, 1285.0, 618.0, 400.0, 245.0, 142.0, 103.0, 50.0, 47.0, 22.0, 21.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4271659851074219, -0.41341400146484375, -0.3996620178222656, -0.3859100341796875, -0.3721580505371094, -0.35840606689453125, -0.3446540832519531, -0.330902099609375, -0.3171501159667969, -0.30339813232421875, -0.2896461486816406, -0.2758941650390625, -0.2621421813964844, -0.24839019775390625, -0.23463821411132812, -0.22088623046875, -0.20713424682617188, -0.19338226318359375, -0.17963027954101562, -0.1658782958984375, -0.15212631225585938, -0.13837432861328125, -0.12462234497070312, -0.110870361328125, -0.09711837768554688, -0.08336639404296875, -0.06961441040039062, -0.0558624267578125, -0.042110443115234375, -0.02835845947265625, -0.014606475830078125, -0.0008544921875, 0.012897491455078125, 0.02664947509765625, 0.040401458740234375, 0.0541534423828125, 0.06790542602539062, 0.08165740966796875, 0.09540939331054688, 0.109161376953125, 0.12291336059570312, 0.13666534423828125, 0.15041732788085938, 0.1641693115234375, 0.17792129516601562, 0.19167327880859375, 0.20542526245117188, 0.21917724609375, 0.23292922973632812, 0.24668121337890625, 0.2604331970214844, 0.2741851806640625, 0.2879371643066406, 0.30168914794921875, 0.3154411315917969, 0.329193115234375, 0.3429450988769531, 0.35669708251953125, 0.3704490661621094, 0.3842010498046875, 0.3979530334472656, 0.41170501708984375, 0.4254570007324219, 0.439208984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 8.0, 3.0, 7.0, 13.0, 11.0, 34.0, 36.0, 113.0, 382.0, 1400.0, 1425.0, 384.0, 103.0, 54.0, 29.0, 31.0, 7.0, 4.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.85205078125, -0.8270111083984375, -0.801971435546875, -0.7769317626953125, -0.75189208984375, -0.7268524169921875, -0.701812744140625, -0.6767730712890625, -0.6517333984375, -0.6266937255859375, -0.601654052734375, -0.5766143798828125, -0.55157470703125, -0.5265350341796875, -0.501495361328125, -0.4764556884765625, -0.451416015625, -0.4263763427734375, -0.401336669921875, -0.3762969970703125, -0.35125732421875, -0.3262176513671875, -0.301177978515625, -0.2761383056640625, -0.2510986328125, -0.2260589599609375, -0.201019287109375, -0.1759796142578125, -0.15093994140625, -0.1259002685546875, -0.100860595703125, -0.0758209228515625, -0.05078125, -0.0257415771484375, -0.000701904296875, 0.0243377685546875, 0.04937744140625, 0.0744171142578125, 0.099456787109375, 0.1244964599609375, 0.1495361328125, 0.1745758056640625, 0.199615478515625, 0.2246551513671875, 0.24969482421875, 0.2747344970703125, 0.299774169921875, 0.3248138427734375, 0.349853515625, 0.3748931884765625, 0.399932861328125, 0.4249725341796875, 0.45001220703125, 0.4750518798828125, 0.500091552734375, 0.5251312255859375, 0.5501708984375, 0.5752105712890625, 0.600250244140625, 0.6252899169921875, 0.65032958984375, 0.6753692626953125, 0.700408935546875, 0.7254486083984375, 0.75048828125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 11.0, 33.0, 77.0, 180.0, 327.0, 235.0, 78.0, 32.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.667299270629883, -5.51667594909668, -5.366052627563477, -5.215429306030273, -5.06480598449707, -4.914182662963867, -4.763559341430664, -4.612936019897461, -4.462312698364258, -4.311689376831055, -4.161066055297852, -4.010442733764648, -3.8598194122314453, -3.709196090698242, -3.558572769165039, -3.407949447631836, -3.2573258876800537, -3.1067025661468506, -2.9560792446136475, -2.8054559230804443, -2.654832601547241, -2.504209280014038, -2.353585720062256, -2.2029623985290527, -2.0523390769958496, -1.9017157554626465, -1.7510924339294434, -1.6004691123962402, -1.449845790863037, -1.299222469329834, -1.1485990285873413, -0.9979757070541382, -0.8473525047302246, -0.6967291831970215, -0.5461058616638184, -0.39548248052597046, -0.24485915899276733, -0.09423583745956421, 0.05638754367828369, 0.20701086521148682, 0.35763418674468994, 0.5082575082778931, 0.6588808298110962, 0.8095042109489441, 0.9601275324821472, 1.1107509136199951, 1.2613742351531982, 1.4119975566864014, 1.5626208782196045, 1.7132441997528076, 1.8638675212860107, 2.014490842819214, 2.165114164352417, 2.31573748588562, 2.4663610458374023, 2.6169843673706055, 2.7676076889038086, 2.9182310104370117, 3.068854331970215, 3.219477653503418, 3.370100975036621, 3.520724296569824, 3.6713476181030273, 3.8219709396362305, 3.9725942611694336]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 11.0, 13.0, 20.0, 22.0, 41.0, 52.0, 68.0, 91.0, 77.0, 80.0, 103.0, 84.0, 75.0, 63.0, 46.0, 47.0, 33.0, 28.0, 18.0, 13.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2218856811523438, -2.1032114028930664, -1.9845373630523682, -1.8658630847930908, -1.7471890449523926, -1.6285147666931152, -1.5098406076431274, -1.3911664485931396, -1.2724922895431519, -1.153818130493164, -1.0351439714431763, -0.9164697527885437, -0.7977955937385559, -0.6791214346885681, -0.5604472160339355, -0.44177305698394775, -0.32309889793395996, -0.20442472398281097, -0.08575055003166199, 0.03292363882064819, 0.151597797870636, 0.2702719569206238, 0.38894617557525635, 0.5076203346252441, 0.6262944936752319, 0.7449686527252197, 0.8636428117752075, 0.9823170304298401, 1.1009912490844727, 1.219665288925171, 1.3383395671844482, 1.457013726234436, 1.5756878852844238, 1.6943620443344116, 1.8130362033843994, 1.9317104816436768, 2.050384521484375, 2.1690587997436523, 2.2877330780029297, 2.406407117843628, 2.525081157684326, 2.6437554359436035, 2.7624294757843018, 2.881103754043579, 2.9997777938842773, 3.1184520721435547, 3.237126350402832, 3.3558003902435303, 3.4744746685028076, 3.593148946762085, 3.711822986602783, 3.8304972648620605, 3.949171304702759, 4.067845344543457, 4.186519622802734, 4.305193901062012, 4.423868179321289, 4.542542457580566, 4.661216735839844, 4.779890537261963, 4.89856481552124, 5.017239093780518, 5.135913372039795, 5.254587173461914, 5.373261451721191]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 3.0, 11.0, 14.0, 17.0, 29.0, 40.0, 64.0, 109.0, 147.0, 250.0, 397.0, 710.0, 1205.0, 2547.0, 5061.0, 11733.0, 28457.0, 76295.0, 225806.0, 405289.0, 184016.0, 63088.0, 24010.0, 9930.0, 4365.0, 2175.0, 1136.0, 632.0, 373.0, 239.0, 156.0, 75.0, 70.0, 31.0, 27.0, 13.0, 11.0, 4.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.31201171875, -0.30175018310546875, -0.2914886474609375, -0.28122711181640625, -0.270965576171875, -0.26070404052734375, -0.2504425048828125, -0.24018096923828125, -0.22991943359375, -0.21965789794921875, -0.2093963623046875, -0.19913482666015625, -0.188873291015625, -0.17861175537109375, -0.1683502197265625, -0.15808868408203125, -0.1478271484375, -0.13756561279296875, -0.1273040771484375, -0.11704254150390625, -0.106781005859375, -0.09651947021484375, -0.0862579345703125, -0.07599639892578125, -0.06573486328125, -0.05547332763671875, -0.0452117919921875, -0.03495025634765625, -0.024688720703125, -0.01442718505859375, -0.0041656494140625, 0.00609588623046875, 0.016357421875, 0.02661895751953125, 0.0368804931640625, 0.04714202880859375, 0.057403564453125, 0.06766510009765625, 0.0779266357421875, 0.08818817138671875, 0.09844970703125, 0.10871124267578125, 0.1189727783203125, 0.12923431396484375, 0.139495849609375, 0.14975738525390625, 0.1600189208984375, 0.17028045654296875, 0.1805419921875, 0.19080352783203125, 0.2010650634765625, 0.21132659912109375, 0.221588134765625, 0.23184967041015625, 0.2421112060546875, 0.25237274169921875, 0.26263427734375, 0.27289581298828125, 0.2831573486328125, 0.29341888427734375, 0.303680419921875, 0.31394195556640625, 0.3242034912109375, 0.33446502685546875, 0.3447265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 14.0, 15.0, 15.0, 19.0, 29.0, 20.0, 38.0, 49.0, 44.0, 45.0, 50.0, 52.0, 52.0, 69.0, 64.0, 50.0, 53.0, 44.0, 49.0, 42.0, 36.0, 26.0, 23.0, 24.0, 15.0, 15.0, 12.0, 6.0, 5.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.39892578125, -0.38800811767578125, -0.3770904541015625, -0.36617279052734375, -0.355255126953125, -0.34433746337890625, -0.3334197998046875, -0.32250213623046875, -0.31158447265625, -0.30066680908203125, -0.2897491455078125, -0.27883148193359375, -0.267913818359375, -0.25699615478515625, -0.2460784912109375, -0.23516082763671875, -0.2242431640625, -0.21332550048828125, -0.2024078369140625, -0.19149017333984375, -0.180572509765625, -0.16965484619140625, -0.1587371826171875, -0.14781951904296875, -0.13690185546875, -0.12598419189453125, -0.1150665283203125, -0.10414886474609375, -0.093231201171875, -0.08231353759765625, -0.0713958740234375, -0.06047821044921875, -0.049560546875, -0.03864288330078125, -0.0277252197265625, -0.01680755615234375, -0.005889892578125, 0.00502777099609375, 0.0159454345703125, 0.02686309814453125, 0.03778076171875, 0.04869842529296875, 0.0596160888671875, 0.07053375244140625, 0.081451416015625, 0.09236907958984375, 0.1032867431640625, 0.11420440673828125, 0.1251220703125, 0.13603973388671875, 0.1469573974609375, 0.15787506103515625, 0.168792724609375, 0.17971038818359375, 0.1906280517578125, 0.20154571533203125, 0.21246337890625, 0.22338104248046875, 0.2342987060546875, 0.24521636962890625, 0.256134033203125, 0.26705169677734375, 0.2779693603515625, 0.28888702392578125, 0.2998046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 6.0, 15.0, 25.0, 22.0, 32.0, 49.0, 84.0, 110.0, 158.0, 320.0, 548.0, 1171.0, 3521.0, 22202.0, 405695.0, 580135.0, 27621.0, 4065.0, 1247.0, 546.0, 342.0, 215.0, 128.0, 75.0, 57.0, 40.0, 29.0, 21.0, 11.0, 10.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.88818359375, -0.8604660034179688, -0.8327484130859375, -0.8050308227539062, -0.777313232421875, -0.7495956420898438, -0.7218780517578125, -0.6941604614257812, -0.66644287109375, -0.6387252807617188, -0.6110076904296875, -0.5832901000976562, -0.555572509765625, -0.5278549194335938, -0.5001373291015625, -0.47241973876953125, -0.4447021484375, -0.41698455810546875, -0.3892669677734375, -0.36154937744140625, -0.333831787109375, -0.30611419677734375, -0.2783966064453125, -0.25067901611328125, -0.22296142578125, -0.19524383544921875, -0.1675262451171875, -0.13980865478515625, -0.112091064453125, -0.08437347412109375, -0.0566558837890625, -0.02893829345703125, -0.001220703125, 0.02649688720703125, 0.0542144775390625, 0.08193206787109375, 0.109649658203125, 0.13736724853515625, 0.1650848388671875, 0.19280242919921875, 0.22052001953125, 0.24823760986328125, 0.2759552001953125, 0.30367279052734375, 0.331390380859375, 0.35910797119140625, 0.3868255615234375, 0.41454315185546875, 0.4422607421875, 0.46997833251953125, 0.4976959228515625, 0.5254135131835938, 0.553131103515625, 0.5808486938476562, 0.6085662841796875, 0.6362838745117188, 0.66400146484375, 0.6917190551757812, 0.7194366455078125, 0.7471542358398438, 0.774871826171875, 0.8025894165039062, 0.8303070068359375, 0.8580245971679688, 0.8857421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 0.0, 7.0, 5.0, 8.0, 12.0, 10.0, 11.0, 14.0, 18.0, 27.0, 42.0, 35.0, 33.0, 42.0, 50.0, 39.0, 41.0, 53.0, 43.0, 55.0, 40.0, 54.0, 58.0, 50.0, 35.0, 34.0, 30.0, 29.0, 26.0, 19.0, 18.0, 17.0, 5.0, 11.0, 6.0, 6.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.857421875, -0.8229522705078125, -0.788482666015625, -0.7540130615234375, -0.71954345703125, -0.6850738525390625, -0.650604248046875, -0.6161346435546875, -0.5816650390625, -0.5471954345703125, -0.512725830078125, -0.4782562255859375, -0.44378662109375, -0.4093170166015625, -0.374847412109375, -0.3403778076171875, -0.305908203125, -0.2714385986328125, -0.236968994140625, -0.2024993896484375, -0.16802978515625, -0.1335601806640625, -0.099090576171875, -0.0646209716796875, -0.0301513671875, 0.0043182373046875, 0.038787841796875, 0.0732574462890625, 0.10772705078125, 0.1421966552734375, 0.176666259765625, 0.2111358642578125, 0.24560546875, 0.2800750732421875, 0.314544677734375, 0.3490142822265625, 0.38348388671875, 0.4179534912109375, 0.452423095703125, 0.4868927001953125, 0.5213623046875, 0.5558319091796875, 0.590301513671875, 0.6247711181640625, 0.65924072265625, 0.6937103271484375, 0.728179931640625, 0.7626495361328125, 0.797119140625, 0.8315887451171875, 0.866058349609375, 0.9005279541015625, 0.93499755859375, 0.9694671630859375, 1.003936767578125, 1.0384063720703125, 1.0728759765625, 1.1073455810546875, 1.141815185546875, 1.1762847900390625, 1.21075439453125, 1.2452239990234375, 1.279693603515625, 1.3141632080078125, 1.3486328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 3.0, 7.0, 5.0, 8.0, 16.0, 22.0, 47.0, 86.0, 150.0, 409.0, 1453.0, 11745.0, 910768.0, 118786.0, 3717.0, 745.0, 257.0, 117.0, 69.0, 49.0, 21.0, 21.0, 16.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4324302673339844, -0.41686248779296875, -0.4012947082519531, -0.3857269287109375, -0.3701591491699219, -0.35459136962890625, -0.3390235900878906, -0.323455810546875, -0.3078880310058594, -0.29232025146484375, -0.2767524719238281, -0.2611846923828125, -0.24561691284179688, -0.23004913330078125, -0.21448135375976562, -0.19891357421875, -0.18334579467773438, -0.16777801513671875, -0.15221023559570312, -0.1366424560546875, -0.12107467651367188, -0.10550689697265625, -0.08993911743164062, -0.074371337890625, -0.058803558349609375, -0.04323577880859375, -0.027667999267578125, -0.0121002197265625, 0.003467559814453125, 0.01903533935546875, 0.034603118896484375, 0.0501708984375, 0.06573867797851562, 0.08130645751953125, 0.09687423706054688, 0.1124420166015625, 0.12800979614257812, 0.14357757568359375, 0.15914535522460938, 0.174713134765625, 0.19028091430664062, 0.20584869384765625, 0.22141647338867188, 0.2369842529296875, 0.2525520324707031, 0.26811981201171875, 0.2836875915527344, 0.29925537109375, 0.3148231506347656, 0.33039093017578125, 0.3459587097167969, 0.3615264892578125, 0.3770942687988281, 0.39266204833984375, 0.4082298278808594, 0.423797607421875, 0.4393653869628906, 0.45493316650390625, 0.4705009460449219, 0.4860687255859375, 0.5016365051269531, 0.5172042846679688, 0.5327720642089844, 0.54833984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 12.0, 19.0, 20.0, 24.0, 28.0, 56.0, 61.0, 85.0, 127.0, 95.0, 116.0, 91.0, 69.0, 43.0, 28.0, 21.0, 15.0, 14.0, 7.0, 6.0, 9.0, 4.0, 3.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.608797073364258e-05, -5.430355668067932e-05, -5.2519142627716064e-05, -5.073472857475281e-05, -4.895031452178955e-05, -4.7165900468826294e-05, -4.538148641586304e-05, -4.359707236289978e-05, -4.1812658309936523e-05, -4.0028244256973267e-05, -3.824383020401001e-05, -3.645941615104675e-05, -3.4675002098083496e-05, -3.289058804512024e-05, -3.110617399215698e-05, -2.9321759939193726e-05, -2.753734588623047e-05, -2.5752931833267212e-05, -2.3968517780303955e-05, -2.2184103727340698e-05, -2.039968967437744e-05, -1.8615275621414185e-05, -1.6830861568450928e-05, -1.5046447515487671e-05, -1.3262033462524414e-05, -1.1477619409561157e-05, -9.6932053565979e-06, -7.908791303634644e-06, -6.124377250671387e-06, -4.33996319770813e-06, -2.555549144744873e-06, -7.711350917816162e-07, 1.0132789611816406e-06, 2.7976930141448975e-06, 4.582107067108154e-06, 6.366521120071411e-06, 8.150935173034668e-06, 9.935349225997925e-06, 1.1719763278961182e-05, 1.3504177331924438e-05, 1.5288591384887695e-05, 1.7073005437850952e-05, 1.885741949081421e-05, 2.0641833543777466e-05, 2.2426247596740723e-05, 2.421066164970398e-05, 2.5995075702667236e-05, 2.7779489755630493e-05, 2.956390380859375e-05, 3.134831786155701e-05, 3.3132731914520264e-05, 3.491714596748352e-05, 3.670156002044678e-05, 3.8485974073410034e-05, 4.027038812637329e-05, 4.205480217933655e-05, 4.3839216232299805e-05, 4.562363028526306e-05, 4.740804433822632e-05, 4.9192458391189575e-05, 5.097687244415283e-05, 5.276128649711609e-05, 5.4545700550079346e-05, 5.63301146030426e-05, 5.811452865600586e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 18.0, 21.0, 56.0, 110.0, 263.0, 869.0, 6183.0, 416733.0, 615731.0, 7060.0, 965.0, 283.0, 116.0, 62.0, 25.0, 16.0, 10.0, 5.0, 1.0, 1.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5377235412597656, -0.5232009887695312, -0.5086784362792969, -0.4941558837890625, -0.4796333312988281, -0.46511077880859375, -0.4505882263183594, -0.436065673828125, -0.4215431213378906, -0.40702056884765625, -0.3924980163574219, -0.3779754638671875, -0.3634529113769531, -0.34893035888671875, -0.3344078063964844, -0.31988525390625, -0.3053627014160156, -0.29084014892578125, -0.2763175964355469, -0.2617950439453125, -0.24727249145507812, -0.23274993896484375, -0.21822738647460938, -0.203704833984375, -0.18918228149414062, -0.17465972900390625, -0.16013717651367188, -0.1456146240234375, -0.13109207153320312, -0.11656951904296875, -0.10204696655273438, -0.0875244140625, -0.07300186157226562, -0.05847930908203125, -0.043956756591796875, -0.0294342041015625, -0.014911651611328125, -0.00038909912109375, 0.014133453369140625, 0.028656005859375, 0.043178558349609375, 0.05770111083984375, 0.07222366333007812, 0.0867462158203125, 0.10126876831054688, 0.11579132080078125, 0.13031387329101562, 0.14483642578125, 0.15935897827148438, 0.17388153076171875, 0.18840408325195312, 0.2029266357421875, 0.21744918823242188, 0.23197174072265625, 0.24649429321289062, 0.261016845703125, 0.2755393981933594, 0.29006195068359375, 0.3045845031738281, 0.3191070556640625, 0.3336296081542969, 0.34815216064453125, 0.3626747131347656, 0.377197265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 12.0, 17.0, 23.0, 34.0, 47.0, 82.0, 60.0, 114.0, 104.0, 94.0, 112.0, 70.0, 60.0, 40.0, 36.0, 29.0, 10.0, 9.0, 10.0, 7.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.288330078125, -0.280914306640625, -0.27349853515625, -0.266082763671875, -0.2586669921875, -0.251251220703125, -0.24383544921875, -0.236419677734375, -0.22900390625, -0.221588134765625, -0.21417236328125, -0.206756591796875, -0.1993408203125, -0.191925048828125, -0.18450927734375, -0.177093505859375, -0.169677734375, -0.162261962890625, -0.15484619140625, -0.147430419921875, -0.1400146484375, -0.132598876953125, -0.12518310546875, -0.117767333984375, -0.1103515625, -0.102935791015625, -0.09552001953125, -0.088104248046875, -0.0806884765625, -0.073272705078125, -0.06585693359375, -0.058441162109375, -0.051025390625, -0.043609619140625, -0.03619384765625, -0.028778076171875, -0.0213623046875, -0.013946533203125, -0.00653076171875, 0.000885009765625, 0.00830078125, 0.015716552734375, 0.02313232421875, 0.030548095703125, 0.0379638671875, 0.045379638671875, 0.05279541015625, 0.060211181640625, 0.067626953125, 0.075042724609375, 0.08245849609375, 0.089874267578125, 0.0972900390625, 0.104705810546875, 0.11212158203125, 0.119537353515625, 0.126953125, 0.134368896484375, 0.14178466796875, 0.149200439453125, 0.1566162109375, 0.164031982421875, 0.17144775390625, 0.178863525390625, 0.186279296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 36.0, 153.0, 488.0, 241.0, 47.0, 13.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.478628158569336, -5.1472625732421875, -4.815897464752197, -4.484532356262207, -4.153166770935059, -3.8218014240264893, -3.49043607711792, -3.1590707302093506, -2.8277053833007812, -2.496340036392212, -2.1649746894836426, -1.8336093425750732, -1.502243995666504, -1.1708786487579346, -0.8395133018493652, -0.5081479549407959, -0.17678260803222656, 0.15458273887634277, 0.4859480857849121, 0.8173134326934814, 1.1486787796020508, 1.4800441265106201, 1.8114094734191895, 2.142774820327759, 2.474140167236328, 2.8055055141448975, 3.136870861053467, 3.468236207962036, 3.7996015548706055, 4.130967140197754, 4.462332248687744, 4.793697357177734, 5.125063896179199, 5.456429481506348, 5.787794589996338, 6.119159698486328, 6.450525283813477, 6.781890869140625, 7.113255977630615, 7.4446210861206055, 7.775986671447754, 8.107352256774902, 8.438716888427734, 8.770082473754883, 9.101448059082031, 9.43281364440918, 9.764179229736328, 10.09554386138916, 10.426909446716309, 10.758275032043457, 11.089639663696289, 11.421005249023438, 11.752370834350586, 12.083736419677734, 12.415102005004883, 12.746466636657715, 13.077832221984863, 13.409197807312012, 13.740562438964844, 14.071928024291992, 14.40329360961914, 14.734659194946289, 15.066024780273438, 15.39738941192627, 15.728754997253418]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 14.0, 13.0, 7.0, 16.0, 13.0, 12.0, 29.0, 22.0, 21.0, 38.0, 45.0, 42.0, 46.0, 43.0, 58.0, 73.0, 59.0, 62.0, 57.0, 39.0, 46.0, 31.0, 28.0, 31.0, 28.0, 27.0, 18.0, 15.0, 8.0, 12.0, 7.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1485066413879395, -5.001501083374023, -4.854495525360107, -4.707489490509033, -4.560483932495117, -4.413478374481201, -4.266472816467285, -4.119467258453369, -3.972461462020874, -3.825455904006958, -3.678450107574463, -3.531444549560547, -3.384438991546631, -3.2374331951141357, -3.0904276371002197, -2.9434218406677246, -2.7964162826538086, -2.6494107246398926, -2.5024049282073975, -2.3553993701934814, -2.2083935737609863, -2.0613880157470703, -1.9143824577331543, -1.7673767805099487, -1.6203711032867432, -1.4733654260635376, -1.326359748840332, -1.179354190826416, -1.0323485136032104, -0.8853428363800049, -0.7383372187614441, -0.5913316011428833, -0.44432640075683594, -0.29732075333595276, -0.15031510591506958, -0.0033094584941864014, 0.14369618892669678, 0.29070186614990234, 0.43770748376846313, 0.5847131013870239, 0.7317187786102295, 0.8787244558334351, 1.0257301330566406, 1.1727356910705566, 1.3197413682937622, 1.4667470455169678, 1.6137526035308838, 1.7607582807540894, 1.907763957977295, 2.054769515991211, 2.201775312423706, 2.348780870437622, 2.495786666870117, 2.642792224884033, 2.789797782897949, 2.9368033409118652, 3.0838091373443604, 3.2308146953582764, 3.3778204917907715, 3.5248260498046875, 3.6718316078186035, 3.8188374042510986, 3.9658429622650146, 4.11284875869751, 4.259854316711426]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 16.0, 17.0, 41.0, 47.0, 62.0, 106.0, 188.0, 368.0, 724.0, 1593.0, 4365.0, 17276.0, 232017.0, 3456607.0, 445604.0, 25747.0, 5792.0, 1884.0, 868.0, 409.0, 223.0, 119.0, 74.0, 45.0, 32.0, 15.0, 19.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4542503356933594, -0.44072723388671875, -0.4272041320800781, -0.4136810302734375, -0.4001579284667969, -0.38663482666015625, -0.3731117248535156, -0.359588623046875, -0.3460655212402344, -0.33254241943359375, -0.3190193176269531, -0.3054962158203125, -0.2919731140136719, -0.27845001220703125, -0.2649269104003906, -0.25140380859375, -0.23788070678710938, -0.22435760498046875, -0.21083450317382812, -0.1973114013671875, -0.18378829956054688, -0.17026519775390625, -0.15674209594726562, -0.143218994140625, -0.12969589233398438, -0.11617279052734375, -0.10264968872070312, -0.0891265869140625, -0.07560348510742188, -0.06208038330078125, -0.048557281494140625, -0.0350341796875, -0.021511077880859375, -0.00798797607421875, 0.005535125732421875, 0.0190582275390625, 0.032581329345703125, 0.04610443115234375, 0.059627532958984375, 0.073150634765625, 0.08667373657226562, 0.10019683837890625, 0.11371994018554688, 0.1272430419921875, 0.14076614379882812, 0.15428924560546875, 0.16781234741210938, 0.18133544921875, 0.19485855102539062, 0.20838165283203125, 0.22190475463867188, 0.2354278564453125, 0.24895095825195312, 0.26247406005859375, 0.2759971618652344, 0.289520263671875, 0.3030433654785156, 0.31656646728515625, 0.3300895690917969, 0.3436126708984375, 0.3571357727050781, 0.37065887451171875, 0.3841819763183594, 0.397705078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 2.0, 8.0, 4.0, 10.0, 7.0, 8.0, 12.0, 18.0, 15.0, 21.0, 27.0, 30.0, 53.0, 48.0, 41.0, 42.0, 54.0, 56.0, 54.0, 54.0, 48.0, 49.0, 34.0, 52.0, 47.0, 31.0, 37.0, 23.0, 33.0, 18.0, 11.0, 14.0, 12.0, 8.0, 9.0, 10.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.24920654296875, -0.2406005859375, -0.23199462890625, -0.223388671875, -0.21478271484375, -0.2061767578125, -0.19757080078125, -0.18896484375, -0.18035888671875, -0.1717529296875, -0.16314697265625, -0.154541015625, -0.14593505859375, -0.1373291015625, -0.12872314453125, -0.1201171875, -0.11151123046875, -0.1029052734375, -0.09429931640625, -0.085693359375, -0.07708740234375, -0.0684814453125, -0.05987548828125, -0.05126953125, -0.04266357421875, -0.0340576171875, -0.02545166015625, -0.016845703125, -0.00823974609375, 0.0003662109375, 0.00897216796875, 0.017578125, 0.02618408203125, 0.0347900390625, 0.04339599609375, 0.052001953125, 0.06060791015625, 0.0692138671875, 0.07781982421875, 0.08642578125, 0.09503173828125, 0.1036376953125, 0.11224365234375, 0.120849609375, 0.12945556640625, 0.1380615234375, 0.14666748046875, 0.1552734375, 0.16387939453125, 0.1724853515625, 0.18109130859375, 0.189697265625, 0.19830322265625, 0.2069091796875, 0.21551513671875, 0.22412109375, 0.23272705078125, 0.2413330078125, 0.24993896484375, 0.258544921875, 0.26715087890625, 0.2757568359375, 0.28436279296875, 0.29296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 8.0, 21.0, 26.0, 31.0, 39.0, 59.0, 107.0, 163.0, 301.0, 583.0, 1341.0, 3933.0, 15875.0, 96728.0, 3334394.0, 682698.0, 44435.0, 8898.0, 2584.0, 1008.0, 470.0, 221.0, 123.0, 74.0, 45.0, 25.0, 22.0, 21.0, 13.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.40064239501953125, -0.3867340087890625, -0.37282562255859375, -0.358917236328125, -0.34500885009765625, -0.3311004638671875, -0.31719207763671875, -0.30328369140625, -0.28937530517578125, -0.2754669189453125, -0.26155853271484375, -0.247650146484375, -0.23374176025390625, -0.2198333740234375, -0.20592498779296875, -0.1920166015625, -0.17810821533203125, -0.1641998291015625, -0.15029144287109375, -0.136383056640625, -0.12247467041015625, -0.1085662841796875, -0.09465789794921875, -0.08074951171875, -0.06684112548828125, -0.0529327392578125, -0.03902435302734375, -0.025115966796875, -0.01120758056640625, 0.0027008056640625, 0.01660919189453125, 0.030517578125, 0.04442596435546875, 0.0583343505859375, 0.07224273681640625, 0.086151123046875, 0.10005950927734375, 0.1139678955078125, 0.12787628173828125, 0.14178466796875, 0.15569305419921875, 0.1696014404296875, 0.18350982666015625, 0.197418212890625, 0.21132659912109375, 0.2252349853515625, 0.23914337158203125, 0.2530517578125, 0.26696014404296875, 0.2808685302734375, 0.29477691650390625, 0.308685302734375, 0.32259368896484375, 0.3365020751953125, 0.35041046142578125, 0.36431884765625, 0.37822723388671875, 0.3921356201171875, 0.40604400634765625, 0.419952392578125, 0.43386077880859375, 0.4477691650390625, 0.46167755126953125, 0.4755859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 2.0, 7.0, 7.0, 10.0, 14.0, 27.0, 38.0, 43.0, 73.0, 122.0, 254.0, 677.0, 1209.0, 830.0, 332.0, 141.0, 86.0, 54.0, 43.0, 36.0, 13.0, 20.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61328125, -0.5956039428710938, -0.5779266357421875, -0.5602493286132812, -0.542572021484375, -0.5248947143554688, -0.5072174072265625, -0.48954010009765625, -0.47186279296875, -0.45418548583984375, -0.4365081787109375, -0.41883087158203125, -0.401153564453125, -0.38347625732421875, -0.3657989501953125, -0.34812164306640625, -0.3304443359375, -0.31276702880859375, -0.2950897216796875, -0.27741241455078125, -0.259735107421875, -0.24205780029296875, -0.2243804931640625, -0.20670318603515625, -0.18902587890625, -0.17134857177734375, -0.1536712646484375, -0.13599395751953125, -0.118316650390625, -0.10063934326171875, -0.0829620361328125, -0.06528472900390625, -0.047607421875, -0.02993011474609375, -0.0122528076171875, 0.00542449951171875, 0.023101806640625, 0.04077911376953125, 0.0584564208984375, 0.07613372802734375, 0.09381103515625, 0.11148834228515625, 0.1291656494140625, 0.14684295654296875, 0.164520263671875, 0.18219757080078125, 0.1998748779296875, 0.21755218505859375, 0.2352294921875, 0.25290679931640625, 0.2705841064453125, 0.28826141357421875, 0.305938720703125, 0.32361602783203125, 0.3412933349609375, 0.35897064208984375, 0.37664794921875, 0.39432525634765625, 0.4120025634765625, 0.42967987060546875, 0.447357177734375, 0.46503448486328125, 0.4827117919921875, 0.5003890991210938, 0.51806640625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 6.0, 16.0, 33.0, 98.0, 187.0, 220.0, 235.0, 111.0, 42.0, 15.0, 8.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7039122581481934, -3.5741631984710693, -3.4444143772125244, -3.3146653175354004, -3.1849164962768555, -3.0551674365997314, -2.9254183769226074, -2.7956695556640625, -2.6659204959869385, -2.5361714363098145, -2.4064226150512695, -2.2766735553741455, -2.1469244956970215, -2.0171756744384766, -1.8874266147613525, -1.757677674293518, -1.6279287338256836, -1.4981797933578491, -1.3684308528900146, -1.2386817932128906, -1.1089328527450562, -0.9791839122772217, -0.8494349122047424, -0.7196859121322632, -0.5899369716644287, -0.46018800139427185, -0.330439031124115, -0.20069006085395813, -0.07094109058380127, 0.0588078498840332, 0.18855684995651245, 0.3183058500289917, 0.44805431365966797, 0.5778032541275024, 0.7075522541999817, 0.8373012542724609, 0.9670501947402954, 1.0967991352081299, 1.226548194885254, 1.3562971353530884, 1.4860460758209229, 1.6157950162887573, 1.7455439567565918, 1.8752930164337158, 2.00504207611084, 2.1347908973693848, 2.264539957046509, 2.394289016723633, 2.5240378379821777, 2.6537868976593018, 2.7835357189178467, 2.9132847785949707, 3.0430335998535156, 3.1727826595306396, 3.3025317192077637, 3.4322805404663086, 3.5620296001434326, 3.6917786598205566, 3.8215274810791016, 3.9512765407562256, 4.08102560043335, 4.2107744216918945, 4.3405232429504395, 4.470272541046143, 4.6000213623046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 11.0, 12.0, 24.0, 19.0, 29.0, 27.0, 30.0, 39.0, 39.0, 45.0, 65.0, 64.0, 56.0, 58.0, 59.0, 59.0, 55.0, 46.0, 58.0, 44.0, 29.0, 25.0, 26.0, 21.0, 12.0, 11.0, 4.0, 8.0, 2.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8198716640472412, -1.7408299446105957, -1.6617882251739502, -1.5827466249465942, -1.5037049055099487, -1.4246631860733032, -1.3456215858459473, -1.2665798664093018, -1.1875381469726562, -1.1084964275360107, -1.0294547080993652, -0.9504131078720093, -0.8713713884353638, -0.7923296689987183, -0.7132880091667175, -0.6342463493347168, -0.5552046298980713, -0.47616294026374817, -0.39712125062942505, -0.31807956099510193, -0.2390378713607788, -0.1599961817264557, -0.08095449209213257, -0.001912832260131836, 0.07712888717651367, 0.1561705768108368, 0.2352122664451599, 0.31425395607948303, 0.39329564571380615, 0.4723373353481293, 0.5513790249824524, 0.6304206848144531, 0.7094626426696777, 0.7885043621063232, 0.867546021938324, 0.9465876817703247, 1.0256294012069702, 1.1046711206436157, 1.1837127208709717, 1.2627544403076172, 1.3417961597442627, 1.4208378791809082, 1.4998795986175537, 1.5789211988449097, 1.6579629182815552, 1.7370046377182007, 1.8160462379455566, 1.8950879573822021, 1.9741296768188477, 2.053171396255493, 2.1322131156921387, 2.211254835128784, 2.2902965545654297, 2.369338035583496, 2.4483797550201416, 2.527421474456787, 2.6064631938934326, 2.685504913330078, 2.7645466327667236, 2.843588352203369, 2.9226298332214355, 3.001671552658081, 3.0807132720947266, 3.159754991531372, 3.2387967109680176]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 7.0, 23.0, 24.0, 40.0, 59.0, 75.0, 150.0, 246.0, 326.0, 664.0, 1112.0, 2051.0, 3969.0, 7979.0, 16053.0, 34439.0, 74984.0, 159115.0, 276252.0, 239778.0, 122667.0, 56494.0, 26253.0, 12378.0, 6140.0, 3244.0, 1716.0, 929.0, 525.0, 314.0, 187.0, 108.0, 78.0, 52.0, 32.0, 23.0, 17.0, 15.0, 8.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.20849609375, -0.20194435119628906, -0.19539260864257812, -0.1888408660888672, -0.18228912353515625, -0.1757373809814453, -0.16918563842773438, -0.16263389587402344, -0.1560821533203125, -0.14953041076660156, -0.14297866821289062, -0.1364269256591797, -0.12987518310546875, -0.12332344055175781, -0.11677169799804688, -0.11021995544433594, -0.103668212890625, -0.09711647033691406, -0.09056472778320312, -0.08401298522949219, -0.07746124267578125, -0.07090950012207031, -0.06435775756835938, -0.05780601501464844, -0.0512542724609375, -0.04470252990722656, -0.038150787353515625, -0.03159904479980469, -0.02504730224609375, -0.018495559692382812, -0.011943817138671875, -0.0053920745849609375, 0.00115966796875, 0.0077114105224609375, 0.014263153076171875, 0.020814895629882812, 0.02736663818359375, 0.03391838073730469, 0.040470123291015625, 0.04702186584472656, 0.0535736083984375, 0.06012535095214844, 0.06667709350585938, 0.07322883605957031, 0.07978057861328125, 0.08633232116699219, 0.09288406372070312, 0.09943580627441406, 0.105987548828125, 0.11253929138183594, 0.11909103393554688, 0.1256427764892578, 0.13219451904296875, 0.1387462615966797, 0.14529800415039062, 0.15184974670410156, 0.1584014892578125, 0.16495323181152344, 0.17150497436523438, 0.1780567169189453, 0.18460845947265625, 0.1911602020263672, 0.19771194458007812, 0.20426368713378906, 0.2108154296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 7.0, 14.0, 7.0, 12.0, 20.0, 19.0, 18.0, 35.0, 48.0, 36.0, 47.0, 49.0, 52.0, 47.0, 50.0, 54.0, 70.0, 46.0, 55.0, 50.0, 42.0, 39.0, 30.0, 33.0, 23.0, 20.0, 17.0, 14.0, 9.0, 10.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2559623718261719, -0.24727630615234375, -0.23859024047851562, -0.2299041748046875, -0.22121810913085938, -0.21253204345703125, -0.20384597778320312, -0.195159912109375, -0.18647384643554688, -0.17778778076171875, -0.16910171508789062, -0.1604156494140625, -0.15172958374023438, -0.14304351806640625, -0.13435745239257812, -0.12567138671875, -0.11698532104492188, -0.10829925537109375, -0.09961318969726562, -0.0909271240234375, -0.08224105834960938, -0.07355499267578125, -0.06486892700195312, -0.056182861328125, -0.047496795654296875, -0.03881072998046875, -0.030124664306640625, -0.0214385986328125, -0.012752532958984375, -0.00406646728515625, 0.004619598388671875, 0.0133056640625, 0.021991729736328125, 0.03067779541015625, 0.039363861083984375, 0.0480499267578125, 0.056735992431640625, 0.06542205810546875, 0.07410812377929688, 0.082794189453125, 0.09148025512695312, 0.10016632080078125, 0.10885238647460938, 0.1175384521484375, 0.12622451782226562, 0.13491058349609375, 0.14359664916992188, 0.15228271484375, 0.16096878051757812, 0.16965484619140625, 0.17834091186523438, 0.1870269775390625, 0.19571304321289062, 0.20439910888671875, 0.21308517456054688, 0.221771240234375, 0.23045730590820312, 0.23914337158203125, 0.24782943725585938, 0.2565155029296875, 0.2652015686035156, 0.27388763427734375, 0.2825736999511719, 0.291259765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 12.0, 10.0, 21.0, 20.0, 33.0, 37.0, 61.0, 83.0, 101.0, 148.0, 206.0, 239.0, 432.0, 658.0, 1185.0, 3232.0, 18517.0, 479331.0, 518689.0, 18991.0, 3231.0, 1220.0, 595.0, 447.0, 294.0, 188.0, 160.0, 108.0, 90.0, 66.0, 37.0, 28.0, 21.0, 23.0, 15.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.698211669921875, -0.67327880859375, -0.648345947265625, -0.6234130859375, -0.598480224609375, -0.57354736328125, -0.548614501953125, -0.523681640625, -0.498748779296875, -0.47381591796875, -0.448883056640625, -0.4239501953125, -0.399017333984375, -0.37408447265625, -0.349151611328125, -0.32421875, -0.299285888671875, -0.27435302734375, -0.249420166015625, -0.2244873046875, -0.199554443359375, -0.17462158203125, -0.149688720703125, -0.124755859375, -0.099822998046875, -0.07489013671875, -0.049957275390625, -0.0250244140625, -9.1552734375e-05, 0.02484130859375, 0.049774169921875, 0.07470703125, 0.099639892578125, 0.12457275390625, 0.149505615234375, 0.1744384765625, 0.199371337890625, 0.22430419921875, 0.249237060546875, 0.274169921875, 0.299102783203125, 0.32403564453125, 0.348968505859375, 0.3739013671875, 0.398834228515625, 0.42376708984375, 0.448699951171875, 0.4736328125, 0.498565673828125, 0.52349853515625, 0.548431396484375, 0.5733642578125, 0.598297119140625, 0.62322998046875, 0.648162841796875, 0.673095703125, 0.698028564453125, 0.72296142578125, 0.747894287109375, 0.7728271484375, 0.797760009765625, 0.82269287109375, 0.847625732421875, 0.87255859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 3.0, 5.0, 10.0, 14.0, 13.0, 22.0, 16.0, 21.0, 33.0, 33.0, 56.0, 45.0, 59.0, 42.0, 65.0, 44.0, 58.0, 48.0, 61.0, 52.0, 55.0, 39.0, 37.0, 28.0, 36.0, 27.0, 20.0, 10.0, 11.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98095703125, -0.9457473754882812, -0.9105377197265625, -0.8753280639648438, -0.840118408203125, -0.8049087524414062, -0.7696990966796875, -0.7344894409179688, -0.69927978515625, -0.6640701293945312, -0.6288604736328125, -0.5936508178710938, -0.558441162109375, -0.5232315063476562, -0.4880218505859375, -0.45281219482421875, -0.4176025390625, -0.38239288330078125, -0.3471832275390625, -0.31197357177734375, -0.276763916015625, -0.24155426025390625, -0.2063446044921875, -0.17113494873046875, -0.13592529296875, -0.10071563720703125, -0.0655059814453125, -0.03029632568359375, 0.004913330078125, 0.04012298583984375, 0.0753326416015625, 0.11054229736328125, 0.145751953125, 0.18096160888671875, 0.2161712646484375, 0.25138092041015625, 0.286590576171875, 0.32180023193359375, 0.3570098876953125, 0.39221954345703125, 0.42742919921875, 0.46263885498046875, 0.4978485107421875, 0.5330581665039062, 0.568267822265625, 0.6034774780273438, 0.6386871337890625, 0.6738967895507812, 0.7091064453125, 0.7443161010742188, 0.7795257568359375, 0.8147354125976562, 0.849945068359375, 0.8851547241210938, 0.9203643798828125, 0.9555740356445312, 0.99078369140625, 1.0259933471679688, 1.0612030029296875, 1.0964126586914062, 1.131622314453125, 1.1668319702148438, 1.2020416259765625, 1.2372512817382812, 1.2724609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 12.0, 21.0, 45.0, 76.0, 147.0, 314.0, 928.0, 3538.0, 25962.0, 826766.0, 177600.0, 10140.0, 1924.0, 586.0, 227.0, 115.0, 66.0, 31.0, 15.0, 11.0, 13.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.30446624755859375, -0.2954559326171875, -0.28644561767578125, -0.277435302734375, -0.26842498779296875, -0.2594146728515625, -0.25040435791015625, -0.24139404296875, -0.23238372802734375, -0.2233734130859375, -0.21436309814453125, -0.205352783203125, -0.19634246826171875, -0.1873321533203125, -0.17832183837890625, -0.1693115234375, -0.16030120849609375, -0.1512908935546875, -0.14228057861328125, -0.133270263671875, -0.12425994873046875, -0.1152496337890625, -0.10623931884765625, -0.09722900390625, -0.08821868896484375, -0.0792083740234375, -0.07019805908203125, -0.061187744140625, -0.05217742919921875, -0.0431671142578125, -0.03415679931640625, -0.025146484375, -0.01613616943359375, -0.0071258544921875, 0.00188446044921875, 0.010894775390625, 0.01990509033203125, 0.0289154052734375, 0.03792572021484375, 0.04693603515625, 0.05594635009765625, 0.0649566650390625, 0.07396697998046875, 0.082977294921875, 0.09198760986328125, 0.1009979248046875, 0.11000823974609375, 0.1190185546875, 0.12802886962890625, 0.1370391845703125, 0.14604949951171875, 0.155059814453125, 0.16407012939453125, 0.1730804443359375, 0.18209075927734375, 0.19110107421875, 0.20011138916015625, 0.2091217041015625, 0.21813201904296875, 0.227142333984375, 0.23615264892578125, 0.2451629638671875, 0.25417327880859375, 0.26318359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 3.0, 2.0, 5.0, 8.0, 6.0, 9.0, 11.0, 15.0, 18.0, 28.0, 24.0, 28.0, 39.0, 57.0, 71.0, 108.0, 108.0, 97.0, 75.0, 63.0, 50.0, 33.0, 24.0, 21.0, 12.0, 13.0, 13.0, 13.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.449222564697266e-05, -6.256252527236938e-05, -6.063282489776611e-05, -5.870312452316284e-05, -5.677342414855957e-05, -5.48437237739563e-05, -5.291402339935303e-05, -5.0984323024749756e-05, -4.9054622650146484e-05, -4.712492227554321e-05, -4.519522190093994e-05, -4.326552152633667e-05, -4.13358211517334e-05, -3.940612077713013e-05, -3.7476420402526855e-05, -3.5546720027923584e-05, -3.361701965332031e-05, -3.168731927871704e-05, -2.975761890411377e-05, -2.7827918529510498e-05, -2.5898218154907227e-05, -2.3968517780303955e-05, -2.2038817405700684e-05, -2.0109117031097412e-05, -1.817941665649414e-05, -1.624971628189087e-05, -1.4320015907287598e-05, -1.2390315532684326e-05, -1.0460615158081055e-05, -8.530914783477783e-06, -6.601214408874512e-06, -4.67151403427124e-06, -2.7418136596679688e-06, -8.121132850646973e-07, 1.1175870895385742e-06, 3.0472874641418457e-06, 4.976987838745117e-06, 6.906688213348389e-06, 8.83638858795166e-06, 1.0766088962554932e-05, 1.2695789337158203e-05, 1.4625489711761475e-05, 1.6555190086364746e-05, 1.8484890460968018e-05, 2.041459083557129e-05, 2.234429121017456e-05, 2.4273991584777832e-05, 2.6203691959381104e-05, 2.8133392333984375e-05, 3.0063092708587646e-05, 3.199279308319092e-05, 3.392249345779419e-05, 3.585219383239746e-05, 3.778189420700073e-05, 3.9711594581604004e-05, 4.1641294956207275e-05, 4.357099533081055e-05, 4.550069570541382e-05, 4.743039608001709e-05, 4.936009645462036e-05, 5.128979682922363e-05, 5.3219497203826904e-05, 5.5149197578430176e-05, 5.707889795303345e-05, 5.900859832763672e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 10.0, 7.0, 12.0, 27.0, 39.0, 78.0, 116.0, 222.0, 557.0, 1529.0, 6044.0, 44924.0, 859394.0, 121037.0, 10948.0, 2238.0, 730.0, 311.0, 166.0, 81.0, 29.0, 28.0, 16.0, 9.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.222900390625, -0.21484375, -0.206787109375, -0.19873046875, -0.190673828125, -0.1826171875, -0.174560546875, -0.16650390625, -0.158447265625, -0.150390625, -0.142333984375, -0.13427734375, -0.126220703125, -0.1181640625, -0.110107421875, -0.10205078125, -0.093994140625, -0.0859375, -0.077880859375, -0.06982421875, -0.061767578125, -0.0537109375, -0.045654296875, -0.03759765625, -0.029541015625, -0.021484375, -0.013427734375, -0.00537109375, 0.002685546875, 0.0107421875, 0.018798828125, 0.02685546875, 0.034912109375, 0.04296875, 0.051025390625, 0.05908203125, 0.067138671875, 0.0751953125, 0.083251953125, 0.09130859375, 0.099365234375, 0.107421875, 0.115478515625, 0.12353515625, 0.131591796875, 0.1396484375, 0.147705078125, 0.15576171875, 0.163818359375, 0.171875, 0.179931640625, 0.18798828125, 0.196044921875, 0.2041015625, 0.212158203125, 0.22021484375, 0.228271484375, 0.236328125, 0.244384765625, 0.25244140625, 0.260498046875, 0.2685546875, 0.276611328125, 0.28466796875, 0.292724609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 10.0, 10.0, 16.0, 18.0, 26.0, 17.0, 36.0, 48.0, 45.0, 55.0, 66.0, 67.0, 83.0, 77.0, 57.0, 70.0, 44.0, 36.0, 36.0, 29.0, 27.0, 26.0, 14.0, 16.0, 14.0, 9.0, 5.0, 7.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15673828125, -0.1522235870361328, -0.14770889282226562, -0.14319419860839844, -0.13867950439453125, -0.13416481018066406, -0.12965011596679688, -0.1251354217529297, -0.1206207275390625, -0.11610603332519531, -0.11159133911132812, -0.10707664489746094, -0.10256195068359375, -0.09804725646972656, -0.09353256225585938, -0.08901786804199219, -0.084503173828125, -0.07998847961425781, -0.07547378540039062, -0.07095909118652344, -0.06644439697265625, -0.06192970275878906, -0.057415008544921875, -0.05290031433105469, -0.0483856201171875, -0.04387092590332031, -0.039356231689453125, -0.03484153747558594, -0.03032684326171875, -0.025812149047851562, -0.021297454833984375, -0.016782760620117188, -0.01226806640625, -0.0077533721923828125, -0.003238677978515625, 0.0012760162353515625, 0.00579071044921875, 0.010305404663085938, 0.014820098876953125, 0.019334793090820312, 0.0238494873046875, 0.028364181518554688, 0.032878875732421875, 0.03739356994628906, 0.04190826416015625, 0.04642295837402344, 0.050937652587890625, 0.05545234680175781, 0.059967041015625, 0.06448173522949219, 0.06899642944335938, 0.07351112365722656, 0.07802581787109375, 0.08254051208496094, 0.08705520629882812, 0.09156990051269531, 0.0960845947265625, 0.10059928894042969, 0.10511398315429688, 0.10962867736816406, 0.11414337158203125, 0.11865806579589844, 0.12317276000976562, 0.1276874542236328, 0.1322021484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 9.0, 9.0, 24.0, 36.0, 83.0, 175.0, 297.0, 178.0, 94.0, 38.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.317379951477051, -5.1720967292785645, -5.026813507080078, -4.881530284881592, -4.7362470626831055, -4.590964317321777, -4.445681095123291, -4.300397872924805, -4.155114650726318, -4.009831428527832, -3.8645482063293457, -3.7192652225494385, -3.573982000350952, -3.428698778152466, -3.2834157943725586, -3.1381325721740723, -2.992849349975586, -2.8475661277770996, -2.7022829055786133, -2.556999921798706, -2.4117166996002197, -2.2664334774017334, -2.121150493621826, -1.9758672714233398, -1.8305840492248535, -1.6853008270263672, -1.5400177240371704, -1.3947346210479736, -1.2494513988494873, -1.104168176651001, -0.9588850736618042, -0.8136019706726074, -0.6683192253112793, -0.5230360627174377, -0.3777529001235962, -0.23246973752975464, -0.08718657493591309, 0.05809658765792847, 0.20337975025177002, 0.3486628532409668, 0.4939460754394531, 0.6392292380332947, 0.7845124006271362, 0.9297955632209778, 1.0750787258148193, 1.2203619480133057, 1.3656450510025024, 1.5109281539916992, 1.6562113761901855, 1.8014945983886719, 1.9467777013778687, 2.0920608043670654, 2.2373440265655518, 2.382627248764038, 2.5279102325439453, 2.6731934547424316, 2.818476676940918, 2.9637598991394043, 3.1090431213378906, 3.254326105117798, 3.399609327316284, 3.5448925495147705, 3.6901755332946777, 3.835458755493164, 3.9807419776916504]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 8.0, 8.0, 12.0, 10.0, 8.0, 14.0, 14.0, 14.0, 17.0, 17.0, 17.0, 23.0, 27.0, 27.0, 22.0, 28.0, 49.0, 45.0, 63.0, 60.0, 61.0, 40.0, 46.0, 35.0, 35.0, 31.0, 37.0, 23.0, 24.0, 25.0, 19.0, 24.0, 17.0, 11.0, 12.0, 12.0, 9.0, 8.0, 9.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0], "bins": [-2.8981740474700928, -2.8045549392700195, -2.7109358310699463, -2.617316722869873, -2.523697853088379, -2.4300787448883057, -2.3364596366882324, -2.242840528488159, -2.149221420288086, -2.0556023120880127, -1.961983323097229, -1.8683642148971558, -1.774745225906372, -1.6811261177062988, -1.5875070095062256, -1.4938879013061523, -1.4002690315246582, -1.306649923324585, -1.2130309343338013, -1.119411826133728, -1.0257928371429443, -0.9321737289428711, -0.8385546207427979, -0.7449355721473694, -0.6513165235519409, -0.5576974749565125, -0.4640783965587616, -0.37045931816101074, -0.2768402695655823, -0.1832212209701538, -0.08960211277008057, 0.0040169358253479, 0.09763622283935547, 0.19125528633594513, 0.2848743498325348, 0.37849342823028564, 0.4721124768257141, 0.5657315254211426, 0.6593506336212158, 0.7529696822166443, 0.8465887308120728, 0.9402077794075012, 1.0338268280029297, 1.127445936203003, 1.2210650444030762, 1.3146840333938599, 1.408303141593933, 1.5019221305847168, 1.59554123878479, 1.6891603469848633, 1.782779335975647, 1.8763984441757202, 1.970017433166504, 2.063636541366577, 2.1572556495666504, 2.2508747577667236, 2.344493865966797, 2.43811297416687, 2.5317320823669434, 2.6253509521484375, 2.7189700603485107, 2.812589168548584, 2.9062082767486572, 2.9998273849487305, 3.0934462547302246]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 8.0, 8.0, 9.0, 17.0, 16.0, 25.0, 37.0, 46.0, 59.0, 76.0, 88.0, 123.0, 203.0, 266.0, 459.0, 759.0, 1453.0, 3203.0, 8427.0, 26571.0, 144425.0, 1106969.0, 2360965.0, 448352.0, 63736.0, 16395.0, 5931.0, 2562.0, 1164.0, 706.0, 341.0, 257.0, 161.0, 115.0, 84.0, 61.0, 46.0, 37.0, 28.0, 16.0, 19.0, 11.0, 12.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2440185546875, -0.23690032958984375, -0.2297821044921875, -0.22266387939453125, -0.215545654296875, -0.20842742919921875, -0.2013092041015625, -0.19419097900390625, -0.18707275390625, -0.17995452880859375, -0.1728363037109375, -0.16571807861328125, -0.158599853515625, -0.15148162841796875, -0.1443634033203125, -0.13724517822265625, -0.130126953125, -0.12300872802734375, -0.1158905029296875, -0.10877227783203125, -0.101654052734375, -0.09453582763671875, -0.0874176025390625, -0.08029937744140625, -0.07318115234375, -0.06606292724609375, -0.0589447021484375, -0.05182647705078125, -0.044708251953125, -0.03759002685546875, -0.0304718017578125, -0.02335357666015625, -0.0162353515625, -0.00911712646484375, -0.0019989013671875, 0.00511932373046875, 0.012237548828125, 0.01935577392578125, 0.0264739990234375, 0.03359222412109375, 0.04071044921875, 0.04782867431640625, 0.0549468994140625, 0.06206512451171875, 0.069183349609375, 0.07630157470703125, 0.0834197998046875, 0.09053802490234375, 0.09765625, 0.10477447509765625, 0.1118927001953125, 0.11901092529296875, 0.126129150390625, 0.13324737548828125, 0.1403656005859375, 0.14748382568359375, 0.15460205078125, 0.16172027587890625, 0.1688385009765625, 0.17595672607421875, 0.183074951171875, 0.19019317626953125, 0.1973114013671875, 0.20442962646484375, 0.2115478515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 15.0, 6.0, 16.0, 13.0, 16.0, 28.0, 30.0, 38.0, 38.0, 49.0, 53.0, 57.0, 73.0, 56.0, 54.0, 61.0, 60.0, 55.0, 49.0, 40.0, 49.0, 26.0, 26.0, 25.0, 15.0, 18.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.2731895446777344, -0.26415252685546875, -0.2551155090332031, -0.2460784912109375, -0.23704147338867188, -0.22800445556640625, -0.21896743774414062, -0.209930419921875, -0.20089340209960938, -0.19185638427734375, -0.18281936645507812, -0.1737823486328125, -0.16474533081054688, -0.15570831298828125, -0.14667129516601562, -0.13763427734375, -0.12859725952148438, -0.11956024169921875, -0.11052322387695312, -0.1014862060546875, -0.09244918823242188, -0.08341217041015625, -0.07437515258789062, -0.065338134765625, -0.056301116943359375, -0.04726409912109375, -0.038227081298828125, -0.0291900634765625, -0.020153045654296875, -0.01111602783203125, -0.002079010009765625, 0.0069580078125, 0.015995025634765625, 0.02503204345703125, 0.034069061279296875, 0.0431060791015625, 0.052143096923828125, 0.06118011474609375, 0.07021713256835938, 0.079254150390625, 0.08829116821289062, 0.09732818603515625, 0.10636520385742188, 0.1154022216796875, 0.12443923950195312, 0.13347625732421875, 0.14251327514648438, 0.15155029296875, 0.16058731079101562, 0.16962432861328125, 0.17866134643554688, 0.1876983642578125, 0.19673538208007812, 0.20577239990234375, 0.21480941772460938, 0.223846435546875, 0.23288345336914062, 0.24192047119140625, 0.2509574890136719, 0.2599945068359375, 0.2690315246582031, 0.27806854248046875, 0.2871055603027344, 0.296142578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 5.0, 13.0, 22.0, 25.0, 32.0, 45.0, 100.0, 215.0, 400.0, 812.0, 1981.0, 6227.0, 29650.0, 387054.0, 3591285.0, 147931.0, 19799.0, 5183.0, 1851.0, 775.0, 384.0, 199.0, 100.0, 56.0, 43.0, 33.0, 15.0, 8.0, 9.0, 11.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3269500732421875, -0.314544677734375, -0.3021392822265625, -0.28973388671875, -0.2773284912109375, -0.264923095703125, -0.2525177001953125, -0.2401123046875, -0.2277069091796875, -0.215301513671875, -0.2028961181640625, -0.19049072265625, -0.1780853271484375, -0.165679931640625, -0.1532745361328125, -0.140869140625, -0.1284637451171875, -0.116058349609375, -0.1036529541015625, -0.09124755859375, -0.0788421630859375, -0.066436767578125, -0.0540313720703125, -0.0416259765625, -0.0292205810546875, -0.016815185546875, -0.0044097900390625, 0.00799560546875, 0.0204010009765625, 0.032806396484375, 0.0452117919921875, 0.0576171875, 0.0700225830078125, 0.082427978515625, 0.0948333740234375, 0.10723876953125, 0.1196441650390625, 0.132049560546875, 0.1444549560546875, 0.1568603515625, 0.1692657470703125, 0.181671142578125, 0.1940765380859375, 0.20648193359375, 0.2188873291015625, 0.231292724609375, 0.2436981201171875, 0.256103515625, 0.2685089111328125, 0.280914306640625, 0.2933197021484375, 0.30572509765625, 0.3181304931640625, 0.330535888671875, 0.3429412841796875, 0.3553466796875, 0.3677520751953125, 0.380157470703125, 0.3925628662109375, 0.40496826171875, 0.4173736572265625, 0.429779052734375, 0.4421844482421875, 0.45458984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 8.0, 24.0, 28.0, 49.0, 122.0, 186.0, 400.0, 904.0, 1129.0, 644.0, 267.0, 114.0, 52.0, 31.0, 34.0, 19.0, 8.0, 9.0, 11.0, 1.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5751953125, -0.557861328125, -0.54052734375, -0.523193359375, -0.505859375, -0.488525390625, -0.47119140625, -0.453857421875, -0.4365234375, -0.419189453125, -0.40185546875, -0.384521484375, -0.3671875, -0.349853515625, -0.33251953125, -0.315185546875, -0.2978515625, -0.280517578125, -0.26318359375, -0.245849609375, -0.228515625, -0.211181640625, -0.19384765625, -0.176513671875, -0.1591796875, -0.141845703125, -0.12451171875, -0.107177734375, -0.08984375, -0.072509765625, -0.05517578125, -0.037841796875, -0.0205078125, -0.003173828125, 0.01416015625, 0.031494140625, 0.048828125, 0.066162109375, 0.08349609375, 0.100830078125, 0.1181640625, 0.135498046875, 0.15283203125, 0.170166015625, 0.1875, 0.204833984375, 0.22216796875, 0.239501953125, 0.2568359375, 0.274169921875, 0.29150390625, 0.308837890625, 0.326171875, 0.343505859375, 0.36083984375, 0.378173828125, 0.3955078125, 0.412841796875, 0.43017578125, 0.447509765625, 0.46484375, 0.482177734375, 0.49951171875, 0.516845703125, 0.5341796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 12.0, 29.0, 75.0, 174.0, 209.0, 237.0, 126.0, 72.0, 23.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.06421422958374, -4.9465765953063965, -4.828939437866211, -4.711301803588867, -4.593664169311523, -4.47602653503418, -4.358389377593994, -4.24075174331665, -4.123114585876465, -4.005476951599121, -3.8878395557403564, -3.770202159881592, -3.652564525604248, -3.5349271297454834, -3.4172897338867188, -3.299652099609375, -3.1820144653320312, -3.0643770694732666, -2.946739435195923, -2.829102039337158, -2.7114644050598145, -2.59382700920105, -2.476189613342285, -2.3585519790649414, -2.2409145832061768, -2.123277187347412, -2.0056395530700684, -1.8880021572113037, -1.7703646421432495, -1.6527271270751953, -1.5350897312164307, -1.4174522161483765, -1.2998147010803223, -1.182177186012268, -1.0645396709442139, -0.9469022750854492, -0.829264760017395, -0.7116272449493408, -0.5939897894859314, -0.476352334022522, -0.3587148189544678, -0.24107733368873596, -0.12343984842300415, -0.005802363157272339, 0.11183512210845947, 0.22947263717651367, 0.3471100926399231, 0.4647475481033325, 0.5823850631713867, 0.7000225782394409, 0.8176600337028503, 0.9352974891662598, 1.052935004234314, 1.1705725193023682, 1.2882099151611328, 1.405847430229187, 1.5234849452972412, 1.6411224603652954, 1.7587599754333496, 1.8763973712921143, 1.9940348863601685, 2.1116724014282227, 2.2293097972869873, 2.346947193145752, 2.4645848274230957]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 8.0, 6.0, 7.0, 17.0, 17.0, 17.0, 24.0, 19.0, 26.0, 30.0, 44.0, 41.0, 42.0, 49.0, 59.0, 65.0, 49.0, 50.0, 45.0, 57.0, 43.0, 35.0, 44.0, 24.0, 25.0, 32.0, 22.0, 15.0, 15.0, 17.0, 10.0, 12.0, 8.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.379817485809326, -2.3186392784118652, -2.257460832595825, -2.1962826251983643, -2.1351044178009033, -2.0739259719848633, -2.0127477645874023, -1.9515695571899414, -1.890391230583191, -1.8292129039764404, -1.7680346965789795, -1.706856369972229, -1.6456780433654785, -1.5844998359680176, -1.523321509361267, -1.4621431827545166, -1.4009649753570557, -1.3397866487503052, -1.2786084413528442, -1.2174301147460938, -1.1562519073486328, -1.0950735807418823, -1.0338952541351318, -0.9727169871330261, -0.9115387201309204, -0.8503604531288147, -0.789182186126709, -0.7280038595199585, -0.6668255925178528, -0.6056473255157471, -0.5444689989089966, -0.48329073190689087, -0.42211246490478516, -0.36093419790267944, -0.29975590109825134, -0.23857761919498444, -0.17739933729171753, -0.11622107028961182, -0.055042773485183716, 0.006135523319244385, 0.0673137903213501, 0.128492072224617, 0.1896703541278839, 0.250848650932312, 0.3120269179344177, 0.37320518493652344, 0.43438348174095154, 0.49556177854537964, 0.5567400455474854, 0.6179183125495911, 0.6790965795516968, 0.7402749061584473, 0.801453173160553, 0.8626314401626587, 0.9238097667694092, 0.9849880337715149, 1.0461663007736206, 1.107344627380371, 1.168522834777832, 1.2297011613845825, 1.290879487991333, 1.352057695388794, 1.4132360219955444, 1.474414348602295, 1.5355925559997559]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 6.0, 7.0, 16.0, 17.0, 26.0, 32.0, 49.0, 71.0, 106.0, 172.0, 260.0, 442.0, 768.0, 1274.0, 2436.0, 4524.0, 9545.0, 21436.0, 50927.0, 126314.0, 289853.0, 304704.0, 136278.0, 55075.0, 22973.0, 10237.0, 5043.0, 2573.0, 1398.0, 755.0, 456.0, 273.0, 169.0, 104.0, 63.0, 39.0, 24.0, 31.0, 18.0, 10.0, 11.0, 7.0, 10.0, 3.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.265869140625, -0.25869178771972656, -0.2515144348144531, -0.2443370819091797, -0.23715972900390625, -0.2299823760986328, -0.22280502319335938, -0.21562767028808594, -0.2084503173828125, -0.20127296447753906, -0.19409561157226562, -0.1869182586669922, -0.17974090576171875, -0.1725635528564453, -0.16538619995117188, -0.15820884704589844, -0.151031494140625, -0.14385414123535156, -0.13667678833007812, -0.1294994354248047, -0.12232208251953125, -0.11514472961425781, -0.10796737670898438, -0.10079002380371094, -0.0936126708984375, -0.08643531799316406, -0.07925796508789062, -0.07208061218261719, -0.06490325927734375, -0.05772590637207031, -0.050548553466796875, -0.04337120056152344, -0.03619384765625, -0.029016494750976562, -0.021839141845703125, -0.014661788940429688, -0.00748443603515625, -0.0003070831298828125, 0.006870269775390625, 0.014047622680664062, 0.0212249755859375, 0.028402328491210938, 0.035579681396484375, 0.04275703430175781, 0.04993438720703125, 0.05711174011230469, 0.06428909301757812, 0.07146644592285156, 0.078643798828125, 0.08582115173339844, 0.09299850463867188, 0.10017585754394531, 0.10735321044921875, 0.11453056335449219, 0.12170791625976562, 0.12888526916503906, 0.1360626220703125, 0.14323997497558594, 0.15041732788085938, 0.1575946807861328, 0.16477203369140625, 0.1719493865966797, 0.17912673950195312, 0.18630409240722656, 0.1934814453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 13.0, 13.0, 17.0, 14.0, 29.0, 31.0, 29.0, 34.0, 52.0, 60.0, 61.0, 62.0, 59.0, 60.0, 54.0, 62.0, 47.0, 50.0, 60.0, 40.0, 35.0, 27.0, 20.0, 18.0, 15.0, 7.0, 8.0, 9.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268798828125, -0.2599372863769531, -0.25107574462890625, -0.24221420288085938, -0.2333526611328125, -0.22449111938476562, -0.21562957763671875, -0.20676803588867188, -0.197906494140625, -0.18904495239257812, -0.18018341064453125, -0.17132186889648438, -0.1624603271484375, -0.15359878540039062, -0.14473724365234375, -0.13587570190429688, -0.12701416015625, -0.11815261840820312, -0.10929107666015625, -0.10042953491210938, -0.0915679931640625, -0.08270645141601562, -0.07384490966796875, -0.06498336791992188, -0.056121826171875, -0.047260284423828125, -0.03839874267578125, -0.029537200927734375, -0.0206756591796875, -0.011814117431640625, -0.00295257568359375, 0.005908966064453125, 0.0147705078125, 0.023632049560546875, 0.03249359130859375, 0.041355133056640625, 0.0502166748046875, 0.059078216552734375, 0.06793975830078125, 0.07680130004882812, 0.085662841796875, 0.09452438354492188, 0.10338592529296875, 0.11224746704101562, 0.1211090087890625, 0.12997055053710938, 0.13883209228515625, 0.14769363403320312, 0.15655517578125, 0.16541671752929688, 0.17427825927734375, 0.18313980102539062, 0.1920013427734375, 0.20086288452148438, 0.20972442626953125, 0.21858596801757812, 0.227447509765625, 0.23630905151367188, 0.24517059326171875, 0.2540321350097656, 0.2628936767578125, 0.2717552185058594, 0.28061676025390625, 0.2894783020019531, 0.29833984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 8.0, 8.0, 9.0, 21.0, 22.0, 28.0, 45.0, 50.0, 58.0, 109.0, 143.0, 192.0, 242.0, 327.0, 518.0, 875.0, 1711.0, 4832.0, 31766.0, 648754.0, 329762.0, 20877.0, 4085.0, 1525.0, 769.0, 470.0, 348.0, 270.0, 175.0, 141.0, 114.0, 89.0, 61.0, 35.0, 34.0, 21.0, 17.0, 5.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.57415771484375, -0.5535888671875, -0.53302001953125, -0.512451171875, -0.49188232421875, -0.4713134765625, -0.45074462890625, -0.43017578125, -0.40960693359375, -0.3890380859375, -0.36846923828125, -0.347900390625, -0.32733154296875, -0.3067626953125, -0.28619384765625, -0.265625, -0.24505615234375, -0.2244873046875, -0.20391845703125, -0.183349609375, -0.16278076171875, -0.1422119140625, -0.12164306640625, -0.10107421875, -0.08050537109375, -0.0599365234375, -0.03936767578125, -0.018798828125, 0.00177001953125, 0.0223388671875, 0.04290771484375, 0.0634765625, 0.08404541015625, 0.1046142578125, 0.12518310546875, 0.145751953125, 0.16632080078125, 0.1868896484375, 0.20745849609375, 0.22802734375, 0.24859619140625, 0.2691650390625, 0.28973388671875, 0.310302734375, 0.33087158203125, 0.3514404296875, 0.37200927734375, 0.392578125, 0.41314697265625, 0.4337158203125, 0.45428466796875, 0.474853515625, 0.49542236328125, 0.5159912109375, 0.53656005859375, 0.55712890625, 0.57769775390625, 0.5982666015625, 0.61883544921875, 0.639404296875, 0.65997314453125, 0.6805419921875, 0.70111083984375, 0.7216796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 13.0, 12.0, 18.0, 10.0, 16.0, 26.0, 30.0, 30.0, 36.0, 38.0, 33.0, 57.0, 44.0, 58.0, 60.0, 49.0, 50.0, 52.0, 47.0, 40.0, 37.0, 33.0, 31.0, 29.0, 25.0, 27.0, 23.0, 22.0, 10.0, 6.0, 5.0, 7.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70166015625, -0.67529296875, -0.64892578125, -0.62255859375, -0.59619140625, -0.56982421875, -0.54345703125, -0.51708984375, -0.49072265625, -0.46435546875, -0.43798828125, -0.41162109375, -0.38525390625, -0.35888671875, -0.33251953125, -0.30615234375, -0.27978515625, -0.25341796875, -0.22705078125, -0.20068359375, -0.17431640625, -0.14794921875, -0.12158203125, -0.09521484375, -0.06884765625, -0.04248046875, -0.01611328125, 0.01025390625, 0.03662109375, 0.06298828125, 0.08935546875, 0.11572265625, 0.14208984375, 0.16845703125, 0.19482421875, 0.22119140625, 0.24755859375, 0.27392578125, 0.30029296875, 0.32666015625, 0.35302734375, 0.37939453125, 0.40576171875, 0.43212890625, 0.45849609375, 0.48486328125, 0.51123046875, 0.53759765625, 0.56396484375, 0.59033203125, 0.61669921875, 0.64306640625, 0.66943359375, 0.69580078125, 0.72216796875, 0.74853515625, 0.77490234375, 0.80126953125, 0.82763671875, 0.85400390625, 0.88037109375, 0.90673828125, 0.93310546875, 0.95947265625, 0.98583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 5.0, 8.0, 10.0, 13.0, 19.0, 22.0, 45.0, 78.0, 154.0, 364.0, 1106.0, 7554.0, 181899.0, 828228.0, 25593.0, 2389.0, 557.0, 229.0, 91.0, 56.0, 35.0, 26.0, 23.0, 16.0, 4.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246826171875, -0.23865890502929688, -0.23049163818359375, -0.22232437133789062, -0.2141571044921875, -0.20598983764648438, -0.19782257080078125, -0.18965530395507812, -0.181488037109375, -0.17332077026367188, -0.16515350341796875, -0.15698623657226562, -0.1488189697265625, -0.14065170288085938, -0.13248443603515625, -0.12431716918945312, -0.11614990234375, -0.10798263549804688, -0.09981536865234375, -0.09164810180664062, -0.0834808349609375, -0.07531356811523438, -0.06714630126953125, -0.058979034423828125, -0.050811767578125, -0.042644500732421875, -0.03447723388671875, -0.026309967041015625, -0.0181427001953125, -0.009975433349609375, -0.00180816650390625, 0.006359100341796875, 0.0145263671875, 0.022693634033203125, 0.03086090087890625, 0.039028167724609375, 0.0471954345703125, 0.055362701416015625, 0.06352996826171875, 0.07169723510742188, 0.079864501953125, 0.08803176879882812, 0.09619903564453125, 0.10436630249023438, 0.1125335693359375, 0.12070083618164062, 0.12886810302734375, 0.13703536987304688, 0.14520263671875, 0.15336990356445312, 0.16153717041015625, 0.16970443725585938, 0.1778717041015625, 0.18603897094726562, 0.19420623779296875, 0.20237350463867188, 0.210540771484375, 0.21870803833007812, 0.22687530517578125, 0.23504257202148438, 0.2432098388671875, 0.2513771057128906, 0.25954437255859375, 0.2677116394042969, 0.27587890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 7.0, 4.0, 5.0, 7.0, 9.0, 5.0, 12.0, 15.0, 18.0, 31.0, 43.0, 52.0, 70.0, 105.0, 131.0, 117.0, 86.0, 88.0, 41.0, 34.0, 27.0, 19.0, 8.0, 6.0, 17.0, 10.0, 4.0, 7.0, 6.0, 4.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.687641143798828e-05, -6.476230919361115e-05, -6.264820694923401e-05, -6.053410470485687e-05, -5.8420002460479736e-05, -5.63059002161026e-05, -5.4191797971725464e-05, -5.207769572734833e-05, -4.996359348297119e-05, -4.7849491238594055e-05, -4.573538899421692e-05, -4.362128674983978e-05, -4.1507184505462646e-05, -3.939308226108551e-05, -3.7278980016708374e-05, -3.516487777233124e-05, -3.30507755279541e-05, -3.0936673283576965e-05, -2.882257103919983e-05, -2.6708468794822693e-05, -2.4594366550445557e-05, -2.248026430606842e-05, -2.0366162061691284e-05, -1.8252059817314148e-05, -1.6137957572937012e-05, -1.4023855328559875e-05, -1.190975308418274e-05, -9.795650839805603e-06, -7.681548595428467e-06, -5.5674463510513306e-06, -3.4533441066741943e-06, -1.339241862297058e-06, 7.748603820800781e-07, 2.8889626264572144e-06, 5.003064870834351e-06, 7.117167115211487e-06, 9.231269359588623e-06, 1.134537160396576e-05, 1.3459473848342896e-05, 1.5573576092720032e-05, 1.7687678337097168e-05, 1.9801780581474304e-05, 2.191588282585144e-05, 2.4029985070228577e-05, 2.6144087314605713e-05, 2.825818955898285e-05, 3.0372291803359985e-05, 3.248639404773712e-05, 3.460049629211426e-05, 3.6714598536491394e-05, 3.882870078086853e-05, 4.0942803025245667e-05, 4.30569052696228e-05, 4.517100751399994e-05, 4.7285109758377075e-05, 4.939921200275421e-05, 5.151331424713135e-05, 5.3627416491508484e-05, 5.574151873588562e-05, 5.7855620980262756e-05, 5.996972322463989e-05, 6.208382546901703e-05, 6.419792771339417e-05, 6.63120299577713e-05, 6.842613220214844e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 4.0, 6.0, 8.0, 11.0, 23.0, 20.0, 48.0, 63.0, 132.0, 206.0, 334.0, 639.0, 1481.0, 4523.0, 23280.0, 226260.0, 714068.0, 63876.0, 9161.0, 2370.0, 962.0, 458.0, 216.0, 149.0, 92.0, 50.0, 43.0, 23.0, 18.0, 12.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1873779296875, -0.1824779510498047, -0.17757797241210938, -0.17267799377441406, -0.16777801513671875, -0.16287803649902344, -0.15797805786132812, -0.1530780792236328, -0.1481781005859375, -0.1432781219482422, -0.13837814331054688, -0.13347816467285156, -0.12857818603515625, -0.12367820739746094, -0.11877822875976562, -0.11387825012207031, -0.108978271484375, -0.10407829284667969, -0.09917831420898438, -0.09427833557128906, -0.08937835693359375, -0.08447837829589844, -0.07957839965820312, -0.07467842102050781, -0.0697784423828125, -0.06487846374511719, -0.059978485107421875, -0.05507850646972656, -0.05017852783203125, -0.04527854919433594, -0.040378570556640625, -0.03547859191894531, -0.03057861328125, -0.025678634643554688, -0.020778656005859375, -0.015878677368164062, -0.01097869873046875, -0.0060787200927734375, -0.001178741455078125, 0.0037212371826171875, 0.0086212158203125, 0.013521194458007812, 0.018421173095703125, 0.023321151733398438, 0.02822113037109375, 0.03312110900878906, 0.038021087646484375, 0.04292106628417969, 0.047821044921875, 0.05272102355957031, 0.057621002197265625, 0.06252098083496094, 0.06742095947265625, 0.07232093811035156, 0.07722091674804688, 0.08212089538574219, 0.0870208740234375, 0.09192085266113281, 0.09682083129882812, 0.10172080993652344, 0.10662078857421875, 0.11152076721191406, 0.11642074584960938, 0.12132072448730469, 0.126220703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 12.0, 14.0, 14.0, 24.0, 28.0, 33.0, 58.0, 79.0, 114.0, 121.0, 98.0, 117.0, 72.0, 64.0, 43.0, 36.0, 22.0, 21.0, 11.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.255340576171875, -0.24945068359375, -0.243560791015625, -0.2376708984375, -0.231781005859375, -0.22589111328125, -0.220001220703125, -0.214111328125, -0.208221435546875, -0.20233154296875, -0.196441650390625, -0.1905517578125, -0.184661865234375, -0.17877197265625, -0.172882080078125, -0.1669921875, -0.161102294921875, -0.15521240234375, -0.149322509765625, -0.1434326171875, -0.137542724609375, -0.13165283203125, -0.125762939453125, -0.119873046875, -0.113983154296875, -0.10809326171875, -0.102203369140625, -0.0963134765625, -0.090423583984375, -0.08453369140625, -0.078643798828125, -0.07275390625, -0.066864013671875, -0.06097412109375, -0.055084228515625, -0.0491943359375, -0.043304443359375, -0.03741455078125, -0.031524658203125, -0.025634765625, -0.019744873046875, -0.01385498046875, -0.007965087890625, -0.0020751953125, 0.003814697265625, 0.00970458984375, 0.015594482421875, 0.021484375, 0.027374267578125, 0.03326416015625, 0.039154052734375, 0.0450439453125, 0.050933837890625, 0.05682373046875, 0.062713623046875, 0.068603515625, 0.074493408203125, 0.08038330078125, 0.086273193359375, 0.0921630859375, 0.098052978515625, 0.10394287109375, 0.109832763671875, 0.11572265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 14.0, 28.0, 63.0, 155.0, 339.0, 207.0, 94.0, 37.0, 18.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.472559928894043, -4.334954261779785, -4.197348594665527, -4.059742450714111, -3.9221367835998535, -3.7845311164855957, -3.646925449371338, -3.50931978225708, -3.371713876724243, -3.2341082096099854, -3.0965023040771484, -2.9588966369628906, -2.821290969848633, -2.683685064315796, -2.546079397201538, -2.408473491668701, -2.2708678245544434, -2.1332621574401855, -1.9956562519073486, -1.8580505847930908, -1.7204447984695435, -1.582839012145996, -1.4452333450317383, -1.307627558708191, -1.1700217723846436, -1.0324159860610962, -0.8948102593421936, -0.757204532623291, -0.6195987462997437, -0.4819929599761963, -0.3443872332572937, -0.2067815065383911, -0.06917619705200195, 0.06842955946922302, 0.206035315990448, 0.343641072511673, 0.48124682903289795, 0.6188526153564453, 0.7564583420753479, 0.8940640687942505, 1.0316698551177979, 1.1692756414413452, 1.3068814277648926, 1.4444870948791504, 1.5820928812026978, 1.7196986675262451, 1.857304334640503, 1.9949101209640503, 2.1325159072875977, 2.2701215744018555, 2.4077274799346924, 2.54533314704895, 2.682939052581787, 2.820544719696045, 2.9581503868103027, 3.0957560539245605, 3.2333619594573975, 3.3709676265716553, 3.508573532104492, 3.64617919921875, 3.783784866333008, 3.9213907718658447, 4.058996677398682, 4.1966023445129395, 4.334208011627197]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 8.0, 14.0, 13.0, 13.0, 15.0, 22.0, 23.0, 27.0, 30.0, 41.0, 49.0, 53.0, 59.0, 76.0, 111.0, 69.0, 63.0, 45.0, 42.0, 40.0, 27.0, 28.0, 23.0, 19.0, 19.0, 18.0, 15.0, 11.0, 10.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.347200870513916, -3.2330715656280518, -3.1189424991607666, -3.0048131942749023, -2.890684127807617, -2.776554822921753, -2.6624255180358887, -2.5482964515686035, -2.4341673851013184, -2.320038080215454, -2.205909013748169, -2.0917797088623047, -1.9776506423950195, -1.8635213375091553, -1.7493921518325806, -1.6352629661560059, -1.5211336612701416, -1.407004475593567, -1.2928752899169922, -1.178745985031128, -1.0646169185638428, -0.9504876732826233, -0.8363584280014038, -0.7222292423248291, -0.6081000566482544, -0.4939708709716797, -0.3798416554927826, -0.2657124400138855, -0.1515832543373108, -0.037454068660736084, 0.0766751766204834, 0.1908043622970581, 0.3049333095550537, 0.4190624952316284, 0.5331916809082031, 0.6473209261894226, 0.7614501118659973, 0.875579297542572, 0.9897085428237915, 1.1038377285003662, 1.217966914176941, 1.3320960998535156, 1.4462252855300903, 1.560354471206665, 1.6744837760925293, 1.7886128425598145, 1.9027421474456787, 2.016871452331543, 2.131000518798828, 2.2451298236846924, 2.3592588901519775, 2.473388195037842, 2.587517261505127, 2.701646566390991, 2.8157758712768555, 2.9299049377441406, 3.044034004211426, 3.15816330909729, 3.272292375564575, 3.3864216804504395, 3.5005507469177246, 3.614680051803589, 3.728809356689453, 3.8429384231567383, 3.9570677280426025]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 7.0, 10.0, 26.0, 38.0, 31.0, 64.0, 95.0, 148.0, 263.0, 573.0, 1607.0, 6485.0, 57089.0, 1948131.0, 2102848.0, 65662.0, 8003.0, 1824.0, 660.0, 288.0, 153.0, 79.0, 60.0, 45.0, 17.0, 24.0, 20.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3516502380371094, -0.33953094482421875, -0.3274116516113281, -0.3152923583984375, -0.3031730651855469, -0.29105377197265625, -0.2789344787597656, -0.266815185546875, -0.2546958923339844, -0.24257659912109375, -0.23045730590820312, -0.2183380126953125, -0.20621871948242188, -0.19409942626953125, -0.18198013305664062, -0.16986083984375, -0.15774154663085938, -0.14562225341796875, -0.13350296020507812, -0.1213836669921875, -0.10926437377929688, -0.09714508056640625, -0.08502578735351562, -0.072906494140625, -0.060787200927734375, -0.04866790771484375, -0.036548614501953125, -0.0244293212890625, -0.012310028076171875, -0.00019073486328125, 0.011928558349609375, 0.0240478515625, 0.036167144775390625, 0.04828643798828125, 0.060405731201171875, 0.0725250244140625, 0.08464431762695312, 0.09676361083984375, 0.10888290405273438, 0.121002197265625, 0.13312149047851562, 0.14524078369140625, 0.15736007690429688, 0.1694793701171875, 0.18159866333007812, 0.19371795654296875, 0.20583724975585938, 0.21795654296875, 0.23007583618164062, 0.24219512939453125, 0.2543144226074219, 0.2664337158203125, 0.2785530090332031, 0.29067230224609375, 0.3027915954589844, 0.314910888671875, 0.3270301818847656, 0.33914947509765625, 0.3512687683105469, 0.3633880615234375, 0.3755073547363281, 0.38762664794921875, 0.3997459411621094, 0.411865234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 9.0, 17.0, 21.0, 20.0, 26.0, 28.0, 40.0, 43.0, 61.0, 55.0, 78.0, 80.0, 55.0, 68.0, 74.0, 50.0, 54.0, 41.0, 43.0, 37.0, 27.0, 21.0, 16.0, 11.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.263702392578125, -0.25469970703125, -0.245697021484375, -0.2366943359375, -0.227691650390625, -0.21868896484375, -0.209686279296875, -0.20068359375, -0.191680908203125, -0.18267822265625, -0.173675537109375, -0.1646728515625, -0.155670166015625, -0.14666748046875, -0.137664794921875, -0.128662109375, -0.119659423828125, -0.11065673828125, -0.101654052734375, -0.0926513671875, -0.083648681640625, -0.07464599609375, -0.065643310546875, -0.056640625, -0.047637939453125, -0.03863525390625, -0.029632568359375, -0.0206298828125, -0.011627197265625, -0.00262451171875, 0.006378173828125, 0.015380859375, 0.024383544921875, 0.03338623046875, 0.042388916015625, 0.0513916015625, 0.060394287109375, 0.06939697265625, 0.078399658203125, 0.08740234375, 0.096405029296875, 0.10540771484375, 0.114410400390625, 0.1234130859375, 0.132415771484375, 0.14141845703125, 0.150421142578125, 0.159423828125, 0.168426513671875, 0.17742919921875, 0.186431884765625, 0.1954345703125, 0.204437255859375, 0.21343994140625, 0.222442626953125, 0.2314453125, 0.240447998046875, 0.24945068359375, 0.258453369140625, 0.2674560546875, 0.276458740234375, 0.28546142578125, 0.294464111328125, 0.303466796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 3.0, 6.0, 15.0, 28.0, 63.0, 125.0, 255.0, 571.0, 1952.0, 11668.0, 562236.0, 3584142.0, 27898.0, 3629.0, 1051.0, 363.0, 138.0, 73.0, 26.0, 11.0, 12.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.63232421875, -0.612030029296875, -0.59173583984375, -0.571441650390625, -0.5511474609375, -0.530853271484375, -0.51055908203125, -0.490264892578125, -0.469970703125, -0.449676513671875, -0.42938232421875, -0.409088134765625, -0.3887939453125, -0.368499755859375, -0.34820556640625, -0.327911376953125, -0.3076171875, -0.287322998046875, -0.26702880859375, -0.246734619140625, -0.2264404296875, -0.206146240234375, -0.18585205078125, -0.165557861328125, -0.145263671875, -0.124969482421875, -0.10467529296875, -0.084381103515625, -0.0640869140625, -0.043792724609375, -0.02349853515625, -0.003204345703125, 0.01708984375, 0.037384033203125, 0.05767822265625, 0.077972412109375, 0.0982666015625, 0.118560791015625, 0.13885498046875, 0.159149169921875, 0.179443359375, 0.199737548828125, 0.22003173828125, 0.240325927734375, 0.2606201171875, 0.280914306640625, 0.30120849609375, 0.321502685546875, 0.341796875, 0.362091064453125, 0.38238525390625, 0.402679443359375, 0.4229736328125, 0.443267822265625, 0.46356201171875, 0.483856201171875, 0.504150390625, 0.524444580078125, 0.54473876953125, 0.565032958984375, 0.5853271484375, 0.605621337890625, 0.62591552734375, 0.646209716796875, 0.66650390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 13.0, 22.0, 33.0, 42.0, 104.0, 217.0, 553.0, 1135.0, 1087.0, 456.0, 200.0, 95.0, 48.0, 19.0, 13.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5771484375, -0.559539794921875, -0.54193115234375, -0.524322509765625, -0.5067138671875, -0.489105224609375, -0.47149658203125, -0.453887939453125, -0.436279296875, -0.418670654296875, -0.40106201171875, -0.383453369140625, -0.3658447265625, -0.348236083984375, -0.33062744140625, -0.313018798828125, -0.29541015625, -0.277801513671875, -0.26019287109375, -0.242584228515625, -0.2249755859375, -0.207366943359375, -0.18975830078125, -0.172149658203125, -0.154541015625, -0.136932373046875, -0.11932373046875, -0.101715087890625, -0.0841064453125, -0.066497802734375, -0.04888916015625, -0.031280517578125, -0.013671875, 0.003936767578125, 0.02154541015625, 0.039154052734375, 0.0567626953125, 0.074371337890625, 0.09197998046875, 0.109588623046875, 0.127197265625, 0.144805908203125, 0.16241455078125, 0.180023193359375, 0.1976318359375, 0.215240478515625, 0.23284912109375, 0.250457763671875, 0.26806640625, 0.285675048828125, 0.30328369140625, 0.320892333984375, 0.3385009765625, 0.356109619140625, 0.37371826171875, 0.391326904296875, 0.408935546875, 0.426544189453125, 0.44415283203125, 0.461761474609375, 0.4793701171875, 0.496978759765625, 0.51458740234375, 0.532196044921875, 0.5498046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 12.0, 12.0, 47.0, 185.0, 404.0, 247.0, 62.0, 17.0, 9.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7105021476745605, -4.518747329711914, -4.326992511749268, -4.135237693786621, -3.9434828758239746, -3.751728057861328, -3.5599732398986816, -3.368218421936035, -3.1764636039733887, -2.984708786010742, -2.7929539680480957, -2.601199150085449, -2.4094443321228027, -2.2176895141601562, -2.0259346961975098, -1.8341798782348633, -1.6424250602722168, -1.4506702423095703, -1.2589154243469238, -1.0671606063842773, -0.8754057884216309, -0.6836509704589844, -0.4918961524963379, -0.3001413345336914, -0.10838651657104492, 0.08336830139160156, 0.27512311935424805, 0.46687793731689453, 0.658632755279541, 0.8503875732421875, 1.042142391204834, 1.2338972091674805, 1.4256515502929688, 1.6174063682556152, 1.8091611862182617, 2.000916004180908, 2.1926708221435547, 2.384425640106201, 2.5761804580688477, 2.767935276031494, 2.9596900939941406, 3.151444911956787, 3.3431997299194336, 3.53495454788208, 3.7267093658447266, 3.918464183807373, 4.1102190017700195, 4.301973819732666, 4.4937286376953125, 4.685483455657959, 4.8772382736206055, 5.068993091583252, 5.260747909545898, 5.452502727508545, 5.644257545471191, 5.836012363433838, 6.027767181396484, 6.219521999359131, 6.411276817321777, 6.603031635284424, 6.79478645324707, 6.986541271209717, 7.178296089172363, 7.37005090713501, 7.561805725097656]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 1.0, 2.0, 4.0, 7.0, 16.0, 12.0, 17.0, 25.0, 29.0, 28.0, 40.0, 52.0, 61.0, 59.0, 49.0, 48.0, 68.0, 49.0, 60.0, 48.0, 50.0, 56.0, 34.0, 40.0, 32.0, 23.0, 16.0, 19.0, 15.0, 9.0, 9.0, 9.0, 6.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.606874465942383, -2.5371897220611572, -2.4675049781799316, -2.397820234298706, -2.3281354904174805, -2.258450746536255, -2.1887660026550293, -2.1190812587738037, -2.049396514892578, -1.9797117710113525, -1.910027027130127, -1.8403422832489014, -1.7706575393676758, -1.7009727954864502, -1.6312880516052246, -1.561603307723999, -1.4919184446334839, -1.4222337007522583, -1.3525489568710327, -1.2828642129898071, -1.2131794691085815, -1.143494725227356, -1.0738098621368408, -1.0041251182556152, -0.9344404339790344, -0.8647556900978088, -0.7950709462165833, -0.7253861427307129, -0.6557013988494873, -0.5860166549682617, -0.5163319110870361, -0.44664716720581055, -0.37696242332458496, -0.3072776794433594, -0.2375929206609726, -0.16790816187858582, -0.09822341799736023, -0.028538674116134644, 0.04114609956741333, 0.11083084344863892, 0.1805155873298645, 0.2502003312110901, 0.3198850750923157, 0.38956984877586365, 0.45925459265708923, 0.5289393663406372, 0.5986241102218628, 0.6683088541030884, 0.737993597984314, 0.8076783418655396, 0.8773630857467651, 0.9470478296279907, 1.0167325735092163, 1.086417317390442, 1.156102180480957, 1.2257869243621826, 1.2954716682434082, 1.3651564121246338, 1.4348411560058594, 1.504525899887085, 1.5742106437683105, 1.6438953876495361, 1.7135801315307617, 1.7832648754119873, 1.852949619293213]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 17.0, 18.0, 32.0, 52.0, 79.0, 137.0, 323.0, 544.0, 1305.0, 3127.0, 8953.0, 30398.0, 125894.0, 438162.0, 329125.0, 79084.0, 20514.0, 6426.0, 2271.0, 1017.0, 483.0, 233.0, 148.0, 53.0, 45.0, 26.0, 14.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.332275390625, -0.3221588134765625, -0.312042236328125, -0.3019256591796875, -0.29180908203125, -0.2816925048828125, -0.271575927734375, -0.2614593505859375, -0.2513427734375, -0.2412261962890625, -0.231109619140625, -0.2209930419921875, -0.21087646484375, -0.2007598876953125, -0.190643310546875, -0.1805267333984375, -0.17041015625, -0.1602935791015625, -0.150177001953125, -0.1400604248046875, -0.12994384765625, -0.1198272705078125, -0.109710693359375, -0.0995941162109375, -0.0894775390625, -0.0793609619140625, -0.069244384765625, -0.0591278076171875, -0.04901123046875, -0.0388946533203125, -0.028778076171875, -0.0186614990234375, -0.008544921875, 0.0015716552734375, 0.011688232421875, 0.0218048095703125, 0.03192138671875, 0.0420379638671875, 0.052154541015625, 0.0622711181640625, 0.0723876953125, 0.0825042724609375, 0.092620849609375, 0.1027374267578125, 0.11285400390625, 0.1229705810546875, 0.133087158203125, 0.1432037353515625, 0.1533203125, 0.1634368896484375, 0.173553466796875, 0.1836700439453125, 0.19378662109375, 0.2039031982421875, 0.214019775390625, 0.2241363525390625, 0.2342529296875, 0.2443695068359375, 0.254486083984375, 0.2646026611328125, 0.27471923828125, 0.2848358154296875, 0.294952392578125, 0.3050689697265625, 0.315185546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 12.0, 12.0, 21.0, 21.0, 24.0, 47.0, 44.0, 49.0, 55.0, 68.0, 67.0, 74.0, 60.0, 67.0, 56.0, 43.0, 64.0, 48.0, 45.0, 31.0, 24.0, 22.0, 15.0, 7.0, 10.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270263671875, -0.261260986328125, -0.25225830078125, -0.243255615234375, -0.2342529296875, -0.225250244140625, -0.21624755859375, -0.207244873046875, -0.1982421875, -0.189239501953125, -0.18023681640625, -0.171234130859375, -0.1622314453125, -0.153228759765625, -0.14422607421875, -0.135223388671875, -0.126220703125, -0.117218017578125, -0.10821533203125, -0.099212646484375, -0.0902099609375, -0.081207275390625, -0.07220458984375, -0.063201904296875, -0.05419921875, -0.045196533203125, -0.03619384765625, -0.027191162109375, -0.0181884765625, -0.009185791015625, -0.00018310546875, 0.008819580078125, 0.017822265625, 0.026824951171875, 0.03582763671875, 0.044830322265625, 0.0538330078125, 0.062835693359375, 0.07183837890625, 0.080841064453125, 0.08984375, 0.098846435546875, 0.10784912109375, 0.116851806640625, 0.1258544921875, 0.134857177734375, 0.14385986328125, 0.152862548828125, 0.161865234375, 0.170867919921875, 0.17987060546875, 0.188873291015625, 0.1978759765625, 0.206878662109375, 0.21588134765625, 0.224884033203125, 0.23388671875, 0.242889404296875, 0.25189208984375, 0.260894775390625, 0.2698974609375, 0.278900146484375, 0.28790283203125, 0.296905517578125, 0.305908203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 10.0, 14.0, 3.0, 8.0, 11.0, 10.0, 32.0, 33.0, 46.0, 69.0, 72.0, 117.0, 182.0, 318.0, 603.0, 1420.0, 4335.0, 17485.0, 104056.0, 693736.0, 188225.0, 27785.0, 6213.0, 1944.0, 761.0, 366.0, 197.0, 148.0, 97.0, 54.0, 54.0, 39.0, 25.0, 18.0, 14.0, 7.0, 7.0, 11.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.38570404052734375, -0.3722381591796875, -0.35877227783203125, -0.345306396484375, -0.33184051513671875, -0.3183746337890625, -0.30490875244140625, -0.29144287109375, -0.27797698974609375, -0.2645111083984375, -0.25104522705078125, -0.237579345703125, -0.22411346435546875, -0.2106475830078125, -0.19718170166015625, -0.1837158203125, -0.17024993896484375, -0.1567840576171875, -0.14331817626953125, -0.129852294921875, -0.11638641357421875, -0.1029205322265625, -0.08945465087890625, -0.07598876953125, -0.06252288818359375, -0.0490570068359375, -0.03559112548828125, -0.022125244140625, -0.00865936279296875, 0.0048065185546875, 0.01827239990234375, 0.03173828125, 0.04520416259765625, 0.0586700439453125, 0.07213592529296875, 0.085601806640625, 0.09906768798828125, 0.1125335693359375, 0.12599945068359375, 0.13946533203125, 0.15293121337890625, 0.1663970947265625, 0.17986297607421875, 0.193328857421875, 0.20679473876953125, 0.2202606201171875, 0.23372650146484375, 0.2471923828125, 0.26065826416015625, 0.2741241455078125, 0.28759002685546875, 0.301055908203125, 0.31452178955078125, 0.3279876708984375, 0.34145355224609375, 0.35491943359375, 0.36838531494140625, 0.3818511962890625, 0.39531707763671875, 0.408782958984375, 0.42224884033203125, 0.4357147216796875, 0.44918060302734375, 0.462646484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 13.0, 8.0, 11.0, 7.0, 6.0, 19.0, 22.0, 22.0, 24.0, 23.0, 37.0, 27.0, 44.0, 49.0, 65.0, 45.0, 51.0, 50.0, 43.0, 52.0, 40.0, 34.0, 29.0, 32.0, 33.0, 26.0, 34.0, 23.0, 17.0, 24.0, 16.0, 11.0, 11.0, 6.0, 7.0, 8.0, 7.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.62799072265625, -0.6075439453125, -0.58709716796875, -0.566650390625, -0.54620361328125, -0.5257568359375, -0.50531005859375, -0.48486328125, -0.46441650390625, -0.4439697265625, -0.42352294921875, -0.403076171875, -0.38262939453125, -0.3621826171875, -0.34173583984375, -0.3212890625, -0.30084228515625, -0.2803955078125, -0.25994873046875, -0.239501953125, -0.21905517578125, -0.1986083984375, -0.17816162109375, -0.15771484375, -0.13726806640625, -0.1168212890625, -0.09637451171875, -0.075927734375, -0.05548095703125, -0.0350341796875, -0.01458740234375, 0.005859375, 0.02630615234375, 0.0467529296875, 0.06719970703125, 0.087646484375, 0.10809326171875, 0.1285400390625, 0.14898681640625, 0.16943359375, 0.18988037109375, 0.2103271484375, 0.23077392578125, 0.251220703125, 0.27166748046875, 0.2921142578125, 0.31256103515625, 0.3330078125, 0.35345458984375, 0.3739013671875, 0.39434814453125, 0.414794921875, 0.43524169921875, 0.4556884765625, 0.47613525390625, 0.49658203125, 0.51702880859375, 0.5374755859375, 0.55792236328125, 0.578369140625, 0.59881591796875, 0.6192626953125, 0.63970947265625, 0.66015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 13.0, 15.0, 29.0, 51.0, 116.0, 269.0, 753.0, 2577.0, 12042.0, 82742.0, 742912.0, 179063.0, 22074.0, 4113.0, 1083.0, 367.0, 147.0, 78.0, 36.0, 25.0, 19.0, 9.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1612548828125, -0.1564655303955078, -0.15167617797851562, -0.14688682556152344, -0.14209747314453125, -0.13730812072753906, -0.13251876831054688, -0.1277294158935547, -0.1229400634765625, -0.11815071105957031, -0.11336135864257812, -0.10857200622558594, -0.10378265380859375, -0.09899330139160156, -0.09420394897460938, -0.08941459655761719, -0.084625244140625, -0.07983589172363281, -0.07504653930664062, -0.07025718688964844, -0.06546783447265625, -0.06067848205566406, -0.055889129638671875, -0.05109977722167969, -0.0463104248046875, -0.04152107238769531, -0.036731719970703125, -0.03194236755371094, -0.02715301513671875, -0.022363662719726562, -0.017574310302734375, -0.012784957885742188, -0.00799560546875, -0.0032062530517578125, 0.001583099365234375, 0.0063724517822265625, 0.01116180419921875, 0.015951156616210938, 0.020740509033203125, 0.025529861450195312, 0.0303192138671875, 0.03510856628417969, 0.039897918701171875, 0.04468727111816406, 0.04947662353515625, 0.05426597595214844, 0.059055328369140625, 0.06384468078613281, 0.068634033203125, 0.07342338562011719, 0.07821273803710938, 0.08300209045410156, 0.08779144287109375, 0.09258079528808594, 0.09737014770507812, 0.10215950012207031, 0.1069488525390625, 0.11173820495605469, 0.11652755737304688, 0.12131690979003906, 0.12610626220703125, 0.13089561462402344, 0.13568496704101562, 0.1404743194580078, 0.145263671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 12.0, 8.0, 14.0, 24.0, 20.0, 15.0, 30.0, 44.0, 61.0, 77.0, 77.0, 75.0, 79.0, 89.0, 65.0, 66.0, 54.0, 47.0, 30.0, 21.0, 25.0, 17.0, 11.0, 5.0, 3.0, 5.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.088878631591797e-05, -3.963429480791092e-05, -3.837980329990387e-05, -3.712531179189682e-05, -3.587082028388977e-05, -3.461632877588272e-05, -3.336183726787567e-05, -3.210734575986862e-05, -3.085285425186157e-05, -2.9598362743854523e-05, -2.8343871235847473e-05, -2.7089379727840424e-05, -2.5834888219833374e-05, -2.4580396711826324e-05, -2.3325905203819275e-05, -2.2071413695812225e-05, -2.0816922187805176e-05, -1.9562430679798126e-05, -1.8307939171791077e-05, -1.7053447663784027e-05, -1.5798956155776978e-05, -1.4544464647769928e-05, -1.3289973139762878e-05, -1.2035481631755829e-05, -1.078099012374878e-05, -9.52649861574173e-06, -8.27200710773468e-06, -7.017515599727631e-06, -5.763024091720581e-06, -4.5085325837135315e-06, -3.254041075706482e-06, -1.9995495676994324e-06, -7.450580596923828e-07, 5.094334483146667e-07, 1.7639249563217163e-06, 3.018416464328766e-06, 4.2729079723358154e-06, 5.527399480342865e-06, 6.7818909883499146e-06, 8.036382496356964e-06, 9.290874004364014e-06, 1.0545365512371063e-05, 1.1799857020378113e-05, 1.3054348528385162e-05, 1.4308840036392212e-05, 1.556333154439926e-05, 1.681782305240631e-05, 1.807231456041336e-05, 1.932680606842041e-05, 2.058129757642746e-05, 2.183578908443451e-05, 2.309028059244156e-05, 2.434477210044861e-05, 2.5599263608455658e-05, 2.6853755116462708e-05, 2.8108246624469757e-05, 2.9362738132476807e-05, 3.0617229640483856e-05, 3.1871721148490906e-05, 3.3126212656497955e-05, 3.4380704164505005e-05, 3.5635195672512054e-05, 3.6889687180519104e-05, 3.8144178688526154e-05, 3.93986701965332e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 8.0, 18.0, 28.0, 30.0, 74.0, 114.0, 216.0, 507.0, 1433.0, 5988.0, 35643.0, 358562.0, 592340.0, 44064.0, 6808.0, 1656.0, 534.0, 235.0, 119.0, 73.0, 32.0, 20.0, 12.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1549072265625, -0.1499176025390625, -0.144927978515625, -0.1399383544921875, -0.13494873046875, -0.1299591064453125, -0.124969482421875, -0.1199798583984375, -0.114990234375, -0.1100006103515625, -0.105010986328125, -0.1000213623046875, -0.09503173828125, -0.0900421142578125, -0.085052490234375, -0.0800628662109375, -0.0750732421875, -0.0700836181640625, -0.065093994140625, -0.0601043701171875, -0.05511474609375, -0.0501251220703125, -0.045135498046875, -0.0401458740234375, -0.03515625, -0.0301666259765625, -0.025177001953125, -0.0201873779296875, -0.01519775390625, -0.0102081298828125, -0.005218505859375, -0.0002288818359375, 0.0047607421875, 0.0097503662109375, 0.014739990234375, 0.0197296142578125, 0.02471923828125, 0.0297088623046875, 0.034698486328125, 0.0396881103515625, 0.044677734375, 0.0496673583984375, 0.054656982421875, 0.0596466064453125, 0.06463623046875, 0.0696258544921875, 0.074615478515625, 0.0796051025390625, 0.0845947265625, 0.0895843505859375, 0.094573974609375, 0.0995635986328125, 0.10455322265625, 0.1095428466796875, 0.114532470703125, 0.1195220947265625, 0.12451171875, 0.1295013427734375, 0.134490966796875, 0.1394805908203125, 0.14447021484375, 0.1494598388671875, 0.154449462890625, 0.1594390869140625, 0.1644287109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 17.0, 15.0, 29.0, 24.0, 50.0, 56.0, 64.0, 80.0, 103.0, 92.0, 99.0, 78.0, 61.0, 60.0, 44.0, 31.0, 25.0, 11.0, 7.0, 10.0, 7.0, 4.0, 8.0, 1.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17478561401367188, -0.17024993896484375, -0.16571426391601562, -0.1611785888671875, -0.15664291381835938, -0.15210723876953125, -0.14757156372070312, -0.143035888671875, -0.13850021362304688, -0.13396453857421875, -0.12942886352539062, -0.1248931884765625, -0.12035751342773438, -0.11582183837890625, -0.11128616333007812, -0.10675048828125, -0.10221481323242188, -0.09767913818359375, -0.09314346313476562, -0.0886077880859375, -0.08407211303710938, -0.07953643798828125, -0.07500076293945312, -0.070465087890625, -0.06592941284179688, -0.06139373779296875, -0.056858062744140625, -0.0523223876953125, -0.047786712646484375, -0.04325103759765625, -0.038715362548828125, -0.0341796875, -0.029644012451171875, -0.02510833740234375, -0.020572662353515625, -0.0160369873046875, -0.011501312255859375, -0.00696563720703125, -0.002429962158203125, 0.002105712890625, 0.006641387939453125, 0.01117706298828125, 0.015712738037109375, 0.0202484130859375, 0.024784088134765625, 0.02931976318359375, 0.033855438232421875, 0.03839111328125, 0.042926788330078125, 0.04746246337890625, 0.051998138427734375, 0.0565338134765625, 0.061069488525390625, 0.06560516357421875, 0.07014083862304688, 0.074676513671875, 0.07921218872070312, 0.08374786376953125, 0.08828353881835938, 0.0928192138671875, 0.09735488891601562, 0.10189056396484375, 0.10642623901367188, 0.1109619140625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 12.0, 12.0, 41.0, 109.0, 297.0, 272.0, 136.0, 51.0, 24.0, 15.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.741288185119629, -2.6102638244628906, -2.4792394638061523, -2.348215103149414, -2.217190742492676, -2.0861663818359375, -1.9551421403884888, -1.8241177797317505, -1.6930934190750122, -1.562069058418274, -1.4310446977615356, -1.300020456314087, -1.1689960956573486, -1.0379717350006104, -0.9069473743438721, -0.7759230136871338, -0.6448986530303955, -0.5138742923736572, -0.38284996151924133, -0.25182563066482544, -0.12080127000808716, 0.010223090648651123, 0.14124739170074463, 0.2722717523574829, 0.4032961130142212, 0.5343204736709595, 0.6653448343276978, 0.7963691353797913, 0.9273934960365295, 1.058417797088623, 1.1894421577453613, 1.3204665184020996, 1.451490879058838, 1.5825152397155762, 1.7135396003723145, 1.8445639610290527, 1.975588321685791, 2.1066126823425293, 2.2376370429992676, 2.368661403656006, 2.499685764312744, 2.6307101249694824, 2.7617344856262207, 2.892758846282959, 3.0237832069396973, 3.1548075675964355, 3.285831928253174, 3.416856288909912, 3.5478804111480713, 3.6789047718048096, 3.809929132461548, 3.940953493118286, 4.071977615356445, 4.203001976013184, 4.334026336669922, 4.46505069732666, 4.596075057983398, 4.727099418640137, 4.858123779296875, 4.989148139953613, 5.120172500610352, 5.25119686126709, 5.382221221923828, 5.513245582580566, 5.644269943237305]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 12.0, 3.0, 5.0, 9.0, 13.0, 13.0, 20.0, 18.0, 22.0, 33.0, 24.0, 20.0, 28.0, 50.0, 48.0, 68.0, 71.0, 83.0, 82.0, 46.0, 45.0, 32.0, 46.0, 28.0, 20.0, 28.0, 26.0, 23.0, 15.0, 10.0, 16.0, 11.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7512314319610596, -2.662660598754883, -2.574089765548706, -2.4855189323425293, -2.3969478607177734, -2.3083770275115967, -2.21980619430542, -2.131235361099243, -2.0426645278930664, -1.9540936946868896, -1.865522861480713, -1.7769519090652466, -1.6883810758590698, -1.599810242652893, -1.5112392902374268, -1.42266845703125, -1.3340976238250732, -1.2455267906188965, -1.1569559574127197, -1.0683850049972534, -0.9798141717910767, -0.8912433385848999, -0.8026724457740784, -0.7141015529632568, -0.6255307197570801, -0.5369598865509033, -0.4483889937400818, -0.35981813073158264, -0.2712472677230835, -0.18267640471458435, -0.0941055417060852, -0.005534648895263672, 0.08303594589233398, 0.17160680890083313, 0.2601776719093323, 0.3487485349178314, 0.43731939792633057, 0.5258902311325073, 0.6144611239433289, 0.7030320167541504, 0.7916028499603271, 0.8801736831665039, 0.9687445759773254, 1.057315468788147, 1.1458863019943237, 1.2344571352005005, 1.3230280876159668, 1.4115989208221436, 1.5001697540283203, 1.588740587234497, 1.6773114204406738, 1.7658823728561401, 1.854453206062317, 1.9430240392684937, 2.03159499168396, 2.1201658248901367, 2.2087366580963135, 2.2973074913024902, 2.385878324508667, 2.4744491577148438, 2.5630202293395996, 2.6515910625457764, 2.740161895751953, 2.82873272895813, 2.9173035621643066]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 11.0, 8.0, 14.0, 23.0, 31.0, 30.0, 52.0, 82.0, 142.0, 211.0, 362.0, 641.0, 1375.0, 3330.0, 9631.0, 44013.0, 377073.0, 2360043.0, 1218643.0, 143936.0, 23383.0, 6474.0, 2433.0, 989.0, 490.0, 284.0, 202.0, 121.0, 74.0, 61.0, 37.0, 28.0, 14.0, 11.0, 9.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205322265625, -0.1984272003173828, -0.19153213500976562, -0.18463706970214844, -0.17774200439453125, -0.17084693908691406, -0.16395187377929688, -0.1570568084716797, -0.1501617431640625, -0.1432666778564453, -0.13637161254882812, -0.12947654724121094, -0.12258148193359375, -0.11568641662597656, -0.10879135131835938, -0.10189628601074219, -0.095001220703125, -0.08810615539550781, -0.08121109008789062, -0.07431602478027344, -0.06742095947265625, -0.06052589416503906, -0.053630828857421875, -0.04673576354980469, -0.0398406982421875, -0.03294563293457031, -0.026050567626953125, -0.019155502319335938, -0.01226043701171875, -0.0053653717041015625, 0.001529693603515625, 0.008424758911132812, 0.01531982421875, 0.022214889526367188, 0.029109954833984375, 0.03600502014160156, 0.04290008544921875, 0.04979515075683594, 0.056690216064453125, 0.06358528137207031, 0.0704803466796875, 0.07737541198730469, 0.08427047729492188, 0.09116554260253906, 0.09806060791015625, 0.10495567321777344, 0.11185073852539062, 0.11874580383300781, 0.125640869140625, 0.1325359344482422, 0.13943099975585938, 0.14632606506347656, 0.15322113037109375, 0.16011619567871094, 0.16701126098632812, 0.1739063262939453, 0.1808013916015625, 0.1876964569091797, 0.19459152221679688, 0.20148658752441406, 0.20838165283203125, 0.21527671813964844, 0.22217178344726562, 0.2290668487548828, 0.2359619140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 17.0, 24.0, 19.0, 27.0, 38.0, 55.0, 55.0, 75.0, 67.0, 65.0, 79.0, 81.0, 70.0, 54.0, 53.0, 45.0, 48.0, 28.0, 24.0, 22.0, 14.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.2565345764160156, -0.24744415283203125, -0.23835372924804688, -0.2292633056640625, -0.22017288208007812, -0.21108245849609375, -0.20199203491210938, -0.192901611328125, -0.18381118774414062, -0.17472076416015625, -0.16563034057617188, -0.1565399169921875, -0.14744949340820312, -0.13835906982421875, -0.12926864624023438, -0.12017822265625, -0.11108779907226562, -0.10199737548828125, -0.09290695190429688, -0.0838165283203125, -0.07472610473632812, -0.06563568115234375, -0.056545257568359375, -0.047454833984375, -0.038364410400390625, -0.02927398681640625, -0.020183563232421875, -0.0110931396484375, -0.002002716064453125, 0.00708770751953125, 0.016178131103515625, 0.0252685546875, 0.034358978271484375, 0.04344940185546875, 0.052539825439453125, 0.0616302490234375, 0.07072067260742188, 0.07981109619140625, 0.08890151977539062, 0.097991943359375, 0.10708236694335938, 0.11617279052734375, 0.12526321411132812, 0.1343536376953125, 0.14344406127929688, 0.15253448486328125, 0.16162490844726562, 0.17071533203125, 0.17980575561523438, 0.18889617919921875, 0.19798660278320312, 0.2070770263671875, 0.21616744995117188, 0.22525787353515625, 0.23434829711914062, 0.243438720703125, 0.2525291442871094, 0.26161956787109375, 0.2707099914550781, 0.2798004150390625, 0.2888908386230469, 0.29798126220703125, 0.3070716857910156, 0.316162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 13.0, 18.0, 22.0, 52.0, 111.0, 296.0, 837.0, 3742.0, 63409.0, 3996318.0, 123052.0, 4890.0, 950.0, 328.0, 121.0, 49.0, 19.0, 26.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.638671875, -0.6190643310546875, -0.599456787109375, -0.5798492431640625, -0.56024169921875, -0.5406341552734375, -0.521026611328125, -0.5014190673828125, -0.4818115234375, -0.4622039794921875, -0.442596435546875, -0.4229888916015625, -0.40338134765625, -0.3837738037109375, -0.364166259765625, -0.3445587158203125, -0.324951171875, -0.3053436279296875, -0.285736083984375, -0.2661285400390625, -0.24652099609375, -0.2269134521484375, -0.207305908203125, -0.1876983642578125, -0.1680908203125, -0.1484832763671875, -0.128875732421875, -0.1092681884765625, -0.08966064453125, -0.0700531005859375, -0.050445556640625, -0.0308380126953125, -0.01123046875, 0.0083770751953125, 0.027984619140625, 0.0475921630859375, 0.06719970703125, 0.0868072509765625, 0.106414794921875, 0.1260223388671875, 0.1456298828125, 0.1652374267578125, 0.184844970703125, 0.2044525146484375, 0.22406005859375, 0.2436676025390625, 0.263275146484375, 0.2828826904296875, 0.302490234375, 0.3220977783203125, 0.341705322265625, 0.3613128662109375, 0.38092041015625, 0.4005279541015625, 0.420135498046875, 0.4397430419921875, 0.4593505859375, 0.4789581298828125, 0.498565673828125, 0.5181732177734375, 0.53778076171875, 0.5573883056640625, 0.576995849609375, 0.5966033935546875, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 5.0, 6.0, 7.0, 6.0, 18.0, 37.0, 55.0, 69.0, 106.0, 196.0, 362.0, 670.0, 820.0, 711.0, 418.0, 245.0, 123.0, 76.0, 53.0, 33.0, 21.0, 13.0, 5.0, 5.0, 1.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38037109375, -0.36904144287109375, -0.3577117919921875, -0.34638214111328125, -0.335052490234375, -0.32372283935546875, -0.3123931884765625, -0.30106353759765625, -0.28973388671875, -0.27840423583984375, -0.2670745849609375, -0.25574493408203125, -0.244415283203125, -0.23308563232421875, -0.2217559814453125, -0.21042633056640625, -0.1990966796875, -0.18776702880859375, -0.1764373779296875, -0.16510772705078125, -0.153778076171875, -0.14244842529296875, -0.1311187744140625, -0.11978912353515625, -0.10845947265625, -0.09712982177734375, -0.0858001708984375, -0.07447052001953125, -0.063140869140625, -0.05181121826171875, -0.0404815673828125, -0.02915191650390625, -0.017822265625, -0.00649261474609375, 0.0048370361328125, 0.01616668701171875, 0.027496337890625, 0.03882598876953125, 0.0501556396484375, 0.06148529052734375, 0.07281494140625, 0.08414459228515625, 0.0954742431640625, 0.10680389404296875, 0.118133544921875, 0.12946319580078125, 0.1407928466796875, 0.15212249755859375, 0.1634521484375, 0.17478179931640625, 0.1861114501953125, 0.19744110107421875, 0.208770751953125, 0.22010040283203125, 0.2314300537109375, 0.24275970458984375, 0.25408935546875, 0.26541900634765625, 0.2767486572265625, 0.28807830810546875, 0.299407958984375, 0.31073760986328125, 0.3220672607421875, 0.33339691162109375, 0.3447265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 16.0, 63.0, 147.0, 260.0, 260.0, 132.0, 67.0, 28.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.03072452545166, -5.904982566833496, -5.779240131378174, -5.65349817276001, -5.527756214141846, -5.402013778686523, -5.276271820068359, -5.150529861450195, -5.024787902832031, -4.899045944213867, -4.773303508758545, -4.647561550140381, -4.521819591522217, -4.3960771560668945, -4.2703351974487305, -4.144593238830566, -4.018850803375244, -3.893108606338501, -3.767366647720337, -3.6416244506835938, -3.5158824920654297, -3.3901402950286865, -3.2643980979919434, -3.1386561393737793, -3.012913942337036, -2.887171745300293, -2.761429786682129, -2.6356875896453857, -2.5099453926086426, -2.3842034339904785, -2.2584612369537354, -2.132719039916992, -2.006977081298828, -1.8812350034713745, -1.755492925643921, -1.6297507286071777, -1.5040086507797241, -1.3782665729522705, -1.2525243759155273, -1.1267822980880737, -1.0010402202606201, -0.8752981424331665, -0.7495560050010681, -0.6238138675689697, -0.4980717897415161, -0.3723297119140625, -0.2465875744819641, -0.12084543704986572, 0.004896640777587891, 0.1306387484073639, 0.2563808560371399, 0.3821229636669159, 0.5078650712966919, 0.6336071491241455, 0.7593492865562439, 0.8850914239883423, 1.010833501815796, 1.1365755796432495, 1.2623176574707031, 1.3880598545074463, 1.5138019323349, 1.6395440101623535, 1.7652862071990967, 1.8910282850265503, 2.016770362854004]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 3.0, 4.0, 9.0, 15.0, 11.0, 10.0, 16.0, 16.0, 16.0, 28.0, 20.0, 30.0, 49.0, 41.0, 41.0, 46.0, 50.0, 56.0, 69.0, 45.0, 45.0, 58.0, 35.0, 47.0, 27.0, 36.0, 33.0, 24.0, 16.0, 16.0, 17.0, 19.0, 5.0, 9.0, 7.0, 5.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4121918678283691, -1.3658236265182495, -1.3194552659988403, -1.2730870246887207, -1.2267186641693115, -1.180350422859192, -1.1339821815490723, -1.087613821029663, -1.041245460510254, -0.9948771595954895, -0.9485088586807251, -0.9021406173706055, -0.8557722568511963, -0.8094040155410767, -0.7630357146263123, -0.7166674137115479, -0.6702991724014282, -0.6239308714866638, -0.5775625705718994, -0.5311943292617798, -0.484825998544693, -0.4384576976299286, -0.3920894265174866, -0.34572112560272217, -0.29935282468795776, -0.25298452377319336, -0.20661623775959015, -0.16024795174598694, -0.11387965083122253, -0.06751134991645813, -0.021143078804016113, 0.02522522211074829, 0.07159340381622314, 0.11796169728040695, 0.16432999074459076, 0.21069827675819397, 0.2570665776729584, 0.3034348785877228, 0.3498031497001648, 0.3961714506149292, 0.4425397515296936, 0.488908052444458, 0.5352763533592224, 0.5816446542739868, 0.6280128955841064, 0.6743812561035156, 0.7207494974136353, 0.7671177983283997, 0.8134860992431641, 0.8598544001579285, 0.9062227010726929, 0.9525909423828125, 0.9989593029022217, 1.0453275442123413, 1.091695785522461, 1.1380641460418701, 1.1844325065612793, 1.230800747871399, 1.277169108390808, 1.3235373497009277, 1.369905710220337, 1.4162739515304565, 1.4626421928405762, 1.5090105533599854, 1.555378794670105]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 6.0, 15.0, 12.0, 26.0, 40.0, 69.0, 82.0, 120.0, 161.0, 235.0, 423.0, 758.0, 1434.0, 2821.0, 6093.0, 14520.0, 37390.0, 103375.0, 287266.0, 358851.0, 147177.0, 52044.0, 19799.0, 8228.0, 3647.0, 1669.0, 914.0, 508.0, 280.0, 196.0, 137.0, 65.0, 48.0, 35.0, 33.0, 14.0, 12.0, 7.0, 8.0, 13.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20068359375, -0.194244384765625, -0.18780517578125, -0.181365966796875, -0.1749267578125, -0.168487548828125, -0.16204833984375, -0.155609130859375, -0.149169921875, -0.142730712890625, -0.13629150390625, -0.129852294921875, -0.1234130859375, -0.116973876953125, -0.11053466796875, -0.104095458984375, -0.09765625, -0.091217041015625, -0.08477783203125, -0.078338623046875, -0.0718994140625, -0.065460205078125, -0.05902099609375, -0.052581787109375, -0.046142578125, -0.039703369140625, -0.03326416015625, -0.026824951171875, -0.0203857421875, -0.013946533203125, -0.00750732421875, -0.001068115234375, 0.00537109375, 0.011810302734375, 0.01824951171875, 0.024688720703125, 0.0311279296875, 0.037567138671875, 0.04400634765625, 0.050445556640625, 0.056884765625, 0.063323974609375, 0.06976318359375, 0.076202392578125, 0.0826416015625, 0.089080810546875, 0.09552001953125, 0.101959228515625, 0.1083984375, 0.114837646484375, 0.12127685546875, 0.127716064453125, 0.1341552734375, 0.140594482421875, 0.14703369140625, 0.153472900390625, 0.159912109375, 0.166351318359375, 0.17279052734375, 0.179229736328125, 0.1856689453125, 0.192108154296875, 0.19854736328125, 0.204986572265625, 0.21142578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 10.0, 22.0, 19.0, 27.0, 39.0, 45.0, 48.0, 64.0, 76.0, 88.0, 65.0, 74.0, 55.0, 57.0, 64.0, 48.0, 48.0, 28.0, 30.0, 30.0, 11.0, 19.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.2566871643066406, -0.24774932861328125, -0.23881149291992188, -0.2298736572265625, -0.22093582153320312, -0.21199798583984375, -0.20306015014648438, -0.194122314453125, -0.18518447875976562, -0.17624664306640625, -0.16730880737304688, -0.1583709716796875, -0.14943313598632812, -0.14049530029296875, -0.13155746459960938, -0.12261962890625, -0.11368179321289062, -0.10474395751953125, -0.09580612182617188, -0.0868682861328125, -0.07793045043945312, -0.06899261474609375, -0.060054779052734375, -0.051116943359375, -0.042179107666015625, -0.03324127197265625, -0.024303436279296875, -0.0153656005859375, -0.006427764892578125, 0.00251007080078125, 0.011447906494140625, 0.0203857421875, 0.029323577880859375, 0.03826141357421875, 0.047199249267578125, 0.0561370849609375, 0.06507492065429688, 0.07401275634765625, 0.08295059204101562, 0.091888427734375, 0.10082626342773438, 0.10976409912109375, 0.11870193481445312, 0.1276397705078125, 0.13657760620117188, 0.14551544189453125, 0.15445327758789062, 0.16339111328125, 0.17232894897460938, 0.18126678466796875, 0.19020462036132812, 0.1991424560546875, 0.20808029174804688, 0.21701812744140625, 0.22595596313476562, 0.234893798828125, 0.24383163452148438, 0.25276947021484375, 0.2617073059082031, 0.2706451416015625, 0.2795829772949219, 0.28852081298828125, 0.2974586486816406, 0.306396484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 8.0, 7.0, 15.0, 11.0, 16.0, 25.0, 37.0, 31.0, 52.0, 81.0, 130.0, 148.0, 213.0, 307.0, 445.0, 737.0, 1569.0, 4468.0, 20885.0, 185139.0, 749846.0, 68463.0, 10148.0, 2696.0, 1128.0, 577.0, 372.0, 281.0, 198.0, 148.0, 85.0, 67.0, 56.0, 30.0, 33.0, 23.0, 16.0, 9.0, 7.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.47900390625, -0.46503448486328125, -0.4510650634765625, -0.43709564208984375, -0.423126220703125, -0.40915679931640625, -0.3951873779296875, -0.38121795654296875, -0.36724853515625, -0.35327911376953125, -0.3393096923828125, -0.32534027099609375, -0.311370849609375, -0.29740142822265625, -0.2834320068359375, -0.26946258544921875, -0.2554931640625, -0.24152374267578125, -0.2275543212890625, -0.21358489990234375, -0.199615478515625, -0.18564605712890625, -0.1716766357421875, -0.15770721435546875, -0.14373779296875, -0.12976837158203125, -0.1157989501953125, -0.10182952880859375, -0.087860107421875, -0.07389068603515625, -0.0599212646484375, -0.04595184326171875, -0.031982421875, -0.01801300048828125, -0.0040435791015625, 0.00992584228515625, 0.023895263671875, 0.03786468505859375, 0.0518341064453125, 0.06580352783203125, 0.07977294921875, 0.09374237060546875, 0.1077117919921875, 0.12168121337890625, 0.135650634765625, 0.14962005615234375, 0.1635894775390625, 0.17755889892578125, 0.1915283203125, 0.20549774169921875, 0.2194671630859375, 0.23343658447265625, 0.247406005859375, 0.26137542724609375, 0.2753448486328125, 0.28931427001953125, 0.30328369140625, 0.31725311279296875, 0.3312225341796875, 0.34519195556640625, 0.359161376953125, 0.37313079833984375, 0.3871002197265625, 0.40106964111328125, 0.4150390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 13.0, 13.0, 16.0, 21.0, 24.0, 33.0, 37.0, 28.0, 49.0, 47.0, 61.0, 77.0, 53.0, 61.0, 63.0, 53.0, 50.0, 50.0, 39.0, 36.0, 29.0, 26.0, 20.0, 19.0, 16.0, 8.0, 7.0, 9.0, 8.0, 8.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7920150756835938, -0.7681121826171875, -0.7442092895507812, -0.720306396484375, -0.6964035034179688, -0.6725006103515625, -0.6485977172851562, -0.62469482421875, -0.6007919311523438, -0.5768890380859375, -0.5529861450195312, -0.529083251953125, -0.5051803588867188, -0.4812774658203125, -0.45737457275390625, -0.4334716796875, -0.40956878662109375, -0.3856658935546875, -0.36176300048828125, -0.337860107421875, -0.31395721435546875, -0.2900543212890625, -0.26615142822265625, -0.24224853515625, -0.21834564208984375, -0.1944427490234375, -0.17053985595703125, -0.146636962890625, -0.12273406982421875, -0.0988311767578125, -0.07492828369140625, -0.051025390625, -0.02712249755859375, -0.0032196044921875, 0.02068328857421875, 0.044586181640625, 0.06848907470703125, 0.0923919677734375, 0.11629486083984375, 0.14019775390625, 0.16410064697265625, 0.1880035400390625, 0.21190643310546875, 0.235809326171875, 0.25971221923828125, 0.2836151123046875, 0.30751800537109375, 0.3314208984375, 0.35532379150390625, 0.3792266845703125, 0.40312957763671875, 0.427032470703125, 0.45093536376953125, 0.4748382568359375, 0.49874114990234375, 0.52264404296875, 0.5465469360351562, 0.5704498291015625, 0.5943527221679688, 0.618255615234375, 0.6421585083007812, 0.6660614013671875, 0.6899642944335938, 0.7138671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 13.0, 13.0, 10.0, 24.0, 18.0, 54.0, 100.0, 168.0, 312.0, 725.0, 2059.0, 6908.0, 29040.0, 169001.0, 737141.0, 80028.0, 16109.0, 4292.0, 1356.0, 553.0, 260.0, 130.0, 74.0, 43.0, 25.0, 17.0, 15.0, 13.0, 13.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.107666015625, -0.10372352600097656, -0.09978103637695312, -0.09583854675292969, -0.09189605712890625, -0.08795356750488281, -0.08401107788085938, -0.08006858825683594, -0.0761260986328125, -0.07218360900878906, -0.06824111938476562, -0.06429862976074219, -0.06035614013671875, -0.05641365051269531, -0.052471160888671875, -0.04852867126464844, -0.044586181640625, -0.04064369201660156, -0.036701202392578125, -0.03275871276855469, -0.02881622314453125, -0.024873733520507812, -0.020931243896484375, -0.016988754272460938, -0.0130462646484375, -0.009103775024414062, -0.005161285400390625, -0.0012187957763671875, 0.00272369384765625, 0.0066661834716796875, 0.010608673095703125, 0.014551162719726562, 0.01849365234375, 0.022436141967773438, 0.026378631591796875, 0.030321121215820312, 0.03426361083984375, 0.03820610046386719, 0.042148590087890625, 0.04609107971191406, 0.0500335693359375, 0.05397605895996094, 0.057918548583984375, 0.06186103820800781, 0.06580352783203125, 0.06974601745605469, 0.07368850708007812, 0.07763099670410156, 0.081573486328125, 0.08551597595214844, 0.08945846557617188, 0.09340095520019531, 0.09734344482421875, 0.10128593444824219, 0.10522842407226562, 0.10917091369628906, 0.1131134033203125, 0.11705589294433594, 0.12099838256835938, 0.12494087219238281, 0.12888336181640625, 0.1328258514404297, 0.13676834106445312, 0.14071083068847656, 0.1446533203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 4.0, 8.0, 12.0, 12.0, 9.0, 17.0, 25.0, 21.0, 21.0, 33.0, 35.0, 53.0, 48.0, 76.0, 68.0, 82.0, 91.0, 71.0, 52.0, 44.0, 41.0, 36.0, 21.0, 16.0, 16.0, 17.0, 17.0, 14.0, 6.0, 8.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.3272430300712585e-05, -3.227218985557556e-05, -3.127194941043854e-05, -3.0271708965301514e-05, -2.927146852016449e-05, -2.8271228075027466e-05, -2.7270987629890442e-05, -2.6270747184753418e-05, -2.5270506739616394e-05, -2.427026629447937e-05, -2.3270025849342346e-05, -2.2269785404205322e-05, -2.12695449590683e-05, -2.0269304513931274e-05, -1.926906406879425e-05, -1.8268823623657227e-05, -1.7268583178520203e-05, -1.626834273338318e-05, -1.5268102288246155e-05, -1.4267861843109131e-05, -1.3267621397972107e-05, -1.2267380952835083e-05, -1.1267140507698059e-05, -1.0266900062561035e-05, -9.266659617424011e-06, -8.266419172286987e-06, -7.266178727149963e-06, -6.2659382820129395e-06, -5.2656978368759155e-06, -4.265457391738892e-06, -3.2652169466018677e-06, -2.2649765014648438e-06, -1.2647360563278198e-06, -2.644956111907959e-07, 7.35744833946228e-07, 1.735985279083252e-06, 2.736225724220276e-06, 3.7364661693573e-06, 4.736706614494324e-06, 5.736947059631348e-06, 6.737187504768372e-06, 7.737427949905396e-06, 8.73766839504242e-06, 9.737908840179443e-06, 1.0738149285316467e-05, 1.1738389730453491e-05, 1.2738630175590515e-05, 1.3738870620727539e-05, 1.4739111065864563e-05, 1.5739351511001587e-05, 1.673959195613861e-05, 1.7739832401275635e-05, 1.874007284641266e-05, 1.9740313291549683e-05, 2.0740553736686707e-05, 2.174079418182373e-05, 2.2741034626960754e-05, 2.374127507209778e-05, 2.4741515517234802e-05, 2.5741755962371826e-05, 2.674199640750885e-05, 2.7742236852645874e-05, 2.8742477297782898e-05, 2.9742717742919922e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 7.0, 9.0, 10.0, 10.0, 19.0, 25.0, 34.0, 96.0, 119.0, 200.0, 375.0, 623.0, 1455.0, 4131.0, 14641.0, 67919.0, 647172.0, 255069.0, 41527.0, 9637.0, 3021.0, 1212.0, 512.0, 292.0, 157.0, 98.0, 53.0, 48.0, 22.0, 17.0, 14.0, 10.0, 7.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.110595703125, -0.10712337493896484, -0.10365104675292969, -0.10017871856689453, -0.09670639038085938, -0.09323406219482422, -0.08976173400878906, -0.0862894058227539, -0.08281707763671875, -0.0793447494506836, -0.07587242126464844, -0.07240009307861328, -0.06892776489257812, -0.06545543670654297, -0.06198310852050781, -0.058510780334472656, -0.0550384521484375, -0.051566123962402344, -0.04809379577636719, -0.04462146759033203, -0.041149139404296875, -0.03767681121826172, -0.03420448303222656, -0.030732154846191406, -0.02725982666015625, -0.023787498474121094, -0.020315170288085938, -0.01684284210205078, -0.013370513916015625, -0.009898185729980469, -0.0064258575439453125, -0.0029535293579101562, 0.000518798828125, 0.003991127014160156, 0.0074634552001953125, 0.010935783386230469, 0.014408111572265625, 0.01788043975830078, 0.021352767944335938, 0.024825096130371094, 0.02829742431640625, 0.031769752502441406, 0.03524208068847656, 0.03871440887451172, 0.042186737060546875, 0.04565906524658203, 0.04913139343261719, 0.052603721618652344, 0.0560760498046875, 0.059548377990722656, 0.06302070617675781, 0.06649303436279297, 0.06996536254882812, 0.07343769073486328, 0.07691001892089844, 0.0803823471069336, 0.08385467529296875, 0.0873270034790039, 0.09079933166503906, 0.09427165985107422, 0.09774398803710938, 0.10121631622314453, 0.10468864440917969, 0.10816097259521484, 0.11163330078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 11.0, 14.0, 17.0, 21.0, 27.0, 48.0, 58.0, 74.0, 115.0, 129.0, 125.0, 87.0, 82.0, 53.0, 23.0, 27.0, 21.0, 16.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1861572265625, -0.18160629272460938, -0.17705535888671875, -0.17250442504882812, -0.1679534912109375, -0.16340255737304688, -0.15885162353515625, -0.15430068969726562, -0.149749755859375, -0.14519882202148438, -0.14064788818359375, -0.13609695434570312, -0.1315460205078125, -0.12699508666992188, -0.12244415283203125, -0.11789321899414062, -0.11334228515625, -0.10879135131835938, -0.10424041748046875, -0.09968948364257812, -0.0951385498046875, -0.09058761596679688, -0.08603668212890625, -0.08148574829101562, -0.076934814453125, -0.07238388061523438, -0.06783294677734375, -0.06328201293945312, -0.0587310791015625, -0.054180145263671875, -0.04962921142578125, -0.045078277587890625, -0.04052734375, -0.035976409912109375, -0.03142547607421875, -0.026874542236328125, -0.0223236083984375, -0.017772674560546875, -0.01322174072265625, -0.008670806884765625, -0.004119873046875, 0.000431060791015625, 0.00498199462890625, 0.009532928466796875, 0.0140838623046875, 0.018634796142578125, 0.02318572998046875, 0.027736663818359375, 0.03228759765625, 0.036838531494140625, 0.04138946533203125, 0.045940399169921875, 0.0504913330078125, 0.055042266845703125, 0.05959320068359375, 0.06414413452148438, 0.068695068359375, 0.07324600219726562, 0.07779693603515625, 0.08234786987304688, 0.0868988037109375, 0.09144973754882812, 0.09600067138671875, 0.10055160522460938, 0.1051025390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 12.0, 22.0, 47.0, 89.0, 297.0, 273.0, 117.0, 66.0, 30.0, 15.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2032394409179688, -2.093127489089966, -1.9830154180526733, -1.8729033470153809, -1.762791395187378, -1.6526793241500854, -1.542567253112793, -1.43245530128479, -1.3223432302474976, -1.212231159210205, -1.1021192073822021, -0.9920071363449097, -0.881895124912262, -0.7717831134796143, -0.6616710424423218, -0.5515590310096741, -0.44144701957702637, -0.33133500814437866, -0.22122296690940857, -0.11111092567443848, -0.0009989142417907715, 0.10911309719085693, 0.21922516822814941, 0.3293371796607971, 0.4394491910934448, 0.5495612025260925, 0.6596732139587402, 0.7697852849960327, 0.8798972964286804, 0.9900093078613281, 1.1001213788986206, 1.210233449935913, 1.320345401763916, 1.4304574728012085, 1.5405694246292114, 1.650681495666504, 1.7607934474945068, 1.8709055185317993, 1.9810175895690918, 2.0911295413970947, 2.2012414932250977, 2.3113534450531006, 2.4214656352996826, 2.5315775871276855, 2.6416895389556885, 2.7518014907836914, 2.8619136810302734, 2.9720256328582764, 3.0821378231048584, 3.1922497749328613, 3.3023619651794434, 3.4124739170074463, 3.522585868835449, 3.6326980590820312, 3.742810010910034, 3.852921962738037, 3.963034152984619, 4.073146343231201, 4.183258056640625, 4.293370246887207, 4.403482437133789, 4.513594150543213, 4.623706340789795, 4.733818531036377, 4.843930244445801]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 11.0, 3.0, 8.0, 8.0, 10.0, 10.0, 12.0, 14.0, 19.0, 15.0, 17.0, 22.0, 20.0, 29.0, 25.0, 25.0, 36.0, 57.0, 69.0, 102.0, 97.0, 57.0, 41.0, 26.0, 36.0, 24.0, 29.0, 24.0, 22.0, 16.0, 17.0, 11.0, 11.0, 13.0, 7.0, 10.0, 8.0, 5.0, 11.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.97845458984375, -1.909497857093811, -1.840541124343872, -1.771584391593933, -1.7026276588439941, -1.6336709260940552, -1.5647141933441162, -1.4957575798034668, -1.4268007278442383, -1.3578439950942993, -1.2888872623443604, -1.2199305295944214, -1.1509737968444824, -1.0820170640945435, -1.0130603313446045, -0.9441036581993103, -0.8751469850540161, -0.8061902523040771, -0.7372335195541382, -0.6682767868041992, -0.5993200540542603, -0.5303633213043213, -0.4614066481590271, -0.39244991540908813, -0.32349318265914917, -0.2545364499092102, -0.18557973206043243, -0.11662301421165466, -0.0476662814617157, 0.021290451288223267, 0.09024715423583984, 0.1592038869857788, 0.22816061973571777, 0.29711735248565674, 0.3660740852355957, 0.4350307881832123, 0.5039875507354736, 0.5729442834854126, 0.6419009566307068, 0.7108576893806458, 0.7798144221305847, 0.8487711548805237, 0.9177278876304626, 0.9866845607757568, 1.0556412935256958, 1.1245980262756348, 1.1935547590255737, 1.2625114917755127, 1.3314682245254517, 1.4004249572753906, 1.4693816900253296, 1.5383384227752686, 1.6072951555252075, 1.6762518882751465, 1.745208501815796, 1.8141653537750244, 1.8831219673156738, 1.9520787000656128, 2.0210354328155518, 2.089992046356201, 2.1589488983154297, 2.227905511856079, 2.2968623638153076, 2.365818977355957, 2.4347758293151855]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 10.0, 8.0, 11.0, 21.0, 19.0, 25.0, 54.0, 63.0, 75.0, 109.0, 167.0, 258.0, 346.0, 590.0, 1312.0, 2850.0, 7708.0, 28274.0, 174845.0, 1177710.0, 2177794.0, 520985.0, 75410.0, 15974.0, 5138.0, 2053.0, 983.0, 515.0, 295.0, 224.0, 127.0, 96.0, 49.0, 38.0, 40.0, 27.0, 21.0, 15.0, 9.0, 4.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.206298828125, -0.1999073028564453, -0.19351577758789062, -0.18712425231933594, -0.18073272705078125, -0.17434120178222656, -0.16794967651367188, -0.1615581512451172, -0.1551666259765625, -0.1487751007080078, -0.14238357543945312, -0.13599205017089844, -0.12960052490234375, -0.12320899963378906, -0.11681747436523438, -0.11042594909667969, -0.104034423828125, -0.09764289855957031, -0.09125137329101562, -0.08485984802246094, -0.07846832275390625, -0.07207679748535156, -0.06568527221679688, -0.05929374694824219, -0.0529022216796875, -0.04651069641113281, -0.040119171142578125, -0.03372764587402344, -0.02733612060546875, -0.020944595336914062, -0.014553070068359375, -0.008161544799804688, -0.00177001953125, 0.0046215057373046875, 0.011013031005859375, 0.017404556274414062, 0.02379608154296875, 0.030187606811523438, 0.036579132080078125, 0.04297065734863281, 0.0493621826171875, 0.05575370788574219, 0.062145233154296875, 0.06853675842285156, 0.07492828369140625, 0.08131980895996094, 0.08771133422851562, 0.09410285949707031, 0.100494384765625, 0.10688591003417969, 0.11327743530273438, 0.11966896057128906, 0.12606048583984375, 0.13245201110839844, 0.13884353637695312, 0.1452350616455078, 0.1516265869140625, 0.1580181121826172, 0.16440963745117188, 0.17080116271972656, 0.17719268798828125, 0.18358421325683594, 0.18997573852539062, 0.1963672637939453, 0.2027587890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 9.0, 13.0, 17.0, 14.0, 21.0, 32.0, 27.0, 28.0, 47.0, 62.0, 57.0, 64.0, 75.0, 72.0, 74.0, 50.0, 47.0, 72.0, 40.0, 44.0, 29.0, 26.0, 20.0, 21.0, 15.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19536209106445312, -0.18735504150390625, -0.17934799194335938, -0.1713409423828125, -0.16333389282226562, -0.15532684326171875, -0.14731979370117188, -0.139312744140625, -0.13130569458007812, -0.12329864501953125, -0.11529159545898438, -0.1072845458984375, -0.09927749633789062, -0.09127044677734375, -0.08326339721679688, -0.07525634765625, -0.06724929809570312, -0.05924224853515625, -0.051235198974609375, -0.0432281494140625, -0.035221099853515625, -0.02721405029296875, -0.019207000732421875, -0.011199951171875, -0.003192901611328125, 0.00481414794921875, 0.012821197509765625, 0.0208282470703125, 0.028835296630859375, 0.03684234619140625, 0.044849395751953125, 0.0528564453125, 0.060863494873046875, 0.06887054443359375, 0.07687759399414062, 0.0848846435546875, 0.09289169311523438, 0.10089874267578125, 0.10890579223632812, 0.116912841796875, 0.12491989135742188, 0.13292694091796875, 0.14093399047851562, 0.1489410400390625, 0.15694808959960938, 0.16495513916015625, 0.17296218872070312, 0.18096923828125, 0.18897628784179688, 0.19698333740234375, 0.20499038696289062, 0.2129974365234375, 0.22100448608398438, 0.22901153564453125, 0.23701858520507812, 0.245025634765625, 0.2530326843261719, 0.26103973388671875, 0.2690467834472656, 0.2770538330078125, 0.2850608825683594, 0.29306793212890625, 0.3010749816894531, 0.30908203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 11.0, 13.0, 27.0, 36.0, 74.0, 130.0, 243.0, 544.0, 1428.0, 6617.0, 78117.0, 3743166.0, 346954.0, 13349.0, 2199.0, 719.0, 260.0, 155.0, 89.0, 48.0, 23.0, 17.0, 9.0, 11.0, 8.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43212890625, -0.4165191650390625, -0.400909423828125, -0.3852996826171875, -0.36968994140625, -0.3540802001953125, -0.338470458984375, -0.3228607177734375, -0.3072509765625, -0.2916412353515625, -0.276031494140625, -0.2604217529296875, -0.24481201171875, -0.2292022705078125, -0.213592529296875, -0.1979827880859375, -0.182373046875, -0.1667633056640625, -0.151153564453125, -0.1355438232421875, -0.11993408203125, -0.1043243408203125, -0.088714599609375, -0.0731048583984375, -0.0574951171875, -0.0418853759765625, -0.026275634765625, -0.0106658935546875, 0.00494384765625, 0.0205535888671875, 0.036163330078125, 0.0517730712890625, 0.0673828125, 0.0829925537109375, 0.098602294921875, 0.1142120361328125, 0.12982177734375, 0.1454315185546875, 0.161041259765625, 0.1766510009765625, 0.1922607421875, 0.2078704833984375, 0.223480224609375, 0.2390899658203125, 0.25469970703125, 0.2703094482421875, 0.285919189453125, 0.3015289306640625, 0.317138671875, 0.3327484130859375, 0.348358154296875, 0.3639678955078125, 0.37957763671875, 0.3951873779296875, 0.410797119140625, 0.4264068603515625, 0.4420166015625, 0.4576263427734375, 0.473236083984375, 0.4888458251953125, 0.50445556640625, 0.5200653076171875, 0.535675048828125, 0.5512847900390625, 0.56689453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 12.0, 5.0, 16.0, 21.0, 32.0, 42.0, 61.0, 118.0, 179.0, 325.0, 558.0, 700.0, 738.0, 501.0, 310.0, 167.0, 88.0, 70.0, 40.0, 25.0, 27.0, 12.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.38146209716796875, -0.3691253662109375, -0.35678863525390625, -0.344451904296875, -0.33211517333984375, -0.3197784423828125, -0.30744171142578125, -0.29510498046875, -0.28276824951171875, -0.2704315185546875, -0.25809478759765625, -0.245758056640625, -0.23342132568359375, -0.2210845947265625, -0.20874786376953125, -0.1964111328125, -0.18407440185546875, -0.1717376708984375, -0.15940093994140625, -0.147064208984375, -0.13472747802734375, -0.1223907470703125, -0.11005401611328125, -0.09771728515625, -0.08538055419921875, -0.0730438232421875, -0.06070709228515625, -0.048370361328125, -0.03603363037109375, -0.0236968994140625, -0.01136016845703125, 0.0009765625, 0.01331329345703125, 0.0256500244140625, 0.03798675537109375, 0.050323486328125, 0.06266021728515625, 0.0749969482421875, 0.08733367919921875, 0.09967041015625, 0.11200714111328125, 0.1243438720703125, 0.13668060302734375, 0.149017333984375, 0.16135406494140625, 0.1736907958984375, 0.18602752685546875, 0.1983642578125, 0.21070098876953125, 0.2230377197265625, 0.23537445068359375, 0.247711181640625, 0.26004791259765625, 0.2723846435546875, 0.28472137451171875, 0.29705810546875, 0.30939483642578125, 0.3217315673828125, 0.33406829833984375, 0.346405029296875, 0.35874176025390625, 0.3710784912109375, 0.38341522216796875, 0.395751953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 20.0, 29.0, 79.0, 180.0, 250.0, 244.0, 113.0, 38.0, 21.0, 11.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.871633529663086, -5.746171951293945, -5.620710372924805, -5.495249271392822, -5.369787693023682, -5.244326114654541, -5.1188645362854, -4.993403434753418, -4.867941856384277, -4.742480278015137, -4.617018699645996, -4.491557598114014, -4.366096019744873, -4.240634441375732, -4.115172863006592, -3.9897115230560303, -3.8642499446868896, -3.738788366317749, -3.6133270263671875, -3.487865447998047, -3.3624041080474854, -3.2369425296783447, -3.111481189727783, -2.9860196113586426, -2.860558032989502, -2.7350964546203613, -2.6096351146698, -2.484173536300659, -2.3587121963500977, -2.233250617980957, -2.1077890396118164, -1.9823276996612549, -1.8568665981292725, -1.7314051389694214, -1.6059436798095703, -1.4804821014404297, -1.3550207614898682, -1.2295591831207275, -1.1040977239608765, -0.9786362648010254, -0.8531748056411743, -0.7277133464813232, -0.6022518873214722, -0.4767903685569763, -0.35132890939712524, -0.22586745023727417, -0.10040593147277832, 0.025055527687072754, 0.15051698684692383, 0.2759784460067749, 0.40143993496894836, 0.5269014239311218, 0.6523628830909729, 0.777824342250824, 0.9032858610153198, 1.028747320175171, 1.154208779335022, 1.279670238494873, 1.4051316976547241, 1.5305931568145752, 1.6560547351837158, 1.7815160751342773, 1.906977653503418, 2.0324392318725586, 2.15790057182312]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 7.0, 17.0, 12.0, 15.0, 11.0, 26.0, 27.0, 24.0, 27.0, 45.0, 38.0, 36.0, 40.0, 54.0, 57.0, 54.0, 57.0, 57.0, 37.0, 48.0, 43.0, 39.0, 32.0, 21.0, 26.0, 16.0, 26.0, 19.0, 14.0, 15.0, 10.0, 10.0, 12.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.664239764213562, -1.614546537399292, -1.564853310585022, -1.515160083770752, -1.465466856956482, -1.415773630142212, -1.366080403327942, -1.3163871765136719, -1.2666939496994019, -1.2170007228851318, -1.1673074960708618, -1.1176142692565918, -1.0679210424423218, -1.0182278156280518, -0.9685345888137817, -0.9188413619995117, -0.8691480755805969, -0.8194548487663269, -0.7697616219520569, -0.7200683951377869, -0.6703751683235168, -0.6206819415092468, -0.570988655090332, -0.521295428276062, -0.4716022312641144, -0.42190900444984436, -0.37221577763557434, -0.32252252101898193, -0.2728292942047119, -0.2231360822916031, -0.17344284057617188, -0.12374961376190186, -0.07405638694763184, -0.024363156408071518, 0.0253300741314888, 0.07502330839633942, 0.12471653521060944, 0.17440976202487946, 0.22410300374031067, 0.2737962305545807, 0.3234894573688507, 0.3731826841831207, 0.42287591099739075, 0.47256916761398315, 0.5222623944282532, 0.5719556212425232, 0.6216488480567932, 0.6713420748710632, 0.7210353016853333, 0.7707285284996033, 0.8204217553138733, 0.8701149821281433, 0.9198082089424133, 0.9695014357566833, 1.0191947221755981, 1.0688879489898682, 1.1185811758041382, 1.1682744026184082, 1.2179676294326782, 1.2676608562469482, 1.3173540830612183, 1.3670473098754883, 1.4167405366897583, 1.4664337635040283, 1.5161269903182983]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 11.0, 21.0, 33.0, 51.0, 77.0, 143.0, 240.0, 478.0, 861.0, 1828.0, 4058.0, 10379.0, 33465.0, 149784.0, 547650.0, 228858.0, 47517.0, 13533.0, 5055.0, 2190.0, 1070.0, 540.0, 288.0, 156.0, 114.0, 52.0, 31.0, 21.0, 15.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3125, -0.3019523620605469, -0.29140472412109375, -0.2808570861816406, -0.2703094482421875, -0.2597618103027344, -0.24921417236328125, -0.23866653442382812, -0.228118896484375, -0.21757125854492188, -0.20702362060546875, -0.19647598266601562, -0.1859283447265625, -0.17538070678710938, -0.16483306884765625, -0.15428543090820312, -0.14373779296875, -0.13319015502929688, -0.12264251708984375, -0.11209487915039062, -0.1015472412109375, -0.09099960327148438, -0.08045196533203125, -0.06990432739257812, -0.059356689453125, -0.048809051513671875, -0.03826141357421875, -0.027713775634765625, -0.0171661376953125, -0.006618499755859375, 0.00392913818359375, 0.014476776123046875, 0.0250244140625, 0.035572052001953125, 0.04611968994140625, 0.056667327880859375, 0.0672149658203125, 0.07776260375976562, 0.08831024169921875, 0.09885787963867188, 0.109405517578125, 0.11995315551757812, 0.13050079345703125, 0.14104843139648438, 0.1515960693359375, 0.16214370727539062, 0.17269134521484375, 0.18323898315429688, 0.19378662109375, 0.20433425903320312, 0.21488189697265625, 0.22542953491210938, 0.2359771728515625, 0.24652481079101562, 0.25707244873046875, 0.2676200866699219, 0.278167724609375, 0.2887153625488281, 0.29926300048828125, 0.3098106384277344, 0.3203582763671875, 0.3309059143066406, 0.34145355224609375, 0.3520011901855469, 0.362548828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 10.0, 27.0, 19.0, 10.0, 29.0, 31.0, 29.0, 49.0, 59.0, 66.0, 71.0, 68.0, 58.0, 54.0, 61.0, 66.0, 48.0, 49.0, 30.0, 41.0, 28.0, 32.0, 21.0, 10.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.1964244842529297, -0.18838119506835938, -0.18033790588378906, -0.17229461669921875, -0.16425132751464844, -0.15620803833007812, -0.1481647491455078, -0.1401214599609375, -0.1320781707763672, -0.12403488159179688, -0.11599159240722656, -0.10794830322265625, -0.09990501403808594, -0.09186172485351562, -0.08381843566894531, -0.075775146484375, -0.06773185729980469, -0.059688568115234375, -0.05164527893066406, -0.04360198974609375, -0.03555870056152344, -0.027515411376953125, -0.019472122192382812, -0.0114288330078125, -0.0033855438232421875, 0.004657745361328125, 0.012701034545898438, 0.02074432373046875, 0.028787612915039062, 0.036830902099609375, 0.04487419128417969, 0.05291748046875, 0.06096076965332031, 0.06900405883789062, 0.07704734802246094, 0.08509063720703125, 0.09313392639160156, 0.10117721557617188, 0.10922050476074219, 0.1172637939453125, 0.1253070831298828, 0.13335037231445312, 0.14139366149902344, 0.14943695068359375, 0.15748023986816406, 0.16552352905273438, 0.1735668182373047, 0.181610107421875, 0.1896533966064453, 0.19769668579101562, 0.20573997497558594, 0.21378326416015625, 0.22182655334472656, 0.22986984252929688, 0.2379131317138672, 0.2459564208984375, 0.2539997100830078, 0.2620429992675781, 0.27008628845214844, 0.27812957763671875, 0.28617286682128906, 0.2942161560058594, 0.3022594451904297, 0.310302734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 13.0, 16.0, 34.0, 24.0, 44.0, 60.0, 80.0, 84.0, 121.0, 173.0, 249.0, 325.0, 551.0, 872.0, 1541.0, 4059.0, 27822.0, 785126.0, 208547.0, 12377.0, 2801.0, 1247.0, 739.0, 468.0, 326.0, 207.0, 157.0, 110.0, 102.0, 63.0, 54.0, 27.0, 33.0, 19.0, 10.0, 18.0, 9.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5339508056640625, -0.516632080078125, -0.4993133544921875, -0.48199462890625, -0.4646759033203125, -0.447357177734375, -0.4300384521484375, -0.4127197265625, -0.3954010009765625, -0.378082275390625, -0.3607635498046875, -0.34344482421875, -0.3261260986328125, -0.308807373046875, -0.2914886474609375, -0.274169921875, -0.2568511962890625, -0.239532470703125, -0.2222137451171875, -0.20489501953125, -0.1875762939453125, -0.170257568359375, -0.1529388427734375, -0.1356201171875, -0.1183013916015625, -0.100982666015625, -0.0836639404296875, -0.06634521484375, -0.0490264892578125, -0.031707763671875, -0.0143890380859375, 0.0029296875, 0.0202484130859375, 0.037567138671875, 0.0548858642578125, 0.07220458984375, 0.0895233154296875, 0.106842041015625, 0.1241607666015625, 0.1414794921875, 0.1587982177734375, 0.176116943359375, 0.1934356689453125, 0.21075439453125, 0.2280731201171875, 0.245391845703125, 0.2627105712890625, 0.280029296875, 0.2973480224609375, 0.314666748046875, 0.3319854736328125, 0.34930419921875, 0.3666229248046875, 0.383941650390625, 0.4012603759765625, 0.4185791015625, 0.4358978271484375, 0.453216552734375, 0.4705352783203125, 0.48785400390625, 0.5051727294921875, 0.522491455078125, 0.5398101806640625, 0.55712890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 5.0, 3.0, 3.0, 8.0, 9.0, 13.0, 18.0, 13.0, 22.0, 22.0, 21.0, 26.0, 34.0, 35.0, 48.0, 55.0, 39.0, 45.0, 49.0, 48.0, 41.0, 51.0, 42.0, 54.0, 39.0, 37.0, 34.0, 28.0, 25.0, 24.0, 17.0, 9.0, 16.0, 12.0, 14.0, 14.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5295791625976562, -0.5103302001953125, -0.49108123779296875, -0.471832275390625, -0.45258331298828125, -0.4333343505859375, -0.41408538818359375, -0.39483642578125, -0.37558746337890625, -0.3563385009765625, -0.33708953857421875, -0.317840576171875, -0.29859161376953125, -0.2793426513671875, -0.26009368896484375, -0.2408447265625, -0.22159576416015625, -0.2023468017578125, -0.18309783935546875, -0.163848876953125, -0.14459991455078125, -0.1253509521484375, -0.10610198974609375, -0.08685302734375, -0.06760406494140625, -0.0483551025390625, -0.02910614013671875, -0.009857177734375, 0.00939178466796875, 0.0286407470703125, 0.04788970947265625, 0.067138671875, 0.08638763427734375, 0.1056365966796875, 0.12488555908203125, 0.144134521484375, 0.16338348388671875, 0.1826324462890625, 0.20188140869140625, 0.22113037109375, 0.24037933349609375, 0.2596282958984375, 0.27887725830078125, 0.298126220703125, 0.31737518310546875, 0.3366241455078125, 0.35587310791015625, 0.3751220703125, 0.39437103271484375, 0.4136199951171875, 0.43286895751953125, 0.452117919921875, 0.47136688232421875, 0.4906158447265625, 0.5098648071289062, 0.52911376953125, 0.5483627319335938, 0.5676116943359375, 0.5868606567382812, 0.606109619140625, 0.6253585815429688, 0.6446075439453125, 0.6638565063476562, 0.68310546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 11.0, 22.0, 28.0, 42.0, 98.0, 157.0, 340.0, 1118.0, 5878.0, 98221.0, 915068.0, 23655.0, 2667.0, 652.0, 232.0, 130.0, 71.0, 55.0, 28.0, 21.0, 8.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.229156494140625, -0.22247314453125, -0.215789794921875, -0.2091064453125, -0.202423095703125, -0.19573974609375, -0.189056396484375, -0.182373046875, -0.175689697265625, -0.16900634765625, -0.162322998046875, -0.1556396484375, -0.148956298828125, -0.14227294921875, -0.135589599609375, -0.12890625, -0.122222900390625, -0.11553955078125, -0.108856201171875, -0.1021728515625, -0.095489501953125, -0.08880615234375, -0.082122802734375, -0.075439453125, -0.068756103515625, -0.06207275390625, -0.055389404296875, -0.0487060546875, -0.042022705078125, -0.03533935546875, -0.028656005859375, -0.02197265625, -0.015289306640625, -0.00860595703125, -0.001922607421875, 0.0047607421875, 0.011444091796875, 0.01812744140625, 0.024810791015625, 0.031494140625, 0.038177490234375, 0.04486083984375, 0.051544189453125, 0.0582275390625, 0.064910888671875, 0.07159423828125, 0.078277587890625, 0.0849609375, 0.091644287109375, 0.09832763671875, 0.105010986328125, 0.1116943359375, 0.118377685546875, 0.12506103515625, 0.131744384765625, 0.138427734375, 0.145111083984375, 0.15179443359375, 0.158477783203125, 0.1651611328125, 0.171844482421875, 0.17852783203125, 0.185211181640625, 0.19189453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 14.0, 11.0, 28.0, 36.0, 51.0, 84.0, 98.0, 145.0, 119.0, 122.0, 79.0, 56.0, 44.0, 17.0, 11.0, 13.0, 6.0, 10.0, 5.0, 4.0, 3.0, 5.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.104873657226562e-05, -6.913114339113235e-05, -6.721355020999908e-05, -6.529595702886581e-05, -6.337836384773254e-05, -6.146077066659927e-05, -5.9543177485466003e-05, -5.762558430433273e-05, -5.570799112319946e-05, -5.379039794206619e-05, -5.187280476093292e-05, -4.995521157979965e-05, -4.803761839866638e-05, -4.612002521753311e-05, -4.420243203639984e-05, -4.228483885526657e-05, -4.03672456741333e-05, -3.844965249300003e-05, -3.653205931186676e-05, -3.461446613073349e-05, -3.269687294960022e-05, -3.077927976846695e-05, -2.886168658733368e-05, -2.694409340620041e-05, -2.502650022506714e-05, -2.310890704393387e-05, -2.1191313862800598e-05, -1.9273720681667328e-05, -1.7356127500534058e-05, -1.5438534319400787e-05, -1.3520941138267517e-05, -1.1603347957134247e-05, -9.685754776000977e-06, -7.768161594867706e-06, -5.850568413734436e-06, -3.932975232601166e-06, -2.0153820514678955e-06, -9.778887033462524e-08, 1.819804310798645e-06, 3.7373974919319153e-06, 5.6549906730651855e-06, 7.572583854198456e-06, 9.490177035331726e-06, 1.1407770216464996e-05, 1.3325363397598267e-05, 1.5242956578731537e-05, 1.7160549759864807e-05, 1.9078142940998077e-05, 2.0995736122131348e-05, 2.2913329303264618e-05, 2.4830922484397888e-05, 2.674851566553116e-05, 2.866610884666443e-05, 3.05837020277977e-05, 3.250129520893097e-05, 3.441888839006424e-05, 3.633648157119751e-05, 3.825407475233078e-05, 4.017166793346405e-05, 4.208926111459732e-05, 4.400685429573059e-05, 4.592444747686386e-05, 4.784204065799713e-05, 4.97596338391304e-05, 5.167722702026367e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 10.0, 6.0, 11.0, 28.0, 36.0, 47.0, 69.0, 92.0, 153.0, 206.0, 374.0, 722.0, 1586.0, 4441.0, 19073.0, 146880.0, 790390.0, 67681.0, 11080.0, 3056.0, 1168.0, 549.0, 335.0, 187.0, 125.0, 65.0, 50.0, 36.0, 32.0, 30.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11065673828125, -0.10723400115966797, -0.10381126403808594, -0.1003885269165039, -0.09696578979492188, -0.09354305267333984, -0.09012031555175781, -0.08669757843017578, -0.08327484130859375, -0.07985210418701172, -0.07642936706542969, -0.07300662994384766, -0.06958389282226562, -0.0661611557006836, -0.06273841857910156, -0.05931568145751953, -0.0558929443359375, -0.05247020721435547, -0.04904747009277344, -0.045624732971191406, -0.042201995849609375, -0.038779258728027344, -0.03535652160644531, -0.03193378448486328, -0.02851104736328125, -0.02508831024169922, -0.021665573120117188, -0.018242835998535156, -0.014820098876953125, -0.011397361755371094, -0.007974624633789062, -0.004551887512207031, -0.001129150390625, 0.0022935867309570312, 0.0057163238525390625, 0.009139060974121094, 0.012561798095703125, 0.015984535217285156, 0.019407272338867188, 0.02283000946044922, 0.02625274658203125, 0.02967548370361328, 0.03309822082519531, 0.036520957946777344, 0.039943695068359375, 0.043366432189941406, 0.04678916931152344, 0.05021190643310547, 0.0536346435546875, 0.05705738067626953, 0.06048011779785156, 0.0639028549194336, 0.06732559204101562, 0.07074832916259766, 0.07417106628417969, 0.07759380340576172, 0.08101654052734375, 0.08443927764892578, 0.08786201477050781, 0.09128475189208984, 0.09470748901367188, 0.0981302261352539, 0.10155296325683594, 0.10497570037841797, 0.1083984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 6.0, 5.0, 9.0, 14.0, 16.0, 18.0, 20.0, 20.0, 33.0, 47.0, 41.0, 52.0, 68.0, 65.0, 97.0, 80.0, 66.0, 47.0, 57.0, 31.0, 24.0, 23.0, 20.0, 22.0, 18.0, 16.0, 10.0, 12.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0806884765625, -0.07828521728515625, -0.0758819580078125, -0.07347869873046875, -0.071075439453125, -0.06867218017578125, -0.0662689208984375, -0.06386566162109375, -0.06146240234375, -0.05905914306640625, -0.0566558837890625, -0.05425262451171875, -0.051849365234375, -0.04944610595703125, -0.0470428466796875, -0.04463958740234375, -0.042236328125, -0.03983306884765625, -0.0374298095703125, -0.03502655029296875, -0.032623291015625, -0.03022003173828125, -0.0278167724609375, -0.02541351318359375, -0.02301025390625, -0.02060699462890625, -0.0182037353515625, -0.01580047607421875, -0.013397216796875, -0.01099395751953125, -0.0085906982421875, -0.00618743896484375, -0.0037841796875, -0.00138092041015625, 0.0010223388671875, 0.00342559814453125, 0.005828857421875, 0.00823211669921875, 0.0106353759765625, 0.01303863525390625, 0.01544189453125, 0.01784515380859375, 0.0202484130859375, 0.02265167236328125, 0.025054931640625, 0.02745819091796875, 0.0298614501953125, 0.03226470947265625, 0.03466796875, 0.03707122802734375, 0.0394744873046875, 0.04187774658203125, 0.044281005859375, 0.04668426513671875, 0.0490875244140625, 0.05149078369140625, 0.05389404296875, 0.05629730224609375, 0.0587005615234375, 0.06110382080078125, 0.063507080078125, 0.06591033935546875, 0.0683135986328125, 0.07071685791015625, 0.0731201171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 24.0, 108.0, 595.0, 231.0, 30.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1179704666137695, -6.862144470214844, -6.606318473815918, -6.350492477416992, -6.094666481018066, -5.838840484619141, -5.583014488220215, -5.327188491821289, -5.071362495422363, -4.8155364990234375, -4.559710502624512, -4.303884506225586, -4.04805850982666, -3.7922325134277344, -3.5364065170288086, -3.280580520629883, -3.024754524230957, -2.7689285278320312, -2.5131025314331055, -2.2572765350341797, -2.001450538635254, -1.7456245422363281, -1.4897985458374023, -1.2339725494384766, -0.9781465530395508, -0.722320556640625, -0.4664945602416992, -0.21066856384277344, 0.045157432556152344, 0.3009834289550781, 0.5568094253540039, 0.8126354217529297, 1.0684623718261719, 1.3242883682250977, 1.5801143646240234, 1.8359403610229492, 2.091766357421875, 2.347592353820801, 2.6034183502197266, 2.8592443466186523, 3.115070343017578, 3.370896339416504, 3.6267223358154297, 3.8825483322143555, 4.138374328613281, 4.394200325012207, 4.650026321411133, 4.905852317810059, 5.161678314208984, 5.41750431060791, 5.673330307006836, 5.929156303405762, 6.1849822998046875, 6.440808296203613, 6.696634292602539, 6.952460289001465, 7.208286285400391, 7.464112281799316, 7.719938278198242, 7.975764274597168, 8.231590270996094, 8.48741626739502, 8.743242263793945, 8.999068260192871, 9.254894256591797]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 5.0, 8.0, 12.0, 9.0, 12.0, 13.0, 14.0, 20.0, 18.0, 22.0, 30.0, 19.0, 24.0, 30.0, 24.0, 45.0, 110.0, 163.0, 83.0, 38.0, 23.0, 29.0, 27.0, 21.0, 25.0, 24.0, 22.0, 22.0, 15.0, 16.0, 10.0, 6.0, 9.0, 8.0, 3.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.0402026176452637, -1.9682003259658813, -1.896198034286499, -1.8241957426071167, -1.7521934509277344, -1.6801910400390625, -1.6081887483596802, -1.5361864566802979, -1.4641841650009155, -1.3921818733215332, -1.3201795816421509, -1.2481772899627686, -1.1761748790740967, -1.104172706604004, -1.032170295715332, -0.9601680040359497, -0.8881657123565674, -0.8161634206771851, -0.7441611289978027, -0.6721587777137756, -0.6001564860343933, -0.528154194355011, -0.4561518728733063, -0.38414955139160156, -0.31214725971221924, -0.24014495313167572, -0.1681426465511322, -0.09614033997058868, -0.024138033390045166, 0.04786425828933716, 0.11986657977104187, 0.19186890125274658, 0.2638711929321289, 0.33587348461151123, 0.40787580609321594, 0.47987812757492065, 0.551880419254303, 0.6238827109336853, 0.6958850622177124, 0.7678873538970947, 0.839889645576477, 0.9118919372558594, 0.9838942289352417, 1.055896520614624, 1.127898931503296, 1.1999011039733887, 1.2719035148620605, 1.3439058065414429, 1.4159080982208252, 1.4879103899002075, 1.5599126815795898, 1.6319149732589722, 1.7039172649383545, 1.7759196758270264, 1.8479219675064087, 1.919924259185791, 1.9919265508651733, 2.0639288425445557, 2.1359312534332275, 2.2079334259033203, 2.279935836791992, 2.351938009262085, 2.423940420150757, 2.4959425926208496, 2.5679450035095215]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 15.0, 20.0, 28.0, 49.0, 76.0, 92.0, 151.0, 255.0, 377.0, 681.0, 1230.0, 2382.0, 5082.0, 12733.0, 49112.0, 277720.0, 1187424.0, 1828594.0, 661232.0, 123972.0, 26615.0, 8745.0, 3593.0, 1797.0, 941.0, 507.0, 275.0, 222.0, 122.0, 76.0, 44.0, 29.0, 20.0, 15.0, 13.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21826171875, -0.21128273010253906, -0.20430374145507812, -0.1973247528076172, -0.19034576416015625, -0.1833667755126953, -0.17638778686523438, -0.16940879821777344, -0.1624298095703125, -0.15545082092285156, -0.14847183227539062, -0.1414928436279297, -0.13451385498046875, -0.1275348663330078, -0.12055587768554688, -0.11357688903808594, -0.106597900390625, -0.09961891174316406, -0.09263992309570312, -0.08566093444824219, -0.07868194580078125, -0.07170295715332031, -0.06472396850585938, -0.05774497985839844, -0.0507659912109375, -0.04378700256347656, -0.036808013916015625, -0.029829025268554688, -0.02285003662109375, -0.015871047973632812, -0.008892059326171875, -0.0019130706787109375, 0.00506591796875, 0.012044906616210938, 0.019023895263671875, 0.026002883911132812, 0.03298187255859375, 0.03996086120605469, 0.046939849853515625, 0.05391883850097656, 0.0608978271484375, 0.06787681579589844, 0.07485580444335938, 0.08183479309082031, 0.08881378173828125, 0.09579277038574219, 0.10277175903320312, 0.10975074768066406, 0.116729736328125, 0.12370872497558594, 0.13068771362304688, 0.1376667022705078, 0.14464569091796875, 0.1516246795654297, 0.15860366821289062, 0.16558265686035156, 0.1725616455078125, 0.17954063415527344, 0.18651962280273438, 0.1934986114501953, 0.20047760009765625, 0.2074565887451172, 0.21443557739257812, 0.22141456604003906, 0.2283935546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 5.0, 11.0, 20.0, 16.0, 28.0, 34.0, 39.0, 59.0, 45.0, 67.0, 66.0, 64.0, 69.0, 73.0, 61.0, 44.0, 53.0, 52.0, 33.0, 32.0, 32.0, 26.0, 20.0, 15.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19610595703125, -0.1881103515625, -0.18011474609375, -0.172119140625, -0.16412353515625, -0.1561279296875, -0.14813232421875, -0.14013671875, -0.13214111328125, -0.1241455078125, -0.11614990234375, -0.108154296875, -0.10015869140625, -0.0921630859375, -0.08416748046875, -0.076171875, -0.06817626953125, -0.0601806640625, -0.05218505859375, -0.044189453125, -0.03619384765625, -0.0281982421875, -0.02020263671875, -0.01220703125, -0.00421142578125, 0.0037841796875, 0.01177978515625, 0.019775390625, 0.02777099609375, 0.0357666015625, 0.04376220703125, 0.0517578125, 0.05975341796875, 0.0677490234375, 0.07574462890625, 0.083740234375, 0.09173583984375, 0.0997314453125, 0.10772705078125, 0.11572265625, 0.12371826171875, 0.1317138671875, 0.13970947265625, 0.147705078125, 0.15570068359375, 0.1636962890625, 0.17169189453125, 0.1796875, 0.18768310546875, 0.1956787109375, 0.20367431640625, 0.211669921875, 0.21966552734375, 0.2276611328125, 0.23565673828125, 0.24365234375, 0.25164794921875, 0.2596435546875, 0.26763916015625, 0.275634765625, 0.28363037109375, 0.2916259765625, 0.29962158203125, 0.3076171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 7.0, 9.0, 23.0, 40.0, 33.0, 69.0, 83.0, 140.0, 258.0, 394.0, 736.0, 1533.0, 4139.0, 18929.0, 889736.0, 3242241.0, 28174.0, 4574.0, 1423.0, 705.0, 369.0, 227.0, 125.0, 86.0, 55.0, 33.0, 31.0, 25.0, 10.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74853515625, -0.7236709594726562, -0.6988067626953125, -0.6739425659179688, -0.649078369140625, -0.6242141723632812, -0.5993499755859375, -0.5744857788085938, -0.54962158203125, -0.5247573852539062, -0.4998931884765625, -0.47502899169921875, -0.450164794921875, -0.42530059814453125, -0.4004364013671875, -0.37557220458984375, -0.3507080078125, -0.32584381103515625, -0.3009796142578125, -0.27611541748046875, -0.251251220703125, -0.22638702392578125, -0.2015228271484375, -0.17665863037109375, -0.15179443359375, -0.12693023681640625, -0.1020660400390625, -0.07720184326171875, -0.052337646484375, -0.02747344970703125, -0.0026092529296875, 0.02225494384765625, 0.047119140625, 0.07198333740234375, 0.0968475341796875, 0.12171173095703125, 0.146575927734375, 0.17144012451171875, 0.1963043212890625, 0.22116851806640625, 0.24603271484375, 0.27089691162109375, 0.2957611083984375, 0.32062530517578125, 0.345489501953125, 0.37035369873046875, 0.3952178955078125, 0.42008209228515625, 0.4449462890625, 0.46981048583984375, 0.4946746826171875, 0.5195388793945312, 0.544403076171875, 0.5692672729492188, 0.5941314697265625, 0.6189956665039062, 0.64385986328125, 0.6687240600585938, 0.6935882568359375, 0.7184524536132812, 0.743316650390625, 0.7681808471679688, 0.7930450439453125, 0.8179092407226562, 0.8427734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 11.0, 12.0, 25.0, 26.0, 32.0, 52.0, 76.0, 116.0, 143.0, 231.0, 374.0, 556.0, 682.0, 631.0, 407.0, 238.0, 145.0, 113.0, 69.0, 28.0, 27.0, 16.0, 15.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7333984375, -0.7138290405273438, -0.6942596435546875, -0.6746902465820312, -0.655120849609375, -0.6355514526367188, -0.6159820556640625, -0.5964126586914062, -0.57684326171875, -0.5572738647460938, -0.5377044677734375, -0.5181350708007812, -0.498565673828125, -0.47899627685546875, -0.4594268798828125, -0.43985748291015625, -0.4202880859375, -0.40071868896484375, -0.3811492919921875, -0.36157989501953125, -0.342010498046875, -0.32244110107421875, -0.3028717041015625, -0.28330230712890625, -0.26373291015625, -0.24416351318359375, -0.2245941162109375, -0.20502471923828125, -0.185455322265625, -0.16588592529296875, -0.1463165283203125, -0.12674713134765625, -0.107177734375, -0.08760833740234375, -0.0680389404296875, -0.04846954345703125, -0.028900146484375, -0.00933074951171875, 0.0102386474609375, 0.02980804443359375, 0.04937744140625, 0.06894683837890625, 0.0885162353515625, 0.10808563232421875, 0.127655029296875, 0.14722442626953125, 0.1667938232421875, 0.18636322021484375, 0.2059326171875, 0.22550201416015625, 0.2450714111328125, 0.26464080810546875, 0.284210205078125, 0.30377960205078125, 0.3233489990234375, 0.34291839599609375, 0.36248779296875, 0.38205718994140625, 0.4016265869140625, 0.42119598388671875, 0.440765380859375, 0.46033477783203125, 0.4799041748046875, 0.49947357177734375, 0.51904296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 33.0, 61.0, 221.0, 432.0, 178.0, 50.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.28878402709961, -24.83358383178711, -24.37838363647461, -23.923181533813477, -23.467981338500977, -23.012781143188477, -22.557579040527344, -22.102378845214844, -21.647178649902344, -21.191978454589844, -20.736778259277344, -20.28157615661621, -19.82637596130371, -19.37117576599121, -18.915973663330078, -18.460773468017578, -18.005573272705078, -17.550373077392578, -17.095172882080078, -16.639970779418945, -16.184770584106445, -15.729570388793945, -15.274369239807129, -14.819168090820312, -14.363967895507812, -13.908767700195312, -13.453566551208496, -12.99836540222168, -12.54316520690918, -12.08796501159668, -11.632763862609863, -11.177562713623047, -10.722362518310547, -10.267162322998047, -9.81196117401123, -9.356760025024414, -8.901559829711914, -8.446359634399414, -7.991158485412598, -7.5359578132629395, -7.080757141113281, -6.625556468963623, -6.170355796813965, -5.715155124664307, -5.259954452514648, -4.80475378036499, -4.349553108215332, -3.894352436065674, -3.4391515254974365, -2.9839508533477783, -2.52875018119812, -2.073549509048462, -1.6183488368988037, -1.1631481647491455, -0.7079474925994873, -0.2527468204498291, 0.2024538516998291, 0.6576545238494873, 1.1128551959991455, 1.5680558681488037, 2.023256540298462, 2.47845721244812, 2.9336578845977783, 3.3888585567474365, 3.8440592288970947]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 7.0, 6.0, 29.0, 27.0, 32.0, 55.0, 78.0, 91.0, 115.0, 120.0, 113.0, 101.0, 71.0, 56.0, 37.0, 22.0, 10.0, 16.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.560724258422852, -8.33340835571289, -8.106093406677246, -7.878777503967285, -7.651461601257324, -7.4241461753845215, -7.196830749511719, -6.969514846801758, -6.742198944091797, -6.514883518218994, -6.287567615509033, -6.0602521896362305, -5.8329362869262695, -5.605620861053467, -5.378305435180664, -5.150989532470703, -4.9236741065979, -4.696358680725098, -4.469042778015137, -4.241727352142334, -4.014411449432373, -3.7870960235595703, -3.5597803592681885, -3.3324646949768066, -3.105149030685425, -2.877833366394043, -2.650517702102661, -2.4232020378112793, -2.1958866119384766, -1.9685708284378052, -1.741255283355713, -1.513939619064331, -1.2866239547729492, -1.0593082904815674, -0.8319926857948303, -0.6046770811080933, -0.3773614168167114, -0.1500457525253296, 0.0772697925567627, 0.30458545684814453, 0.5319011211395264, 0.7592167854309082, 0.9865323901176453, 1.2138479948043823, 1.4411636590957642, 1.668479323387146, 1.8957948684692383, 2.12311053276062, 2.350426197052002, 2.577741861343384, 2.8050575256347656, 3.0323729515075684, 3.2596888542175293, 3.487004280090332, 3.714319944381714, 3.9416356086730957, 4.168951034545898, 4.396266460418701, 4.623582363128662, 4.850897789001465, 5.078213691711426, 5.3055291175842285, 5.532844543457031, 5.760160446166992, 5.987476348876953]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 6.0, 7.0, 17.0, 28.0, 36.0, 42.0, 62.0, 134.0, 312.0, 779.0, 2406.0, 8840.0, 49230.0, 716536.0, 237999.0, 24144.0, 5323.0, 1557.0, 526.0, 234.0, 119.0, 61.0, 34.0, 25.0, 19.0, 14.0, 7.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.472900390625, -0.45891571044921875, -0.4449310302734375, -0.43094635009765625, -0.416961669921875, -0.40297698974609375, -0.3889923095703125, -0.37500762939453125, -0.36102294921875, -0.34703826904296875, -0.3330535888671875, -0.31906890869140625, -0.305084228515625, -0.29109954833984375, -0.2771148681640625, -0.26313018798828125, -0.2491455078125, -0.23516082763671875, -0.2211761474609375, -0.20719146728515625, -0.193206787109375, -0.17922210693359375, -0.1652374267578125, -0.15125274658203125, -0.13726806640625, -0.12328338623046875, -0.1092987060546875, -0.09531402587890625, -0.081329345703125, -0.06734466552734375, -0.0533599853515625, -0.03937530517578125, -0.025390625, -0.01140594482421875, 0.0025787353515625, 0.01656341552734375, 0.030548095703125, 0.04453277587890625, 0.0585174560546875, 0.07250213623046875, 0.08648681640625, 0.10047149658203125, 0.1144561767578125, 0.12844085693359375, 0.142425537109375, 0.15641021728515625, 0.1703948974609375, 0.18437957763671875, 0.1983642578125, 0.21234893798828125, 0.2263336181640625, 0.24031829833984375, 0.254302978515625, 0.26828765869140625, 0.2822723388671875, 0.29625701904296875, 0.31024169921875, 0.32422637939453125, 0.3382110595703125, 0.35219573974609375, 0.366180419921875, 0.38016510009765625, 0.3941497802734375, 0.40813446044921875, 0.422119140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 14.0, 21.0, 37.0, 59.0, 98.0, 113.0, 123.0, 125.0, 118.0, 99.0, 64.0, 58.0, 38.0, 14.0, 10.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7641830444335938, -0.7456512451171875, -0.7271194458007812, -0.708587646484375, -0.6900558471679688, -0.6715240478515625, -0.6529922485351562, -0.63446044921875, -0.6159286499023438, -0.5973968505859375, -0.5788650512695312, -0.560333251953125, -0.5418014526367188, -0.5232696533203125, -0.5047378540039062, -0.4862060546875, -0.46767425537109375, -0.4491424560546875, -0.43061065673828125, -0.412078857421875, -0.39354705810546875, -0.3750152587890625, -0.35648345947265625, -0.33795166015625, -0.31941986083984375, -0.3008880615234375, -0.28235626220703125, -0.263824462890625, -0.24529266357421875, -0.2267608642578125, -0.20822906494140625, -0.189697265625, -0.17116546630859375, -0.1526336669921875, -0.13410186767578125, -0.115570068359375, -0.09703826904296875, -0.0785064697265625, -0.05997467041015625, -0.04144287109375, -0.02291107177734375, -0.0043792724609375, 0.01415252685546875, 0.032684326171875, 0.05121612548828125, 0.0697479248046875, 0.08827972412109375, 0.1068115234375, 0.12534332275390625, 0.1438751220703125, 0.16240692138671875, 0.180938720703125, 0.19947052001953125, 0.2180023193359375, 0.23653411865234375, 0.25506591796875, 0.27359771728515625, 0.2921295166015625, 0.31066131591796875, 0.329193115234375, 0.34772491455078125, 0.3662567138671875, 0.38478851318359375, 0.4033203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 16.0, 18.0, 30.0, 56.0, 76.0, 151.0, 240.0, 518.0, 1360.0, 6928.0, 341472.0, 687974.0, 7173.0, 1340.0, 556.0, 245.0, 142.0, 82.0, 66.0, 39.0, 26.0, 9.0, 13.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.599609375, -0.5796279907226562, -0.5596466064453125, -0.5396652221679688, -0.519683837890625, -0.49970245361328125, -0.4797210693359375, -0.45973968505859375, -0.43975830078125, -0.41977691650390625, -0.3997955322265625, -0.37981414794921875, -0.359832763671875, -0.33985137939453125, -0.3198699951171875, -0.29988861083984375, -0.2799072265625, -0.25992584228515625, -0.2399444580078125, -0.21996307373046875, -0.199981689453125, -0.18000030517578125, -0.1600189208984375, -0.14003753662109375, -0.12005615234375, -0.10007476806640625, -0.0800933837890625, -0.06011199951171875, -0.040130615234375, -0.02014923095703125, -0.0001678466796875, 0.01981353759765625, 0.039794921875, 0.05977630615234375, 0.0797576904296875, 0.09973907470703125, 0.119720458984375, 0.13970184326171875, 0.1596832275390625, 0.17966461181640625, 0.19964599609375, 0.21962738037109375, 0.2396087646484375, 0.25959014892578125, 0.279571533203125, 0.29955291748046875, 0.3195343017578125, 0.33951568603515625, 0.3594970703125, 0.37947845458984375, 0.3994598388671875, 0.41944122314453125, 0.439422607421875, 0.45940399169921875, 0.4793853759765625, 0.49936676025390625, 0.51934814453125, 0.5393295288085938, 0.5593109130859375, 0.5792922973632812, 0.599273681640625, 0.6192550659179688, 0.6392364501953125, 0.6592178344726562, 0.67919921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 13.0, 10.0, 12.0, 19.0, 19.0, 30.0, 21.0, 52.0, 46.0, 71.0, 87.0, 95.0, 88.0, 74.0, 57.0, 46.0, 40.0, 42.0, 34.0, 24.0, 14.0, 23.0, 15.0, 10.0, 6.0, 11.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0966796875, -1.0644149780273438, -1.0321502685546875, -0.9998855590820312, -0.967620849609375, -0.9353561401367188, -0.9030914306640625, -0.8708267211914062, -0.83856201171875, -0.8062973022460938, -0.7740325927734375, -0.7417678833007812, -0.709503173828125, -0.6772384643554688, -0.6449737548828125, -0.6127090454101562, -0.5804443359375, -0.5481796264648438, -0.5159149169921875, -0.48365020751953125, -0.451385498046875, -0.41912078857421875, -0.3868560791015625, -0.35459136962890625, -0.32232666015625, -0.29006195068359375, -0.2577972412109375, -0.22553253173828125, -0.193267822265625, -0.16100311279296875, -0.1287384033203125, -0.09647369384765625, -0.064208984375, -0.03194427490234375, 0.0003204345703125, 0.03258514404296875, 0.064849853515625, 0.09711456298828125, 0.1293792724609375, 0.16164398193359375, 0.19390869140625, 0.22617340087890625, 0.2584381103515625, 0.29070281982421875, 0.322967529296875, 0.35523223876953125, 0.3874969482421875, 0.41976165771484375, 0.4520263671875, 0.48429107666015625, 0.5165557861328125, 0.5488204956054688, 0.581085205078125, 0.6133499145507812, 0.6456146240234375, 0.6778793334960938, 0.71014404296875, 0.7424087524414062, 0.7746734619140625, 0.8069381713867188, 0.839202880859375, 0.8714675903320312, 0.9037322998046875, 0.9359970092773438, 0.96826171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 10.0, 9.0, 8.0, 11.0, 9.0, 13.0, 27.0, 34.0, 58.0, 94.0, 195.0, 397.0, 824.0, 2592.0, 11199.0, 112698.0, 887798.0, 25612.0, 4581.0, 1274.0, 496.0, 254.0, 118.0, 67.0, 48.0, 33.0, 28.0, 21.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07623291015625, -0.0737905502319336, -0.07134819030761719, -0.06890583038330078, -0.06646347045898438, -0.06402111053466797, -0.06157875061035156, -0.059136390686035156, -0.05669403076171875, -0.054251670837402344, -0.05180931091308594, -0.04936695098876953, -0.046924591064453125, -0.04448223114013672, -0.04203987121582031, -0.039597511291503906, -0.0371551513671875, -0.034712791442871094, -0.03227043151855469, -0.02982807159423828, -0.027385711669921875, -0.02494335174560547, -0.022500991821289062, -0.020058631896972656, -0.01761627197265625, -0.015173912048339844, -0.012731552124023438, -0.010289192199707031, -0.007846832275390625, -0.005404472351074219, -0.0029621124267578125, -0.0005197525024414062, 0.001922607421875, 0.004364967346191406, 0.0068073272705078125, 0.009249687194824219, 0.011692047119140625, 0.014134407043457031, 0.016576766967773438, 0.019019126892089844, 0.02146148681640625, 0.023903846740722656, 0.026346206665039062, 0.02878856658935547, 0.031230926513671875, 0.03367328643798828, 0.03611564636230469, 0.038558006286621094, 0.0410003662109375, 0.043442726135253906, 0.04588508605957031, 0.04832744598388672, 0.050769805908203125, 0.05321216583251953, 0.05565452575683594, 0.058096885681152344, 0.06053924560546875, 0.06298160552978516, 0.06542396545410156, 0.06786632537841797, 0.07030868530273438, 0.07275104522705078, 0.07519340515136719, 0.0776357650756836, 0.080078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 6.0, 2.0, 5.0, 4.0, 5.0, 18.0, 12.0, 15.0, 19.0, 27.0, 24.0, 34.0, 37.0, 34.0, 59.0, 69.0, 76.0, 55.0, 73.0, 57.0, 56.0, 52.0, 40.0, 37.0, 32.0, 25.0, 26.0, 13.0, 18.0, 6.0, 4.0, 6.0, 10.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0], "bins": [-2.9981136322021484e-05, -2.916250377893448e-05, -2.8343871235847473e-05, -2.7525238692760468e-05, -2.6706606149673462e-05, -2.5887973606586456e-05, -2.506934106349945e-05, -2.4250708520412445e-05, -2.343207597732544e-05, -2.2613443434238434e-05, -2.1794810891151428e-05, -2.0976178348064423e-05, -2.0157545804977417e-05, -1.933891326189041e-05, -1.8520280718803406e-05, -1.77016481757164e-05, -1.6883015632629395e-05, -1.606438308954239e-05, -1.5245750546455383e-05, -1.4427118003368378e-05, -1.3608485460281372e-05, -1.2789852917194366e-05, -1.197122037410736e-05, -1.1152587831020355e-05, -1.033395528793335e-05, -9.515322744846344e-06, -8.696690201759338e-06, -7.878057658672333e-06, -7.059425115585327e-06, -6.2407925724983215e-06, -5.422160029411316e-06, -4.60352748632431e-06, -3.7848949432373047e-06, -2.966262400150299e-06, -2.1476298570632935e-06, -1.3289973139762878e-06, -5.103647708892822e-07, 3.082677721977234e-07, 1.126900315284729e-06, 1.9455328583717346e-06, 2.7641654014587402e-06, 3.582797944545746e-06, 4.4014304876327515e-06, 5.220063030719757e-06, 6.038695573806763e-06, 6.857328116893768e-06, 7.675960659980774e-06, 8.49459320306778e-06, 9.313225746154785e-06, 1.013185828924179e-05, 1.0950490832328796e-05, 1.1769123375415802e-05, 1.2587755918502808e-05, 1.3406388461589813e-05, 1.4225021004676819e-05, 1.5043653547763824e-05, 1.586228609085083e-05, 1.6680918633937836e-05, 1.749955117702484e-05, 1.8318183720111847e-05, 1.9136816263198853e-05, 1.9955448806285858e-05, 2.0774081349372864e-05, 2.159271389245987e-05, 2.2411346435546875e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 10.0, 13.0, 11.0, 24.0, 27.0, 45.0, 73.0, 92.0, 99.0, 171.0, 315.0, 482.0, 818.0, 1430.0, 2653.0, 5172.0, 11522.0, 29715.0, 129760.0, 769622.0, 60892.0, 19032.0, 7876.0, 3832.0, 1965.0, 1100.0, 635.0, 379.0, 271.0, 164.0, 103.0, 71.0, 48.0, 38.0, 19.0, 22.0, 9.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03344154357910156, -0.032337188720703125, -0.031232833862304688, -0.03012847900390625, -0.029024124145507812, -0.027919769287109375, -0.026815414428710938, -0.0257110595703125, -0.024606704711914062, -0.023502349853515625, -0.022397994995117188, -0.02129364013671875, -0.020189285278320312, -0.019084930419921875, -0.017980575561523438, -0.016876220703125, -0.015771865844726562, -0.014667510986328125, -0.013563156127929688, -0.01245880126953125, -0.011354446411132812, -0.010250091552734375, -0.009145736694335938, -0.0080413818359375, -0.0069370269775390625, -0.005832672119140625, -0.0047283172607421875, -0.00362396240234375, -0.0025196075439453125, -0.001415252685546875, -0.0003108978271484375, 0.00079345703125, 0.0018978118896484375, 0.003002166748046875, 0.0041065216064453125, 0.00521087646484375, 0.0063152313232421875, 0.007419586181640625, 0.008523941040039062, 0.0096282958984375, 0.010732650756835938, 0.011837005615234375, 0.012941360473632812, 0.01404571533203125, 0.015150070190429688, 0.016254425048828125, 0.017358779907226562, 0.018463134765625, 0.019567489624023438, 0.020671844482421875, 0.021776199340820312, 0.02288055419921875, 0.023984909057617188, 0.025089263916015625, 0.026193618774414062, 0.0272979736328125, 0.028402328491210938, 0.029506683349609375, 0.030611038208007812, 0.03171539306640625, 0.03281974792480469, 0.033924102783203125, 0.03502845764160156, 0.0361328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 6.0, 12.0, 12.0, 13.0, 18.0, 16.0, 31.0, 36.0, 49.0, 64.0, 78.0, 111.0, 127.0, 95.0, 63.0, 48.0, 27.0, 23.0, 26.0, 18.0, 17.0, 11.0, 10.0, 15.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.06610107421875, -0.06426668167114258, -0.062432289123535156, -0.060597896575927734, -0.05876350402832031, -0.05692911148071289, -0.05509471893310547, -0.05326032638549805, -0.051425933837890625, -0.0495915412902832, -0.04775714874267578, -0.04592275619506836, -0.04408836364746094, -0.042253971099853516, -0.040419578552246094, -0.03858518600463867, -0.03675079345703125, -0.03491640090942383, -0.033082008361816406, -0.031247615814208984, -0.029413223266601562, -0.02757883071899414, -0.02574443817138672, -0.023910045623779297, -0.022075653076171875, -0.020241260528564453, -0.01840686798095703, -0.01657247543334961, -0.014738082885742188, -0.012903690338134766, -0.011069297790527344, -0.009234905242919922, -0.0074005126953125, -0.005566120147705078, -0.0037317276000976562, -0.0018973350524902344, -6.29425048828125e-05, 0.0017714500427246094, 0.0036058425903320312, 0.005440235137939453, 0.007274627685546875, 0.009109020233154297, 0.010943412780761719, 0.01277780532836914, 0.014612197875976562, 0.016446590423583984, 0.018280982971191406, 0.020115375518798828, 0.02194976806640625, 0.023784160614013672, 0.025618553161621094, 0.027452945709228516, 0.029287338256835938, 0.03112173080444336, 0.03295612335205078, 0.0347905158996582, 0.036624908447265625, 0.03845930099487305, 0.04029369354248047, 0.04212808609008789, 0.04396247863769531, 0.045796871185302734, 0.047631263732910156, 0.04946565628051758, 0.051300048828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 24.0, 27.0, 54.0, 146.0, 478.0, 98.0, 59.0, 30.0, 22.0, 13.0, 12.0, 6.0, 8.0, 6.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4051713943481445, -1.3128323554992676, -1.2204933166503906, -1.1281542778015137, -1.0358152389526367, -0.9434762001037598, -0.8511371612548828, -0.7587981224060059, -0.6664590835571289, -0.574120044708252, -0.481781005859375, -0.38944196701049805, -0.2971029281616211, -0.20476388931274414, -0.11242485046386719, -0.020085811614990234, 0.07225322723388672, 0.16459226608276367, 0.2569313049316406, 0.3492703437805176, 0.44160938262939453, 0.5339484214782715, 0.6262874603271484, 0.7186264991760254, 0.8109655380249023, 0.9033045768737793, 0.9956436157226562, 1.0879826545715332, 1.1803216934204102, 1.272660732269287, 1.364999771118164, 1.457338809967041, 1.549677848815918, 1.642016887664795, 1.7343559265136719, 1.8266949653625488, 1.9190340042114258, 2.0113730430603027, 2.1037120819091797, 2.1960511207580566, 2.2883901596069336, 2.3807291984558105, 2.4730682373046875, 2.5654072761535645, 2.6577463150024414, 2.7500853538513184, 2.8424243927001953, 2.9347634315490723, 3.027102470397949, 3.119441509246826, 3.211780548095703, 3.30411958694458, 3.396458625793457, 3.488797664642334, 3.581136703491211, 3.673475742340088, 3.765814781188965, 3.858153820037842, 3.9504928588867188, 4.042831897735596, 4.135170936584473, 4.22750997543335, 4.319849014282227, 4.4121880531311035, 4.5045270919799805]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 8.0, 2.0, 6.0, 11.0, 8.0, 8.0, 15.0, 17.0, 17.0, 26.0, 25.0, 30.0, 39.0, 40.0, 168.0, 303.0, 46.0, 37.0, 33.0, 14.0, 28.0, 20.0, 11.0, 13.0, 19.0, 8.0, 5.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.8578991889953613, -2.7718162536621094, -2.6857330799102783, -2.5996501445770264, -2.5135669708251953, -2.4274840354919434, -2.3414011001586914, -2.2553181648254395, -2.1692349910736084, -2.0831520557403564, -1.9970688819885254, -1.9109859466552734, -1.824902892112732, -1.7388198375701904, -1.6527369022369385, -1.566653847694397, -1.4805707931518555, -1.394487738609314, -1.3084046840667725, -1.2223217487335205, -1.136238694190979, -1.0501556396484375, -0.9640726447105408, -0.877989649772644, -0.7919065952301025, -0.705823540687561, -0.6197405457496643, -0.5336575508117676, -0.4475744962692261, -0.36149147152900696, -0.27540844678878784, -0.1893254518508911, -0.10324215888977051, -0.01715913414955139, 0.06892389059066772, 0.15500691533088684, 0.24108994007110596, 0.3271729648113251, 0.4132559895515442, 0.4993389844894409, 0.5854220390319824, 0.6715050935745239, 0.7575880885124207, 0.8436710834503174, 0.9297541379928589, 1.0158371925354004, 1.1019201278686523, 1.1880031824111938, 1.2740862369537354, 1.3601692914962769, 1.4462523460388184, 1.5323352813720703, 1.6184183359146118, 1.7045013904571533, 1.7905843257904053, 1.8766673803329468, 1.9627504348754883, 2.0488333702087402, 2.1349165439605713, 2.2209994792938232, 2.3070826530456543, 2.3931655883789062, 2.479248523712158, 2.56533145904541, 2.651414632797241]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 10.0, 10.0, 9.0, 9.0, 25.0, 23.0, 25.0, 26.0, 47.0, 47.0, 59.0, 261.0, 147.0, 55.0, 37.0, 34.0, 29.0, 26.0, 30.0, 25.0, 21.0, 10.0, 6.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296630859375, -0.2883739471435547, -0.2801170349121094, -0.27186012268066406, -0.26360321044921875, -0.25534629821777344, -0.24708938598632812, -0.2388324737548828, -0.2305755615234375, -0.2223186492919922, -0.21406173706054688, -0.20580482482910156, -0.19754791259765625, -0.18929100036621094, -0.18103408813476562, -0.1727771759033203, -0.164520263671875, -0.1562633514404297, -0.14800643920898438, -0.13974952697753906, -0.13149261474609375, -0.12323570251464844, -0.11497879028320312, -0.10672187805175781, -0.0984649658203125, -0.09020805358886719, -0.08195114135742188, -0.07369422912597656, -0.06543731689453125, -0.05718040466308594, -0.048923492431640625, -0.04066658020019531, -0.03240966796875, -0.024152755737304688, -0.015895843505859375, -0.0076389312744140625, 0.00061798095703125, 0.008874893188476562, 0.017131805419921875, 0.025388717651367188, 0.0336456298828125, 0.04190254211425781, 0.050159454345703125, 0.05841636657714844, 0.06667327880859375, 0.07493019104003906, 0.08318710327148438, 0.09144401550292969, 0.099700927734375, 0.10795783996582031, 0.11621475219726562, 0.12447166442871094, 0.13272857666015625, 0.14098548889160156, 0.14924240112304688, 0.1574993133544922, 0.1657562255859375, 0.1740131378173828, 0.18227005004882812, 0.19052696228027344, 0.19878387451171875, 0.20704078674316406, 0.21529769897460938, 0.2235546112060547, 0.2318115234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 0.0, 0.0, 11.0, 2.0, 1.0, 1.0, 5.0, 13.0, 11.0, 34.0, 40.0, 58.0, 121.0, 533.0, 7728.0, 8375851.0, 3450.0, 464.0, 106.0, 45.0, 23.0, 17.0, 24.0, 13.0, 3.0, 5.0, 12.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-4.04733943939209, -3.904789686203003, -3.762239933013916, -3.619690179824829, -3.477140426635742, -3.3345906734466553, -3.1920409202575684, -3.0494911670684814, -2.9069414138793945, -2.7643916606903076, -2.6218419075012207, -2.479292154312134, -2.336742401123047, -2.19419264793396, -2.051642894744873, -1.9090931415557861, -1.7665433883666992, -1.6239936351776123, -1.4814438819885254, -1.3388941287994385, -1.1963443756103516, -1.0537946224212646, -0.9112448692321777, -0.7686951160430908, -0.6261453628540039, -0.483595609664917, -0.3410458564758301, -0.19849610328674316, -0.05594635009765625, 0.08660340309143066, 0.22915315628051758, 0.3717029094696045, 0.5142531394958496, 0.6568028926849365, 0.7993526458740234, 0.9419023990631104, 1.0844521522521973, 1.2270019054412842, 1.369551658630371, 1.512101411819458, 1.654651165008545, 1.7972009181976318, 1.9397506713867188, 2.0823004245758057, 2.2248501777648926, 2.3673999309539795, 2.5099496841430664, 2.6524994373321533, 2.7950491905212402, 2.937598943710327, 3.080148696899414, 3.222698450088501, 3.365248203277588, 3.507797956466675, 3.6503477096557617, 3.7928974628448486, 3.9354472160339355, 4.077997207641602, 4.220546722412109, 4.363096237182617, 4.505646228790283, 4.648196220397949, 4.790745735168457, 4.933295249938965, 5.075845241546631]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.315582275390625, -2.2522382736206055, -2.188894033432007, -2.1255500316619873, -2.0622057914733887, -1.9988617897033691, -1.9355177879333496, -1.8721736669540405, -1.8088295459747314, -1.7454854249954224, -1.6821413040161133, -1.6187973022460938, -1.5554531812667847, -1.4921090602874756, -1.428765058517456, -1.365420937538147, -1.302076816558838, -1.2387326955795288, -1.1753885746002197, -1.1120445728302002, -1.0487004518508911, -0.985356330871582, -0.9220122694969177, -0.8586682081222534, -0.7953240871429443, -0.7319799661636353, -0.668635904788971, -0.6052918434143066, -0.5419477224349976, -0.47860363125801086, -0.41525954008102417, -0.3519154489040375, -0.2885715961456299, -0.2252275049686432, -0.1618834137916565, -0.0985393226146698, -0.035195231437683105, 0.02814885973930359, 0.09149295091629028, 0.15483704209327698, 0.21818113327026367, 0.28152522444725037, 0.34486931562423706, 0.40821340680122375, 0.47155749797821045, 0.5349016189575195, 0.5982456803321838, 0.6615897417068481, 0.7249338626861572, 0.7882779836654663, 0.8516220450401306, 0.9149661064147949, 0.978310227394104, 1.041654348373413, 1.1049983501434326, 1.1683424711227417, 1.2316865921020508, 1.2950307130813599, 1.358374834060669, 1.4217188358306885, 1.4850629568099976, 1.5484070777893066, 1.6117510795593262, 1.6750952005386353, 1.7384393215179443]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 4.0, 8.0, 4.0, 6.0, 12.0, 21.0, 31.0, 36.0, 49.0, 64.0, 101.0, 180.0, 290.0, 558.0, 1624.0, 6994.0, 43752.0, 289248.0, 154532.0, 20601.0, 3944.0, 1093.0, 465.0, 239.0, 142.0, 78.0, 55.0, 37.0, 24.0, 19.0, 15.0, 9.0, 3.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.40625, -2.328125, -2.25, -2.171875, -2.09375, -2.015625, -1.9375, -1.859375, -1.78125, -1.703125, -1.625, -1.546875, -1.46875, -1.390625, -1.3125, -1.234375, -1.15625, -1.078125, -1.0, -0.921875, -0.84375, -0.765625, -0.6875, -0.609375, -0.53125, -0.453125, -0.375, -0.296875, -0.21875, -0.140625, -0.0625, 0.015625, 0.09375, 0.171875, 0.25, 0.328125, 0.40625, 0.484375, 0.5625, 0.640625, 0.71875, 0.796875, 0.875, 0.953125, 1.03125, 1.109375, 1.1875, 1.265625, 1.34375, 1.421875, 1.5, 1.578125, 1.65625, 1.734375, 1.8125, 1.890625, 1.96875, 2.046875, 2.125, 2.203125, 2.28125, 2.359375, 2.4375, 2.515625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 18.0, 20.0, 28.0, 51.0, 75.0, 123.0, 159.0, 154.0, 127.0, 95.0, 55.0, 45.0, 25.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7945938110351562, -0.7752227783203125, -0.7558517456054688, -0.736480712890625, -0.7171096801757812, -0.6977386474609375, -0.6783676147460938, -0.65899658203125, -0.6396255493164062, -0.6202545166015625, -0.6008834838867188, -0.581512451171875, -0.5621414184570312, -0.5427703857421875, -0.5233993530273438, -0.5040283203125, -0.48465728759765625, -0.4652862548828125, -0.44591522216796875, -0.426544189453125, -0.40717315673828125, -0.3878021240234375, -0.36843109130859375, -0.34906005859375, -0.32968902587890625, -0.3103179931640625, -0.29094696044921875, -0.271575927734375, -0.25220489501953125, -0.2328338623046875, -0.21346282958984375, -0.194091796875, -0.17472076416015625, -0.1553497314453125, -0.13597869873046875, -0.116607666015625, -0.09723663330078125, -0.0778656005859375, -0.05849456787109375, -0.03912353515625, -0.01975250244140625, -0.0003814697265625, 0.01898956298828125, 0.038360595703125, 0.05773162841796875, 0.0771026611328125, 0.09647369384765625, 0.1158447265625, 0.13521575927734375, 0.1545867919921875, 0.17395782470703125, 0.193328857421875, 0.21269989013671875, 0.2320709228515625, 0.25144195556640625, 0.27081298828125, 0.29018402099609375, 0.3095550537109375, 0.32892608642578125, 0.348297119140625, 0.36766815185546875, 0.3870391845703125, 0.40641021728515625, 0.42578125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 2.0, 9.0, 8.0, 18.0, 27.0, 60.0, 80.0, 76.0, 71.0, 58.0, 22.0, 12.0, 11.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.408954620361328, -2.3510591983795166, -2.293164014816284, -2.2352685928344727, -2.177373170852661, -2.1194777488708496, -2.061582565307617, -2.0036871433258057, -1.9457917213439941, -1.8878964185714722, -1.8300009965896606, -1.7721056938171387, -1.7142102718353271, -1.6563149690628052, -1.5984196662902832, -1.5405242443084717, -1.4826289415359497, -1.4247336387634277, -1.3668382167816162, -1.3089429140090942, -1.2510474920272827, -1.1931521892547607, -1.1352567672729492, -1.0773614645004272, -1.0194661617279053, -0.9615707993507385, -0.9036754369735718, -0.8457801342010498, -0.7878847122192383, -0.7299894094467163, -0.6720940470695496, -0.6141986846923828, -0.5563031435012817, -0.498407781124115, -0.44051241874694824, -0.3826170861721039, -0.32472172379493713, -0.2668263614177704, -0.20893102884292603, -0.15103566646575928, -0.09314030408859253, -0.03524494916200638, 0.022650405764579773, 0.08054575324058533, 0.13844111561775208, 0.19633647799491882, 0.2542318105697632, 0.31212717294692993, 0.3700225353240967, 0.4279178977012634, 0.4858132600784302, 0.5437085628509521, 0.6016039848327637, 0.6594992876052856, 0.7173946499824524, 0.7752900123596191, 0.8331853747367859, 0.8910807371139526, 0.9489760994911194, 1.0068714618682861, 1.064766764640808, 1.1226621866226196, 1.1805574893951416, 1.2384529113769531, 1.296348214149475]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 5.0, 33.0, 72.0, 124.0, 91.0, 62.0, 30.0, 14.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.102263927459717, -2.031590700149536, -1.960917353630066, -1.8902440071105957, -1.819570779800415, -1.7488974332809448, -1.6782240867614746, -1.607550859451294, -1.5368775129318237, -1.4662041664123535, -1.3955309391021729, -1.3248575925827026, -1.2541842460632324, -1.1835110187530518, -1.1128376722335815, -1.0421643257141113, -0.9714910984039307, -0.9008178114891052, -0.8301445245742798, -0.7594711780548096, -0.6887978911399841, -0.6181246042251587, -0.5474512577056885, -0.47677797079086304, -0.4061046838760376, -0.33543139696121216, -0.26475808024406433, -0.1940847784280777, -0.12341147661209106, -0.052738189697265625, 0.017935127019882202, 0.08860844373703003, 0.15928173065185547, 0.2299550324678421, 0.30062833428382874, 0.37130165100097656, 0.441974937915802, 0.5126482248306274, 0.5833215713500977, 0.6539948582649231, 0.7246681451797485, 0.795341432094574, 0.8660147190093994, 0.9366880655288696, 1.0073614120483398, 1.0780346393585205, 1.1487079858779907, 1.219381332397461, 1.2900545597076416, 1.3607279062271118, 1.4314011335372925, 1.5020744800567627, 1.5727477073669434, 1.6434210538864136, 1.7140944004058838, 1.7847676277160645, 1.8554409742355347, 1.9261143207550049, 1.9967875480651855, 2.067460775375366, 2.138134241104126, 2.2088074684143066, 2.2794806957244873, 2.350154161453247, 2.4208273887634277]}, "eval/loss": 4.14947509765625, "eval/wer": 2.392959143197144, "eval/runtime": 957.1338, "eval/samples_per_second": 2.76, "eval/steps_per_second": 0.231, "train/train_runtime": 5681.1629, "train/train_samples_per_second": 5.023, "train/train_steps_per_second": 0.105, "train/total_flos": 0.0, "train/train_loss": 4.265389429599749, "_wandb": {"runtime": 6994}}