diff --git "a/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" "b/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 2.8303, "train/learning_rate": 0.00012137730873866748, "train/epoch": 0.15, "train/global_step": 500, "_runtime": 4820, "_timestamp": 1651678909, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 59.0, 839.0, 112.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.895102500915527, -14.636402130126953, -14.377700805664062, -14.119000434875488, -13.860299110412598, -13.601598739624023, -13.342897415161133, -13.084197044372559, -12.825496673583984, -12.56679630279541, -12.30809497833252, -12.049394607543945, -11.790693283081055, -11.53199291229248, -11.27329158782959, -11.014591217041016, -10.755889892578125, -10.49718952178955, -10.23848819732666, -9.979787826538086, -9.721086502075195, -9.462386131286621, -9.20368480682373, -8.944984436035156, -8.686283111572266, -8.427582740783691, -8.1688814163208, -7.910180568695068, -7.651479721069336, -7.392779350280762, -7.134078502655029, -6.875377655029297, -6.6166768074035645, -6.357975959777832, -6.0992751121521, -5.840574264526367, -5.581873893737793, -5.323172569274902, -5.064472198486328, -4.805771350860596, -4.547070503234863, -4.288369655609131, -4.029668807983398, -3.770968198776245, -3.5122673511505127, -3.2535665035247803, -2.994865894317627, -2.7361650466918945, -2.477464199066162, -2.2187633514404297, -1.9600626230239868, -1.701361894607544, -1.4426610469818115, -1.183960199356079, -0.9252594709396362, -0.6665587425231934, -0.4078577756881714, -0.14915698766708374, 0.1095438003540039, 0.36824458837509155, 0.6269453763961792, 0.8856462240219116, 1.1443469524383545, 1.4030476808547974, 1.6617485284805298]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 8.0, 13.0, 13.0, 18.0, 21.0, 29.0, 31.0, 35.0, 46.0, 67.0, 44.0, 71.0, 64.0, 66.0, 68.0, 70.0, 61.0, 49.0, 43.0, 48.0, 30.0, 27.0, 21.0, 20.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4242651462554932, -1.3700642585754395, -1.3158632516860962, -1.2616623640060425, -1.2074613571166992, -1.1532604694366455, -1.0990594625473022, -1.0448585748672485, -0.9906575679779053, -0.9364566206932068, -0.8822556734085083, -0.8280547261238098, -0.7738537788391113, -0.7196528911590576, -0.6654518842697144, -0.6112509965896606, -0.5570500493049622, -0.5028491020202637, -0.4486481547355652, -0.3944472074508667, -0.3402462601661682, -0.2860453426837921, -0.23184439539909363, -0.17764344811439514, -0.12344250082969666, -0.06924155354499817, -0.01504061371088028, 0.03916032612323761, 0.0933612734079361, 0.1475622057914734, 0.20176315307617188, 0.25596410036087036, 0.31016504764556885, 0.36436599493026733, 0.4185669422149658, 0.4727678894996643, 0.5269688367843628, 0.5811697244644165, 0.6353707313537598, 0.6895716190338135, 0.7437726259231567, 0.7979735732078552, 0.8521745204925537, 0.9063754677772522, 0.9605764150619507, 1.0147773027420044, 1.0689783096313477, 1.1231791973114014, 1.177380084991455, 1.2315809726715088, 1.285781979560852, 1.3399828672409058, 1.394183874130249, 1.4483847618103027, 1.502585768699646, 1.5567866563796997, 1.610987663269043, 1.6651885509490967, 1.71938955783844, 1.7735904455184937, 1.827791452407837, 1.8819923400878906, 1.9361933469772339, 1.9903942346572876, 2.044595241546631]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 12.0, 13.0, 16.0, 15.0, 19.0, 50.0, 67.0, 114.0, 183.0, 318.0, 866.0, 4378.0, 9313.0, 84022.0, 2442563.0, 1588548.0, 55537.0, 5187.0, 1417.0, 625.0, 333.0, 188.0, 136.0, 71.0, 69.0, 46.0, 25.0, 28.0, 23.0, 16.0, 16.0, 9.0, 12.0, 7.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.7578125, -2.655364990234375, -2.55291748046875, -2.450469970703125, -2.3480224609375, -2.245574951171875, -2.14312744140625, -2.040679931640625, -1.938232421875, -1.835784912109375, -1.73333740234375, -1.630889892578125, -1.5284423828125, -1.425994873046875, -1.32354736328125, -1.221099853515625, -1.11865234375, -1.016204833984375, -0.91375732421875, -0.811309814453125, -0.7088623046875, -0.606414794921875, -0.50396728515625, -0.401519775390625, -0.299072265625, -0.196624755859375, -0.09417724609375, 0.008270263671875, 0.1107177734375, 0.213165283203125, 0.31561279296875, 0.418060302734375, 0.5205078125, 0.622955322265625, 0.72540283203125, 0.827850341796875, 0.9302978515625, 1.032745361328125, 1.13519287109375, 1.237640380859375, 1.340087890625, 1.442535400390625, 1.54498291015625, 1.647430419921875, 1.7498779296875, 1.852325439453125, 1.95477294921875, 2.057220458984375, 2.15966796875, 2.262115478515625, 2.36456298828125, 2.467010498046875, 2.5694580078125, 2.671905517578125, 2.77435302734375, 2.876800537109375, 2.979248046875, 3.081695556640625, 3.18414306640625, 3.286590576171875, 3.3890380859375, 3.491485595703125, 3.59393310546875, 3.696380615234375, 3.798828125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 10.0, 9.0, 22.0, 30.0, 32.0, 42.0, 42.0, 59.0, 61.0, 63.0, 72.0, 60.0, 76.0, 70.0, 64.0, 53.0, 59.0, 37.0, 34.0, 22.0, 20.0, 14.0, 9.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4236907958984375, -1.367889404296875, -1.3120880126953125, -1.25628662109375, -1.2004852294921875, -1.144683837890625, -1.0888824462890625, -1.0330810546875, -0.9772796630859375, -0.921478271484375, -0.8656768798828125, -0.80987548828125, -0.7540740966796875, -0.698272705078125, -0.6424713134765625, -0.586669921875, -0.5308685302734375, -0.475067138671875, -0.4192657470703125, -0.36346435546875, -0.3076629638671875, -0.251861572265625, -0.1960601806640625, -0.1402587890625, -0.0844573974609375, -0.028656005859375, 0.0271453857421875, 0.08294677734375, 0.1387481689453125, 0.194549560546875, 0.2503509521484375, 0.30615234375, 0.3619537353515625, 0.417755126953125, 0.4735565185546875, 0.52935791015625, 0.5851593017578125, 0.640960693359375, 0.6967620849609375, 0.7525634765625, 0.8083648681640625, 0.864166259765625, 0.9199676513671875, 0.97576904296875, 1.0315704345703125, 1.087371826171875, 1.1431732177734375, 1.198974609375, 1.2547760009765625, 1.310577392578125, 1.3663787841796875, 1.42218017578125, 1.4779815673828125, 1.533782958984375, 1.5895843505859375, 1.6453857421875, 1.7011871337890625, 1.756988525390625, 1.8127899169921875, 1.86859130859375, 1.9243927001953125, 1.980194091796875, 2.0359954833984375, 2.091796875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 16.0, 55.0, 358.0, 4193496.0, 285.0, 49.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.25, -144.3515625, -139.453125, -134.5546875, -129.65625, -124.7578125, -119.859375, -114.9609375, -110.0625, -105.1640625, -100.265625, -95.3671875, -90.46875, -85.5703125, -80.671875, -75.7734375, -70.875, -65.9765625, -61.078125, -56.1796875, -51.28125, -46.3828125, -41.484375, -36.5859375, -31.6875, -26.7890625, -21.890625, -16.9921875, -12.09375, -7.1953125, -2.296875, 2.6015625, 7.5, 12.3984375, 17.296875, 22.1953125, 27.09375, 31.9921875, 36.890625, 41.7890625, 46.6875, 51.5859375, 56.484375, 61.3828125, 66.28125, 71.1796875, 76.078125, 80.9765625, 85.875, 90.7734375, 95.671875, 100.5703125, 105.46875, 110.3671875, 115.265625, 120.1640625, 125.0625, 129.9609375, 134.859375, 139.7578125, 144.65625, 149.5546875, 154.453125, 159.3515625, 164.25]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 15.0, 58.0, 319.0, 3326.0, 271.0, 64.0, 10.0, 2.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.912872314453125, -2.81402587890625, -2.715179443359375, -2.6163330078125, -2.517486572265625, -2.41864013671875, -2.319793701171875, -2.220947265625, -2.122100830078125, -2.02325439453125, -1.924407958984375, -1.8255615234375, -1.726715087890625, -1.62786865234375, -1.529022216796875, -1.43017578125, -1.331329345703125, -1.23248291015625, -1.133636474609375, -1.0347900390625, -0.935943603515625, -0.83709716796875, -0.738250732421875, -0.639404296875, -0.540557861328125, -0.44171142578125, -0.342864990234375, -0.2440185546875, -0.145172119140625, -0.04632568359375, 0.052520751953125, 0.1513671875, 0.250213623046875, 0.34906005859375, 0.447906494140625, 0.5467529296875, 0.645599365234375, 0.74444580078125, 0.843292236328125, 0.942138671875, 1.040985107421875, 1.13983154296875, 1.238677978515625, 1.3375244140625, 1.436370849609375, 1.53521728515625, 1.634063720703125, 1.73291015625, 1.831756591796875, 1.93060302734375, 2.029449462890625, 2.1282958984375, 2.227142333984375, 2.32598876953125, 2.424835205078125, 2.523681640625, 2.622528076171875, 2.72137451171875, 2.820220947265625, 2.9190673828125, 3.017913818359375, 3.11676025390625, 3.215606689453125, 3.314453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 2.0, 5.0, 6.0, 19.0, 13.0, 21.0, 38.0, 43.0, 50.0, 60.0, 77.0, 75.0, 113.0, 103.0, 81.0, 55.0, 52.0, 50.0, 36.0, 25.0, 16.0, 14.0, 8.0, 4.0, 4.0, 5.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.349200963973999, -2.286876916885376, -2.224552869796753, -2.162229061126709, -2.099905014038086, -2.037580966949463, -1.9752569198608398, -1.9129328727722168, -1.8506089448928833, -1.7882848978042603, -1.7259609699249268, -1.6636369228363037, -1.6013128757476807, -1.5389889478683472, -1.4766649007797241, -1.4143409729003906, -1.3520169258117676, -1.2896928787231445, -1.227368950843811, -1.165044903755188, -1.1027209758758545, -1.0403969287872314, -0.9780728816986084, -0.9157488942146301, -0.8534249067306519, -0.7911009192466736, -0.7287769317626953, -0.6664528846740723, -0.604128897190094, -0.5418049097061157, -0.47948089241981506, -0.4171568751335144, -0.3548327684402466, -0.2925087809562683, -0.23018476366996765, -0.16786076128482819, -0.10553675889968872, -0.04321277141571045, 0.01911124587059021, 0.08143526315689087, 0.14375925064086914, 0.2060832530260086, 0.26840725541114807, 0.33073127269744873, 0.393055260181427, 0.4553792476654053, 0.5177032947540283, 0.5800272822380066, 0.6423512697219849, 0.7046752572059631, 0.7669992446899414, 0.8293232917785645, 0.8916472792625427, 0.953971266746521, 1.016295313835144, 1.0786192417144775, 1.1409432888031006, 1.2032673358917236, 1.2655912637710571, 1.3279153108596802, 1.3902392387390137, 1.4525632858276367, 1.5148873329162598, 1.5772113800048828, 1.6395353078842163]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 10.0, 13.0, 14.0, 13.0, 11.0, 16.0, 16.0, 25.0, 18.0, 30.0, 20.0, 36.0, 23.0, 43.0, 44.0, 48.0, 41.0, 34.0, 37.0, 38.0, 39.0, 24.0, 28.0, 32.0, 28.0, 36.0, 31.0, 29.0, 28.0, 29.0, 16.0, 22.0, 17.0, 16.0, 18.0, 12.0, 11.0, 8.0, 10.0, 9.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4210435152053833, -1.3709176778793335, -1.3207918405532837, -1.2706660032272339, -1.2205400466918945, -1.1704142093658447, -1.120288372039795, -1.0701625347137451, -1.0200366973876953, -0.9699108600616455, -0.9197850227355957, -0.8696591258049011, -0.8195332884788513, -0.7694074511528015, -0.7192815542221069, -0.6691557168960571, -0.6190298795700073, -0.5689040422439575, -0.5187782049179077, -0.46865230798721313, -0.41852647066116333, -0.3684006333351135, -0.31827476620674133, -0.26814889907836914, -0.21802306175231934, -0.16789720952510834, -0.11777135729789734, -0.06764550507068634, -0.017519652843475342, 0.03260618448257446, 0.08273205161094666, 0.13285791873931885, 0.18298375606536865, 0.23310960829257965, 0.28323546051979065, 0.33336132764816284, 0.38348716497421265, 0.43361300230026245, 0.48373886942863464, 0.5338647365570068, 0.5839905738830566, 0.6341164112091064, 0.6842422485351562, 0.7343681454658508, 0.7844939827919006, 0.8346198201179504, 0.884745717048645, 0.9348715543746948, 0.9849973917007446, 1.0351232290267944, 1.0852490663528442, 1.135374903678894, 1.1855008602142334, 1.2356266975402832, 1.285752534866333, 1.3358783721923828, 1.3860042095184326, 1.4361300468444824, 1.4862558841705322, 1.536381721496582, 1.5865075588226318, 1.6366333961486816, 1.686759352684021, 1.7368851900100708, 1.7870110273361206]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 4.0, 13.0, 14.0, 18.0, 21.0, 31.0, 48.0, 61.0, 86.0, 100.0, 135.0, 154.0, 242.0, 308.0, 468.0, 781.0, 1251.0, 2314.0, 4688.0, 10109.0, 24569.0, 67123.0, 208998.0, 425506.0, 195254.0, 63088.0, 23258.0, 9490.0, 4533.0, 2236.0, 1239.0, 750.0, 463.0, 295.0, 221.0, 165.0, 120.0, 79.0, 88.0, 68.0, 42.0, 29.0, 31.0, 15.0, 15.0, 12.0, 9.0, 8.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.4326171875, -0.42006683349609375, -0.4075164794921875, -0.39496612548828125, -0.382415771484375, -0.36986541748046875, -0.3573150634765625, -0.34476470947265625, -0.33221435546875, -0.31966400146484375, -0.3071136474609375, -0.29456329345703125, -0.282012939453125, -0.26946258544921875, -0.2569122314453125, -0.24436187744140625, -0.2318115234375, -0.21926116943359375, -0.2067108154296875, -0.19416046142578125, -0.181610107421875, -0.16905975341796875, -0.1565093994140625, -0.14395904541015625, -0.13140869140625, -0.11885833740234375, -0.1063079833984375, -0.09375762939453125, -0.081207275390625, -0.06865692138671875, -0.0561065673828125, -0.04355621337890625, -0.031005859375, -0.01845550537109375, -0.0059051513671875, 0.00664520263671875, 0.019195556640625, 0.03174591064453125, 0.0442962646484375, 0.05684661865234375, 0.06939697265625, 0.08194732666015625, 0.0944976806640625, 0.10704803466796875, 0.119598388671875, 0.13214874267578125, 0.1446990966796875, 0.15724945068359375, 0.1697998046875, 0.18235015869140625, 0.1949005126953125, 0.20745086669921875, 0.220001220703125, 0.23255157470703125, 0.2451019287109375, 0.25765228271484375, 0.27020263671875, 0.28275299072265625, 0.2953033447265625, 0.30785369873046875, 0.320404052734375, 0.33295440673828125, 0.3455047607421875, 0.35805511474609375, 0.37060546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 7.0, 7.0, 7.0, 12.0, 13.0, 12.0, 13.0, 20.0, 14.0, 30.0, 29.0, 34.0, 35.0, 39.0, 49.0, 39.0, 55.0, 47.0, 48.0, 42.0, 46.0, 34.0, 37.0, 33.0, 32.0, 33.0, 30.0, 31.0, 36.0, 24.0, 16.0, 14.0, 15.0, 8.0, 12.0, 8.0, 6.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2148284912109375, -1.170867919921875, -1.1269073486328125, -1.08294677734375, -1.0389862060546875, -0.995025634765625, -0.9510650634765625, -0.9071044921875, -0.8631439208984375, -0.819183349609375, -0.7752227783203125, -0.73126220703125, -0.6873016357421875, -0.643341064453125, -0.5993804931640625, -0.555419921875, -0.5114593505859375, -0.467498779296875, -0.4235382080078125, -0.37957763671875, -0.3356170654296875, -0.291656494140625, -0.2476959228515625, -0.2037353515625, -0.1597747802734375, -0.115814208984375, -0.0718536376953125, -0.02789306640625, 0.0160675048828125, 0.060028076171875, 0.1039886474609375, 0.14794921875, 0.1919097900390625, 0.235870361328125, 0.2798309326171875, 0.32379150390625, 0.3677520751953125, 0.411712646484375, 0.4556732177734375, 0.4996337890625, 0.5435943603515625, 0.587554931640625, 0.6315155029296875, 0.67547607421875, 0.7194366455078125, 0.763397216796875, 0.8073577880859375, 0.851318359375, 0.8952789306640625, 0.939239501953125, 0.9832000732421875, 1.02716064453125, 1.0711212158203125, 1.115081787109375, 1.1590423583984375, 1.2030029296875, 1.2469635009765625, 1.290924072265625, 1.3348846435546875, 1.37884521484375, 1.4228057861328125, 1.466766357421875, 1.5107269287109375, 1.5546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 19.0, 28.0, 45.0, 92.0, 130.0, 246.0, 420.0, 690.0, 1219.0, 2527.0, 4838.0, 9635.0, 18916.0, 38165.0, 77054.0, 149746.0, 241409.0, 229206.0, 136121.0, 68887.0, 34308.0, 16886.0, 8512.0, 4358.0, 2270.0, 1311.0, 694.0, 357.0, 217.0, 97.0, 55.0, 38.0, 23.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.15032005310058594, -0.14561080932617188, -0.1409015655517578, -0.13619232177734375, -0.1314830780029297, -0.12677383422851562, -0.12206459045410156, -0.1173553466796875, -0.11264610290527344, -0.10793685913085938, -0.10322761535644531, -0.09851837158203125, -0.09380912780761719, -0.08909988403320312, -0.08439064025878906, -0.079681396484375, -0.07497215270996094, -0.07026290893554688, -0.06555366516113281, -0.06084442138671875, -0.05613517761230469, -0.051425933837890625, -0.04671669006347656, -0.0420074462890625, -0.03729820251464844, -0.032588958740234375, -0.027879714965820312, -0.02317047119140625, -0.018461227416992188, -0.013751983642578125, -0.009042739868164062, -0.00433349609375, 0.0003757476806640625, 0.005084991455078125, 0.009794235229492188, 0.01450347900390625, 0.019212722778320312, 0.023921966552734375, 0.028631210327148438, 0.0333404541015625, 0.03804969787597656, 0.042758941650390625, 0.04746818542480469, 0.05217742919921875, 0.05688667297363281, 0.061595916748046875, 0.06630516052246094, 0.071014404296875, 0.07572364807128906, 0.08043289184570312, 0.08514213562011719, 0.08985137939453125, 0.09456062316894531, 0.09926986694335938, 0.10397911071777344, 0.1086883544921875, 0.11339759826660156, 0.11810684204101562, 0.12281608581542969, 0.12752532958984375, 0.1322345733642578, 0.13694381713867188, 0.14165306091308594, 0.1463623046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 9.0, 9.0, 14.0, 11.0, 20.0, 15.0, 24.0, 22.0, 27.0, 16.0, 27.0, 26.0, 28.0, 37.0, 39.0, 34.0, 37.0, 51.0, 41.0, 48.0, 38.0, 46.0, 40.0, 38.0, 19.0, 45.0, 26.0, 30.0, 29.0, 29.0, 18.0, 21.0, 8.0, 12.0, 13.0, 8.0, 6.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.142578125, -2.0782470703125, -2.013916015625, -1.9495849609375, -1.88525390625, -1.8209228515625, -1.756591796875, -1.6922607421875, -1.6279296875, -1.5635986328125, -1.499267578125, -1.4349365234375, -1.37060546875, -1.3062744140625, -1.241943359375, -1.1776123046875, -1.11328125, -1.0489501953125, -0.984619140625, -0.9202880859375, -0.85595703125, -0.7916259765625, -0.727294921875, -0.6629638671875, -0.5986328125, -0.5343017578125, -0.469970703125, -0.4056396484375, -0.34130859375, -0.2769775390625, -0.212646484375, -0.1483154296875, -0.083984375, -0.0196533203125, 0.044677734375, 0.1090087890625, 0.17333984375, 0.2376708984375, 0.302001953125, 0.3663330078125, 0.4306640625, 0.4949951171875, 0.559326171875, 0.6236572265625, 0.68798828125, 0.7523193359375, 0.816650390625, 0.8809814453125, 0.9453125, 1.0096435546875, 1.073974609375, 1.1383056640625, 1.20263671875, 1.2669677734375, 1.331298828125, 1.3956298828125, 1.4599609375, 1.5242919921875, 1.588623046875, 1.6529541015625, 1.71728515625, 1.7816162109375, 1.845947265625, 1.9102783203125, 1.974609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 13.0, 16.0, 23.0, 34.0, 48.0, 63.0, 124.0, 185.0, 373.0, 679.0, 1318.0, 2813.0, 6534.0, 16884.0, 54510.0, 213185.0, 467915.0, 201953.0, 53188.0, 16759.0, 6378.0, 2763.0, 1300.0, 647.0, 334.0, 195.0, 93.0, 70.0, 44.0, 28.0, 24.0, 12.0, 10.0, 4.0, 10.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0257110595703125, -0.024965286254882812, -0.024219512939453125, -0.023473739624023438, -0.02272796630859375, -0.021982192993164062, -0.021236419677734375, -0.020490646362304688, -0.019744873046875, -0.018999099731445312, -0.018253326416015625, -0.017507553100585938, -0.01676177978515625, -0.016016006469726562, -0.015270233154296875, -0.014524459838867188, -0.0137786865234375, -0.013032913208007812, -0.012287139892578125, -0.011541366577148438, -0.01079559326171875, -0.010049819946289062, -0.009304046630859375, -0.008558273315429688, -0.0078125, -0.0070667266845703125, -0.006320953369140625, -0.0055751800537109375, -0.00482940673828125, -0.0040836334228515625, -0.003337860107421875, -0.0025920867919921875, -0.0018463134765625, -0.0011005401611328125, -0.000354766845703125, 0.0003910064697265625, 0.00113677978515625, 0.0018825531005859375, 0.002628326416015625, 0.0033740997314453125, 0.004119873046875, 0.0048656463623046875, 0.005611419677734375, 0.0063571929931640625, 0.00710296630859375, 0.007848739624023438, 0.008594512939453125, 0.009340286254882812, 0.0100860595703125, 0.010831832885742188, 0.011577606201171875, 0.012323379516601562, 0.01306915283203125, 0.013814926147460938, 0.014560699462890625, 0.015306472778320312, 0.01605224609375, 0.016798019409179688, 0.017543792724609375, 0.018289566040039062, 0.01903533935546875, 0.019781112670898438, 0.020526885986328125, 0.021272659301757812, 0.0220184326171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 5.0, 10.0, 13.0, 23.0, 30.0, 31.0, 51.0, 54.0, 88.0, 98.0, 130.0, 117.0, 96.0, 64.0, 57.0, 34.0, 32.0, 18.0, 17.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.184246063232422e-05, -4.0271319448947906e-05, -3.8700178265571594e-05, -3.712903708219528e-05, -3.555789589881897e-05, -3.398675471544266e-05, -3.2415613532066345e-05, -3.084447234869003e-05, -2.927333116531372e-05, -2.770218998193741e-05, -2.6131048798561096e-05, -2.4559907615184784e-05, -2.298876643180847e-05, -2.141762524843216e-05, -1.9846484065055847e-05, -1.8275342881679535e-05, -1.6704201698303223e-05, -1.513306051492691e-05, -1.3561919331550598e-05, -1.1990778148174286e-05, -1.0419636964797974e-05, -8.848495781421661e-06, -7.277354598045349e-06, -5.706213414669037e-06, -4.135072231292725e-06, -2.5639310479164124e-06, -9.927898645401e-07, 5.783513188362122e-07, 2.1494925022125244e-06, 3.7206336855888367e-06, 5.291774868965149e-06, 6.862916052341461e-06, 8.434057235717773e-06, 1.0005198419094086e-05, 1.1576339602470398e-05, 1.314748078584671e-05, 1.4718621969223022e-05, 1.6289763152599335e-05, 1.7860904335975647e-05, 1.943204551935196e-05, 2.100318670272827e-05, 2.2574327886104584e-05, 2.4145469069480896e-05, 2.5716610252857208e-05, 2.728775143623352e-05, 2.8858892619609833e-05, 3.0430033802986145e-05, 3.200117498636246e-05, 3.357231616973877e-05, 3.514345735311508e-05, 3.6714598536491394e-05, 3.8285739719867706e-05, 3.985688090324402e-05, 4.142802208662033e-05, 4.299916326999664e-05, 4.4570304453372955e-05, 4.614144563674927e-05, 4.771258682012558e-05, 4.928372800350189e-05, 5.0854869186878204e-05, 5.2426010370254517e-05, 5.399715155363083e-05, 5.556829273700714e-05, 5.713943392038345e-05, 5.8710575103759766e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 3.0, 6.0, 6.0, 14.0, 17.0, 22.0, 34.0, 65.0, 103.0, 227.0, 1908.0, 1014257.0, 30997.0, 476.0, 149.0, 85.0, 51.0, 43.0, 27.0, 19.0, 12.0, 5.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1923828125, -0.18519210815429688, -0.17800140380859375, -0.17081069946289062, -0.1636199951171875, -0.15642929077148438, -0.14923858642578125, -0.14204788208007812, -0.134857177734375, -0.12766647338867188, -0.12047576904296875, -0.11328506469726562, -0.1060943603515625, -0.09890365600585938, -0.09171295166015625, -0.08452224731445312, -0.07733154296875, -0.07014083862304688, -0.06295013427734375, -0.055759429931640625, -0.0485687255859375, -0.041378021240234375, -0.03418731689453125, -0.026996612548828125, -0.019805908203125, -0.012615203857421875, -0.00542449951171875, 0.001766204833984375, 0.0089569091796875, 0.016147613525390625, 0.02333831787109375, 0.030529022216796875, 0.0377197265625, 0.044910430908203125, 0.05210113525390625, 0.059291839599609375, 0.0664825439453125, 0.07367324829101562, 0.08086395263671875, 0.08805465698242188, 0.095245361328125, 0.10243606567382812, 0.10962677001953125, 0.11681747436523438, 0.1240081787109375, 0.13119888305664062, 0.13838958740234375, 0.14558029174804688, 0.15277099609375, 0.15996170043945312, 0.16715240478515625, 0.17434310913085938, 0.1815338134765625, 0.18872451782226562, 0.19591522216796875, 0.20310592651367188, 0.210296630859375, 0.21748733520507812, 0.22467803955078125, 0.23186874389648438, 0.2390594482421875, 0.24625015258789062, 0.25344085693359375, 0.2606315612792969, 0.267822265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 4.0, 10.0, 17.0, 17.0, 27.0, 37.0, 54.0, 82.0, 89.0, 112.0, 129.0, 94.0, 69.0, 56.0, 54.0, 32.0, 35.0, 17.0, 18.0, 5.0, 7.0, 6.0, 6.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118255615234375, -0.011375904083251953, -0.010926246643066406, -0.01047658920288086, -0.010026931762695312, -0.009577274322509766, -0.009127616882324219, -0.008677959442138672, -0.008228302001953125, -0.007778644561767578, -0.007328987121582031, -0.006879329681396484, -0.0064296722412109375, -0.005980014801025391, -0.005530357360839844, -0.005080699920654297, -0.00463104248046875, -0.004181385040283203, -0.0037317276000976562, -0.0032820701599121094, -0.0028324127197265625, -0.0023827552795410156, -0.0019330978393554688, -0.0014834403991699219, -0.001033782958984375, -0.0005841255187988281, -0.00013446807861328125, 0.0003151893615722656, 0.0007648468017578125, 0.0012145042419433594, 0.0016641616821289062, 0.002113819122314453, 0.0025634765625, 0.003013134002685547, 0.0034627914428710938, 0.003912448883056641, 0.0043621063232421875, 0.004811763763427734, 0.005261421203613281, 0.005711078643798828, 0.006160736083984375, 0.006610393524169922, 0.007060050964355469, 0.007509708404541016, 0.007959365844726562, 0.00840902328491211, 0.008858680725097656, 0.009308338165283203, 0.00975799560546875, 0.010207653045654297, 0.010657310485839844, 0.01110696792602539, 0.011556625366210938, 0.012006282806396484, 0.012455940246582031, 0.012905597686767578, 0.013355255126953125, 0.013804912567138672, 0.014254570007324219, 0.014704227447509766, 0.015153884887695312, 0.01560354232788086, 0.016053199768066406, 0.016502857208251953, 0.0169525146484375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 10.0, 10.0, 20.0, 27.0, 64.0, 79.0, 107.0, 164.0, 172.0, 125.0, 77.0, 55.0, 38.0, 21.0, 15.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.978070616722107, -1.8959063291549683, -1.81374192237854, -1.7315776348114014, -1.6494132280349731, -1.5672489404678345, -1.4850845336914062, -1.4029202461242676, -1.320755958557129, -1.2385916709899902, -1.156427264213562, -1.0742629766464233, -0.9920985698699951, -0.9099342823028564, -0.827769935131073, -0.7456055879592896, -0.6634411811828613, -0.5812768340110779, -0.49911248683929443, -0.4169481694698334, -0.3347838222980499, -0.2526194751262665, -0.17045515775680542, -0.08829081058502197, -0.006126463413238525, 0.07603787630796432, 0.15820221602916718, 0.24036654829978943, 0.3225308954715729, 0.4046952426433563, 0.4868595600128174, 0.5690239071846008, 0.6511881351470947, 0.7333524823188782, 0.8155168294906616, 0.8976811170578003, 0.9798455238342285, 1.0620098114013672, 1.1441740989685059, 1.226338505744934, 1.3085029125213623, 1.390667200088501, 1.4728316068649292, 1.5549958944320679, 1.637160301208496, 1.7193245887756348, 1.8014888763427734, 1.8836532831192017, 1.9658175706863403, 2.0479819774627686, 2.1301462650299072, 2.212310552597046, 2.2944748401641846, 2.3766393661499023, 2.458803653717041, 2.5409679412841797, 2.6231322288513184, 2.705296516418457, 2.7874608039855957, 2.8696253299713135, 2.951789617538452, 3.033953905105591, 3.1161181926727295, 3.1982827186584473, 3.280447006225586]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 9.0, 19.0, 17.0, 19.0, 28.0, 24.0, 32.0, 33.0, 57.0, 43.0, 66.0, 66.0, 59.0, 58.0, 50.0, 48.0, 46.0, 46.0, 47.0, 43.0, 37.0, 28.0, 23.0, 24.0, 16.0, 15.0, 9.0, 6.0, 15.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0632197856903076, -2.0095162391662598, -1.9558128118515015, -1.9021093845367432, -1.8484058380126953, -1.794702410697937, -1.7409989833831787, -1.6872954368591309, -1.633591890335083, -1.5798884630203247, -1.5261849164962769, -1.4724814891815186, -1.4187779426574707, -1.3650745153427124, -1.311371088027954, -1.2576675415039062, -1.203964114189148, -1.1502606868743896, -1.0965571403503418, -1.0428537130355835, -0.9891501665115356, -0.9354467391967773, -0.8817432522773743, -0.8280397653579712, -0.7743362784385681, -0.720632791519165, -0.666929304599762, -0.6132258176803589, -0.5595223903656006, -0.5058188438415527, -0.45211541652679443, -0.39841192960739136, -0.34470832347869873, -0.29100483655929565, -0.23730136454105377, -0.1835978925228119, -0.1298944056034088, -0.07619091868400574, -0.02248746156692505, 0.031216025352478027, 0.0849195122718811, 0.13862299919128418, 0.19232647120952606, 0.24602994322776794, 0.299733430147171, 0.3534369170665741, 0.4071403741836548, 0.46084386110305786, 0.5145473480224609, 0.568250834941864, 0.6219543218612671, 0.6756577491760254, 0.7293612957000732, 0.7830647230148315, 0.8367682099342346, 0.8904716968536377, 0.9441751837730408, 0.9978786706924438, 1.0515820980072021, 1.10528564453125, 1.1589890718460083, 1.2126926183700562, 1.2663960456848145, 1.3200995922088623, 1.3738030195236206]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 11.0, 18.0, 24.0, 30.0, 35.0, 64.0, 95.0, 119.0, 213.0, 265.0, 442.0, 642.0, 949.0, 1509.0, 2261.0, 3634.0, 5761.0, 9616.0, 16035.0, 28324.0, 54287.0, 124303.0, 389690.0, 234703.0, 81185.0, 39518.0, 21467.0, 12450.0, 7555.0, 4660.0, 3006.0, 1871.0, 1213.0, 870.0, 586.0, 335.0, 250.0, 174.0, 100.0, 79.0, 66.0, 36.0, 25.0, 24.0, 17.0, 7.0, 16.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.26953125, -1.228271484375, -1.18701171875, -1.145751953125, -1.1044921875, -1.063232421875, -1.02197265625, -0.980712890625, -0.939453125, -0.898193359375, -0.85693359375, -0.815673828125, -0.7744140625, -0.733154296875, -0.69189453125, -0.650634765625, -0.609375, -0.568115234375, -0.52685546875, -0.485595703125, -0.4443359375, -0.403076171875, -0.36181640625, -0.320556640625, -0.279296875, -0.238037109375, -0.19677734375, -0.155517578125, -0.1142578125, -0.072998046875, -0.03173828125, 0.009521484375, 0.05078125, 0.092041015625, 0.13330078125, 0.174560546875, 0.2158203125, 0.257080078125, 0.29833984375, 0.339599609375, 0.380859375, 0.422119140625, 0.46337890625, 0.504638671875, 0.5458984375, 0.587158203125, 0.62841796875, 0.669677734375, 0.7109375, 0.752197265625, 0.79345703125, 0.834716796875, 0.8759765625, 0.917236328125, 0.95849609375, 0.999755859375, 1.041015625, 1.082275390625, 1.12353515625, 1.164794921875, 1.2060546875, 1.247314453125, 1.28857421875, 1.329833984375, 1.37109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 7.0, 5.0, 9.0, 9.0, 6.0, 16.0, 14.0, 20.0, 22.0, 20.0, 27.0, 16.0, 27.0, 22.0, 35.0, 27.0, 30.0, 31.0, 31.0, 46.0, 41.0, 37.0, 30.0, 43.0, 37.0, 39.0, 34.0, 37.0, 33.0, 28.0, 34.0, 30.0, 27.0, 24.0, 9.0, 16.0, 8.0, 12.0, 15.0, 11.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-15.4765625, -15.026123046875, -14.57568359375, -14.125244140625, -13.6748046875, -13.224365234375, -12.77392578125, -12.323486328125, -11.873046875, -11.422607421875, -10.97216796875, -10.521728515625, -10.0712890625, -9.620849609375, -9.17041015625, -8.719970703125, -8.26953125, -7.819091796875, -7.36865234375, -6.918212890625, -6.4677734375, -6.017333984375, -5.56689453125, -5.116455078125, -4.666015625, -4.215576171875, -3.76513671875, -3.314697265625, -2.8642578125, -2.413818359375, -1.96337890625, -1.512939453125, -1.0625, -0.612060546875, -0.16162109375, 0.288818359375, 0.7392578125, 1.189697265625, 1.64013671875, 2.090576171875, 2.541015625, 2.991455078125, 3.44189453125, 3.892333984375, 4.3427734375, 4.793212890625, 5.24365234375, 5.694091796875, 6.14453125, 6.594970703125, 7.04541015625, 7.495849609375, 7.9462890625, 8.396728515625, 8.84716796875, 9.297607421875, 9.748046875, 10.198486328125, 10.64892578125, 11.099365234375, 11.5498046875, 12.000244140625, 12.45068359375, 12.901123046875, 13.3515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 5.0, 14.0, 18.0, 20.0, 21.0, 25.0, 31.0, 50.0, 69.0, 76.0, 118.0, 152.0, 308.0, 530.0, 2843.0, 269060.0, 769758.0, 3948.0, 623.0, 268.0, 156.0, 113.0, 74.0, 62.0, 33.0, 29.0, 30.0, 25.0, 14.0, 11.0, 13.0, 12.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.46875, -12.123046875, -11.77734375, -11.431640625, -11.0859375, -10.740234375, -10.39453125, -10.048828125, -9.703125, -9.357421875, -9.01171875, -8.666015625, -8.3203125, -7.974609375, -7.62890625, -7.283203125, -6.9375, -6.591796875, -6.24609375, -5.900390625, -5.5546875, -5.208984375, -4.86328125, -4.517578125, -4.171875, -3.826171875, -3.48046875, -3.134765625, -2.7890625, -2.443359375, -2.09765625, -1.751953125, -1.40625, -1.060546875, -0.71484375, -0.369140625, -0.0234375, 0.322265625, 0.66796875, 1.013671875, 1.359375, 1.705078125, 2.05078125, 2.396484375, 2.7421875, 3.087890625, 3.43359375, 3.779296875, 4.125, 4.470703125, 4.81640625, 5.162109375, 5.5078125, 5.853515625, 6.19921875, 6.544921875, 6.890625, 7.236328125, 7.58203125, 7.927734375, 8.2734375, 8.619140625, 8.96484375, 9.310546875, 9.65625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 11.0, 17.0, 18.0, 13.0, 29.0, 22.0, 23.0, 35.0, 36.0, 38.0, 43.0, 42.0, 49.0, 46.0, 40.0, 57.0, 43.0, 50.0, 50.0, 43.0, 42.0, 33.0, 27.0, 25.0, 28.0, 19.0, 21.0, 13.0, 12.0, 8.0, 8.0, 6.0, 3.0, 8.0, 7.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-18.1875, -17.6856689453125, -17.183837890625, -16.6820068359375, -16.18017578125, -15.6783447265625, -15.176513671875, -14.6746826171875, -14.1728515625, -13.6710205078125, -13.169189453125, -12.6673583984375, -12.16552734375, -11.6636962890625, -11.161865234375, -10.6600341796875, -10.158203125, -9.6563720703125, -9.154541015625, -8.6527099609375, -8.15087890625, -7.6490478515625, -7.147216796875, -6.6453857421875, -6.1435546875, -5.6417236328125, -5.139892578125, -4.6380615234375, -4.13623046875, -3.6343994140625, -3.132568359375, -2.6307373046875, -2.12890625, -1.6270751953125, -1.125244140625, -0.6234130859375, -0.12158203125, 0.3802490234375, 0.882080078125, 1.3839111328125, 1.8857421875, 2.3875732421875, 2.889404296875, 3.3912353515625, 3.89306640625, 4.3948974609375, 4.896728515625, 5.3985595703125, 5.900390625, 6.4022216796875, 6.904052734375, 7.4058837890625, 7.90771484375, 8.4095458984375, 8.911376953125, 9.4132080078125, 9.9150390625, 10.4168701171875, 10.918701171875, 11.4205322265625, 11.92236328125, 12.4241943359375, 12.926025390625, 13.4278564453125, 13.9296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 12.0, 15.0, 14.0, 20.0, 40.0, 96.0, 221.0, 1866.0, 935632.0, 109086.0, 1184.0, 197.0, 72.0, 32.0, 19.0, 12.0, 9.0, 12.0, 8.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6918869018554688, -0.6757659912109375, -0.6596450805664062, -0.643524169921875, -0.6274032592773438, -0.6112823486328125, -0.5951614379882812, -0.57904052734375, -0.5629196166992188, -0.5467987060546875, -0.5306777954101562, -0.514556884765625, -0.49843597412109375, -0.4823150634765625, -0.46619415283203125, -0.4500732421875, -0.43395233154296875, -0.4178314208984375, -0.40171051025390625, -0.385589599609375, -0.36946868896484375, -0.3533477783203125, -0.33722686767578125, -0.32110595703125, -0.30498504638671875, -0.2888641357421875, -0.27274322509765625, -0.256622314453125, -0.24050140380859375, -0.2243804931640625, -0.20825958251953125, -0.192138671875, -0.17601776123046875, -0.1598968505859375, -0.14377593994140625, -0.127655029296875, -0.11153411865234375, -0.0954132080078125, -0.07929229736328125, -0.06317138671875, -0.04705047607421875, -0.0309295654296875, -0.01480865478515625, 0.001312255859375, 0.01743316650390625, 0.0335540771484375, 0.04967498779296875, 0.0657958984375, 0.08191680908203125, 0.0980377197265625, 0.11415863037109375, 0.130279541015625, 0.14640045166015625, 0.1625213623046875, 0.17864227294921875, 0.19476318359375, 0.21088409423828125, 0.2270050048828125, 0.24312591552734375, 0.259246826171875, 0.27536773681640625, 0.2914886474609375, 0.30760955810546875, 0.32373046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 1.0, 6.0, 3.0, 4.0, 6.0, 6.0, 8.0, 15.0, 19.0, 27.0, 42.0, 58.0, 127.0, 198.0, 197.0, 105.0, 53.0, 29.0, 19.0, 17.0, 11.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.695487976074219e-05, -3.5954639315605164e-05, -3.495439887046814e-05, -3.3954158425331116e-05, -3.295391798019409e-05, -3.195367753505707e-05, -3.0953437089920044e-05, -2.995319664478302e-05, -2.8952956199645996e-05, -2.7952715754508972e-05, -2.6952475309371948e-05, -2.5952234864234924e-05, -2.49519944190979e-05, -2.3951753973960876e-05, -2.2951513528823853e-05, -2.195127308368683e-05, -2.0951032638549805e-05, -1.995079219341278e-05, -1.8950551748275757e-05, -1.7950311303138733e-05, -1.695007085800171e-05, -1.5949830412864685e-05, -1.4949589967727661e-05, -1.3949349522590637e-05, -1.2949109077453613e-05, -1.194886863231659e-05, -1.0948628187179565e-05, -9.948387742042542e-06, -8.948147296905518e-06, -7.947906851768494e-06, -6.94766640663147e-06, -5.947425961494446e-06, -4.947185516357422e-06, -3.946945071220398e-06, -2.946704626083374e-06, -1.94646418094635e-06, -9.462237358093262e-07, 5.4016709327697754e-08, 1.0542571544647217e-06, 2.0544975996017456e-06, 3.0547380447387695e-06, 4.0549784898757935e-06, 5.055218935012817e-06, 6.055459380149841e-06, 7.055699825286865e-06, 8.05594027042389e-06, 9.056180715560913e-06, 1.0056421160697937e-05, 1.1056661605834961e-05, 1.2056902050971985e-05, 1.3057142496109009e-05, 1.4057382941246033e-05, 1.5057623386383057e-05, 1.605786383152008e-05, 1.7058104276657104e-05, 1.805834472179413e-05, 1.9058585166931152e-05, 2.0058825612068176e-05, 2.10590660572052e-05, 2.2059306502342224e-05, 2.3059546947479248e-05, 2.4059787392616272e-05, 2.5060027837753296e-05, 2.606026828289032e-05, 2.7060508728027344e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 10.0, 7.0, 15.0, 17.0, 22.0, 39.0, 58.0, 139.0, 460.0, 2561.0, 42840.0, 986861.0, 13563.0, 1362.0, 298.0, 109.0, 58.0, 36.0, 16.0, 13.0, 13.0, 14.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.21349716186523438, -0.20507049560546875, -0.19664382934570312, -0.1882171630859375, -0.17979049682617188, -0.17136383056640625, -0.16293716430664062, -0.154510498046875, -0.14608383178710938, -0.13765716552734375, -0.12923049926757812, -0.1208038330078125, -0.11237716674804688, -0.10395050048828125, -0.09552383422851562, -0.08709716796875, -0.07867050170898438, -0.07024383544921875, -0.061817169189453125, -0.0533905029296875, -0.044963836669921875, -0.03653717041015625, -0.028110504150390625, -0.019683837890625, -0.011257171630859375, -0.00283050537109375, 0.005596160888671875, 0.0140228271484375, 0.022449493408203125, 0.03087615966796875, 0.039302825927734375, 0.0477294921875, 0.056156158447265625, 0.06458282470703125, 0.07300949096679688, 0.0814361572265625, 0.08986282348632812, 0.09828948974609375, 0.10671615600585938, 0.115142822265625, 0.12356948852539062, 0.13199615478515625, 0.14042282104492188, 0.1488494873046875, 0.15727615356445312, 0.16570281982421875, 0.17412948608398438, 0.18255615234375, 0.19098281860351562, 0.19940948486328125, 0.20783615112304688, 0.2162628173828125, 0.22468948364257812, 0.23311614990234375, 0.24154281616210938, 0.249969482421875, 0.2583961486816406, 0.26682281494140625, 0.2752494812011719, 0.2836761474609375, 0.2921028137207031, 0.30052947998046875, 0.3089561462402344, 0.3173828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 7.0, 7.0, 9.0, 15.0, 17.0, 24.0, 47.0, 71.0, 138.0, 217.0, 167.0, 71.0, 60.0, 38.0, 24.0, 14.0, 14.0, 8.0, 11.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0341796875, -0.03294181823730469, -0.031703948974609375, -0.030466079711914062, -0.02922821044921875, -0.027990341186523438, -0.026752471923828125, -0.025514602661132812, -0.0242767333984375, -0.023038864135742188, -0.021800994873046875, -0.020563125610351562, -0.01932525634765625, -0.018087387084960938, -0.016849517822265625, -0.015611648559570312, -0.014373779296875, -0.013135910034179688, -0.011898040771484375, -0.010660171508789062, -0.00942230224609375, -0.008184432983398438, -0.006946563720703125, -0.0057086944580078125, -0.0044708251953125, -0.0032329559326171875, -0.001995086669921875, -0.0007572174072265625, 0.00048065185546875, 0.0017185211181640625, 0.002956390380859375, 0.0041942596435546875, 0.00543212890625, 0.0066699981689453125, 0.007907867431640625, 0.009145736694335938, 0.01038360595703125, 0.011621475219726562, 0.012859344482421875, 0.014097213745117188, 0.0153350830078125, 0.016572952270507812, 0.017810821533203125, 0.019048690795898438, 0.02028656005859375, 0.021524429321289062, 0.022762298583984375, 0.024000167846679688, 0.025238037109375, 0.026475906372070312, 0.027713775634765625, 0.028951644897460938, 0.03018951416015625, 0.03142738342285156, 0.032665252685546875, 0.03390312194824219, 0.0351409912109375, 0.03637886047363281, 0.037616729736328125, 0.03885459899902344, 0.04009246826171875, 0.04133033752441406, 0.042568206787109375, 0.04380607604980469, 0.0450439453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 16.0, 21.0, 73.0, 145.0, 279.0, 255.0, 134.0, 56.0, 24.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.879417419433594, -11.655167579650879, -11.430917739868164, -11.20666790008545, -10.982418060302734, -10.75816822052002, -10.533918380737305, -10.309669494628906, -10.085418701171875, -9.86116886138916, -9.636919021606445, -9.41266918182373, -9.188419342041016, -8.9641695022583, -8.739919662475586, -8.515670776367188, -8.291420936584473, -8.067171096801758, -7.842921257019043, -7.618671417236328, -7.394421577453613, -7.170171737670898, -6.945922374725342, -6.721672534942627, -6.497422695159912, -6.273172855377197, -6.048923015594482, -5.824673175811768, -5.600423812866211, -5.376173973083496, -5.151924133300781, -4.927674293518066, -4.70342493057251, -4.479175090789795, -4.25492525100708, -4.030675411224365, -3.8064258098602295, -3.5821759700775146, -3.357926368713379, -3.133676528930664, -2.909426689147949, -2.6851768493652344, -2.4609270095825195, -2.236677408218384, -2.012427568435669, -1.788177728652954, -1.5639280080795288, -1.3396782875061035, -1.1154284477233887, -0.8911786675453186, -0.6669288873672485, -0.44267910718917847, -0.2184293270111084, 0.005820512771606445, 0.23007023334503174, 0.45431995391845703, 0.6785697937011719, 0.9028195738792419, 1.127069354057312, 1.3513190746307373, 1.5755689144134521, 1.799818754196167, 2.0240683555603027, 2.2483181953430176, 2.4725680351257324]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 5.0, 15.0, 12.0, 10.0, 16.0, 17.0, 18.0, 29.0, 22.0, 26.0, 28.0, 39.0, 37.0, 40.0, 51.0, 41.0, 43.0, 44.0, 38.0, 48.0, 47.0, 35.0, 37.0, 42.0, 38.0, 32.0, 24.0, 26.0, 35.0, 22.0, 15.0, 9.0, 11.0, 6.0, 9.0, 7.0, 5.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.74412727355957, -18.15521240234375, -17.56629753112793, -16.977380752563477, -16.388465881347656, -15.799551010131836, -15.210636138916016, -14.621720314025879, -14.032804489135742, -13.443889617919922, -12.854973793029785, -12.266058921813965, -11.677143096923828, -11.088228225708008, -10.499313354492188, -9.91039752960205, -9.32148265838623, -8.73256778717041, -8.143651962280273, -7.554737091064453, -6.965821266174316, -6.376906394958496, -5.787991046905518, -5.199075698852539, -4.6101603507995605, -4.021245002746582, -3.4323296546936035, -2.843414545059204, -2.2544991970062256, -1.665583848953247, -1.0766687393188477, -0.48775339126586914, 0.10116195678710938, 0.6900772452354431, 1.2789925336837769, 1.8679077625274658, 2.4568231105804443, 3.045738458633423, 3.6346535682678223, 4.223568916320801, 4.812484264373779, 5.401399612426758, 5.990314960479736, 6.579230308532715, 7.168145179748535, 7.757061004638672, 8.345975875854492, 8.934890747070312, 9.52380657196045, 10.11272144317627, 10.701637268066406, 11.290552139282227, 11.879467964172363, 12.468382835388184, 13.05729866027832, 13.64621353149414, 14.235128402709961, 14.824043273925781, 15.412959098815918, 16.001874923706055, 16.590789794921875, 17.179704666137695, 17.768619537353516, 18.35753631591797, 18.94645118713379]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 10.0, 7.0, 11.0, 9.0, 10.0, 12.0, 11.0, 23.0, 29.0, 31.0, 43.0, 57.0, 77.0, 136.0, 197.0, 465.0, 6323.0, 4159070.0, 26352.0, 612.0, 292.0, 121.0, 75.0, 72.0, 40.0, 23.0, 26.0, 28.0, 18.0, 26.0, 18.0, 8.0, 6.0, 8.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8045654296875, -9.484130859375, -9.1636962890625, -8.84326171875, -8.5228271484375, -8.202392578125, -7.8819580078125, -7.5615234375, -7.2410888671875, -6.920654296875, -6.6002197265625, -6.27978515625, -5.9593505859375, -5.638916015625, -5.3184814453125, -4.998046875, -4.6776123046875, -4.357177734375, -4.0367431640625, -3.71630859375, -3.3958740234375, -3.075439453125, -2.7550048828125, -2.4345703125, -2.1141357421875, -1.793701171875, -1.4732666015625, -1.15283203125, -0.8323974609375, -0.511962890625, -0.1915283203125, 0.12890625, 0.4493408203125, 0.769775390625, 1.0902099609375, 1.41064453125, 1.7310791015625, 2.051513671875, 2.3719482421875, 2.6923828125, 3.0128173828125, 3.333251953125, 3.6536865234375, 3.97412109375, 4.2945556640625, 4.614990234375, 4.9354248046875, 5.255859375, 5.5762939453125, 5.896728515625, 6.2171630859375, 6.53759765625, 6.8580322265625, 7.178466796875, 7.4989013671875, 7.8193359375, 8.1397705078125, 8.460205078125, 8.7806396484375, 9.10107421875, 9.4215087890625, 9.741943359375, 10.0623779296875, 10.3828125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 12.0, 17.0, 16.0, 24.0, 26.0, 34.0, 27.0, 38.0, 53.0, 63.0, 66.0, 78.0, 75.0, 66.0, 72.0, 50.0, 54.0, 54.0, 28.0, 38.0, 21.0, 29.0, 12.0, 13.0, 15.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.75390625, -2.6903076171875, -2.626708984375, -2.5631103515625, -2.49951171875, -2.4359130859375, -2.372314453125, -2.3087158203125, -2.2451171875, -2.1815185546875, -2.117919921875, -2.0543212890625, -1.99072265625, -1.9271240234375, -1.863525390625, -1.7999267578125, -1.736328125, -1.6727294921875, -1.609130859375, -1.5455322265625, -1.48193359375, -1.4183349609375, -1.354736328125, -1.2911376953125, -1.2275390625, -1.1639404296875, -1.100341796875, -1.0367431640625, -0.97314453125, -0.9095458984375, -0.845947265625, -0.7823486328125, -0.71875, -0.6551513671875, -0.591552734375, -0.5279541015625, -0.46435546875, -0.4007568359375, -0.337158203125, -0.2735595703125, -0.2099609375, -0.1463623046875, -0.082763671875, -0.0191650390625, 0.04443359375, 0.1080322265625, 0.171630859375, 0.2352294921875, 0.298828125, 0.3624267578125, 0.426025390625, 0.4896240234375, 0.55322265625, 0.6168212890625, 0.680419921875, 0.7440185546875, 0.8076171875, 0.8712158203125, 0.934814453125, 0.9984130859375, 1.06201171875, 1.1256103515625, 1.189208984375, 1.2528076171875, 1.31640625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 21.0, 4194065.0, 185.0, 8.0, 6.0, 5.0], "bins": [-1152.0, -1132.744140625, -1113.48828125, -1094.232421875, -1074.9765625, -1055.720703125, -1036.46484375, -1017.208984375, -997.953125, -978.697265625, -959.44140625, -940.185546875, -920.9296875, -901.673828125, -882.41796875, -863.162109375, -843.90625, -824.650390625, -805.39453125, -786.138671875, -766.8828125, -747.626953125, -728.37109375, -709.115234375, -689.859375, -670.603515625, -651.34765625, -632.091796875, -612.8359375, -593.580078125, -574.32421875, -555.068359375, -535.8125, -516.556640625, -497.30078125, -478.044921875, -458.7890625, -439.533203125, -420.27734375, -401.021484375, -381.765625, -362.509765625, -343.25390625, -323.998046875, -304.7421875, -285.486328125, -266.23046875, -246.974609375, -227.71875, -208.462890625, -189.20703125, -169.951171875, -150.6953125, -131.439453125, -112.18359375, -92.927734375, -73.671875, -54.416015625, -35.16015625, -15.904296875, 3.3515625, 22.607421875, 41.86328125, 61.119140625, 80.375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 4.0, 27.0, 427.0, 3424.0, 173.0, 19.0, 7.0, 2.0, 0.0, 1.0], "bins": [-6.66015625, -6.544013977050781, -6.4278717041015625, -6.311729431152344, -6.195587158203125, -6.079444885253906, -5.9633026123046875, -5.847160339355469, -5.73101806640625, -5.614875793457031, -5.4987335205078125, -5.382591247558594, -5.266448974609375, -5.150306701660156, -5.0341644287109375, -4.918022155761719, -4.8018798828125, -4.685737609863281, -4.5695953369140625, -4.453453063964844, -4.337310791015625, -4.221168518066406, -4.1050262451171875, -3.9888839721679688, -3.87274169921875, -3.7565994262695312, -3.6404571533203125, -3.5243148803710938, -3.408172607421875, -3.2920303344726562, -3.1758880615234375, -3.0597457885742188, -2.943603515625, -2.8274612426757812, -2.7113189697265625, -2.5951766967773438, -2.479034423828125, -2.3628921508789062, -2.2467498779296875, -2.1306076049804688, -2.01446533203125, -1.8983230590820312, -1.7821807861328125, -1.6660385131835938, -1.549896240234375, -1.4337539672851562, -1.3176116943359375, -1.2014694213867188, -1.0853271484375, -0.9691848754882812, -0.8530426025390625, -0.7369003295898438, -0.620758056640625, -0.5046157836914062, -0.3884735107421875, -0.27233123779296875, -0.15618896484375, -0.04004669189453125, 0.0760955810546875, 0.19223785400390625, 0.308380126953125, 0.42452239990234375, 0.5406646728515625, 0.6568069458007812, 0.77294921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 25.0, 26.0, 46.0, 79.0, 114.0, 126.0, 132.0, 137.0, 115.0, 63.0, 42.0, 33.0, 20.0, 7.0, 6.0, 4.0, 6.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2193613052368164, -2.1383421421051025, -2.0573229789733887, -1.9763039350509644, -1.89528489112854, -1.8142657279968262, -1.7332465648651123, -1.6522274017333984, -1.5712083578109741, -1.4901891946792603, -1.409170150756836, -1.328150987625122, -1.2471318244934082, -1.1661127805709839, -1.08509361743927, -1.0040745735168457, -0.9230554103851318, -0.8420363068580627, -0.7610172033309937, -0.6799980401992798, -0.5989789366722107, -0.5179598331451416, -0.4369406998157501, -0.35592156648635864, -0.27490246295928955, -0.19388334453105927, -0.11286422610282898, -0.031845107674598694, 0.04917401075363159, 0.13019311428070068, 0.21121224761009216, 0.29223138093948364, 0.37325072288513184, 0.4542698264122009, 0.53528892993927, 0.6163080930709839, 0.697327196598053, 0.7783463001251221, 0.8593654632568359, 0.940384566783905, 1.0214036703109741, 1.102422833442688, 1.1834418773651123, 1.2644610404968262, 1.34548020362854, 1.4264992475509644, 1.5075184106826782, 1.5885374546051025, 1.6695566177368164, 1.7505757808685303, 1.8315948247909546, 1.9126139879226685, 1.9936330318450928, 2.0746521949768066, 2.1556713581085205, 2.2366905212402344, 2.317709445953369, 2.398728609085083, 2.479747772216797, 2.5607666969299316, 2.6417858600616455, 2.7228050231933594, 2.8038241863250732, 2.884843349456787, 2.965862512588501]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 18.0, 16.0, 25.0, 38.0, 46.0, 50.0, 44.0, 55.0, 76.0, 83.0, 72.0, 73.0, 62.0, 40.0, 59.0, 40.0, 48.0, 32.0, 34.0, 23.0, 14.0, 20.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.874143123626709, -3.7888190746307373, -3.7034947872161865, -3.618170738220215, -3.532846689224243, -3.4475226402282715, -3.3621983528137207, -3.276874303817749, -3.1915502548217773, -3.1062262058258057, -3.020901918411255, -2.935577869415283, -2.8502538204193115, -2.76492977142334, -2.679605484008789, -2.5942814350128174, -2.5089571475982666, -2.423633098602295, -2.338308811187744, -2.2529847621917725, -2.167660713195801, -2.08233642578125, -1.9970123767852783, -1.9116883277893066, -1.8263641595840454, -1.7410399913787842, -1.6557159423828125, -1.5703917741775513, -1.48506760597229, -1.3997435569763184, -1.3144193887710571, -1.229095220565796, -1.1437710523605347, -1.0584468841552734, -0.9731228351593018, -0.8877986669540405, -0.8024745583534241, -0.7171504497528076, -0.6318262815475464, -0.5465021729469299, -0.4611780643463135, -0.375853955745697, -0.2905298173427582, -0.20520567893981934, -0.11988157033920288, -0.034557461738586426, 0.050766706466674805, 0.13609081506729126, 0.22141492366790771, 0.30673903226852417, 0.392063170671463, 0.47738730907440186, 0.5627114176750183, 0.6480355262756348, 0.733359694480896, 0.8186838030815125, 0.9040079116821289, 0.9893320202827454, 1.0746561288833618, 1.159980297088623, 1.2453043460845947, 1.330628514289856, 1.4159526824951172, 1.5012767314910889, 1.58660089969635]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 7.0, 6.0, 7.0, 4.0, 10.0, 16.0, 47.0, 94.0, 157.0, 390.0, 990.0, 2680.0, 10952.0, 297918.0, 711072.0, 18652.0, 3296.0, 1320.0, 501.0, 206.0, 82.0, 66.0, 31.0, 12.0, 3.0, 3.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3466796875, -1.30938720703125, -1.2720947265625, -1.23480224609375, -1.197509765625, -1.16021728515625, -1.1229248046875, -1.08563232421875, -1.04833984375, -1.01104736328125, -0.9737548828125, -0.93646240234375, -0.899169921875, -0.86187744140625, -0.8245849609375, -0.78729248046875, -0.75, -0.71270751953125, -0.6754150390625, -0.63812255859375, -0.600830078125, -0.56353759765625, -0.5262451171875, -0.48895263671875, -0.45166015625, -0.41436767578125, -0.3770751953125, -0.33978271484375, -0.302490234375, -0.26519775390625, -0.2279052734375, -0.19061279296875, -0.1533203125, -0.11602783203125, -0.0787353515625, -0.04144287109375, -0.004150390625, 0.03314208984375, 0.0704345703125, 0.10772705078125, 0.14501953125, 0.18231201171875, 0.2196044921875, 0.25689697265625, 0.294189453125, 0.33148193359375, 0.3687744140625, 0.40606689453125, 0.443359375, 0.48065185546875, 0.5179443359375, 0.55523681640625, 0.592529296875, 0.62982177734375, 0.6671142578125, 0.70440673828125, 0.74169921875, 0.77899169921875, 0.8162841796875, 0.85357666015625, 0.890869140625, 0.92816162109375, 0.9654541015625, 1.00274658203125, 1.0400390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 13.0, 13.0, 23.0, 27.0, 45.0, 47.0, 62.0, 66.0, 83.0, 103.0, 90.0, 83.0, 76.0, 70.0, 50.0, 46.0, 38.0, 29.0, 16.0, 12.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.162109375, -3.0905914306640625, -3.019073486328125, -2.9475555419921875, -2.87603759765625, -2.8045196533203125, -2.733001708984375, -2.6614837646484375, -2.5899658203125, -2.5184478759765625, -2.446929931640625, -2.3754119873046875, -2.30389404296875, -2.2323760986328125, -2.160858154296875, -2.0893402099609375, -2.017822265625, -1.9463043212890625, -1.874786376953125, -1.8032684326171875, -1.73175048828125, -1.6602325439453125, -1.588714599609375, -1.5171966552734375, -1.4456787109375, -1.3741607666015625, -1.302642822265625, -1.2311248779296875, -1.15960693359375, -1.0880889892578125, -1.016571044921875, -0.9450531005859375, -0.87353515625, -0.8020172119140625, -0.730499267578125, -0.6589813232421875, -0.58746337890625, -0.5159454345703125, -0.444427490234375, -0.3729095458984375, -0.3013916015625, -0.2298736572265625, -0.158355712890625, -0.0868377685546875, -0.01531982421875, 0.0561981201171875, 0.127716064453125, 0.1992340087890625, 0.270751953125, 0.3422698974609375, 0.413787841796875, 0.4853057861328125, 0.55682373046875, 0.6283416748046875, 0.699859619140625, 0.7713775634765625, 0.8428955078125, 0.9144134521484375, 0.985931396484375, 1.0574493408203125, 1.12896728515625, 1.2004852294921875, 1.272003173828125, 1.3435211181640625, 1.4150390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 16.0, 17.0, 26.0, 49.0, 66.0, 91.0, 171.0, 270.0, 366.0, 620.0, 983.0, 1587.0, 2423.0, 3959.0, 6317.0, 10351.0, 17701.0, 29827.0, 52797.0, 94929.0, 160883.0, 216669.0, 184323.0, 113020.0, 62799.0, 35585.0, 20685.0, 12152.0, 7370.0, 4623.0, 2881.0, 1748.0, 1169.0, 769.0, 464.0, 289.0, 184.0, 118.0, 79.0, 59.0, 37.0, 17.0, 19.0, 5.0, 6.0, 12.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.091552734375, -0.08846569061279297, -0.08537864685058594, -0.0822916030883789, -0.07920455932617188, -0.07611751556396484, -0.07303047180175781, -0.06994342803955078, -0.06685638427734375, -0.06376934051513672, -0.06068229675292969, -0.057595252990722656, -0.054508209228515625, -0.051421165466308594, -0.04833412170410156, -0.04524707794189453, -0.0421600341796875, -0.03907299041748047, -0.03598594665527344, -0.032898902893066406, -0.029811859130859375, -0.026724815368652344, -0.023637771606445312, -0.02055072784423828, -0.01746368408203125, -0.014376640319824219, -0.011289596557617188, -0.008202552795410156, -0.005115509033203125, -0.0020284652709960938, 0.0010585784912109375, 0.004145622253417969, 0.007232666015625, 0.010319709777832031, 0.013406753540039062, 0.016493797302246094, 0.019580841064453125, 0.022667884826660156, 0.025754928588867188, 0.02884197235107422, 0.03192901611328125, 0.03501605987548828, 0.03810310363769531, 0.041190147399902344, 0.044277191162109375, 0.047364234924316406, 0.05045127868652344, 0.05353832244873047, 0.0566253662109375, 0.05971240997314453, 0.06279945373535156, 0.0658864974975586, 0.06897354125976562, 0.07206058502197266, 0.07514762878417969, 0.07823467254638672, 0.08132171630859375, 0.08440876007080078, 0.08749580383300781, 0.09058284759521484, 0.09366989135742188, 0.0967569351196289, 0.09984397888183594, 0.10293102264404297, 0.10601806640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 4.0, 7.0, 7.0, 4.0, 7.0, 25.0, 20.0, 16.0, 21.0, 19.0, 27.0, 17.0, 27.0, 34.0, 30.0, 49.0, 49.0, 52.0, 44.0, 44.0, 46.0, 48.0, 41.0, 40.0, 34.0, 41.0, 29.0, 31.0, 28.0, 27.0, 25.0, 23.0, 11.0, 15.0, 10.0, 5.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.0072479248046875, -1.948089599609375, -1.8889312744140625, -1.82977294921875, -1.7706146240234375, -1.711456298828125, -1.6522979736328125, -1.5931396484375, -1.5339813232421875, -1.474822998046875, -1.4156646728515625, -1.35650634765625, -1.2973480224609375, -1.238189697265625, -1.1790313720703125, -1.119873046875, -1.0607147216796875, -1.001556396484375, -0.9423980712890625, -0.88323974609375, -0.8240814208984375, -0.764923095703125, -0.7057647705078125, -0.6466064453125, -0.5874481201171875, -0.528289794921875, -0.4691314697265625, -0.40997314453125, -0.3508148193359375, -0.291656494140625, -0.2324981689453125, -0.17333984375, -0.1141815185546875, -0.055023193359375, 0.0041351318359375, 0.06329345703125, 0.1224517822265625, 0.181610107421875, 0.2407684326171875, 0.2999267578125, 0.3590850830078125, 0.418243408203125, 0.4774017333984375, 0.53656005859375, 0.5957183837890625, 0.654876708984375, 0.7140350341796875, 0.773193359375, 0.8323516845703125, 0.891510009765625, 0.9506683349609375, 1.00982666015625, 1.0689849853515625, 1.128143310546875, 1.1873016357421875, 1.2464599609375, 1.3056182861328125, 1.364776611328125, 1.4239349365234375, 1.48309326171875, 1.5422515869140625, 1.601409912109375, 1.6605682373046875, 1.7197265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 8.0, 16.0, 9.0, 18.0, 18.0, 31.0, 40.0, 86.0, 117.0, 206.0, 386.0, 697.0, 1530.0, 3358.0, 8228.0, 22344.0, 77690.0, 354284.0, 433845.0, 101261.0, 27010.0, 9611.0, 3974.0, 1801.0, 884.0, 420.0, 222.0, 128.0, 95.0, 63.0, 47.0, 39.0, 20.0, 22.0, 14.0, 7.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0230560302734375, -0.022379636764526367, -0.021703243255615234, -0.0210268497467041, -0.02035045623779297, -0.019674062728881836, -0.018997669219970703, -0.01832127571105957, -0.017644882202148438, -0.016968488693237305, -0.016292095184326172, -0.015615701675415039, -0.014939308166503906, -0.014262914657592773, -0.01358652114868164, -0.012910127639770508, -0.012233734130859375, -0.011557340621948242, -0.01088094711303711, -0.010204553604125977, -0.009528160095214844, -0.008851766586303711, -0.008175373077392578, -0.007498979568481445, -0.0068225860595703125, -0.00614619255065918, -0.005469799041748047, -0.004793405532836914, -0.004117012023925781, -0.0034406185150146484, -0.0027642250061035156, -0.002087831497192383, -0.00141143798828125, -0.0007350444793701172, -5.8650970458984375e-05, 0.0006177425384521484, 0.0012941360473632812, 0.001970529556274414, 0.002646923065185547, 0.0033233165740966797, 0.0039997100830078125, 0.004676103591918945, 0.005352497100830078, 0.006028890609741211, 0.006705284118652344, 0.0073816776275634766, 0.00805807113647461, 0.008734464645385742, 0.009410858154296875, 0.010087251663208008, 0.01076364517211914, 0.011440038681030273, 0.012116432189941406, 0.012792825698852539, 0.013469219207763672, 0.014145612716674805, 0.014822006225585938, 0.01549839973449707, 0.016174793243408203, 0.016851186752319336, 0.01752758026123047, 0.0182039737701416, 0.018880367279052734, 0.019556760787963867, 0.020233154296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 11.0, 11.0, 19.0, 20.0, 30.0, 48.0, 64.0, 43.0, 92.0, 84.0, 82.0, 92.0, 80.0, 83.0, 55.0, 37.0, 26.0, 25.0, 12.0, 17.0, 12.0, 7.0, 5.0, 1.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9206275939941406e-05, -2.8141774237155914e-05, -2.7077272534370422e-05, -2.601277083158493e-05, -2.494826912879944e-05, -2.3883767426013947e-05, -2.2819265723228455e-05, -2.1754764020442963e-05, -2.069026231765747e-05, -1.962576061487198e-05, -1.8561258912086487e-05, -1.7496757209300995e-05, -1.6432255506515503e-05, -1.536775380373001e-05, -1.4303252100944519e-05, -1.3238750398159027e-05, -1.2174248695373535e-05, -1.1109746992588043e-05, -1.0045245289802551e-05, -8.98074358701706e-06, -7.916241884231567e-06, -6.8517401814460754e-06, -5.7872384786605835e-06, -4.7227367758750916e-06, -3.6582350730895996e-06, -2.5937333703041077e-06, -1.5292316675186157e-06, -4.647299647331238e-07, 5.997717380523682e-07, 1.6642734408378601e-06, 2.728775143623352e-06, 3.793276846408844e-06, 4.857778549194336e-06, 5.922280251979828e-06, 6.98678195476532e-06, 8.051283657550812e-06, 9.115785360336304e-06, 1.0180287063121796e-05, 1.1244788765907288e-05, 1.230929046869278e-05, 1.3373792171478271e-05, 1.4438293874263763e-05, 1.5502795577049255e-05, 1.6567297279834747e-05, 1.763179898262024e-05, 1.869630068540573e-05, 1.9760802388191223e-05, 2.0825304090976715e-05, 2.1889805793762207e-05, 2.29543074965477e-05, 2.401880919933319e-05, 2.5083310902118683e-05, 2.6147812604904175e-05, 2.7212314307689667e-05, 2.827681601047516e-05, 2.934131771326065e-05, 3.0405819416046143e-05, 3.1470321118831635e-05, 3.2534822821617126e-05, 3.359932452440262e-05, 3.466382622718811e-05, 3.57283279299736e-05, 3.6792829632759094e-05, 3.7857331335544586e-05, 3.892183303833008e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 7.0, 4.0, 12.0, 9.0, 11.0, 21.0, 36.0, 25.0, 48.0, 68.0, 128.0, 444.0, 77746.0, 968593.0, 937.0, 166.0, 77.0, 51.0, 46.0, 24.0, 24.0, 15.0, 11.0, 10.0, 9.0, 5.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1656494140625, -0.16015243530273438, -0.15465545654296875, -0.14915847778320312, -0.1436614990234375, -0.13816452026367188, -0.13266754150390625, -0.12717056274414062, -0.121673583984375, -0.11617660522460938, -0.11067962646484375, -0.10518264770507812, -0.0996856689453125, -0.09418869018554688, -0.08869171142578125, -0.08319473266601562, -0.07769775390625, -0.07220077514648438, -0.06670379638671875, -0.061206817626953125, -0.0557098388671875, -0.050212860107421875, -0.04471588134765625, -0.039218902587890625, -0.033721923828125, -0.028224945068359375, -0.02272796630859375, -0.017230987548828125, -0.0117340087890625, -0.006237030029296875, -0.00074005126953125, 0.004756927490234375, 0.01025390625, 0.015750885009765625, 0.02124786376953125, 0.026744842529296875, 0.0322418212890625, 0.037738800048828125, 0.04323577880859375, 0.048732757568359375, 0.054229736328125, 0.059726715087890625, 0.06522369384765625, 0.07072067260742188, 0.0762176513671875, 0.08171463012695312, 0.08721160888671875, 0.09270858764648438, 0.09820556640625, 0.10370254516601562, 0.10919952392578125, 0.11469650268554688, 0.1201934814453125, 0.12569046020507812, 0.13118743896484375, 0.13668441772460938, 0.142181396484375, 0.14767837524414062, 0.15317535400390625, 0.15867233276367188, 0.1641693115234375, 0.16966629028320312, 0.17516326904296875, 0.18066024780273438, 0.1861572265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 13.0, 17.0, 28.0, 37.0, 52.0, 48.0, 76.0, 109.0, 109.0, 115.0, 106.0, 70.0, 50.0, 53.0, 27.0, 21.0, 20.0, 7.0, 12.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0104522705078125, -0.01012265682220459, -0.00979304313659668, -0.00946342945098877, -0.00913381576538086, -0.00880420207977295, -0.008474588394165039, -0.008144974708557129, -0.007815361022949219, -0.007485747337341309, -0.0071561336517333984, -0.006826519966125488, -0.006496906280517578, -0.006167292594909668, -0.005837678909301758, -0.005508065223693848, -0.0051784515380859375, -0.004848837852478027, -0.004519224166870117, -0.004189610481262207, -0.003859996795654297, -0.0035303831100463867, -0.0032007694244384766, -0.0028711557388305664, -0.0025415420532226562, -0.002211928367614746, -0.001882314682006836, -0.0015527009963989258, -0.0012230873107910156, -0.0008934736251831055, -0.0005638599395751953, -0.00023424625396728516, 9.5367431640625e-05, 0.00042498111724853516, 0.0007545948028564453, 0.0010842084884643555, 0.0014138221740722656, 0.0017434358596801758, 0.002073049545288086, 0.002402663230895996, 0.0027322769165039062, 0.0030618906021118164, 0.0033915042877197266, 0.0037211179733276367, 0.004050731658935547, 0.004380345344543457, 0.004709959030151367, 0.005039572715759277, 0.0053691864013671875, 0.005698800086975098, 0.006028413772583008, 0.006358027458190918, 0.006687641143798828, 0.007017254829406738, 0.0073468685150146484, 0.007676482200622559, 0.008006095886230469, 0.008335709571838379, 0.008665323257446289, 0.0089949369430542, 0.00932455062866211, 0.00965416431427002, 0.00998377799987793, 0.01031339168548584, 0.01064300537109375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 7.0, 29.0, 103.0, 304.0, 357.0, 139.0, 44.0, 12.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.545940399169922, -2.4200143814086914, -2.29408860206604, -2.1681625843048096, -2.042236804962158, -1.9163107872009277, -1.7903847694396973, -1.6644588708877563, -1.5385329723358154, -1.4126070737838745, -1.2866811752319336, -1.1607551574707031, -1.0348292589187622, -0.9089033603668213, -0.7829774022102356, -0.6570514440536499, -0.531125545501709, -0.4051996171474457, -0.2792736887931824, -0.15334776043891907, -0.02742183208465576, 0.09850406646728516, 0.22443002462387085, 0.35035598278045654, 0.47628188133239746, 0.6022077798843384, 0.7281337380409241, 0.8540596961975098, 0.9799855947494507, 1.1059114933013916, 1.231837511062622, 1.357763409614563, 1.483689785003662, 1.609615683555603, 1.735541582107544, 1.8614675998687744, 1.9873934984207153, 2.1133193969726562, 2.2392454147338867, 2.365171432495117, 2.4910972118377686, 2.617023229598999, 2.7429490089416504, 2.868875026702881, 2.9948010444641113, 3.1207268238067627, 3.246652841567993, 3.3725786209106445, 3.498504638671875, 3.6244306564331055, 3.750356435775757, 3.8762824535369873, 4.002208232879639, 4.128134250640869, 4.2540602684021, 4.37998628616333, 4.505911827087402, 4.631837844848633, 4.757763862609863, 4.8836894035339355, 5.009615421295166, 5.1355414390563965, 5.261467456817627, 5.387393474578857, 5.513319492340088]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 8.0, 16.0, 24.0, 27.0, 44.0, 51.0, 57.0, 62.0, 97.0, 89.0, 92.0, 81.0, 56.0, 61.0, 51.0, 56.0, 42.0, 26.0, 22.0, 15.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.8317196369171143, -2.769137144088745, -2.706554651260376, -2.643972158432007, -2.5813896656036377, -2.5188071727752686, -2.4562246799468994, -2.3936424255371094, -2.3310599327087402, -2.268477439880371, -2.205894947052002, -2.143312454223633, -2.0807299613952637, -2.0181474685668945, -1.955565094947815, -1.8929826021194458, -1.830399990081787, -1.767817497253418, -1.7052350044250488, -1.6426525115966797, -1.5800700187683105, -1.5174875259399414, -1.4549051523208618, -1.3923226594924927, -1.3297401666641235, -1.2671576738357544, -1.2045751810073853, -1.1419926881790161, -1.0794103145599365, -1.0168278217315674, -0.9542453289031982, -0.8916628360748291, -0.8290802240371704, -0.7664977312088013, -0.7039152383804321, -0.6413328051567078, -0.5787503123283386, -0.5161678194999695, -0.45358535647392273, -0.391002893447876, -0.32842040061950684, -0.2658379077911377, -0.20325544476509094, -0.140672966837883, -0.07809048891067505, -0.015507996082305908, 0.047074466943740845, 0.1096569299697876, 0.17223942279815674, 0.23482190072536469, 0.29740437865257263, 0.3599868416786194, 0.4225693345069885, 0.48515182733535767, 0.547734260559082, 0.6103167533874512, 0.6728992462158203, 0.7354817390441895, 0.7980642318725586, 0.860646665096283, 0.9232291579246521, 0.9858116507530212, 1.0483940839767456, 1.1109765768051147, 1.1735590696334839]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 11.0, 13.0, 20.0, 22.0, 38.0, 44.0, 77.0, 113.0, 241.0, 354.0, 692.0, 1418.0, 3148.0, 7849.0, 23477.0, 99347.0, 660264.0, 194817.0, 36992.0, 11485.0, 4224.0, 1799.0, 903.0, 484.0, 252.0, 139.0, 106.0, 52.0, 48.0, 18.0, 26.0, 12.0, 14.0, 10.0, 3.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.173828125, -2.1072998046875, -2.040771484375, -1.9742431640625, -1.90771484375, -1.8411865234375, -1.774658203125, -1.7081298828125, -1.6416015625, -1.5750732421875, -1.508544921875, -1.4420166015625, -1.37548828125, -1.3089599609375, -1.242431640625, -1.1759033203125, -1.109375, -1.0428466796875, -0.976318359375, -0.9097900390625, -0.84326171875, -0.7767333984375, -0.710205078125, -0.6436767578125, -0.5771484375, -0.5106201171875, -0.444091796875, -0.3775634765625, -0.31103515625, -0.2445068359375, -0.177978515625, -0.1114501953125, -0.044921875, 0.0216064453125, 0.088134765625, 0.1546630859375, 0.22119140625, 0.2877197265625, 0.354248046875, 0.4207763671875, 0.4873046875, 0.5538330078125, 0.620361328125, 0.6868896484375, 0.75341796875, 0.8199462890625, 0.886474609375, 0.9530029296875, 1.01953125, 1.0860595703125, 1.152587890625, 1.2191162109375, 1.28564453125, 1.3521728515625, 1.418701171875, 1.4852294921875, 1.5517578125, 1.6182861328125, 1.684814453125, 1.7513427734375, 1.81787109375, 1.8843994140625, 1.950927734375, 2.0174560546875, 2.083984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 13.0, 27.0, 26.0, 46.0, 36.0, 53.0, 81.0, 83.0, 102.0, 89.0, 87.0, 67.0, 71.0, 59.0, 47.0, 37.0, 24.0, 19.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.274658203125, -14.81494140625, -14.355224609375, -13.8955078125, -13.435791015625, -12.97607421875, -12.516357421875, -12.056640625, -11.596923828125, -11.13720703125, -10.677490234375, -10.2177734375, -9.758056640625, -9.29833984375, -8.838623046875, -8.37890625, -7.919189453125, -7.45947265625, -6.999755859375, -6.5400390625, -6.080322265625, -5.62060546875, -5.160888671875, -4.701171875, -4.241455078125, -3.78173828125, -3.322021484375, -2.8623046875, -2.402587890625, -1.94287109375, -1.483154296875, -1.0234375, -0.563720703125, -0.10400390625, 0.355712890625, 0.8154296875, 1.275146484375, 1.73486328125, 2.194580078125, 2.654296875, 3.114013671875, 3.57373046875, 4.033447265625, 4.4931640625, 4.952880859375, 5.41259765625, 5.872314453125, 6.33203125, 6.791748046875, 7.25146484375, 7.711181640625, 8.1708984375, 8.630615234375, 9.09033203125, 9.550048828125, 10.009765625, 10.469482421875, 10.92919921875, 11.388916015625, 11.8486328125, 12.308349609375, 12.76806640625, 13.227783203125, 13.6875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 6.0, 6.0, 4.0, 10.0, 9.0, 19.0, 23.0, 25.0, 45.0, 59.0, 77.0, 109.0, 1116.0, 1046433.0, 252.0, 105.0, 68.0, 55.0, 37.0, 32.0, 17.0, 15.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.9375, -47.51123046875, -46.0849609375, -44.65869140625, -43.232421875, -41.80615234375, -40.3798828125, -38.95361328125, -37.52734375, -36.10107421875, -34.6748046875, -33.24853515625, -31.822265625, -30.39599609375, -28.9697265625, -27.54345703125, -26.1171875, -24.69091796875, -23.2646484375, -21.83837890625, -20.412109375, -18.98583984375, -17.5595703125, -16.13330078125, -14.70703125, -13.28076171875, -11.8544921875, -10.42822265625, -9.001953125, -7.57568359375, -6.1494140625, -4.72314453125, -3.296875, -1.87060546875, -0.4443359375, 0.98193359375, 2.408203125, 3.83447265625, 5.2607421875, 6.68701171875, 8.11328125, 9.53955078125, 10.9658203125, 12.39208984375, 13.818359375, 15.24462890625, 16.6708984375, 18.09716796875, 19.5234375, 20.94970703125, 22.3759765625, 23.80224609375, 25.228515625, 26.65478515625, 28.0810546875, 29.50732421875, 30.93359375, 32.35986328125, 33.7861328125, 35.21240234375, 36.638671875, 38.06494140625, 39.4912109375, 40.91748046875, 42.34375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 6.0, 7.0, 3.0, 10.0, 9.0, 20.0, 22.0, 28.0, 45.0, 57.0, 72.0, 84.0, 97.0, 111.0, 96.0, 81.0, 63.0, 57.0, 38.0, 33.0, 16.0, 15.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.5625, -18.991943359375, -18.42138671875, -17.850830078125, -17.2802734375, -16.709716796875, -16.13916015625, -15.568603515625, -14.998046875, -14.427490234375, -13.85693359375, -13.286376953125, -12.7158203125, -12.145263671875, -11.57470703125, -11.004150390625, -10.43359375, -9.863037109375, -9.29248046875, -8.721923828125, -8.1513671875, -7.580810546875, -7.01025390625, -6.439697265625, -5.869140625, -5.298583984375, -4.72802734375, -4.157470703125, -3.5869140625, -3.016357421875, -2.44580078125, -1.875244140625, -1.3046875, -0.734130859375, -0.16357421875, 0.406982421875, 0.9775390625, 1.548095703125, 2.11865234375, 2.689208984375, 3.259765625, 3.830322265625, 4.40087890625, 4.971435546875, 5.5419921875, 6.112548828125, 6.68310546875, 7.253662109375, 7.82421875, 8.394775390625, 8.96533203125, 9.535888671875, 10.1064453125, 10.677001953125, 11.24755859375, 11.818115234375, 12.388671875, 12.959228515625, 13.52978515625, 14.100341796875, 14.6708984375, 15.241455078125, 15.81201171875, 16.382568359375, 16.953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 5.0, 15.0, 20.0, 51.0, 73.0, 164.0, 433.0, 2562.0, 148773.0, 890879.0, 4547.0, 586.0, 198.0, 102.0, 37.0, 34.0, 22.0, 9.0, 14.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81103515625, -0.7891769409179688, -0.7673187255859375, -0.7454605102539062, -0.723602294921875, -0.7017440795898438, -0.6798858642578125, -0.6580276489257812, -0.63616943359375, -0.6143112182617188, -0.5924530029296875, -0.5705947875976562, -0.548736572265625, -0.5268783569335938, -0.5050201416015625, -0.48316192626953125, -0.4613037109375, -0.43944549560546875, -0.4175872802734375, -0.39572906494140625, -0.373870849609375, -0.35201263427734375, -0.3301544189453125, -0.30829620361328125, -0.28643798828125, -0.26457977294921875, -0.2427215576171875, -0.22086334228515625, -0.199005126953125, -0.17714691162109375, -0.1552886962890625, -0.13343048095703125, -0.111572265625, -0.08971405029296875, -0.0678558349609375, -0.04599761962890625, -0.024139404296875, -0.00228118896484375, 0.0195770263671875, 0.04143524169921875, 0.06329345703125, 0.08515167236328125, 0.1070098876953125, 0.12886810302734375, 0.150726318359375, 0.17258453369140625, 0.1944427490234375, 0.21630096435546875, 0.2381591796875, 0.26001739501953125, 0.2818756103515625, 0.30373382568359375, 0.325592041015625, 0.34745025634765625, 0.3693084716796875, 0.39116668701171875, 0.41302490234375, 0.43488311767578125, 0.4567413330078125, 0.47859954833984375, 0.500457763671875, 0.5223159790039062, 0.5441741943359375, 0.5660324096679688, 0.587890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 18.0, 24.0, 49.0, 108.0, 333.0, 189.0, 103.0, 33.0, 29.0, 16.0, 10.0, 5.0, 10.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.66191291809082e-05, -9.367614984512329e-05, -9.073317050933838e-05, -8.779019117355347e-05, -8.484721183776855e-05, -8.190423250198364e-05, -7.896125316619873e-05, -7.601827383041382e-05, -7.30752944946289e-05, -7.0132315158844e-05, -6.718933582305908e-05, -6.424635648727417e-05, -6.130337715148926e-05, -5.8360397815704346e-05, -5.5417418479919434e-05, -5.247443914413452e-05, -4.953145980834961e-05, -4.65884804725647e-05, -4.3645501136779785e-05, -4.070252180099487e-05, -3.775954246520996e-05, -3.481656312942505e-05, -3.187358379364014e-05, -2.8930604457855225e-05, -2.5987625122070312e-05, -2.30446457862854e-05, -2.0101666450500488e-05, -1.7158687114715576e-05, -1.4215707778930664e-05, -1.1272728443145752e-05, -8.32974910736084e-06, -5.386769771575928e-06, -2.4437904357910156e-06, 4.991888999938965e-07, 3.4421682357788086e-06, 6.385147571563721e-06, 9.328126907348633e-06, 1.2271106243133545e-05, 1.5214085578918457e-05, 1.815706491470337e-05, 2.110004425048828e-05, 2.4043023586273193e-05, 2.6986002922058105e-05, 2.9928982257843018e-05, 3.287196159362793e-05, 3.581494092941284e-05, 3.8757920265197754e-05, 4.1700899600982666e-05, 4.464387893676758e-05, 4.758685827255249e-05, 5.05298376083374e-05, 5.3472816944122314e-05, 5.6415796279907227e-05, 5.935877561569214e-05, 6.230175495147705e-05, 6.524473428726196e-05, 6.818771362304688e-05, 7.113069295883179e-05, 7.40736722946167e-05, 7.701665163040161e-05, 7.995963096618652e-05, 8.290261030197144e-05, 8.584558963775635e-05, 8.878856897354126e-05, 9.173154830932617e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 8.0, 14.0, 20.0, 34.0, 45.0, 53.0, 145.0, 333.0, 904.0, 5352.0, 129962.0, 897971.0, 11364.0, 1508.0, 391.0, 180.0, 100.0, 64.0, 37.0, 18.0, 15.0, 13.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.505218505859375, -0.48846435546875, -0.471710205078125, -0.4549560546875, -0.438201904296875, -0.42144775390625, -0.404693603515625, -0.387939453125, -0.371185302734375, -0.35443115234375, -0.337677001953125, -0.3209228515625, -0.304168701171875, -0.28741455078125, -0.270660400390625, -0.25390625, -0.237152099609375, -0.22039794921875, -0.203643798828125, -0.1868896484375, -0.170135498046875, -0.15338134765625, -0.136627197265625, -0.119873046875, -0.103118896484375, -0.08636474609375, -0.069610595703125, -0.0528564453125, -0.036102294921875, -0.01934814453125, -0.002593994140625, 0.01416015625, 0.030914306640625, 0.04766845703125, 0.064422607421875, 0.0811767578125, 0.097930908203125, 0.11468505859375, 0.131439208984375, 0.148193359375, 0.164947509765625, 0.18170166015625, 0.198455810546875, 0.2152099609375, 0.231964111328125, 0.24871826171875, 0.265472412109375, 0.2822265625, 0.298980712890625, 0.31573486328125, 0.332489013671875, 0.3492431640625, 0.365997314453125, 0.38275146484375, 0.399505615234375, 0.416259765625, 0.433013916015625, 0.44976806640625, 0.466522216796875, 0.4832763671875, 0.500030517578125, 0.51678466796875, 0.533538818359375, 0.55029296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 13.0, 7.0, 14.0, 15.0, 19.0, 29.0, 36.0, 49.0, 85.0, 146.0, 239.0, 94.0, 73.0, 55.0, 39.0, 17.0, 16.0, 14.0, 11.0, 8.0, 4.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06890869140625, -0.06593704223632812, -0.06296539306640625, -0.059993743896484375, -0.0570220947265625, -0.054050445556640625, -0.05107879638671875, -0.048107147216796875, -0.045135498046875, -0.042163848876953125, -0.03919219970703125, -0.036220550537109375, -0.0332489013671875, -0.030277252197265625, -0.02730560302734375, -0.024333953857421875, -0.0213623046875, -0.018390655517578125, -0.01541900634765625, -0.012447357177734375, -0.0094757080078125, -0.006504058837890625, -0.00353240966796875, -0.000560760498046875, 0.002410888671875, 0.005382537841796875, 0.00835418701171875, 0.011325836181640625, 0.0142974853515625, 0.017269134521484375, 0.02024078369140625, 0.023212432861328125, 0.02618408203125, 0.029155731201171875, 0.03212738037109375, 0.035099029541015625, 0.0380706787109375, 0.041042327880859375, 0.04401397705078125, 0.046985626220703125, 0.049957275390625, 0.052928924560546875, 0.05590057373046875, 0.058872222900390625, 0.0618438720703125, 0.06481552124023438, 0.06778717041015625, 0.07075881958007812, 0.07373046875, 0.07670211791992188, 0.07967376708984375, 0.08264541625976562, 0.0856170654296875, 0.08858871459960938, 0.09156036376953125, 0.09453201293945312, 0.097503662109375, 0.10047531127929688, 0.10344696044921875, 0.10641860961914062, 0.1093902587890625, 0.11236190795898438, 0.11533355712890625, 0.11830520629882812, 0.12127685546875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [6.0, 972.0, 44.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3044328689575195, -0.9227868318557739, 0.4588592052459717, 1.8405051231384277, 3.222151279449463, 4.603797435760498, 5.985443115234375, 7.36708927154541, 8.748735427856445, 10.13038158416748, 11.512027740478516, 12.893672943115234, 14.275320053100586, 15.656965255737305, 17.038612365722656, 18.420257568359375, 19.801902770996094, 21.183547973632812, 22.565195083618164, 23.946840286254883, 25.328487396240234, 26.710132598876953, 28.091777801513672, 29.473424911499023, 30.855072021484375, 32.236717224121094, 33.61836242675781, 35.0000114440918, 36.381656646728516, 37.763301849365234, 39.14494705200195, 40.52659606933594, 41.90823745727539, 43.28988265991211, 44.67152786254883, 46.05317687988281, 47.43482208251953, 48.81646728515625, 50.19811248779297, 51.57975769042969, 52.96140670776367, 54.34305191040039, 55.72469711303711, 57.106346130371094, 58.48799133300781, 59.86963653564453, 61.25128173828125, 62.63292694091797, 64.01457214355469, 65.3962173461914, 66.77786254882812, 68.15950775146484, 69.54115295410156, 70.92280578613281, 72.30445098876953, 73.68609619140625, 75.06774139404297, 76.44938659667969, 77.8310317993164, 79.21267700195312, 80.59432220458984, 81.9759750366211, 83.35762023925781, 84.73926544189453, 86.12091064453125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 9.0, 8.0, 7.0, 9.0, 7.0, 20.0, 17.0, 12.0, 22.0, 34.0, 23.0, 43.0, 27.0, 39.0, 37.0, 35.0, 48.0, 36.0, 57.0, 43.0, 59.0, 46.0, 39.0, 42.0, 37.0, 32.0, 34.0, 24.0, 12.0, 26.0, 17.0, 16.0, 11.0, 13.0, 11.0, 16.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-11.732352256774902, -11.355462074279785, -10.978571891784668, -10.60168170928955, -10.224791526794434, -9.847901344299316, -9.471010208129883, -9.094120025634766, -8.717229843139648, -8.340339660644531, -7.963449478149414, -7.586559295654297, -7.20966911315918, -6.8327789306640625, -6.455888271331787, -6.07899808883667, -5.702108383178711, -5.325218200683594, -4.948328018188477, -4.571437835693359, -4.194547653198242, -3.817657232284546, -3.4407668113708496, -3.0638766288757324, -2.6869864463806152, -2.310096263885498, -1.9332059621810913, -1.5563156604766846, -1.1794254779815674, -0.8025352954864502, -0.4256448745727539, -0.04875469207763672, 0.3281364440917969, 0.7050266861915588, 1.0819169282913208, 1.4588072299957275, 1.8356974124908447, 2.212587594985962, 2.589478015899658, 2.9663681983947754, 3.3432583808898926, 3.7201485633850098, 4.097038745880127, 4.473929405212402, 4.8508195877075195, 5.227709770202637, 5.604599952697754, 5.981490135192871, 6.358380317687988, 6.7352705001831055, 7.112160682678223, 7.48905086517334, 7.865941047668457, 8.242831230163574, 8.619722366333008, 8.996612548828125, 9.373502731323242, 9.75039291381836, 10.127283096313477, 10.504173278808594, 10.881063461303711, 11.257953643798828, 11.634843826293945, 12.011734008789062, 12.38862419128418]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 15.0, 14.0, 25.0, 28.0, 33.0, 45.0, 75.0, 80.0, 95.0, 9809.0, 4182750.0, 914.0, 84.0, 65.0, 54.0, 42.0, 28.0, 25.0, 21.0, 20.0, 20.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.0853271484375, -8.615966796875, -8.1466064453125, -7.67724609375, -7.2078857421875, -6.738525390625, -6.2691650390625, -5.7998046875, -5.3304443359375, -4.861083984375, -4.3917236328125, -3.92236328125, -3.4530029296875, -2.983642578125, -2.5142822265625, -2.044921875, -1.5755615234375, -1.106201171875, -0.6368408203125, -0.16748046875, 0.3018798828125, 0.771240234375, 1.2406005859375, 1.7099609375, 2.1793212890625, 2.648681640625, 3.1180419921875, 3.58740234375, 4.0567626953125, 4.526123046875, 4.9954833984375, 5.46484375, 5.9342041015625, 6.403564453125, 6.8729248046875, 7.34228515625, 7.8116455078125, 8.281005859375, 8.7503662109375, 9.2197265625, 9.6890869140625, 10.158447265625, 10.6278076171875, 11.09716796875, 11.5665283203125, 12.035888671875, 12.5052490234375, 12.974609375, 13.4439697265625, 13.913330078125, 14.3826904296875, 14.85205078125, 15.3214111328125, 15.790771484375, 16.2601318359375, 16.7294921875, 17.1988525390625, 17.668212890625, 18.1375732421875, 18.60693359375, 19.0762939453125, 19.545654296875, 20.0150146484375, 20.484375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 9.0, 16.0, 17.0, 21.0, 37.0, 56.0, 60.0, 82.0, 82.0, 83.0, 94.0, 92.0, 76.0, 72.0, 47.0, 49.0, 33.0, 20.0, 19.0, 16.0, 9.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9384765625, -1.882080078125, -1.82568359375, -1.769287109375, -1.712890625, -1.656494140625, -1.60009765625, -1.543701171875, -1.4873046875, -1.430908203125, -1.37451171875, -1.318115234375, -1.26171875, -1.205322265625, -1.14892578125, -1.092529296875, -1.0361328125, -0.979736328125, -0.92333984375, -0.866943359375, -0.810546875, -0.754150390625, -0.69775390625, -0.641357421875, -0.5849609375, -0.528564453125, -0.47216796875, -0.415771484375, -0.359375, -0.302978515625, -0.24658203125, -0.190185546875, -0.1337890625, -0.077392578125, -0.02099609375, 0.035400390625, 0.091796875, 0.148193359375, 0.20458984375, 0.260986328125, 0.3173828125, 0.373779296875, 0.43017578125, 0.486572265625, 0.54296875, 0.599365234375, 0.65576171875, 0.712158203125, 0.7685546875, 0.824951171875, 0.88134765625, 0.937744140625, 0.994140625, 1.050537109375, 1.10693359375, 1.163330078125, 1.2197265625, 1.276123046875, 1.33251953125, 1.388916015625, 1.4453125, 1.501708984375, 1.55810546875, 1.614501953125, 1.6708984375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 14.0, 21.0, 29.0, 46.0, 77.0, 125.0, 221.0, 368.0, 1300.0, 4190828.0, 519.0, 267.0, 164.0, 104.0, 64.0, 36.0, 24.0, 12.0, 11.0, 11.0, 5.0, 2.0, 2.0, 3.0, 1.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.1875, -29.95458984375, -28.7216796875, -27.48876953125, -26.255859375, -25.02294921875, -23.7900390625, -22.55712890625, -21.32421875, -20.09130859375, -18.8583984375, -17.62548828125, -16.392578125, -15.15966796875, -13.9267578125, -12.69384765625, -11.4609375, -10.22802734375, -8.9951171875, -7.76220703125, -6.529296875, -5.29638671875, -4.0634765625, -2.83056640625, -1.59765625, -0.36474609375, 0.8681640625, 2.10107421875, 3.333984375, 4.56689453125, 5.7998046875, 7.03271484375, 8.265625, 9.49853515625, 10.7314453125, 11.96435546875, 13.197265625, 14.43017578125, 15.6630859375, 16.89599609375, 18.12890625, 19.36181640625, 20.5947265625, 21.82763671875, 23.060546875, 24.29345703125, 25.5263671875, 26.75927734375, 27.9921875, 29.22509765625, 30.4580078125, 31.69091796875, 32.923828125, 34.15673828125, 35.3896484375, 36.62255859375, 37.85546875, 39.08837890625, 40.3212890625, 41.55419921875, 42.787109375, 44.02001953125, 45.2529296875, 46.48583984375, 47.71875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 1.0, 5.0, 8.0, 9.0, 12.0, 21.0, 26.0, 44.0, 51.0, 99.0, 169.0, 316.0, 590.0, 748.0, 739.0, 520.0, 299.0, 154.0, 82.0, 58.0, 27.0, 26.0, 16.0, 14.0, 14.0, 5.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.67138671875, -0.6549797058105469, -0.6385726928710938, -0.6221656799316406, -0.6057586669921875, -0.5893516540527344, -0.5729446411132812, -0.5565376281738281, -0.540130615234375, -0.5237236022949219, -0.5073165893554688, -0.4909095764160156, -0.4745025634765625, -0.4580955505371094, -0.44168853759765625, -0.4252815246582031, -0.40887451171875, -0.3924674987792969, -0.37606048583984375, -0.3596534729003906, -0.3432464599609375, -0.3268394470214844, -0.31043243408203125, -0.2940254211425781, -0.277618408203125, -0.2612113952636719, -0.24480438232421875, -0.22839736938476562, -0.2119903564453125, -0.19558334350585938, -0.17917633056640625, -0.16276931762695312, -0.1463623046875, -0.12995529174804688, -0.11354827880859375, -0.09714126586914062, -0.0807342529296875, -0.06432723999023438, -0.04792022705078125, -0.031513214111328125, -0.015106201171875, 0.001300811767578125, 0.01770782470703125, 0.034114837646484375, 0.0505218505859375, 0.06692886352539062, 0.08333587646484375, 0.09974288940429688, 0.11614990234375, 0.13255691528320312, 0.14896392822265625, 0.16537094116210938, 0.1817779541015625, 0.19818496704101562, 0.21459197998046875, 0.23099899291992188, 0.247406005859375, 0.2638130187988281, 0.28022003173828125, 0.2966270446777344, 0.3130340576171875, 0.3294410705566406, 0.34584808349609375, 0.3622550964355469, 0.378662109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 17.0, 12.0, 22.0, 26.0, 39.0, 52.0, 83.0, 107.0, 149.0, 127.0, 113.0, 72.0, 63.0, 44.0, 31.0, 17.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.536605954170227, -1.4837275743484497, -1.4308491945266724, -1.377970814704895, -1.3250924348831177, -1.2722140550613403, -1.219335675239563, -1.1664572954177856, -1.1135789155960083, -1.060700535774231, -1.0078221559524536, -0.9549437761306763, -0.9020653963088989, -0.8491870164871216, -0.7963086366653442, -0.7434302568435669, -0.6905518174171448, -0.6376734375953674, -0.5847950577735901, -0.5319166779518127, -0.4790382981300354, -0.42615988850593567, -0.3732815086841583, -0.320403128862381, -0.26752474904060364, -0.2146463692188263, -0.16176798939704895, -0.10888959467411041, -0.05601121485233307, -0.0031328201293945312, 0.04974555969238281, 0.10262393951416016, 0.1555023193359375, 0.20838069915771484, 0.2612590789794922, 0.31413745880126953, 0.3670158386230469, 0.4198942482471466, 0.47277262806892395, 0.5256509780883789, 0.5785293579101562, 0.6314077377319336, 0.6842861175537109, 0.7371644973754883, 0.7900428771972656, 0.842921257019043, 0.8957996368408203, 0.9486780166625977, 1.001556396484375, 1.0544347763061523, 1.1073131561279297, 1.160191535949707, 1.2130699157714844, 1.2659482955932617, 1.318826675415039, 1.3717050552368164, 1.4245835542678833, 1.4774619340896606, 1.530340313911438, 1.5832186937332153, 1.6360970735549927, 1.68897545337677, 1.7418538331985474, 1.7947322130203247, 1.847610592842102]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 18.0, 12.0, 15.0, 24.0, 32.0, 42.0, 45.0, 42.0, 51.0, 61.0, 62.0, 71.0, 61.0, 66.0, 53.0, 51.0, 53.0, 43.0, 31.0, 33.0, 29.0, 22.0, 19.0, 13.0, 11.0, 6.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6558738946914673, -1.6129295825958252, -1.569985270500183, -1.527040958404541, -1.4840967655181885, -1.4411524534225464, -1.3982081413269043, -1.3552638292312622, -1.3123195171356201, -1.269375205039978, -1.226430892944336, -1.1834865808486938, -1.1405422687530518, -1.0975980758666992, -1.0546537637710571, -1.011709451675415, -0.968765139579773, -0.9258208274841309, -0.8828765153884888, -0.8399322628974915, -0.7969879508018494, -0.7540436387062073, -0.71109938621521, -0.6681550741195679, -0.6252107620239258, -0.5822664499282837, -0.5393221378326416, -0.4963778853416443, -0.4534335732460022, -0.4104892611503601, -0.3675449788570404, -0.3246006965637207, -0.28165650367736816, -0.23871220648288727, -0.19576790928840637, -0.15282361209392548, -0.10987931489944458, -0.06693501770496368, -0.023990720510482788, 0.018953561782836914, 0.061897873878479004, 0.1048421710729599, 0.1477864682674408, 0.1907307654619217, 0.2336750626564026, 0.2766193747520447, 0.3195636570453644, 0.3625079393386841, 0.40545225143432617, 0.44839656352996826, 0.49134084582328796, 0.5342851281166077, 0.5772294402122498, 0.6201737523078918, 0.6631180047988892, 0.7060623168945312, 0.7490066289901733, 0.7919509410858154, 0.8348952531814575, 0.8778395056724548, 0.9207838177680969, 0.963728129863739, 1.0066723823547363, 1.0496166944503784, 1.0925610065460205]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 6.0, 18.0, 34.0, 36.0, 66.0, 97.0, 183.0, 328.0, 607.0, 1138.0, 2090.0, 4380.0, 12949.0, 102359.0, 784358.0, 116398.0, 14240.0, 4466.0, 2173.0, 1166.0, 601.0, 363.0, 187.0, 100.0, 65.0, 35.0, 26.0, 26.0, 6.0, 7.0, 11.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396240234375, -0.3832588195800781, -0.37027740478515625, -0.3572959899902344, -0.3443145751953125, -0.3313331604003906, -0.31835174560546875, -0.3053703308105469, -0.292388916015625, -0.2794075012207031, -0.26642608642578125, -0.2534446716308594, -0.2404632568359375, -0.22748184204101562, -0.21450042724609375, -0.20151901245117188, -0.18853759765625, -0.17555618286132812, -0.16257476806640625, -0.14959335327148438, -0.1366119384765625, -0.12363052368164062, -0.11064910888671875, -0.09766769409179688, -0.084686279296875, -0.07170486450195312, -0.05872344970703125, -0.045742034912109375, -0.0327606201171875, -0.019779205322265625, -0.00679779052734375, 0.006183624267578125, 0.0191650390625, 0.032146453857421875, 0.04512786865234375, 0.058109283447265625, 0.0710906982421875, 0.08407211303710938, 0.09705352783203125, 0.11003494262695312, 0.123016357421875, 0.13599777221679688, 0.14897918701171875, 0.16196060180664062, 0.1749420166015625, 0.18792343139648438, 0.20090484619140625, 0.21388626098632812, 0.22686767578125, 0.23984909057617188, 0.25283050537109375, 0.2658119201660156, 0.2787933349609375, 0.2917747497558594, 0.30475616455078125, 0.3177375793457031, 0.330718994140625, 0.3437004089355469, 0.35668182373046875, 0.3696632385253906, 0.3826446533203125, 0.3956260681152344, 0.40860748291015625, 0.4215888977050781, 0.4345703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 17.0, 16.0, 12.0, 29.0, 33.0, 33.0, 43.0, 56.0, 50.0, 62.0, 73.0, 77.0, 61.0, 75.0, 66.0, 60.0, 46.0, 37.0, 37.0, 28.0, 27.0, 12.0, 16.0, 14.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.070892333984375, -1.04022216796875, -1.009552001953125, -0.9788818359375, -0.948211669921875, -0.91754150390625, -0.886871337890625, -0.856201171875, -0.825531005859375, -0.79486083984375, -0.764190673828125, -0.7335205078125, -0.702850341796875, -0.67218017578125, -0.641510009765625, -0.61083984375, -0.580169677734375, -0.54949951171875, -0.518829345703125, -0.4881591796875, -0.457489013671875, -0.42681884765625, -0.396148681640625, -0.365478515625, -0.334808349609375, -0.30413818359375, -0.273468017578125, -0.2427978515625, -0.212127685546875, -0.18145751953125, -0.150787353515625, -0.1201171875, -0.089447021484375, -0.05877685546875, -0.028106689453125, 0.0025634765625, 0.033233642578125, 0.06390380859375, 0.094573974609375, 0.125244140625, 0.155914306640625, 0.18658447265625, 0.217254638671875, 0.2479248046875, 0.278594970703125, 0.30926513671875, 0.339935302734375, 0.37060546875, 0.401275634765625, 0.43194580078125, 0.462615966796875, 0.4932861328125, 0.523956298828125, 0.55462646484375, 0.585296630859375, 0.615966796875, 0.646636962890625, 0.67730712890625, 0.707977294921875, 0.7386474609375, 0.769317626953125, 0.79998779296875, 0.830657958984375, 0.861328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 10.0, 22.0, 26.0, 43.0, 77.0, 91.0, 169.0, 296.0, 501.0, 978.0, 2062.0, 4175.0, 9915.0, 23412.0, 57465.0, 145814.0, 303933.0, 283311.0, 128391.0, 51045.0, 20472.0, 8667.0, 3870.0, 1818.0, 879.0, 440.0, 262.0, 140.0, 101.0, 63.0, 33.0, 22.0, 14.0, 11.0, 10.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1029052734375, -0.09987258911132812, -0.09683990478515625, -0.09380722045898438, -0.0907745361328125, -0.08774185180664062, -0.08470916748046875, -0.08167648315429688, -0.078643798828125, -0.07561111450195312, -0.07257843017578125, -0.06954574584960938, -0.0665130615234375, -0.06348037719726562, -0.06044769287109375, -0.057415008544921875, -0.05438232421875, -0.051349639892578125, -0.04831695556640625, -0.045284271240234375, -0.0422515869140625, -0.039218902587890625, -0.03618621826171875, -0.033153533935546875, -0.030120849609375, -0.027088165283203125, -0.02405548095703125, -0.021022796630859375, -0.0179901123046875, -0.014957427978515625, -0.01192474365234375, -0.008892059326171875, -0.005859375, -0.002826690673828125, 0.00020599365234375, 0.003238677978515625, 0.0062713623046875, 0.009304046630859375, 0.01233673095703125, 0.015369415283203125, 0.018402099609375, 0.021434783935546875, 0.02446746826171875, 0.027500152587890625, 0.0305328369140625, 0.033565521240234375, 0.03659820556640625, 0.039630889892578125, 0.04266357421875, 0.045696258544921875, 0.04872894287109375, 0.051761627197265625, 0.0547943115234375, 0.057826995849609375, 0.06085968017578125, 0.06389236450195312, 0.066925048828125, 0.06995773315429688, 0.07299041748046875, 0.07602310180664062, 0.0790557861328125, 0.08208847045898438, 0.08512115478515625, 0.08815383911132812, 0.0911865234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 8.0, 9.0, 18.0, 19.0, 30.0, 31.0, 34.0, 49.0, 47.0, 48.0, 65.0, 48.0, 59.0, 57.0, 50.0, 47.0, 51.0, 52.0, 47.0, 46.0, 39.0, 32.0, 30.0, 13.0, 15.0, 10.0, 14.0, 11.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.365234375, -1.3192901611328125, -1.273345947265625, -1.2274017333984375, -1.18145751953125, -1.1355133056640625, -1.089569091796875, -1.0436248779296875, -0.9976806640625, -0.9517364501953125, -0.905792236328125, -0.8598480224609375, -0.81390380859375, -0.7679595947265625, -0.722015380859375, -0.6760711669921875, -0.630126953125, -0.5841827392578125, -0.538238525390625, -0.4922943115234375, -0.44635009765625, -0.4004058837890625, -0.354461669921875, -0.3085174560546875, -0.2625732421875, -0.2166290283203125, -0.170684814453125, -0.1247406005859375, -0.07879638671875, -0.0328521728515625, 0.013092041015625, 0.0590362548828125, 0.10498046875, 0.1509246826171875, 0.196868896484375, 0.2428131103515625, 0.28875732421875, 0.3347015380859375, 0.380645751953125, 0.4265899658203125, 0.4725341796875, 0.5184783935546875, 0.564422607421875, 0.6103668212890625, 0.65631103515625, 0.7022552490234375, 0.748199462890625, 0.7941436767578125, 0.840087890625, 0.8860321044921875, 0.931976318359375, 0.9779205322265625, 1.02386474609375, 1.0698089599609375, 1.115753173828125, 1.1616973876953125, 1.2076416015625, 1.2535858154296875, 1.299530029296875, 1.3454742431640625, 1.39141845703125, 1.4373626708984375, 1.483306884765625, 1.5292510986328125, 1.5751953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 8.0, 4.0, 10.0, 14.0, 30.0, 38.0, 44.0, 76.0, 147.0, 226.0, 428.0, 847.0, 1952.0, 4661.0, 13284.0, 54412.0, 339269.0, 511267.0, 90541.0, 19837.0, 6236.0, 2622.0, 1187.0, 640.0, 303.0, 175.0, 102.0, 66.0, 37.0, 26.0, 17.0, 18.0, 12.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176239013671875, -0.017019271850585938, -0.016414642333984375, -0.015810012817382812, -0.01520538330078125, -0.014600753784179688, -0.013996124267578125, -0.013391494750976562, -0.012786865234375, -0.012182235717773438, -0.011577606201171875, -0.010972976684570312, -0.01036834716796875, -0.009763717651367188, -0.009159088134765625, -0.008554458618164062, -0.0079498291015625, -0.0073451995849609375, -0.006740570068359375, -0.0061359405517578125, -0.00553131103515625, -0.0049266815185546875, -0.004322052001953125, -0.0037174224853515625, -0.00311279296875, -0.0025081634521484375, -0.001903533935546875, -0.0012989044189453125, -0.00069427490234375, -8.96453857421875e-05, 0.000514984130859375, 0.0011196136474609375, 0.0017242431640625, 0.0023288726806640625, 0.002933502197265625, 0.0035381317138671875, 0.00414276123046875, 0.0047473907470703125, 0.005352020263671875, 0.0059566497802734375, 0.006561279296875, 0.0071659088134765625, 0.007770538330078125, 0.008375167846679688, 0.00897979736328125, 0.009584426879882812, 0.010189056396484375, 0.010793685913085938, 0.0113983154296875, 0.012002944946289062, 0.012607574462890625, 0.013212203979492188, 0.01381683349609375, 0.014421463012695312, 0.015026092529296875, 0.015630722045898438, 0.0162353515625, 0.016839981079101562, 0.017444610595703125, 0.018049240112304688, 0.01865386962890625, 0.019258499145507812, 0.019863128662109375, 0.020467758178710938, 0.0210723876953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 17.0, 27.0, 32.0, 39.0, 62.0, 80.0, 104.0, 113.0, 130.0, 105.0, 77.0, 62.0, 34.0, 36.0, 17.0, 7.0, 13.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.7962960302829742e-05, -2.695806324481964e-05, -2.595316618680954e-05, -2.494826912879944e-05, -2.3943372070789337e-05, -2.2938475012779236e-05, -2.1933577954769135e-05, -2.0928680896759033e-05, -1.9923783838748932e-05, -1.891888678073883e-05, -1.791398972272873e-05, -1.6909092664718628e-05, -1.5904195606708527e-05, -1.4899298548698425e-05, -1.3894401490688324e-05, -1.2889504432678223e-05, -1.1884607374668121e-05, -1.087971031665802e-05, -9.874813258647919e-06, -8.869916200637817e-06, -7.865019142627716e-06, -6.860122084617615e-06, -5.8552250266075134e-06, -4.850327968597412e-06, -3.845430910587311e-06, -2.8405338525772095e-06, -1.8356367945671082e-06, -8.307397365570068e-07, 1.7415732145309448e-07, 1.1790543794631958e-06, 2.183951437473297e-06, 3.1888484954833984e-06, 4.1937455534935e-06, 5.198642611503601e-06, 6.203539669513702e-06, 7.208436727523804e-06, 8.213333785533905e-06, 9.218230843544006e-06, 1.0223127901554108e-05, 1.1228024959564209e-05, 1.223292201757431e-05, 1.3237819075584412e-05, 1.4242716133594513e-05, 1.5247613191604614e-05, 1.6252510249614716e-05, 1.7257407307624817e-05, 1.8262304365634918e-05, 1.926720142364502e-05, 2.027209848165512e-05, 2.1276995539665222e-05, 2.2281892597675323e-05, 2.3286789655685425e-05, 2.4291686713695526e-05, 2.5296583771705627e-05, 2.630148082971573e-05, 2.730637788772583e-05, 2.831127494573593e-05, 2.9316172003746033e-05, 3.0321069061756134e-05, 3.1325966119766235e-05, 3.233086317777634e-05, 3.333576023578644e-05, 3.434065729379654e-05, 3.534555435180664e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 6.0, 15.0, 9.0, 10.0, 20.0, 30.0, 56.0, 124.0, 765.0, 1045549.0, 1647.0, 136.0, 67.0, 34.0, 28.0, 10.0, 15.0, 9.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13451576232910156, -0.13011550903320312, -0.1257152557373047, -0.12131500244140625, -0.11691474914550781, -0.11251449584960938, -0.10811424255371094, -0.1037139892578125, -0.09931373596191406, -0.09491348266601562, -0.09051322937011719, -0.08611297607421875, -0.08171272277832031, -0.07731246948242188, -0.07291221618652344, -0.068511962890625, -0.06411170959472656, -0.059711456298828125, -0.05531120300292969, -0.05091094970703125, -0.04651069641113281, -0.042110443115234375, -0.03771018981933594, -0.0333099365234375, -0.028909683227539062, -0.024509429931640625, -0.020109176635742188, -0.01570892333984375, -0.011308670043945312, -0.006908416748046875, -0.0025081634521484375, 0.00189208984375, 0.0062923431396484375, 0.010692596435546875, 0.015092849731445312, 0.01949310302734375, 0.023893356323242188, 0.028293609619140625, 0.03269386291503906, 0.0370941162109375, 0.04149436950683594, 0.045894622802734375, 0.05029487609863281, 0.05469512939453125, 0.05909538269042969, 0.06349563598632812, 0.06789588928222656, 0.072296142578125, 0.07669639587402344, 0.08109664916992188, 0.08549690246582031, 0.08989715576171875, 0.09429740905761719, 0.09869766235351562, 0.10309791564941406, 0.1074981689453125, 0.11189842224121094, 0.11629867553710938, 0.12069892883300781, 0.12509918212890625, 0.1294994354248047, 0.13389968872070312, 0.13829994201660156, 0.1427001953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 14.0, 20.0, 24.0, 29.0, 45.0, 69.0, 104.0, 121.0, 132.0, 115.0, 76.0, 62.0, 51.0, 30.0, 28.0, 15.0, 9.0, 10.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005886077880859375, -0.005692720413208008, -0.005499362945556641, -0.0053060054779052734, -0.005112648010253906, -0.004919290542602539, -0.004725933074951172, -0.004532575607299805, -0.0043392181396484375, -0.00414586067199707, -0.003952503204345703, -0.003759145736694336, -0.0035657882690429688, -0.0033724308013916016, -0.0031790733337402344, -0.002985715866088867, -0.0027923583984375, -0.002599000930786133, -0.0024056434631347656, -0.0022122859954833984, -0.0020189285278320312, -0.001825571060180664, -0.0016322135925292969, -0.0014388561248779297, -0.0012454986572265625, -0.0010521411895751953, -0.0008587837219238281, -0.0006654262542724609, -0.00047206878662109375, -0.00027871131896972656, -8.535385131835938e-05, 0.00010800361633300781, 0.000301361083984375, 0.0004947185516357422, 0.0006880760192871094, 0.0008814334869384766, 0.0010747909545898438, 0.001268148422241211, 0.0014615058898925781, 0.0016548633575439453, 0.0018482208251953125, 0.0020415782928466797, 0.002234935760498047, 0.002428293228149414, 0.0026216506958007812, 0.0028150081634521484, 0.0030083656311035156, 0.003201723098754883, 0.00339508056640625, 0.003588438034057617, 0.0037817955017089844, 0.0039751529693603516, 0.004168510437011719, 0.004361867904663086, 0.004555225372314453, 0.00474858283996582, 0.0049419403076171875, 0.005135297775268555, 0.005328655242919922, 0.005522012710571289, 0.005715370178222656, 0.0059087276458740234, 0.006102085113525391, 0.006295442581176758, 0.006488800048828125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 14.0, 21.0, 28.0, 62.0, 100.0, 161.0, 218.0, 166.0, 98.0, 76.0, 25.0, 15.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.863788902759552, -0.8171229362487793, -0.7704570293426514, -0.7237911224365234, -0.6771251559257507, -0.630459189414978, -0.5837932825088501, -0.5371273756027222, -0.49046140909194946, -0.44379547238349915, -0.39712953567504883, -0.3504635989665985, -0.3037976622581482, -0.2571317255496979, -0.21046578884124756, -0.16379985213279724, -0.11713391542434692, -0.0704679787158966, -0.02380204200744629, 0.02286389470100403, 0.06952983140945435, 0.11619576811790466, 0.16286170482635498, 0.2095276415348053, 0.2561935782432556, 0.30285951495170593, 0.34952545166015625, 0.39619138836860657, 0.4428573250770569, 0.4895232617855072, 0.5361891984939575, 0.5828551054000854, 0.6295211315155029, 0.6761870384216309, 0.7228530049324036, 0.7695189714431763, 0.8161848783493042, 0.8628507852554321, 0.9095167517662048, 0.9561827182769775, 1.0028486251831055, 1.0495145320892334, 1.0961804389953613, 1.1428464651107788, 1.1895123720169067, 1.2361782789230347, 1.2828443050384521, 1.32951021194458, 1.376176118850708, 1.422842025756836, 1.4695079326629639, 1.5161739587783813, 1.5628398656845093, 1.6095057725906372, 1.6561717987060547, 1.7028377056121826, 1.7495036125183105, 1.7961695194244385, 1.8428354263305664, 1.8895014524459839, 1.9361673593521118, 1.9828332662582397, 2.0294992923736572, 2.076165199279785, 2.122831106185913]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 11.0, 14.0, 12.0, 13.0, 15.0, 31.0, 32.0, 37.0, 49.0, 48.0, 59.0, 72.0, 66.0, 71.0, 70.0, 62.0, 55.0, 53.0, 43.0, 39.0, 34.0, 23.0, 27.0, 19.0, 13.0, 12.0, 3.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.0241647958755493, -0.9969033002853394, -0.9696418642997742, -0.9423803687095642, -0.915118932723999, -0.8878574371337891, -0.8605959415435791, -0.8333345055580139, -0.8060730695724487, -0.7788115739822388, -0.7515501379966736, -0.7242886424064636, -0.6970272064208984, -0.6697657108306885, -0.6425042152404785, -0.6152427792549133, -0.5879812836647034, -0.5607197880744934, -0.5334583520889282, -0.5061968564987183, -0.4789354205131531, -0.4516739249229431, -0.42441245913505554, -0.39715099334716797, -0.3698895275592804, -0.3426280617713928, -0.31536659598350525, -0.2881051301956177, -0.2608436346054077, -0.23358218371868134, -0.20632070302963257, -0.179059237241745, -0.15179777145385742, -0.12453630566596985, -0.09727483242750168, -0.07001335918903351, -0.042751893401145935, -0.015490427613258362, 0.011771053075790405, 0.03903251886367798, 0.06629398465156555, 0.09355545043945312, 0.1208169236779213, 0.14807839691638947, 0.17533986270427704, 0.2026013284921646, 0.22986280918121338, 0.25712427496910095, 0.2843857407569885, 0.3116472065448761, 0.33890867233276367, 0.36617016792297363, 0.3934316039085388, 0.4206930994987488, 0.44795456528663635, 0.4752160310745239, 0.5024775266647339, 0.5297390222549438, 0.557000458240509, 0.584261953830719, 0.6115233898162842, 0.6387848854064941, 0.6660463809967041, 0.6933078169822693, 0.7205692529678345]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 10.0, 8.0, 13.0, 21.0, 24.0, 37.0, 82.0, 139.0, 208.0, 320.0, 541.0, 1024.0, 1910.0, 4697.0, 14413.0, 60355.0, 434540.0, 445381.0, 61050.0, 14501.0, 4833.0, 2024.0, 993.0, 549.0, 318.0, 202.0, 105.0, 84.0, 52.0, 36.0, 21.0, 20.0, 7.0, 8.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3955078125, -0.38275146484375, -0.3699951171875, -0.35723876953125, -0.344482421875, -0.33172607421875, -0.3189697265625, -0.30621337890625, -0.29345703125, -0.28070068359375, -0.2679443359375, -0.25518798828125, -0.242431640625, -0.22967529296875, -0.2169189453125, -0.20416259765625, -0.19140625, -0.17864990234375, -0.1658935546875, -0.15313720703125, -0.140380859375, -0.12762451171875, -0.1148681640625, -0.10211181640625, -0.08935546875, -0.07659912109375, -0.0638427734375, -0.05108642578125, -0.038330078125, -0.02557373046875, -0.0128173828125, -6.103515625e-05, 0.0126953125, 0.02545166015625, 0.0382080078125, 0.05096435546875, 0.063720703125, 0.07647705078125, 0.0892333984375, 0.10198974609375, 0.11474609375, 0.12750244140625, 0.1402587890625, 0.15301513671875, 0.165771484375, 0.17852783203125, 0.1912841796875, 0.20404052734375, 0.216796875, 0.22955322265625, 0.2423095703125, 0.25506591796875, 0.267822265625, 0.28057861328125, 0.2933349609375, 0.30609130859375, 0.31884765625, 0.33160400390625, 0.3443603515625, 0.35711669921875, 0.369873046875, 0.38262939453125, 0.3953857421875, 0.40814208984375, 0.4208984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 18.0, 11.0, 20.0, 27.0, 29.0, 33.0, 38.0, 55.0, 61.0, 57.0, 74.0, 61.0, 58.0, 63.0, 65.0, 49.0, 53.0, 46.0, 25.0, 34.0, 29.0, 17.0, 17.0, 15.0, 9.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.34375, -4.238006591796875, -4.13226318359375, -4.026519775390625, -3.9207763671875, -3.815032958984375, -3.70928955078125, -3.603546142578125, -3.497802734375, -3.392059326171875, -3.28631591796875, -3.180572509765625, -3.0748291015625, -2.969085693359375, -2.86334228515625, -2.757598876953125, -2.65185546875, -2.546112060546875, -2.44036865234375, -2.334625244140625, -2.2288818359375, -2.123138427734375, -2.01739501953125, -1.911651611328125, -1.805908203125, -1.700164794921875, -1.59442138671875, -1.488677978515625, -1.3829345703125, -1.277191162109375, -1.17144775390625, -1.065704345703125, -0.9599609375, -0.854217529296875, -0.74847412109375, -0.642730712890625, -0.5369873046875, -0.431243896484375, -0.32550048828125, -0.219757080078125, -0.114013671875, -0.008270263671875, 0.09747314453125, 0.203216552734375, 0.3089599609375, 0.414703369140625, 0.52044677734375, 0.626190185546875, 0.73193359375, 0.837677001953125, 0.94342041015625, 1.049163818359375, 1.1549072265625, 1.260650634765625, 1.36639404296875, 1.472137451171875, 1.577880859375, 1.683624267578125, 1.78936767578125, 1.895111083984375, 2.0008544921875, 2.106597900390625, 2.21234130859375, 2.318084716796875, 2.423828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 7.0, 9.0, 10.0, 12.0, 13.0, 22.0, 21.0, 11.0, 16.0, 39.0, 23.0, 28.0, 42.0, 43.0, 39.0, 50.0, 152.0, 1046342.0, 1204.0, 35.0, 61.0, 37.0, 29.0, 41.0, 37.0, 38.0, 20.0, 26.0, 16.0, 17.0, 17.0, 17.0, 12.0, 9.0, 12.0, 12.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.625, -11.27001953125, -10.9150390625, -10.56005859375, -10.205078125, -9.85009765625, -9.4951171875, -9.14013671875, -8.78515625, -8.43017578125, -8.0751953125, -7.72021484375, -7.365234375, -7.01025390625, -6.6552734375, -6.30029296875, -5.9453125, -5.59033203125, -5.2353515625, -4.88037109375, -4.525390625, -4.17041015625, -3.8154296875, -3.46044921875, -3.10546875, -2.75048828125, -2.3955078125, -2.04052734375, -1.685546875, -1.33056640625, -0.9755859375, -0.62060546875, -0.265625, 0.08935546875, 0.4443359375, 0.79931640625, 1.154296875, 1.50927734375, 1.8642578125, 2.21923828125, 2.57421875, 2.92919921875, 3.2841796875, 3.63916015625, 3.994140625, 4.34912109375, 4.7041015625, 5.05908203125, 5.4140625, 5.76904296875, 6.1240234375, 6.47900390625, 6.833984375, 7.18896484375, 7.5439453125, 7.89892578125, 8.25390625, 8.60888671875, 8.9638671875, 9.31884765625, 9.673828125, 10.02880859375, 10.3837890625, 10.73876953125, 11.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 6.0, 7.0, 12.0, 14.0, 12.0, 21.0, 17.0, 18.0, 19.0, 36.0, 24.0, 26.0, 49.0, 35.0, 39.0, 48.0, 48.0, 62.0, 44.0, 33.0, 57.0, 37.0, 32.0, 45.0, 31.0, 36.0, 20.0, 25.0, 15.0, 18.0, 19.0, 13.0, 11.0, 14.0, 13.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.498046875, -2.42144775390625, -2.3448486328125, -2.26824951171875, -2.191650390625, -2.11505126953125, -2.0384521484375, -1.96185302734375, -1.88525390625, -1.80865478515625, -1.7320556640625, -1.65545654296875, -1.578857421875, -1.50225830078125, -1.4256591796875, -1.34906005859375, -1.2724609375, -1.19586181640625, -1.1192626953125, -1.04266357421875, -0.966064453125, -0.88946533203125, -0.8128662109375, -0.73626708984375, -0.65966796875, -0.58306884765625, -0.5064697265625, -0.42987060546875, -0.353271484375, -0.27667236328125, -0.2000732421875, -0.12347412109375, -0.046875, 0.02972412109375, 0.1063232421875, 0.18292236328125, 0.259521484375, 0.33612060546875, 0.4127197265625, 0.48931884765625, 0.56591796875, 0.64251708984375, 0.7191162109375, 0.79571533203125, 0.872314453125, 0.94891357421875, 1.0255126953125, 1.10211181640625, 1.1787109375, 1.25531005859375, 1.3319091796875, 1.40850830078125, 1.485107421875, 1.56170654296875, 1.6383056640625, 1.71490478515625, 1.79150390625, 1.86810302734375, 1.9447021484375, 2.02130126953125, 2.097900390625, 2.17449951171875, 2.2510986328125, 2.32769775390625, 2.404296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 10.0, 16.0, 28.0, 15.0, 29.0, 53.0, 96.0, 227.0, 594.0, 2198.0, 11296.0, 138658.0, 865893.0, 23938.0, 3936.0, 926.0, 296.0, 118.0, 74.0, 40.0, 30.0, 11.0, 15.0, 8.0, 8.0, 5.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2030029296875, -0.1968860626220703, -0.19076919555664062, -0.18465232849121094, -0.17853546142578125, -0.17241859436035156, -0.16630172729492188, -0.1601848602294922, -0.1540679931640625, -0.1479511260986328, -0.14183425903320312, -0.13571739196777344, -0.12960052490234375, -0.12348365783691406, -0.11736679077148438, -0.11124992370605469, -0.105133056640625, -0.09901618957519531, -0.09289932250976562, -0.08678245544433594, -0.08066558837890625, -0.07454872131347656, -0.06843185424804688, -0.06231498718261719, -0.0561981201171875, -0.05008125305175781, -0.043964385986328125, -0.03784751892089844, -0.03173065185546875, -0.025613784790039062, -0.019496917724609375, -0.013380050659179688, -0.00726318359375, -0.0011463165283203125, 0.004970550537109375, 0.011087417602539062, 0.01720428466796875, 0.023321151733398438, 0.029438018798828125, 0.03555488586425781, 0.0416717529296875, 0.04778861999511719, 0.053905487060546875, 0.06002235412597656, 0.06613922119140625, 0.07225608825683594, 0.07837295532226562, 0.08448982238769531, 0.090606689453125, 0.09672355651855469, 0.10284042358398438, 0.10895729064941406, 0.11507415771484375, 0.12119102478027344, 0.12730789184570312, 0.1334247589111328, 0.1395416259765625, 0.1456584930419922, 0.15177536010742188, 0.15789222717285156, 0.16400909423828125, 0.17012596130371094, 0.17624282836914062, 0.1823596954345703, 0.1884765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 10.0, 14.0, 16.0, 36.0, 63.0, 196.0, 375.0, 120.0, 51.0, 27.0, 18.0, 7.0, 6.0, 2.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.765655517578125e-05, -2.693384885787964e-05, -2.6211142539978027e-05, -2.5488436222076416e-05, -2.4765729904174805e-05, -2.4043023586273193e-05, -2.3320317268371582e-05, -2.259761095046997e-05, -2.187490463256836e-05, -2.1152198314666748e-05, -2.0429491996765137e-05, -1.9706785678863525e-05, -1.8984079360961914e-05, -1.8261373043060303e-05, -1.753866672515869e-05, -1.681596040725708e-05, -1.609325408935547e-05, -1.5370547771453857e-05, -1.4647841453552246e-05, -1.3925135135650635e-05, -1.3202428817749023e-05, -1.2479722499847412e-05, -1.17570161819458e-05, -1.103430986404419e-05, -1.0311603546142578e-05, -9.588897228240967e-06, -8.866190910339355e-06, -8.143484592437744e-06, -7.420778274536133e-06, -6.6980719566345215e-06, -5.97536563873291e-06, -5.252659320831299e-06, -4.5299530029296875e-06, -3.807246685028076e-06, -3.084540367126465e-06, -2.3618340492248535e-06, -1.6391277313232422e-06, -9.164214134216309e-07, -1.9371509552001953e-07, 5.289912223815918e-07, 1.2516975402832031e-06, 1.9744038581848145e-06, 2.6971101760864258e-06, 3.419816493988037e-06, 4.1425228118896484e-06, 4.86522912979126e-06, 5.587935447692871e-06, 6.310641765594482e-06, 7.033348083496094e-06, 7.756054401397705e-06, 8.478760719299316e-06, 9.201467037200928e-06, 9.924173355102539e-06, 1.064687967300415e-05, 1.1369585990905762e-05, 1.2092292308807373e-05, 1.2814998626708984e-05, 1.3537704944610596e-05, 1.4260411262512207e-05, 1.4983117580413818e-05, 1.570582389831543e-05, 1.642853021621704e-05, 1.7151236534118652e-05, 1.7873942852020264e-05, 1.8596649169921875e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 5.0, 9.0, 13.0, 13.0, 29.0, 33.0, 50.0, 82.0, 154.0, 318.0, 595.0, 1326.0, 3044.0, 8440.0, 31655.0, 431447.0, 523643.0, 32792.0, 8899.0, 3306.0, 1342.0, 625.0, 301.0, 157.0, 109.0, 45.0, 38.0, 12.0, 12.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1275634765625, -0.12357902526855469, -0.11959457397460938, -0.11561012268066406, -0.11162567138671875, -0.10764122009277344, -0.10365676879882812, -0.09967231750488281, -0.0956878662109375, -0.09170341491699219, -0.08771896362304688, -0.08373451232910156, -0.07975006103515625, -0.07576560974121094, -0.07178115844726562, -0.06779670715332031, -0.063812255859375, -0.05982780456542969, -0.055843353271484375, -0.05185890197753906, -0.04787445068359375, -0.04388999938964844, -0.039905548095703125, -0.03592109680175781, -0.0319366455078125, -0.027952194213867188, -0.023967742919921875, -0.019983291625976562, -0.01599884033203125, -0.012014389038085938, -0.008029937744140625, -0.0040454864501953125, -6.103515625e-05, 0.0039234161376953125, 0.007907867431640625, 0.011892318725585938, 0.01587677001953125, 0.019861221313476562, 0.023845672607421875, 0.027830123901367188, 0.0318145751953125, 0.03579902648925781, 0.039783477783203125, 0.04376792907714844, 0.04775238037109375, 0.05173683166503906, 0.055721282958984375, 0.05970573425292969, 0.063690185546875, 0.06767463684082031, 0.07165908813476562, 0.07564353942871094, 0.07962799072265625, 0.08361244201660156, 0.08759689331054688, 0.09158134460449219, 0.0955657958984375, 0.09955024719238281, 0.10353469848632812, 0.10751914978027344, 0.11150360107421875, 0.11548805236816406, 0.11947250366210938, 0.12345695495605469, 0.12744140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 5.0, 10.0, 10.0, 9.0, 12.0, 22.0, 25.0, 30.0, 43.0, 65.0, 180.0, 263.0, 111.0, 54.0, 34.0, 23.0, 22.0, 14.0, 12.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.04339599609375, -0.042093753814697266, -0.04079151153564453, -0.0394892692565918, -0.03818702697753906, -0.03688478469848633, -0.035582542419433594, -0.03428030014038086, -0.032978057861328125, -0.03167581558227539, -0.030373573303222656, -0.029071331024169922, -0.027769088745117188, -0.026466846466064453, -0.02516460418701172, -0.023862361907958984, -0.02256011962890625, -0.021257877349853516, -0.01995563507080078, -0.018653392791748047, -0.017351150512695312, -0.016048908233642578, -0.014746665954589844, -0.01344442367553711, -0.012142181396484375, -0.01083993911743164, -0.009537696838378906, -0.008235454559326172, -0.0069332122802734375, -0.005630970001220703, -0.004328727722167969, -0.0030264854431152344, -0.0017242431640625, -0.0004220008850097656, 0.0008802413940429688, 0.002182483673095703, 0.0034847259521484375, 0.004786968231201172, 0.006089210510253906, 0.007391452789306641, 0.008693695068359375, 0.00999593734741211, 0.011298179626464844, 0.012600421905517578, 0.013902664184570312, 0.015204906463623047, 0.01650714874267578, 0.017809391021728516, 0.01911163330078125, 0.020413875579833984, 0.02171611785888672, 0.023018360137939453, 0.024320602416992188, 0.025622844696044922, 0.026925086975097656, 0.02822732925415039, 0.029529571533203125, 0.03083181381225586, 0.032134056091308594, 0.03343629837036133, 0.03473854064941406, 0.0360407829284668, 0.03734302520751953, 0.038645267486572266, 0.039947509765625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 11.0, 21.0, 57.0, 148.0, 344.0, 262.0, 127.0, 26.0, 13.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4022542238235474, -1.2432342767715454, -1.084214448928833, -0.925194501876831, -0.7661745548248291, -0.6071546077728271, -0.44813472032546997, -0.2891148328781128, -0.13009488582611084, 0.028925031423568726, 0.1879449486732483, 0.34696486592292786, 0.5059847831726074, 0.6650047302246094, 0.8240246176719666, 0.9830445051193237, 1.1420644521713257, 1.3010843992233276, 1.46010422706604, 1.619124174118042, 1.778144121170044, 1.937164068222046, 2.096184015274048, 2.2552037239074707, 2.4142236709594727, 2.5732436180114746, 2.7322635650634766, 2.8912835121154785, 3.0503034591674805, 3.2093234062194824, 3.3683431148529053, 3.5273630619049072, 3.6863832473754883, 3.8454031944274902, 4.004423141479492, 4.163443088531494, 4.322463035583496, 4.481482982635498, 4.6405029296875, 4.799522399902344, 4.958542823791504, 5.117562770843506, 5.276582717895508, 5.43560266494751, 5.594622611999512, 5.753642559051514, 5.912662506103516, 6.071681976318359, 6.230701923370361, 6.389721870422363, 6.548741817474365, 6.707761764526367, 6.866781711578369, 7.025801658630371, 7.184821605682373, 7.343841552734375, 7.502861022949219, 7.661880970001221, 7.820900917053223, 7.979920864105225, 8.138940811157227, 8.29796028137207, 8.45698070526123, 8.616000175476074, 8.775020599365234]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 3.0, 9.0, 10.0, 18.0, 16.0, 20.0, 23.0, 30.0, 35.0, 32.0, 46.0, 39.0, 51.0, 50.0, 55.0, 50.0, 45.0, 53.0, 51.0, 43.0, 37.0, 29.0, 34.0, 44.0, 28.0, 32.0, 26.0, 20.0, 18.0, 5.0, 8.0, 10.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.359638690948486, -4.236175060272217, -4.112711429595947, -3.9892477989196777, -3.8657844066619873, -3.7423207759857178, -3.6188571453094482, -3.4953935146331787, -3.3719301223754883, -3.2484664916992188, -3.125002861022949, -3.0015392303466797, -2.8780758380889893, -2.7546122074127197, -2.63114857673645, -2.5076849460601807, -2.384221315383911, -2.2607576847076416, -2.137294054031372, -2.0138306617736816, -1.890367031097412, -1.7669034004211426, -1.643439769744873, -1.5199761390686035, -1.3965126276016235, -1.273048996925354, -1.149585485458374, -1.0261218547821045, -0.9026582837104797, -0.779194712638855, -0.6557310819625854, -0.5322675108909607, -0.40880393981933594, -0.2853403687477112, -0.16187676787376404, -0.038413166999816895, 0.08505040407180786, 0.20851397514343262, 0.33197760581970215, 0.4554411768913269, 0.5789047479629517, 0.7023683190345764, 0.8258318901062012, 0.9492955207824707, 1.0727591514587402, 1.1962226629257202, 1.3196862936019897, 1.4431498050689697, 1.5666134357452393, 1.6900770664215088, 1.8135405778884888, 1.9370042085647583, 2.0604677200317383, 2.183931350708008, 2.3073949813842773, 2.430858612060547, 2.5543222427368164, 2.677785873413086, 2.8012495040893555, 2.924713134765625, 3.0481765270233154, 3.171640157699585, 3.2951037883758545, 3.418567419052124, 3.5420308113098145]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 9.0, 15.0, 19.0, 31.0, 44.0, 45.0, 91.0, 138.0, 239.0, 411.0, 931.0, 2344.0, 9193.0, 61619.0, 1948612.0, 2084997.0, 68394.0, 11057.0, 3667.0, 1273.0, 464.0, 252.0, 123.0, 82.0, 64.0, 32.0, 39.0, 16.0, 12.0, 13.0, 10.0, 5.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0859375, -2.0246124267578125, -1.963287353515625, -1.9019622802734375, -1.84063720703125, -1.7793121337890625, -1.717987060546875, -1.6566619873046875, -1.5953369140625, -1.5340118408203125, -1.472686767578125, -1.4113616943359375, -1.35003662109375, -1.2887115478515625, -1.227386474609375, -1.1660614013671875, -1.104736328125, -1.0434112548828125, -0.982086181640625, -0.9207611083984375, -0.85943603515625, -0.7981109619140625, -0.736785888671875, -0.6754608154296875, -0.6141357421875, -0.5528106689453125, -0.491485595703125, -0.4301605224609375, -0.36883544921875, -0.3075103759765625, -0.246185302734375, -0.1848602294921875, -0.12353515625, -0.0622100830078125, -0.000885009765625, 0.0604400634765625, 0.12176513671875, 0.1830902099609375, 0.244415283203125, 0.3057403564453125, 0.3670654296875, 0.4283905029296875, 0.489715576171875, 0.5510406494140625, 0.61236572265625, 0.6736907958984375, 0.735015869140625, 0.7963409423828125, 0.857666015625, 0.9189910888671875, 0.980316162109375, 1.0416412353515625, 1.10296630859375, 1.1642913818359375, 1.225616455078125, 1.2869415283203125, 1.3482666015625, 1.4095916748046875, 1.470916748046875, 1.5322418212890625, 1.59356689453125, 1.6548919677734375, 1.716217041015625, 1.7775421142578125, 1.8388671875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 16.0, 14.0, 20.0, 30.0, 43.0, 48.0, 85.0, 92.0, 94.0, 105.0, 99.0, 93.0, 70.0, 66.0, 43.0, 27.0, 17.0, 16.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7109375, -1.6696319580078125, -1.628326416015625, -1.5870208740234375, -1.54571533203125, -1.5044097900390625, -1.463104248046875, -1.4217987060546875, -1.3804931640625, -1.3391876220703125, -1.297882080078125, -1.2565765380859375, -1.21527099609375, -1.1739654541015625, -1.132659912109375, -1.0913543701171875, -1.050048828125, -1.0087432861328125, -0.967437744140625, -0.9261322021484375, -0.88482666015625, -0.8435211181640625, -0.802215576171875, -0.7609100341796875, -0.7196044921875, -0.6782989501953125, -0.636993408203125, -0.5956878662109375, -0.55438232421875, -0.5130767822265625, -0.471771240234375, -0.4304656982421875, -0.38916015625, -0.3478546142578125, -0.306549072265625, -0.2652435302734375, -0.22393798828125, -0.1826324462890625, -0.141326904296875, -0.1000213623046875, -0.0587158203125, -0.0174102783203125, 0.023895263671875, 0.0652008056640625, 0.10650634765625, 0.1478118896484375, 0.189117431640625, 0.2304229736328125, 0.271728515625, 0.3130340576171875, 0.354339599609375, 0.3956451416015625, 0.43695068359375, 0.4782562255859375, 0.519561767578125, 0.5608673095703125, 0.6021728515625, 0.6434783935546875, 0.684783935546875, 0.7260894775390625, 0.76739501953125, 0.8087005615234375, 0.850006103515625, 0.8913116455078125, 0.9326171875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 6.0, 2.0, 5.0, 11.0, 13.0, 21.0, 29.0, 53.0, 111.0, 209.0, 639.0, 3405.0, 77881.0, 4064693.0, 43795.0, 2589.0, 420.0, 177.0, 77.0, 46.0, 27.0, 20.0, 12.0, 16.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.841796875, -3.733367919921875, -3.62493896484375, -3.516510009765625, -3.4080810546875, -3.299652099609375, -3.19122314453125, -3.082794189453125, -2.974365234375, -2.865936279296875, -2.75750732421875, -2.649078369140625, -2.5406494140625, -2.432220458984375, -2.32379150390625, -2.215362548828125, -2.10693359375, -1.998504638671875, -1.89007568359375, -1.781646728515625, -1.6732177734375, -1.564788818359375, -1.45635986328125, -1.347930908203125, -1.239501953125, -1.131072998046875, -1.02264404296875, -0.914215087890625, -0.8057861328125, -0.697357177734375, -0.58892822265625, -0.480499267578125, -0.3720703125, -0.263641357421875, -0.15521240234375, -0.046783447265625, 0.0616455078125, 0.170074462890625, 0.27850341796875, 0.386932373046875, 0.495361328125, 0.603790283203125, 0.71221923828125, 0.820648193359375, 0.9290771484375, 1.037506103515625, 1.14593505859375, 1.254364013671875, 1.36279296875, 1.471221923828125, 1.57965087890625, 1.688079833984375, 1.7965087890625, 1.904937744140625, 2.01336669921875, 2.121795654296875, 2.230224609375, 2.338653564453125, 2.44708251953125, 2.555511474609375, 2.6639404296875, 2.772369384765625, 2.88079833984375, 2.989227294921875, 3.09765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 8.0, 9.0, 12.0, 12.0, 23.0, 21.0, 20.0, 42.0, 63.0, 87.0, 153.0, 302.0, 658.0, 895.0, 755.0, 419.0, 210.0, 126.0, 70.0, 56.0, 42.0, 28.0, 24.0, 16.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.398681640625, -0.3848114013671875, -0.370941162109375, -0.3570709228515625, -0.34320068359375, -0.3293304443359375, -0.315460205078125, -0.3015899658203125, -0.2877197265625, -0.2738494873046875, -0.259979248046875, -0.2461090087890625, -0.23223876953125, -0.2183685302734375, -0.204498291015625, -0.1906280517578125, -0.1767578125, -0.1628875732421875, -0.149017333984375, -0.1351470947265625, -0.12127685546875, -0.1074066162109375, -0.093536376953125, -0.0796661376953125, -0.0657958984375, -0.0519256591796875, -0.038055419921875, -0.0241851806640625, -0.01031494140625, 0.0035552978515625, 0.017425537109375, 0.0312957763671875, 0.045166015625, 0.0590362548828125, 0.072906494140625, 0.0867767333984375, 0.10064697265625, 0.1145172119140625, 0.128387451171875, 0.1422576904296875, 0.1561279296875, 0.1699981689453125, 0.183868408203125, 0.1977386474609375, 0.21160888671875, 0.2254791259765625, 0.239349365234375, 0.2532196044921875, 0.26708984375, 0.2809600830078125, 0.294830322265625, 0.3087005615234375, 0.32257080078125, 0.3364410400390625, 0.350311279296875, 0.3641815185546875, 0.3780517578125, 0.3919219970703125, 0.405792236328125, 0.4196624755859375, 0.43353271484375, 0.4474029541015625, 0.461273193359375, 0.4751434326171875, 0.489013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 6.0, 16.0, 8.0, 13.0, 21.0, 24.0, 39.0, 56.0, 75.0, 83.0, 82.0, 90.0, 116.0, 95.0, 63.0, 65.0, 40.0, 36.0, 17.0, 13.0, 15.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2112107276916504, -1.1741975545883179, -1.1371842622756958, -1.1001710891723633, -1.0631577968597412, -1.0261446237564087, -0.9891313314437866, -0.9521181583404541, -0.915104866027832, -0.8780916333198547, -0.8410784006118774, -0.8040651679039001, -0.7670519351959229, -0.7300387024879456, -0.6930254697799683, -0.6560122966766357, -0.6189990639686584, -0.5819858312606812, -0.5449725985527039, -0.5079593658447266, -0.47094613313674927, -0.433932900428772, -0.39691969752311707, -0.35990646481513977, -0.3228932321071625, -0.2858799993991852, -0.24886676669120789, -0.21185354888439178, -0.1748403161764145, -0.1378270834684372, -0.1008138656616211, -0.0638006329536438, -0.026787400245666504, 0.010225828737020493, 0.04723905771970749, 0.08425228297710419, 0.12126551568508148, 0.15827874839305878, 0.19529196619987488, 0.23230519890785217, 0.26931843161582947, 0.30633166432380676, 0.34334489703178406, 0.38035809993743896, 0.41737133264541626, 0.45438456535339355, 0.49139779806137085, 0.5284110307693481, 0.5654242634773254, 0.6024374961853027, 0.63945072889328, 0.6764639616012573, 0.7134771943092346, 0.7504904270172119, 0.7875036001205444, 0.8245168924331665, 0.861530065536499, 0.8985432982444763, 0.9355565309524536, 0.9725697636604309, 1.0095829963684082, 1.0465961694717407, 1.0836094617843628, 1.1206226348876953, 1.1576359272003174]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 3.0, 4.0, 10.0, 15.0, 13.0, 19.0, 24.0, 41.0, 23.0, 42.0, 46.0, 51.0, 53.0, 51.0, 59.0, 50.0, 64.0, 58.0, 61.0, 61.0, 45.0, 44.0, 33.0, 27.0, 25.0, 15.0, 19.0, 10.0, 11.0, 5.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.091112494468689, -1.061570405960083, -1.0320284366607666, -1.0024863481521606, -0.9729443192481995, -0.9434022903442383, -0.9138602018356323, -0.8843181729316711, -0.85477614402771, -0.8252341151237488, -0.7956920266151428, -0.7661499977111816, -0.7366079688072205, -0.7070659399032593, -0.6775238513946533, -0.6479818224906921, -0.6184397339820862, -0.588897705078125, -0.559355616569519, -0.5298135876655579, -0.5002715587615967, -0.4707295000553131, -0.44118744134902954, -0.41164541244506836, -0.3821033537387848, -0.3525612950325012, -0.32301926612854004, -0.29347720742225647, -0.2639351487159729, -0.23439311981201172, -0.20485106110572815, -0.17530901730060577, -0.1457669734954834, -0.11622492969036102, -0.08668287843465805, -0.05714082717895508, -0.027598783373832703, 0.0019432604312896729, 0.03148531913757324, 0.06102736294269562, 0.090569406747818, 0.12011145055294037, 0.14965349435806274, 0.1791955530643463, 0.2087375968694687, 0.23827964067459106, 0.26782169938087463, 0.2973637580871582, 0.3269057869911194, 0.35644784569740295, 0.38598987460136414, 0.4155319333076477, 0.4450739622116089, 0.47461602091789246, 0.504158079624176, 0.5337001085281372, 0.5632421970367432, 0.5927842259407043, 0.6223263144493103, 0.6518683433532715, 0.6814103722572327, 0.7109524011611938, 0.7404944896697998, 0.770036518573761, 0.7995785474777222]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 7.0, 16.0, 34.0, 43.0, 70.0, 82.0, 177.0, 303.0, 667.0, 1371.0, 3416.0, 14312.0, 171179.0, 781384.0, 62628.0, 8147.0, 2471.0, 1088.0, 487.0, 256.0, 120.0, 85.0, 50.0, 36.0, 28.0, 21.0, 12.0, 7.0, 5.0, 2.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.33739280700683594, -0.3281059265136719, -0.3188190460205078, -0.30953216552734375, -0.3002452850341797, -0.2909584045410156, -0.28167152404785156, -0.2723846435546875, -0.26309776306152344, -0.2538108825683594, -0.2445240020751953, -0.23523712158203125, -0.2259502410888672, -0.21666336059570312, -0.20737648010253906, -0.198089599609375, -0.18880271911621094, -0.17951583862304688, -0.1702289581298828, -0.16094207763671875, -0.1516551971435547, -0.14236831665039062, -0.13308143615722656, -0.1237945556640625, -0.11450767517089844, -0.10522079467773438, -0.09593391418457031, -0.08664703369140625, -0.07736015319824219, -0.06807327270507812, -0.05878639221191406, -0.04949951171875, -0.04021263122558594, -0.030925750732421875, -0.021638870239257812, -0.01235198974609375, -0.0030651092529296875, 0.006221771240234375, 0.015508651733398438, 0.0247955322265625, 0.03408241271972656, 0.043369293212890625, 0.05265617370605469, 0.06194305419921875, 0.07122993469238281, 0.08051681518554688, 0.08980369567871094, 0.099090576171875, 0.10837745666503906, 0.11766433715820312, 0.1269512176513672, 0.13623809814453125, 0.1455249786376953, 0.15481185913085938, 0.16409873962402344, 0.1733856201171875, 0.18267250061035156, 0.19195938110351562, 0.2012462615966797, 0.21053314208984375, 0.2198200225830078, 0.22910690307617188, 0.23839378356933594, 0.2476806640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 10.0, 15.0, 18.0, 23.0, 34.0, 63.0, 58.0, 77.0, 84.0, 91.0, 90.0, 84.0, 83.0, 84.0, 56.0, 37.0, 30.0, 16.0, 18.0, 9.0, 6.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -1.0001296997070312, -0.9738922119140625, -0.9476547241210938, -0.921417236328125, -0.8951797485351562, -0.8689422607421875, -0.8427047729492188, -0.81646728515625, -0.7902297973632812, -0.7639923095703125, -0.7377548217773438, -0.711517333984375, -0.6852798461914062, -0.6590423583984375, -0.6328048706054688, -0.6065673828125, -0.5803298950195312, -0.5540924072265625, -0.5278549194335938, -0.501617431640625, -0.47537994384765625, -0.4491424560546875, -0.42290496826171875, -0.39666748046875, -0.37042999267578125, -0.3441925048828125, -0.31795501708984375, -0.291717529296875, -0.26548004150390625, -0.2392425537109375, -0.21300506591796875, -0.186767578125, -0.16053009033203125, -0.1342926025390625, -0.10805511474609375, -0.081817626953125, -0.05558013916015625, -0.0293426513671875, -0.00310516357421875, 0.02313232421875, 0.04936981201171875, 0.0756072998046875, 0.10184478759765625, 0.128082275390625, 0.15431976318359375, 0.1805572509765625, 0.20679473876953125, 0.2330322265625, 0.25926971435546875, 0.2855072021484375, 0.31174468994140625, 0.337982177734375, 0.36421966552734375, 0.3904571533203125, 0.41669464111328125, 0.44293212890625, 0.46916961669921875, 0.4954071044921875, 0.5216445922851562, 0.547882080078125, 0.5741195678710938, 0.6003570556640625, 0.6265945434570312, 0.65283203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 10.0, 8.0, 12.0, 11.0, 31.0, 38.0, 75.0, 90.0, 140.0, 207.0, 296.0, 493.0, 749.0, 1161.0, 1793.0, 2654.0, 4394.0, 7768.0, 13453.0, 23533.0, 43366.0, 79572.0, 142170.0, 210013.0, 207164.0, 136720.0, 76055.0, 41467.0, 22937.0, 12653.0, 7525.0, 4411.0, 2707.0, 1703.0, 1120.0, 673.0, 467.0, 284.0, 200.0, 147.0, 90.0, 65.0, 44.0, 26.0, 22.0, 18.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.042266845703125, -0.040944576263427734, -0.03962230682373047, -0.0383000373840332, -0.03697776794433594, -0.03565549850463867, -0.034333229064941406, -0.03301095962524414, -0.031688690185546875, -0.03036642074584961, -0.029044151306152344, -0.027721881866455078, -0.026399612426757812, -0.025077342987060547, -0.02375507354736328, -0.022432804107666016, -0.02111053466796875, -0.019788265228271484, -0.01846599578857422, -0.017143726348876953, -0.015821456909179688, -0.014499187469482422, -0.013176918029785156, -0.01185464859008789, -0.010532379150390625, -0.00921010971069336, -0.007887840270996094, -0.006565570831298828, -0.0052433013916015625, -0.003921031951904297, -0.0025987625122070312, -0.0012764930725097656, 4.57763671875e-05, 0.0013680458068847656, 0.0026903152465820312, 0.004012584686279297, 0.0053348541259765625, 0.006657123565673828, 0.007979393005371094, 0.00930166244506836, 0.010623931884765625, 0.01194620132446289, 0.013268470764160156, 0.014590740203857422, 0.015913009643554688, 0.017235279083251953, 0.01855754852294922, 0.019879817962646484, 0.02120208740234375, 0.022524356842041016, 0.02384662628173828, 0.025168895721435547, 0.026491165161132812, 0.027813434600830078, 0.029135704040527344, 0.03045797348022461, 0.031780242919921875, 0.03310251235961914, 0.034424781799316406, 0.03574705123901367, 0.03706932067871094, 0.0383915901184082, 0.03971385955810547, 0.041036128997802734, 0.0423583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 14.0, 16.0, 19.0, 15.0, 19.0, 29.0, 38.0, 35.0, 43.0, 49.0, 58.0, 39.0, 52.0, 50.0, 45.0, 36.0, 46.0, 60.0, 58.0, 39.0, 25.0, 28.0, 21.0, 27.0, 23.0, 19.0, 10.0, 15.0, 6.0, 6.0, 6.0, 10.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.9033203125, -0.87750244140625, -0.8516845703125, -0.82586669921875, -0.800048828125, -0.77423095703125, -0.7484130859375, -0.72259521484375, -0.69677734375, -0.67095947265625, -0.6451416015625, -0.61932373046875, -0.593505859375, -0.56768798828125, -0.5418701171875, -0.51605224609375, -0.490234375, -0.46441650390625, -0.4385986328125, -0.41278076171875, -0.386962890625, -0.36114501953125, -0.3353271484375, -0.30950927734375, -0.28369140625, -0.25787353515625, -0.2320556640625, -0.20623779296875, -0.180419921875, -0.15460205078125, -0.1287841796875, -0.10296630859375, -0.0771484375, -0.05133056640625, -0.0255126953125, 0.00030517578125, 0.026123046875, 0.05194091796875, 0.0777587890625, 0.10357666015625, 0.12939453125, 0.15521240234375, 0.1810302734375, 0.20684814453125, 0.232666015625, 0.25848388671875, 0.2843017578125, 0.31011962890625, 0.3359375, 0.36175537109375, 0.3875732421875, 0.41339111328125, 0.439208984375, 0.46502685546875, 0.4908447265625, 0.51666259765625, 0.54248046875, 0.56829833984375, 0.5941162109375, 0.61993408203125, 0.645751953125, 0.67156982421875, 0.6973876953125, 0.72320556640625, 0.7490234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 15.0, 18.0, 26.0, 34.0, 50.0, 73.0, 94.0, 163.0, 246.0, 366.0, 676.0, 1246.0, 2650.0, 5778.0, 14672.0, 40308.0, 124197.0, 322647.0, 333566.0, 131100.0, 43132.0, 15387.0, 6170.0, 2672.0, 1387.0, 666.0, 410.0, 268.0, 151.0, 103.0, 72.0, 45.0, 40.0, 27.0, 23.0, 20.0, 8.0, 12.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0080718994140625, -0.007819890975952148, -0.007567882537841797, -0.007315874099731445, -0.007063865661621094, -0.006811857223510742, -0.006559848785400391, -0.006307840347290039, -0.0060558319091796875, -0.005803823471069336, -0.005551815032958984, -0.005299806594848633, -0.005047798156738281, -0.00479578971862793, -0.004543781280517578, -0.0042917728424072266, -0.004039764404296875, -0.0037877559661865234, -0.003535747528076172, -0.0032837390899658203, -0.0030317306518554688, -0.002779722213745117, -0.0025277137756347656, -0.002275705337524414, -0.0020236968994140625, -0.001771688461303711, -0.0015196800231933594, -0.0012676715850830078, -0.0010156631469726562, -0.0007636547088623047, -0.0005116462707519531, -0.00025963783264160156, -7.62939453125e-06, 0.00024437904357910156, 0.0004963874816894531, 0.0007483959197998047, 0.0010004043579101562, 0.0012524127960205078, 0.0015044212341308594, 0.001756429672241211, 0.0020084381103515625, 0.002260446548461914, 0.0025124549865722656, 0.002764463424682617, 0.0030164718627929688, 0.0032684803009033203, 0.003520488739013672, 0.0037724971771240234, 0.004024505615234375, 0.0042765140533447266, 0.004528522491455078, 0.00478053092956543, 0.005032539367675781, 0.005284547805786133, 0.005536556243896484, 0.005788564682006836, 0.0060405731201171875, 0.006292581558227539, 0.006544589996337891, 0.006796598434448242, 0.007048606872558594, 0.007300615310668945, 0.007552623748779297, 0.0078046321868896484, 0.008056640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 4.0, 14.0, 12.0, 23.0, 54.0, 66.0, 87.0, 146.0, 147.0, 155.0, 88.0, 78.0, 48.0, 23.0, 19.0, 15.0, 6.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.753734588623047e-05, -2.660602331161499e-05, -2.5674700736999512e-05, -2.4743378162384033e-05, -2.3812055587768555e-05, -2.2880733013153076e-05, -2.1949410438537598e-05, -2.101808786392212e-05, -2.008676528930664e-05, -1.9155442714691162e-05, -1.8224120140075684e-05, -1.7292797565460205e-05, -1.6361474990844727e-05, -1.5430152416229248e-05, -1.449882984161377e-05, -1.3567507266998291e-05, -1.2636184692382812e-05, -1.1704862117767334e-05, -1.0773539543151855e-05, -9.842216968536377e-06, -8.910894393920898e-06, -7.97957181930542e-06, -7.048249244689941e-06, -6.116926670074463e-06, -5.185604095458984e-06, -4.254281520843506e-06, -3.3229589462280273e-06, -2.391636371612549e-06, -1.4603137969970703e-06, -5.289912223815918e-07, 4.023313522338867e-07, 1.3336539268493652e-06, 2.2649765014648438e-06, 3.1962990760803223e-06, 4.127621650695801e-06, 5.058944225311279e-06, 5.990266799926758e-06, 6.921589374542236e-06, 7.852911949157715e-06, 8.784234523773193e-06, 9.715557098388672e-06, 1.064687967300415e-05, 1.1578202247619629e-05, 1.2509524822235107e-05, 1.3440847396850586e-05, 1.4372169971466064e-05, 1.5303492546081543e-05, 1.623481512069702e-05, 1.71661376953125e-05, 1.809746026992798e-05, 1.9028782844543457e-05, 1.9960105419158936e-05, 2.0891427993774414e-05, 2.1822750568389893e-05, 2.275407314300537e-05, 2.368539571762085e-05, 2.4616718292236328e-05, 2.5548040866851807e-05, 2.6479363441467285e-05, 2.7410686016082764e-05, 2.8342008590698242e-05, 2.927333116531372e-05, 3.02046537399292e-05, 3.113597631454468e-05, 3.2067298889160156e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 12.0, 11.0, 11.0, 13.0, 21.0, 43.0, 45.0, 95.0, 159.0, 295.0, 933.0, 3656.0, 20649.0, 207140.0, 709369.0, 91404.0, 11186.0, 2273.0, 672.0, 225.0, 99.0, 68.0, 45.0, 30.0, 36.0, 12.0, 11.0, 12.0, 12.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0167388916015625, -0.016187191009521484, -0.01563549041748047, -0.015083789825439453, -0.014532089233398438, -0.013980388641357422, -0.013428688049316406, -0.01287698745727539, -0.012325286865234375, -0.01177358627319336, -0.011221885681152344, -0.010670185089111328, -0.010118484497070312, -0.009566783905029297, -0.009015083312988281, -0.008463382720947266, -0.00791168212890625, -0.007359981536865234, -0.006808280944824219, -0.006256580352783203, -0.0057048797607421875, -0.005153179168701172, -0.004601478576660156, -0.004049777984619141, -0.003498077392578125, -0.0029463768005371094, -0.0023946762084960938, -0.0018429756164550781, -0.0012912750244140625, -0.0007395744323730469, -0.00018787384033203125, 0.0003638267517089844, 0.00091552734375, 0.0014672279357910156, 0.0020189285278320312, 0.002570629119873047, 0.0031223297119140625, 0.003674030303955078, 0.004225730895996094, 0.004777431488037109, 0.005329132080078125, 0.005880832672119141, 0.006432533264160156, 0.006984233856201172, 0.0075359344482421875, 0.008087635040283203, 0.008639335632324219, 0.009191036224365234, 0.00974273681640625, 0.010294437408447266, 0.010846138000488281, 0.011397838592529297, 0.011949539184570312, 0.012501239776611328, 0.013052940368652344, 0.01360464096069336, 0.014156341552734375, 0.01470804214477539, 0.015259742736816406, 0.015811443328857422, 0.016363143920898438, 0.016914844512939453, 0.01746654510498047, 0.018018245697021484, 0.0185699462890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 9.0, 4.0, 12.0, 15.0, 17.0, 12.0, 18.0, 24.0, 43.0, 39.0, 48.0, 55.0, 74.0, 72.0, 79.0, 51.0, 72.0, 62.0, 61.0, 46.0, 27.0, 33.0, 28.0, 15.0, 22.0, 6.0, 10.0, 7.0, 7.0, 1.0, 3.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022602081298828125, -0.0021872520446777344, -0.0021142959594726562, -0.002041339874267578, -0.0019683837890625, -0.0018954277038574219, -0.0018224716186523438, -0.0017495155334472656, -0.0016765594482421875, -0.0016036033630371094, -0.0015306472778320312, -0.0014576911926269531, -0.001384735107421875, -0.0013117790222167969, -0.0012388229370117188, -0.0011658668518066406, -0.0010929107666015625, -0.0010199546813964844, -0.0009469985961914062, -0.0008740425109863281, -0.00080108642578125, -0.0007281303405761719, -0.0006551742553710938, -0.0005822181701660156, -0.0005092620849609375, -0.0004363059997558594, -0.00036334991455078125, -0.0002903938293457031, -0.000217437744140625, -0.00014448165893554688, -7.152557373046875e-05, 1.430511474609375e-06, 7.43865966796875e-05, 0.00014734268188476562, 0.00022029876708984375, 0.0002932548522949219, 0.0003662109375, 0.0004391670227050781, 0.0005121231079101562, 0.0005850791931152344, 0.0006580352783203125, 0.0007309913635253906, 0.0008039474487304688, 0.0008769035339355469, 0.000949859619140625, 0.0010228157043457031, 0.0010957717895507812, 0.0011687278747558594, 0.0012416839599609375, 0.0013146400451660156, 0.0013875961303710938, 0.0014605522155761719, 0.00153350830078125, 0.0016064643859863281, 0.0016794204711914062, 0.0017523765563964844, 0.0018253326416015625, 0.0018982887268066406, 0.0019712448120117188, 0.002044200897216797, 0.002117156982421875, 0.002190113067626953, 0.0022630691528320312, 0.0023360252380371094, 0.0024089813232421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 14.0, 18.0, 15.0, 19.0, 38.0, 54.0, 78.0, 101.0, 102.0, 116.0, 106.0, 108.0, 70.0, 39.0, 42.0, 17.0, 21.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6917679309844971, -0.6682189106941223, -0.6446698904037476, -0.6211209297180176, -0.5975719094276428, -0.5740228891372681, -0.5504738688468933, -0.5269248485565186, -0.5033758878707886, -0.4798268675804138, -0.45627787709236145, -0.4327288568019867, -0.4091798663139343, -0.38563084602355957, -0.3620818257331848, -0.33853280544281006, -0.3149837851524353, -0.29143476486206055, -0.2678857743740082, -0.24433675408363342, -0.22078774869441986, -0.1972387433052063, -0.17368972301483154, -0.15014071762561798, -0.12659171223640442, -0.10304270684719086, -0.0794936940073967, -0.05594468116760254, -0.03239567577838898, -0.008846670389175415, 0.01470234990119934, 0.0382513552904129, 0.061800360679626465, 0.08534936606884003, 0.10889837890863419, 0.13244739174842834, 0.1559963971376419, 0.17954540252685547, 0.20309442281723022, 0.2266434282064438, 0.25019243359565735, 0.2737414538860321, 0.2972904443740845, 0.32083946466445923, 0.344388484954834, 0.36793747544288635, 0.3914864957332611, 0.4150354862213135, 0.43858450651168823, 0.462133526802063, 0.48568251729011536, 0.5092315673828125, 0.5327805280685425, 0.5563295483589172, 0.579878568649292, 0.6034275889396667, 0.6269766092300415, 0.6505256295204163, 0.674074649810791, 0.697623610496521, 0.7211726307868958, 0.7447216510772705, 0.7682706713676453, 0.79181969165802, 0.81536865234375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 4.0, 14.0, 14.0, 19.0, 31.0, 49.0, 50.0, 61.0, 74.0, 72.0, 84.0, 83.0, 85.0, 95.0, 71.0, 51.0, 40.0, 26.0, 29.0, 16.0, 10.0, 8.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9727823734283447, -0.9490792155265808, -0.9253759980201721, -0.9016728401184082, -0.8779696822166443, -0.8542665243148804, -0.8305633068084717, -0.8068601489067078, -0.7831569910049438, -0.7594538331031799, -0.7357506155967712, -0.7120474576950073, -0.6883442997932434, -0.6646411418914795, -0.6409379243850708, -0.6172347664833069, -0.593531608581543, -0.569828450679779, -0.5461252331733704, -0.5224220752716064, -0.49871891736984253, -0.4750157296657562, -0.4513125419616699, -0.427609384059906, -0.4039061665534973, -0.380202978849411, -0.3564998209476471, -0.3327966332435608, -0.3090934753417969, -0.28539028763771057, -0.26168709993362427, -0.23798394203186035, -0.21428078413009644, -0.19057761132717133, -0.16687443852424622, -0.1431712508201599, -0.1194680854678154, -0.09576491266489029, -0.07206173241138458, -0.04835855960845947, -0.024655386805534363, -0.0009522121399641037, 0.022750962525606155, 0.046454139053821564, 0.07015731185674667, 0.09386048465967178, 0.11756366491317749, 0.1412668377161026, 0.1649700105190277, 0.18867318332195282, 0.21237635612487793, 0.23607954382896423, 0.25978270173072815, 0.28348588943481445, 0.30718904733657837, 0.3308922350406647, 0.354595422744751, 0.3782986104488373, 0.4020017683506012, 0.4257049560546875, 0.4494081139564514, 0.4731113016605377, 0.496814489364624, 0.5205176472663879, 0.5442208051681519]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 5.0, 6.0, 5.0, 9.0, 16.0, 24.0, 23.0, 51.0, 57.0, 122.0, 192.0, 368.0, 683.0, 1430.0, 3301.0, 8545.0, 28071.0, 199182.0, 688051.0, 89583.0, 17812.0, 6226.0, 2441.0, 1075.0, 529.0, 278.0, 166.0, 100.0, 63.0, 33.0, 25.0, 21.0, 15.0, 14.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.60009765625, -0.58209228515625, -0.5640869140625, -0.54608154296875, -0.528076171875, -0.51007080078125, -0.4920654296875, -0.47406005859375, -0.4560546875, -0.43804931640625, -0.4200439453125, -0.40203857421875, -0.384033203125, -0.36602783203125, -0.3480224609375, -0.33001708984375, -0.31201171875, -0.29400634765625, -0.2760009765625, -0.25799560546875, -0.239990234375, -0.22198486328125, -0.2039794921875, -0.18597412109375, -0.16796875, -0.14996337890625, -0.1319580078125, -0.11395263671875, -0.095947265625, -0.07794189453125, -0.0599365234375, -0.04193115234375, -0.02392578125, -0.00592041015625, 0.0120849609375, 0.03009033203125, 0.048095703125, 0.06610107421875, 0.0841064453125, 0.10211181640625, 0.1201171875, 0.13812255859375, 0.1561279296875, 0.17413330078125, 0.192138671875, 0.21014404296875, 0.2281494140625, 0.24615478515625, 0.26416015625, 0.28216552734375, 0.3001708984375, 0.31817626953125, 0.336181640625, 0.35418701171875, 0.3721923828125, 0.39019775390625, 0.408203125, 0.42620849609375, 0.4442138671875, 0.46221923828125, 0.480224609375, 0.49822998046875, 0.5162353515625, 0.53424072265625, 0.55224609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 10.0, 8.0, 14.0, 18.0, 19.0, 31.0, 41.0, 49.0, 56.0, 77.0, 63.0, 69.0, 66.0, 81.0, 99.0, 70.0, 59.0, 47.0, 36.0, 23.0, 23.0, 12.0, 10.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.6122589111328125, -1.565338134765625, -1.5184173583984375, -1.47149658203125, -1.4245758056640625, -1.377655029296875, -1.3307342529296875, -1.2838134765625, -1.2368927001953125, -1.189971923828125, -1.1430511474609375, -1.09613037109375, -1.0492095947265625, -1.002288818359375, -0.9553680419921875, -0.908447265625, -0.8615264892578125, -0.814605712890625, -0.7676849365234375, -0.72076416015625, -0.6738433837890625, -0.626922607421875, -0.5800018310546875, -0.5330810546875, -0.4861602783203125, -0.439239501953125, -0.3923187255859375, -0.34539794921875, -0.2984771728515625, -0.251556396484375, -0.2046356201171875, -0.15771484375, -0.1107940673828125, -0.063873291015625, -0.0169525146484375, 0.02996826171875, 0.0768890380859375, 0.123809814453125, 0.1707305908203125, 0.2176513671875, 0.2645721435546875, 0.311492919921875, 0.3584136962890625, 0.40533447265625, 0.4522552490234375, 0.499176025390625, 0.5460968017578125, 0.593017578125, 0.6399383544921875, 0.686859130859375, 0.7337799072265625, 0.78070068359375, 0.8276214599609375, 0.874542236328125, 0.9214630126953125, 0.9683837890625, 1.0153045654296875, 1.062225341796875, 1.1091461181640625, 1.15606689453125, 1.2029876708984375, 1.249908447265625, 1.2968292236328125, 1.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 8.0, 4.0, 7.0, 8.0, 8.0, 8.0, 12.0, 13.0, 12.0, 15.0, 19.0, 28.0, 23.0, 38.0, 45.0, 30.0, 52.0, 67.0, 95.0, 319.0, 3303.0, 916965.0, 125206.0, 1578.0, 224.0, 77.0, 51.0, 58.0, 33.0, 43.0, 20.0, 32.0, 31.0, 14.0, 15.0, 15.0, 14.0, 7.0, 10.0, 9.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.419921875, -2.33892822265625, -2.2579345703125, -2.17694091796875, -2.095947265625, -2.01495361328125, -1.9339599609375, -1.85296630859375, -1.77197265625, -1.69097900390625, -1.6099853515625, -1.52899169921875, -1.447998046875, -1.36700439453125, -1.2860107421875, -1.20501708984375, -1.1240234375, -1.04302978515625, -0.9620361328125, -0.88104248046875, -0.800048828125, -0.71905517578125, -0.6380615234375, -0.55706787109375, -0.47607421875, -0.39508056640625, -0.3140869140625, -0.23309326171875, -0.152099609375, -0.07110595703125, 0.0098876953125, 0.09088134765625, 0.171875, 0.25286865234375, 0.3338623046875, 0.41485595703125, 0.495849609375, 0.57684326171875, 0.6578369140625, 0.73883056640625, 0.81982421875, 0.90081787109375, 0.9818115234375, 1.06280517578125, 1.143798828125, 1.22479248046875, 1.3057861328125, 1.38677978515625, 1.4677734375, 1.54876708984375, 1.6297607421875, 1.71075439453125, 1.791748046875, 1.87274169921875, 1.9537353515625, 2.03472900390625, 2.11572265625, 2.19671630859375, 2.2777099609375, 2.35870361328125, 2.439697265625, 2.52069091796875, 2.6016845703125, 2.68267822265625, 2.763671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 8.0, 4.0, 4.0, 11.0, 4.0, 4.0, 10.0, 12.0, 7.0, 13.0, 18.0, 11.0, 26.0, 20.0, 28.0, 33.0, 34.0, 37.0, 24.0, 43.0, 45.0, 47.0, 35.0, 44.0, 42.0, 38.0, 34.0, 38.0, 44.0, 29.0, 33.0, 36.0, 24.0, 23.0, 25.0, 16.0, 12.0, 18.0, 13.0, 9.0, 9.0, 4.0, 6.0, 9.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.6923828125, -0.6690826416015625, -0.645782470703125, -0.6224822998046875, -0.59918212890625, -0.5758819580078125, -0.552581787109375, -0.5292816162109375, -0.5059814453125, -0.4826812744140625, -0.459381103515625, -0.4360809326171875, -0.41278076171875, -0.3894805908203125, -0.366180419921875, -0.3428802490234375, -0.319580078125, -0.2962799072265625, -0.272979736328125, -0.2496795654296875, -0.22637939453125, -0.2030792236328125, -0.179779052734375, -0.1564788818359375, -0.1331787109375, -0.1098785400390625, -0.086578369140625, -0.0632781982421875, -0.03997802734375, -0.0166778564453125, 0.006622314453125, 0.0299224853515625, 0.05322265625, 0.0765228271484375, 0.099822998046875, 0.1231231689453125, 0.14642333984375, 0.1697235107421875, 0.193023681640625, 0.2163238525390625, 0.2396240234375, 0.2629241943359375, 0.286224365234375, 0.3095245361328125, 0.33282470703125, 0.3561248779296875, 0.379425048828125, 0.4027252197265625, 0.426025390625, 0.4493255615234375, 0.472625732421875, 0.4959259033203125, 0.51922607421875, 0.5425262451171875, 0.565826416015625, 0.5891265869140625, 0.6124267578125, 0.6357269287109375, 0.659027099609375, 0.6823272705078125, 0.70562744140625, 0.7289276123046875, 0.752227783203125, 0.7755279541015625, 0.798828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 13.0, 10.0, 14.0, 15.0, 32.0, 38.0, 59.0, 100.0, 155.0, 286.0, 570.0, 1339.0, 3377.0, 11624.0, 72783.0, 812577.0, 122261.0, 15965.0, 4212.0, 1569.0, 706.0, 335.0, 180.0, 96.0, 68.0, 45.0, 40.0, 19.0, 13.0, 11.0, 8.0, 9.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1397705078125, -0.13561058044433594, -0.13145065307617188, -0.1272907257080078, -0.12313079833984375, -0.11897087097167969, -0.11481094360351562, -0.11065101623535156, -0.1064910888671875, -0.10233116149902344, -0.09817123413085938, -0.09401130676269531, -0.08985137939453125, -0.08569145202636719, -0.08153152465820312, -0.07737159729003906, -0.073211669921875, -0.06905174255371094, -0.06489181518554688, -0.06073188781738281, -0.05657196044921875, -0.05241203308105469, -0.048252105712890625, -0.04409217834472656, -0.0399322509765625, -0.03577232360839844, -0.031612396240234375, -0.027452468872070312, -0.02329254150390625, -0.019132614135742188, -0.014972686767578125, -0.010812759399414062, -0.00665283203125, -0.0024929046630859375, 0.001667022705078125, 0.0058269500732421875, 0.00998687744140625, 0.014146804809570312, 0.018306732177734375, 0.022466659545898438, 0.0266265869140625, 0.030786514282226562, 0.034946441650390625, 0.03910636901855469, 0.04326629638671875, 0.04742622375488281, 0.051586151123046875, 0.05574607849121094, 0.059906005859375, 0.06406593322753906, 0.06822586059570312, 0.07238578796386719, 0.07654571533203125, 0.08070564270019531, 0.08486557006835938, 0.08902549743652344, 0.0931854248046875, 0.09734535217285156, 0.10150527954101562, 0.10566520690917969, 0.10982513427734375, 0.11398506164550781, 0.11814498901367188, 0.12230491638183594, 0.12646484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 3.0, 13.0, 11.0, 15.0, 20.0, 42.0, 87.0, 89.0, 163.0, 166.0, 143.0, 84.0, 53.0, 26.0, 21.0, 20.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5556812286376953e-05, -1.4913268387317657e-05, -1.4269724488258362e-05, -1.3626180589199066e-05, -1.298263669013977e-05, -1.2339092791080475e-05, -1.169554889202118e-05, -1.1052004992961884e-05, -1.0408461093902588e-05, -9.764917194843292e-06, -9.121373295783997e-06, -8.477829396724701e-06, -7.834285497665405e-06, -7.19074159860611e-06, -6.547197699546814e-06, -5.903653800487518e-06, -5.260109901428223e-06, -4.616566002368927e-06, -3.973022103309631e-06, -3.3294782042503357e-06, -2.68593430519104e-06, -2.0423904061317444e-06, -1.3988465070724487e-06, -7.553026080131531e-07, -1.1175870895385742e-07, 5.317851901054382e-07, 1.1753290891647339e-06, 1.8188729882240295e-06, 2.462416887283325e-06, 3.105960786342621e-06, 3.7495046854019165e-06, 4.393048584461212e-06, 5.036592483520508e-06, 5.6801363825798035e-06, 6.323680281639099e-06, 6.967224180698395e-06, 7.6107680797576904e-06, 8.254311978816986e-06, 8.897855877876282e-06, 9.541399776935577e-06, 1.0184943675994873e-05, 1.0828487575054169e-05, 1.1472031474113464e-05, 1.211557537317276e-05, 1.2759119272232056e-05, 1.3402663171291351e-05, 1.4046207070350647e-05, 1.4689750969409943e-05, 1.5333294868469238e-05, 1.5976838767528534e-05, 1.662038266658783e-05, 1.7263926565647125e-05, 1.790747046470642e-05, 1.8551014363765717e-05, 1.9194558262825012e-05, 1.9838102161884308e-05, 2.0481646060943604e-05, 2.11251899600029e-05, 2.1768733859062195e-05, 2.241227775812149e-05, 2.3055821657180786e-05, 2.3699365556240082e-05, 2.4342909455299377e-05, 2.4986453354358673e-05, 2.562999725341797e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 13.0, 17.0, 25.0, 36.0, 31.0, 61.0, 80.0, 148.0, 238.0, 442.0, 941.0, 2027.0, 4976.0, 14191.0, 53821.0, 573896.0, 339506.0, 39314.0, 11252.0, 4022.0, 1686.0, 778.0, 410.0, 239.0, 123.0, 76.0, 60.0, 33.0, 23.0, 23.0, 16.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.1295166015625, -0.12590885162353516, -0.12230110168457031, -0.11869335174560547, -0.11508560180664062, -0.11147785186767578, -0.10787010192871094, -0.1042623519897461, -0.10065460205078125, -0.0970468521118164, -0.09343910217285156, -0.08983135223388672, -0.08622360229492188, -0.08261585235595703, -0.07900810241699219, -0.07540035247802734, -0.0717926025390625, -0.06818485260009766, -0.06457710266113281, -0.06096935272216797, -0.057361602783203125, -0.05375385284423828, -0.05014610290527344, -0.046538352966308594, -0.04293060302734375, -0.039322853088378906, -0.03571510314941406, -0.03210735321044922, -0.028499603271484375, -0.02489185333251953, -0.021284103393554688, -0.017676353454589844, -0.014068603515625, -0.010460853576660156, -0.0068531036376953125, -0.0032453536987304688, 0.000362396240234375, 0.003970146179199219, 0.0075778961181640625, 0.011185646057128906, 0.01479339599609375, 0.018401145935058594, 0.022008895874023438, 0.02561664581298828, 0.029224395751953125, 0.03283214569091797, 0.03643989562988281, 0.040047645568847656, 0.0436553955078125, 0.047263145446777344, 0.05087089538574219, 0.05447864532470703, 0.058086395263671875, 0.06169414520263672, 0.06530189514160156, 0.0689096450805664, 0.07251739501953125, 0.0761251449584961, 0.07973289489746094, 0.08334064483642578, 0.08694839477539062, 0.09055614471435547, 0.09416389465332031, 0.09777164459228516, 0.10137939453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 7.0, 11.0, 5.0, 12.0, 18.0, 23.0, 30.0, 20.0, 59.0, 72.0, 109.0, 114.0, 112.0, 96.0, 67.0, 56.0, 37.0, 21.0, 26.0, 14.0, 10.0, 10.0, 9.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037445068359375, -0.03610658645629883, -0.034768104553222656, -0.033429622650146484, -0.03209114074707031, -0.03075265884399414, -0.02941417694091797, -0.028075695037841797, -0.026737213134765625, -0.025398731231689453, -0.02406024932861328, -0.02272176742553711, -0.021383285522460938, -0.020044803619384766, -0.018706321716308594, -0.017367839813232422, -0.01602935791015625, -0.014690876007080078, -0.013352394104003906, -0.012013912200927734, -0.010675430297851562, -0.00933694839477539, -0.007998466491699219, -0.006659984588623047, -0.005321502685546875, -0.003983020782470703, -0.0026445388793945312, -0.0013060569763183594, 3.24249267578125e-05, 0.0013709068298339844, 0.0027093887329101562, 0.004047870635986328, 0.0053863525390625, 0.006724834442138672, 0.008063316345214844, 0.009401798248291016, 0.010740280151367188, 0.01207876205444336, 0.013417243957519531, 0.014755725860595703, 0.016094207763671875, 0.017432689666748047, 0.01877117156982422, 0.02010965347290039, 0.021448135375976562, 0.022786617279052734, 0.024125099182128906, 0.025463581085205078, 0.02680206298828125, 0.028140544891357422, 0.029479026794433594, 0.030817508697509766, 0.03215599060058594, 0.03349447250366211, 0.03483295440673828, 0.03617143630981445, 0.037509918212890625, 0.0388484001159668, 0.04018688201904297, 0.04152536392211914, 0.04286384582519531, 0.044202327728271484, 0.045540809631347656, 0.04687929153442383, 0.0482177734375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 26.0, 52.0, 150.0, 317.0, 289.0, 112.0, 33.0, 11.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3494338989257812, -1.2125208377838135, -1.0756076574325562, -0.9386945366859436, -0.801781415939331, -0.6648682951927185, -0.527955174446106, -0.3910420536994934, -0.25412893295288086, -0.11721581220626831, 0.01969730854034424, 0.1566104292869568, 0.29352355003356934, 0.4304366707801819, 0.5673497915267944, 0.704262912273407, 0.8411760330200195, 0.9780891537666321, 1.1150022745132446, 1.251915454864502, 1.3888285160064697, 1.5257415771484375, 1.6626547574996948, 1.7995679378509521, 1.93648099899292, 2.0733940601348877, 2.2103071212768555, 2.3472204208374023, 2.48413348197937, 2.621046543121338, 2.7579598426818848, 2.8948729038238525, 3.031785488128662, 3.16869854927063, 3.3056116104125977, 3.4425249099731445, 3.5794379711151123, 3.71635103225708, 3.853264331817627, 3.9901773929595947, 4.1270904541015625, 4.264003753662109, 4.400916576385498, 4.537829875946045, 4.674742698669434, 4.8116559982299805, 4.948569297790527, 5.085482120513916, 5.222395420074463, 5.35930871963501, 5.496221542358398, 5.633134841918945, 5.770048141479492, 5.906960964202881, 6.043874263763428, 6.180787086486816, 6.317700386047363, 6.45461368560791, 6.591526508331299, 6.728439807891846, 6.865352630615234, 7.002265930175781, 7.139179229736328, 7.276092052459717, 7.413005352020264]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 11.0, 9.0, 15.0, 14.0, 21.0, 23.0, 25.0, 28.0, 27.0, 38.0, 44.0, 49.0, 48.0, 52.0, 63.0, 76.0, 48.0, 34.0, 48.0, 50.0, 41.0, 47.0, 35.0, 29.0, 23.0, 27.0, 12.0, 18.0, 9.0, 5.0, 10.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9454090595245361, -1.888095736503601, -1.830782413482666, -1.773469090461731, -1.716155767440796, -1.6588423252105713, -1.6015290021896362, -1.5442156791687012, -1.4869023561477661, -1.429589033126831, -1.372275710105896, -1.314962387084961, -1.2576489448547363, -1.2003357410430908, -1.1430222988128662, -1.0857089757919312, -1.028395652770996, -0.971082329750061, -0.913769006729126, -0.8564556241035461, -0.7991423010826111, -0.741828978061676, -0.6845155954360962, -0.6272022724151611, -0.5698889493942261, -0.512575626373291, -0.45526227355003357, -0.3979489207267761, -0.34063559770584106, -0.283322274684906, -0.22600892186164856, -0.1686955690383911, -0.11138224601745605, -0.0540689080953598, 0.00324442982673645, 0.0605577677488327, 0.11787110567092896, 0.175184428691864, 0.23249778151512146, 0.2898111343383789, 0.34712445735931396, 0.404437780380249, 0.46175113320350647, 0.5190644860267639, 0.576377809047699, 0.633691132068634, 0.6910045146942139, 0.7483178377151489, 0.805631160736084, 0.862944483757019, 0.9202578067779541, 0.9775711894035339, 1.0348844528198242, 1.0921978950500488, 1.1495112180709839, 1.206824541091919, 1.264137864112854, 1.321451187133789, 1.3787645101547241, 1.4360778331756592, 1.4933912754058838, 1.5507044792175293, 1.608017921447754, 1.665331244468689, 1.722644567489624]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 8.0, 0.0, 5.0, 12.0, 8.0, 8.0, 17.0, 22.0, 17.0, 20.0, 33.0, 41.0, 52.0, 96.0, 158.0, 286.0, 520.0, 1110.0, 2589.0, 6581.0, 21521.0, 116430.0, 1303183.0, 2414450.0, 270307.0, 37038.0, 11814.0, 4627.0, 1724.0, 684.0, 347.0, 183.0, 115.0, 71.0, 48.0, 34.0, 24.0, 24.0, 11.0, 13.0, 7.0, 7.0, 9.0, 3.0, 6.0, 2.0, 2.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0], "bins": [-1.2548828125, -1.218170166015625, -1.18145751953125, -1.144744873046875, -1.1080322265625, -1.071319580078125, -1.03460693359375, -0.997894287109375, -0.961181640625, -0.924468994140625, -0.88775634765625, -0.851043701171875, -0.8143310546875, -0.777618408203125, -0.74090576171875, -0.704193115234375, -0.66748046875, -0.630767822265625, -0.59405517578125, -0.557342529296875, -0.5206298828125, -0.483917236328125, -0.44720458984375, -0.410491943359375, -0.373779296875, -0.337066650390625, -0.30035400390625, -0.263641357421875, -0.2269287109375, -0.190216064453125, -0.15350341796875, -0.116790771484375, -0.080078125, -0.043365478515625, -0.00665283203125, 0.030059814453125, 0.0667724609375, 0.103485107421875, 0.14019775390625, 0.176910400390625, 0.213623046875, 0.250335693359375, 0.28704833984375, 0.323760986328125, 0.3604736328125, 0.397186279296875, 0.43389892578125, 0.470611572265625, 0.50732421875, 0.544036865234375, 0.58074951171875, 0.617462158203125, 0.6541748046875, 0.690887451171875, 0.72760009765625, 0.764312744140625, 0.801025390625, 0.837738037109375, 0.87445068359375, 0.911163330078125, 0.9478759765625, 0.984588623046875, 1.02130126953125, 1.058013916015625, 1.0947265625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 20.0, 24.0, 26.0, 45.0, 39.0, 55.0, 60.0, 71.0, 76.0, 66.0, 87.0, 88.0, 70.0, 55.0, 45.0, 35.0, 27.0, 28.0, 16.0, 17.0, 11.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1669921875, -1.1375656127929688, -1.1081390380859375, -1.0787124633789062, -1.049285888671875, -1.0198593139648438, -0.9904327392578125, -0.9610061645507812, -0.93157958984375, -0.9021530151367188, -0.8727264404296875, -0.8432998657226562, -0.813873291015625, -0.7844467163085938, -0.7550201416015625, -0.7255935668945312, -0.6961669921875, -0.6667404174804688, -0.6373138427734375, -0.6078872680664062, -0.578460693359375, -0.5490341186523438, -0.5196075439453125, -0.49018096923828125, -0.46075439453125, -0.43132781982421875, -0.4019012451171875, -0.37247467041015625, -0.343048095703125, -0.31362152099609375, -0.2841949462890625, -0.25476837158203125, -0.225341796875, -0.19591522216796875, -0.1664886474609375, -0.13706207275390625, -0.107635498046875, -0.07820892333984375, -0.0487823486328125, -0.01935577392578125, 0.01007080078125, 0.03949737548828125, 0.0689239501953125, 0.09835052490234375, 0.127777099609375, 0.15720367431640625, 0.1866302490234375, 0.21605682373046875, 0.2454833984375, 0.27490997314453125, 0.3043365478515625, 0.33376312255859375, 0.363189697265625, 0.39261627197265625, 0.4220428466796875, 0.45146942138671875, 0.48089599609375, 0.5103225708007812, 0.5397491455078125, 0.5691757202148438, 0.598602294921875, 0.6280288696289062, 0.6574554443359375, 0.6868820190429688, 0.71630859375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 5.0, 6.0, 7.0, 11.0, 10.0, 13.0, 11.0, 27.0, 25.0, 26.0, 47.0, 70.0, 123.0, 262.0, 1982.0, 2943232.0, 1246091.0, 1695.0, 250.0, 114.0, 75.0, 43.0, 33.0, 27.0, 12.0, 14.0, 13.0, 11.0, 7.0, 5.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.7108154296875, -5.542724609375, -5.3746337890625, -5.20654296875, -5.0384521484375, -4.870361328125, -4.7022705078125, -4.5341796875, -4.3660888671875, -4.197998046875, -4.0299072265625, -3.86181640625, -3.6937255859375, -3.525634765625, -3.3575439453125, -3.189453125, -3.0213623046875, -2.853271484375, -2.6851806640625, -2.51708984375, -2.3489990234375, -2.180908203125, -2.0128173828125, -1.8447265625, -1.6766357421875, -1.508544921875, -1.3404541015625, -1.17236328125, -1.0042724609375, -0.836181640625, -0.6680908203125, -0.5, -0.3319091796875, -0.163818359375, 0.0042724609375, 0.17236328125, 0.3404541015625, 0.508544921875, 0.6766357421875, 0.8447265625, 1.0128173828125, 1.180908203125, 1.3489990234375, 1.51708984375, 1.6851806640625, 1.853271484375, 2.0213623046875, 2.189453125, 2.3575439453125, 2.525634765625, 2.6937255859375, 2.86181640625, 3.0299072265625, 3.197998046875, 3.3660888671875, 3.5341796875, 3.7022705078125, 3.870361328125, 4.0384521484375, 4.20654296875, 4.3746337890625, 4.542724609375, 4.7108154296875, 4.87890625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 11.0, 9.0, 18.0, 15.0, 32.0, 42.0, 56.0, 72.0, 116.0, 188.0, 349.0, 573.0, 770.0, 711.0, 384.0, 262.0, 145.0, 99.0, 55.0, 33.0, 36.0, 32.0, 20.0, 14.0, 4.0, 4.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32373046875, -0.3128318786621094, -0.30193328857421875, -0.2910346984863281, -0.2801361083984375, -0.2692375183105469, -0.25833892822265625, -0.24744033813476562, -0.236541748046875, -0.22564315795898438, -0.21474456787109375, -0.20384597778320312, -0.1929473876953125, -0.18204879760742188, -0.17115020751953125, -0.16025161743164062, -0.14935302734375, -0.13845443725585938, -0.12755584716796875, -0.11665725708007812, -0.1057586669921875, -0.09486007690429688, -0.08396148681640625, -0.07306289672851562, -0.062164306640625, -0.051265716552734375, -0.04036712646484375, -0.029468536376953125, -0.0185699462890625, -0.007671356201171875, 0.00322723388671875, 0.014125823974609375, 0.0250244140625, 0.035923004150390625, 0.04682159423828125, 0.057720184326171875, 0.0686187744140625, 0.07951736450195312, 0.09041595458984375, 0.10131454467773438, 0.112213134765625, 0.12311172485351562, 0.13401031494140625, 0.14490890502929688, 0.1558074951171875, 0.16670608520507812, 0.17760467529296875, 0.18850326538085938, 0.19940185546875, 0.21030044555664062, 0.22119903564453125, 0.23209762573242188, 0.2429962158203125, 0.2538948059082031, 0.26479339599609375, 0.2756919860839844, 0.286590576171875, 0.2974891662597656, 0.30838775634765625, 0.3192863464355469, 0.3301849365234375, 0.3410835266113281, 0.35198211669921875, 0.3628807067871094, 0.373779296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 9.0, 24.0, 18.0, 30.0, 21.0, 64.0, 80.0, 116.0, 118.0, 120.0, 88.0, 73.0, 77.0, 53.0, 39.0, 25.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4201632738113403, -1.3819478750228882, -1.3437325954437256, -1.3055171966552734, -1.2673017978668213, -1.2290863990783691, -1.1908711194992065, -1.1526557207107544, -1.1144404411315918, -1.0762250423431396, -1.038009762763977, -0.9997943639755249, -0.9615789651870728, -0.9233636260032654, -0.885148286819458, -0.8469328880310059, -0.8087174892425537, -0.7705021500587463, -0.7322867512702942, -0.6940714120864868, -0.6558560132980347, -0.6176406741142273, -0.5794253349304199, -0.5412099361419678, -0.5029945969581604, -0.46477922797203064, -0.4265638589859009, -0.3883485198020935, -0.35013315081596375, -0.311917781829834, -0.2737024426460266, -0.23548707365989685, -0.19727158546447754, -0.15905621647834778, -0.12084086239337921, -0.08262550085783005, -0.044410139322280884, -0.006194770336151123, 0.032020583748817444, 0.07023593783378601, 0.10845130681991577, 0.14666667580604553, 0.1848820298910141, 0.22309738397598267, 0.2613127529621124, 0.2995281219482422, 0.33774346113204956, 0.3759588301181793, 0.4141741991043091, 0.45238956809043884, 0.4906049370765686, 0.528820276260376, 0.5670356750488281, 0.6052510142326355, 0.6434663534164429, 0.681681752204895, 0.7198970913887024, 0.7581124305725098, 0.7963278293609619, 0.8345431685447693, 0.8727585077285767, 0.9109739065170288, 0.9491892457008362, 0.9874045848846436, 1.0256199836730957]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 6.0, 15.0, 6.0, 11.0, 17.0, 21.0, 26.0, 22.0, 29.0, 47.0, 46.0, 44.0, 50.0, 54.0, 58.0, 64.0, 49.0, 60.0, 46.0, 56.0, 48.0, 43.0, 41.0, 27.0, 30.0, 12.0, 21.0, 15.0, 7.0, 7.0, 13.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8640813827514648, -0.8385818600654602, -0.8130823969841003, -0.7875828742980957, -0.7620833516120911, -0.7365838885307312, -0.7110843658447266, -0.6855849027633667, -0.6600853800773621, -0.6345858573913574, -0.6090863943099976, -0.5835868716239929, -0.5580873489379883, -0.5325878858566284, -0.5070883631706238, -0.48158887028694153, -0.4560893476009369, -0.43058985471725464, -0.40509033203125, -0.37959083914756775, -0.3540913462638855, -0.32859182357788086, -0.3030923306941986, -0.27759283781051636, -0.2520933151245117, -0.22659380733966827, -0.20109431445598602, -0.17559480667114258, -0.15009531378746033, -0.12459580600261688, -0.09909629821777344, -0.07359680533409119, -0.048097312450408936, -0.02259781025350094, 0.0029016919434070587, 0.028401196002960205, 0.05390069633722305, 0.0794001966714859, 0.10489970445632935, 0.1303991973400116, 0.15589870512485504, 0.1813982129096985, 0.20689770579338074, 0.23239721357822418, 0.2578967213630676, 0.2833962142467499, 0.30889570713043213, 0.33439522981643677, 0.359894722700119, 0.38539421558380127, 0.4108937382698059, 0.43639323115348816, 0.4618927240371704, 0.48739224672317505, 0.5128917694091797, 0.5383912324905396, 0.5638907551765442, 0.5893902778625488, 0.6148897409439087, 0.6403892636299133, 0.665888786315918, 0.6913882493972778, 0.7168877720832825, 0.7423872947692871, 0.767886757850647]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 5.0, 11.0, 13.0, 26.0, 40.0, 82.0, 131.0, 197.0, 432.0, 981.0, 2987.0, 13319.0, 110216.0, 755237.0, 143403.0, 15890.0, 3426.0, 1164.0, 441.0, 223.0, 130.0, 76.0, 39.0, 28.0, 17.0, 11.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23486328125, -0.2276477813720703, -0.22043228149414062, -0.21321678161621094, -0.20600128173828125, -0.19878578186035156, -0.19157028198242188, -0.1843547821044922, -0.1771392822265625, -0.1699237823486328, -0.16270828247070312, -0.15549278259277344, -0.14827728271484375, -0.14106178283691406, -0.13384628295898438, -0.1266307830810547, -0.119415283203125, -0.11219978332519531, -0.10498428344726562, -0.09776878356933594, -0.09055328369140625, -0.08333778381347656, -0.07612228393554688, -0.06890678405761719, -0.0616912841796875, -0.05447578430175781, -0.047260284423828125, -0.04004478454589844, -0.03282928466796875, -0.025613784790039062, -0.018398284912109375, -0.011182785034179688, -0.00396728515625, 0.0032482147216796875, 0.010463714599609375, 0.017679214477539062, 0.02489471435546875, 0.03211021423339844, 0.039325714111328125, 0.04654121398925781, 0.0537567138671875, 0.06097221374511719, 0.06818771362304688, 0.07540321350097656, 0.08261871337890625, 0.08983421325683594, 0.09704971313476562, 0.10426521301269531, 0.111480712890625, 0.11869621276855469, 0.12591171264648438, 0.13312721252441406, 0.14034271240234375, 0.14755821228027344, 0.15477371215820312, 0.1619892120361328, 0.1692047119140625, 0.1764202117919922, 0.18363571166992188, 0.19085121154785156, 0.19806671142578125, 0.20528221130371094, 0.21249771118164062, 0.2197132110595703, 0.2269287109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 12.0, 14.0, 17.0, 24.0, 33.0, 58.0, 70.0, 83.0, 90.0, 89.0, 95.0, 77.0, 94.0, 59.0, 61.0, 47.0, 21.0, 13.0, 18.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.951171875, -0.9260787963867188, -0.9009857177734375, -0.8758926391601562, -0.850799560546875, -0.8257064819335938, -0.8006134033203125, -0.7755203247070312, -0.75042724609375, -0.7253341674804688, -0.7002410888671875, -0.6751480102539062, -0.650054931640625, -0.6249618530273438, -0.5998687744140625, -0.5747756958007812, -0.5496826171875, -0.5245895385742188, -0.4994964599609375, -0.47440338134765625, -0.449310302734375, -0.42421722412109375, -0.3991241455078125, -0.37403106689453125, -0.34893798828125, -0.32384490966796875, -0.2987518310546875, -0.27365875244140625, -0.248565673828125, -0.22347259521484375, -0.1983795166015625, -0.17328643798828125, -0.148193359375, -0.12310028076171875, -0.0980072021484375, -0.07291412353515625, -0.047821044921875, -0.02272796630859375, 0.0023651123046875, 0.02745819091796875, 0.05255126953125, 0.07764434814453125, 0.1027374267578125, 0.12783050537109375, 0.152923583984375, 0.17801666259765625, 0.2031097412109375, 0.22820281982421875, 0.2532958984375, 0.27838897705078125, 0.3034820556640625, 0.32857513427734375, 0.353668212890625, 0.37876129150390625, 0.4038543701171875, 0.42894744873046875, 0.45404052734375, 0.47913360595703125, 0.5042266845703125, 0.5293197631835938, 0.554412841796875, 0.5795059204101562, 0.6045989990234375, 0.6296920776367188, 0.65478515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 11.0, 17.0, 28.0, 22.0, 43.0, 57.0, 102.0, 165.0, 265.0, 379.0, 638.0, 1148.0, 1892.0, 3610.0, 6433.0, 11724.0, 22584.0, 44480.0, 89358.0, 174980.0, 256202.0, 207116.0, 112092.0, 55268.0, 27712.0, 14433.0, 7780.0, 4184.0, 2388.0, 1342.0, 766.0, 504.0, 270.0, 173.0, 132.0, 76.0, 52.0, 30.0, 30.0, 25.0, 7.0, 12.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.048248291015625, -0.04672431945800781, -0.045200347900390625, -0.04367637634277344, -0.04215240478515625, -0.04062843322753906, -0.039104461669921875, -0.03758049011230469, -0.0360565185546875, -0.03453254699707031, -0.033008575439453125, -0.03148460388183594, -0.02996063232421875, -0.028436660766601562, -0.026912689208984375, -0.025388717651367188, -0.02386474609375, -0.022340774536132812, -0.020816802978515625, -0.019292831420898438, -0.01776885986328125, -0.016244888305664062, -0.014720916748046875, -0.013196945190429688, -0.0116729736328125, -0.010149002075195312, -0.008625030517578125, -0.0071010589599609375, -0.00557708740234375, -0.0040531158447265625, -0.002529144287109375, -0.0010051727294921875, 0.000518798828125, 0.0020427703857421875, 0.003566741943359375, 0.0050907135009765625, 0.00661468505859375, 0.008138656616210938, 0.009662628173828125, 0.011186599731445312, 0.0127105712890625, 0.014234542846679688, 0.015758514404296875, 0.017282485961914062, 0.01880645751953125, 0.020330429077148438, 0.021854400634765625, 0.023378372192382812, 0.02490234375, 0.026426315307617188, 0.027950286865234375, 0.029474258422851562, 0.03099822998046875, 0.03252220153808594, 0.034046173095703125, 0.03557014465332031, 0.0370941162109375, 0.03861808776855469, 0.040142059326171875, 0.04166603088378906, 0.04319000244140625, 0.04471397399902344, 0.046237945556640625, 0.04776191711425781, 0.049285888671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 9.0, 14.0, 13.0, 13.0, 26.0, 30.0, 34.0, 36.0, 29.0, 56.0, 60.0, 49.0, 50.0, 54.0, 66.0, 65.0, 46.0, 40.0, 56.0, 39.0, 29.0, 39.0, 29.0, 21.0, 22.0, 16.0, 12.0, 13.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75439453125, -0.7243270874023438, -0.6942596435546875, -0.6641921997070312, -0.634124755859375, -0.6040573120117188, -0.5739898681640625, -0.5439224243164062, -0.51385498046875, -0.48378753662109375, -0.4537200927734375, -0.42365264892578125, -0.393585205078125, -0.36351776123046875, -0.3334503173828125, -0.30338287353515625, -0.2733154296875, -0.24324798583984375, -0.2131805419921875, -0.18311309814453125, -0.153045654296875, -0.12297821044921875, -0.0929107666015625, -0.06284332275390625, -0.03277587890625, -0.00270843505859375, 0.0273590087890625, 0.05742645263671875, 0.087493896484375, 0.11756134033203125, 0.1476287841796875, 0.17769622802734375, 0.207763671875, 0.23783111572265625, 0.2678985595703125, 0.29796600341796875, 0.328033447265625, 0.35810089111328125, 0.3881683349609375, 0.41823577880859375, 0.44830322265625, 0.47837066650390625, 0.5084381103515625, 0.5385055541992188, 0.568572998046875, 0.5986404418945312, 0.6287078857421875, 0.6587753295898438, 0.6888427734375, 0.7189102172851562, 0.7489776611328125, 0.7790451049804688, 0.809112548828125, 0.8391799926757812, 0.8692474365234375, 0.8993148803710938, 0.92938232421875, 0.9594497680664062, 0.9895172119140625, 1.0195846557617188, 1.049652099609375, 1.0797195434570312, 1.1097869873046875, 1.1398544311523438, 1.169921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 4.0, 10.0, 12.0, 18.0, 17.0, 34.0, 63.0, 101.0, 175.0, 290.0, 589.0, 1078.0, 2161.0, 5547.0, 18465.0, 99502.0, 517587.0, 330488.0, 52801.0, 11807.0, 4024.0, 1747.0, 907.0, 462.0, 277.0, 161.0, 82.0, 48.0, 29.0, 17.0, 13.0, 7.0, 6.0, 8.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01221466064453125, -0.011818408966064453, -0.011422157287597656, -0.01102590560913086, -0.010629653930664062, -0.010233402252197266, -0.009837150573730469, -0.009440898895263672, -0.009044647216796875, -0.008648395538330078, -0.008252143859863281, -0.007855892181396484, -0.0074596405029296875, -0.007063388824462891, -0.006667137145996094, -0.006270885467529297, -0.0058746337890625, -0.005478382110595703, -0.005082130432128906, -0.004685878753662109, -0.0042896270751953125, -0.0038933753967285156, -0.0034971237182617188, -0.003100872039794922, -0.002704620361328125, -0.002308368682861328, -0.0019121170043945312, -0.0015158653259277344, -0.0011196136474609375, -0.0007233619689941406, -0.00032711029052734375, 6.914138793945312e-05, 0.00046539306640625, 0.0008616447448730469, 0.0012578964233398438, 0.0016541481018066406, 0.0020503997802734375, 0.0024466514587402344, 0.0028429031372070312, 0.003239154815673828, 0.003635406494140625, 0.004031658172607422, 0.004427909851074219, 0.004824161529541016, 0.0052204132080078125, 0.005616664886474609, 0.006012916564941406, 0.006409168243408203, 0.006805419921875, 0.007201671600341797, 0.007597923278808594, 0.00799417495727539, 0.008390426635742188, 0.008786678314208984, 0.009182929992675781, 0.009579181671142578, 0.009975433349609375, 0.010371685028076172, 0.010767936706542969, 0.011164188385009766, 0.011560440063476562, 0.01195669174194336, 0.012352943420410156, 0.012749195098876953, 0.01314544677734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 11.0, 9.0, 13.0, 23.0, 34.0, 46.0, 59.0, 69.0, 71.0, 91.0, 86.0, 98.0, 80.0, 68.0, 48.0, 32.0, 39.0, 29.0, 14.0, 20.0, 13.0, 6.0, 7.0, 4.0, 1.0, 1.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-2.372264862060547e-05, -2.3150816559791565e-05, -2.257898449897766e-05, -2.2007152438163757e-05, -2.1435320377349854e-05, -2.086348831653595e-05, -2.0291656255722046e-05, -1.9719824194908142e-05, -1.9147992134094238e-05, -1.8576160073280334e-05, -1.800432801246643e-05, -1.7432495951652527e-05, -1.6860663890838623e-05, -1.628883183002472e-05, -1.5716999769210815e-05, -1.5145167708396912e-05, -1.4573335647583008e-05, -1.4001503586769104e-05, -1.34296715259552e-05, -1.2857839465141296e-05, -1.2286007404327393e-05, -1.1714175343513489e-05, -1.1142343282699585e-05, -1.0570511221885681e-05, -9.998679161071777e-06, -9.426847100257874e-06, -8.85501503944397e-06, -8.283182978630066e-06, -7.711350917816162e-06, -7.139518857002258e-06, -6.5676867961883545e-06, -5.995854735374451e-06, -5.424022674560547e-06, -4.852190613746643e-06, -4.280358552932739e-06, -3.7085264921188354e-06, -3.1366944313049316e-06, -2.564862370491028e-06, -1.993030309677124e-06, -1.4211982488632202e-06, -8.493661880493164e-07, -2.775341272354126e-07, 2.942979335784912e-07, 8.66129994392395e-07, 1.4379620552062988e-06, 2.0097941160202026e-06, 2.5816261768341064e-06, 3.1534582376480103e-06, 3.725290298461914e-06, 4.297122359275818e-06, 4.868954420089722e-06, 5.4407864809036255e-06, 6.012618541717529e-06, 6.584450602531433e-06, 7.156282663345337e-06, 7.72811472415924e-06, 8.299946784973145e-06, 8.871778845787048e-06, 9.443610906600952e-06, 1.0015442967414856e-05, 1.058727502822876e-05, 1.1159107089042664e-05, 1.1730939149856567e-05, 1.2302771210670471e-05, 1.2874603271484375e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 5.0, 10.0, 7.0, 15.0, 29.0, 45.0, 64.0, 80.0, 204.0, 433.0, 1096.0, 3391.0, 14847.0, 140150.0, 776160.0, 95831.0, 11700.0, 2740.0, 926.0, 366.0, 171.0, 101.0, 64.0, 40.0, 19.0, 17.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0213470458984375, -0.02074456214904785, -0.020142078399658203, -0.019539594650268555, -0.018937110900878906, -0.018334627151489258, -0.01773214340209961, -0.01712965965270996, -0.016527175903320312, -0.015924692153930664, -0.015322208404541016, -0.014719724655151367, -0.014117240905761719, -0.01351475715637207, -0.012912273406982422, -0.012309789657592773, -0.011707305908203125, -0.011104822158813477, -0.010502338409423828, -0.00989985466003418, -0.009297370910644531, -0.008694887161254883, -0.008092403411865234, -0.007489919662475586, -0.0068874359130859375, -0.006284952163696289, -0.005682468414306641, -0.005079984664916992, -0.004477500915527344, -0.0038750171661376953, -0.003272533416748047, -0.0026700496673583984, -0.00206756591796875, -0.0014650821685791016, -0.0008625984191894531, -0.0002601146697998047, 0.00034236907958984375, 0.0009448528289794922, 0.0015473365783691406, 0.002149820327758789, 0.0027523040771484375, 0.003354787826538086, 0.003957271575927734, 0.004559755325317383, 0.005162239074707031, 0.00576472282409668, 0.006367206573486328, 0.0069696903228759766, 0.007572174072265625, 0.008174657821655273, 0.008777141571044922, 0.00937962532043457, 0.009982109069824219, 0.010584592819213867, 0.011187076568603516, 0.011789560317993164, 0.012392044067382812, 0.012994527816772461, 0.01359701156616211, 0.014199495315551758, 0.014801979064941406, 0.015404462814331055, 0.016006946563720703, 0.01660943031311035, 0.0172119140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 1.0, 3.0, 7.0, 15.0, 9.0, 14.0, 16.0, 23.0, 33.0, 40.0, 68.0, 56.0, 88.0, 116.0, 128.0, 113.0, 74.0, 57.0, 41.0, 24.0, 16.0, 9.0, 9.0, 7.0, 6.0, 10.0, 10.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037593841552734375, -0.003651559352874756, -0.0035437345504760742, -0.0034359097480773926, -0.003328084945678711, -0.0032202601432800293, -0.0031124353408813477, -0.003004610538482666, -0.0028967857360839844, -0.0027889609336853027, -0.002681136131286621, -0.0025733113288879395, -0.002465486526489258, -0.002357661724090576, -0.0022498369216918945, -0.002142012119293213, -0.0020341873168945312, -0.0019263625144958496, -0.001818537712097168, -0.0017107129096984863, -0.0016028881072998047, -0.001495063304901123, -0.0013872385025024414, -0.0012794137001037598, -0.0011715888977050781, -0.0010637640953063965, -0.0009559392929077148, -0.0008481144905090332, -0.0007402896881103516, -0.0006324648857116699, -0.0005246400833129883, -0.00041681528091430664, -0.000308990478515625, -0.00020116567611694336, -9.334087371826172e-05, 1.4483928680419922e-05, 0.00012230873107910156, 0.0002301335334777832, 0.00033795833587646484, 0.0004457831382751465, 0.0005536079406738281, 0.0006614327430725098, 0.0007692575454711914, 0.000877082347869873, 0.0009849071502685547, 0.0010927319526672363, 0.001200556755065918, 0.0013083815574645996, 0.0014162063598632812, 0.0015240311622619629, 0.0016318559646606445, 0.0017396807670593262, 0.0018475055694580078, 0.0019553303718566895, 0.002063155174255371, 0.0021709799766540527, 0.0022788047790527344, 0.002386629581451416, 0.0024944543838500977, 0.0026022791862487793, 0.002710103988647461, 0.0028179287910461426, 0.0029257535934448242, 0.003033578395843506, 0.0031414031982421875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 8.0, 16.0, 18.0, 28.0, 29.0, 40.0, 72.0, 117.0, 116.0, 111.0, 105.0, 84.0, 66.0, 52.0, 57.0, 15.0, 21.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6574042439460754, -0.6350964307785034, -0.6127886772155762, -0.5904808640480042, -0.5681730508804321, -0.5458652973175049, -0.5235574841499329, -0.5012496709823608, -0.4789418876171112, -0.4566341042518616, -0.43432629108428955, -0.4120185077190399, -0.3897107243537903, -0.36740291118621826, -0.34509512782096863, -0.322787344455719, -0.300479531288147, -0.27817174792289734, -0.2558639347553253, -0.23355615139007568, -0.21124835312366486, -0.18894055485725403, -0.1666327714920044, -0.14432497322559357, -0.12201717495918274, -0.09970937669277191, -0.07740158587694168, -0.05509379506111145, -0.03278599679470062, -0.010478198528289795, 0.011829584836959839, 0.034137383103370667, 0.05644512176513672, 0.07875292003154755, 0.10106071084737778, 0.12336850166320801, 0.14567629992961884, 0.16798409819602966, 0.1902918815612793, 0.21259967982769012, 0.23490747809410095, 0.2572152614593506, 0.2795230746269226, 0.30183085799217224, 0.3241386413574219, 0.3464464545249939, 0.36875423789024353, 0.39106202125549316, 0.4133698344230652, 0.4356776177883148, 0.45798543095588684, 0.4802932143211365, 0.5026010274887085, 0.5249087810516357, 0.5472165942192078, 0.5695244073867798, 0.591832160949707, 0.614139974117279, 0.6364477276802063, 0.6587555408477783, 0.6810633540153503, 0.7033711671829224, 0.7256789207458496, 0.7479867339134216, 0.7702945470809937]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 17.0, 18.0, 30.0, 38.0, 51.0, 82.0, 78.0, 71.0, 104.0, 98.0, 78.0, 79.0, 68.0, 56.0, 31.0, 25.0, 20.0, 17.0, 11.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9075912833213806, -0.8842095732688904, -0.8608278632164001, -0.8374460935592651, -0.8140643835067749, -0.7906826734542847, -0.7673009634017944, -0.7439192533493042, -0.720537543296814, -0.6971558332443237, -0.6737741231918335, -0.6503924131393433, -0.6270106434822083, -0.603628933429718, -0.5802472233772278, -0.5568655133247375, -0.5334837436676025, -0.5101020336151123, -0.4867202937602997, -0.46333858370780945, -0.4399568438529968, -0.4165751338005066, -0.39319342374801636, -0.3698117136955261, -0.3464299738407135, -0.32304826378822327, -0.29966652393341064, -0.2762848138809204, -0.2529031038284302, -0.22952136397361755, -0.20613965392112732, -0.1827579289674759, -0.15937620401382446, -0.13599447906017303, -0.1126127615571022, -0.08923104405403137, -0.06584931910037994, -0.042467594146728516, -0.01908588409423828, 0.004295840859413147, 0.027677565813064575, 0.051059287041425705, 0.07444100826978683, 0.09782272577285767, 0.1212044507265091, 0.14458617568016052, 0.16796788573265076, 0.19134961068630219, 0.2147313356399536, 0.23811306059360504, 0.26149478554725647, 0.2848764955997467, 0.3082582354545593, 0.33163994550704956, 0.3550216555595398, 0.37840336561203003, 0.40178510546684265, 0.4251668155193329, 0.4485485553741455, 0.47193026542663574, 0.495311975479126, 0.5186936855316162, 0.5420753955841064, 0.5654571652412415, 0.5888388752937317]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 19.0, 27.0, 53.0, 132.0, 305.0, 746.0, 2390.0, 11042.0, 96389.0, 828915.0, 94111.0, 10632.0, 2453.0, 772.0, 288.0, 118.0, 60.0, 33.0, 16.0, 11.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79150390625, -0.7655487060546875, -0.739593505859375, -0.7136383056640625, -0.68768310546875, -0.6617279052734375, -0.635772705078125, -0.6098175048828125, -0.5838623046875, -0.5579071044921875, -0.531951904296875, -0.5059967041015625, -0.48004150390625, -0.4540863037109375, -0.428131103515625, -0.4021759033203125, -0.376220703125, -0.3502655029296875, -0.324310302734375, -0.2983551025390625, -0.27239990234375, -0.2464447021484375, -0.220489501953125, -0.1945343017578125, -0.1685791015625, -0.1426239013671875, -0.116668701171875, -0.0907135009765625, -0.06475830078125, -0.0388031005859375, -0.012847900390625, 0.0131072998046875, 0.0390625, 0.0650177001953125, 0.090972900390625, 0.1169281005859375, 0.14288330078125, 0.1688385009765625, 0.194793701171875, 0.2207489013671875, 0.2467041015625, 0.2726593017578125, 0.298614501953125, 0.3245697021484375, 0.35052490234375, 0.3764801025390625, 0.402435302734375, 0.4283905029296875, 0.454345703125, 0.4803009033203125, 0.506256103515625, 0.5322113037109375, 0.55816650390625, 0.5841217041015625, 0.610076904296875, 0.6360321044921875, 0.6619873046875, 0.6879425048828125, 0.713897705078125, 0.7398529052734375, 0.76580810546875, 0.7917633056640625, 0.817718505859375, 0.8436737060546875, 0.86962890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 7.0, 7.0, 10.0, 9.0, 14.0, 19.0, 38.0, 37.0, 48.0, 59.0, 65.0, 62.0, 67.0, 79.0, 70.0, 84.0, 63.0, 59.0, 37.0, 41.0, 34.0, 26.0, 13.0, 17.0, 11.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6611328125, -1.6191253662109375, -1.577117919921875, -1.5351104736328125, -1.49310302734375, -1.4510955810546875, -1.409088134765625, -1.3670806884765625, -1.3250732421875, -1.2830657958984375, -1.241058349609375, -1.1990509033203125, -1.15704345703125, -1.1150360107421875, -1.073028564453125, -1.0310211181640625, -0.989013671875, -0.9470062255859375, -0.904998779296875, -0.8629913330078125, -0.82098388671875, -0.7789764404296875, -0.736968994140625, -0.6949615478515625, -0.6529541015625, -0.6109466552734375, -0.568939208984375, -0.5269317626953125, -0.48492431640625, -0.4429168701171875, -0.400909423828125, -0.3589019775390625, -0.31689453125, -0.2748870849609375, -0.232879638671875, -0.1908721923828125, -0.14886474609375, -0.1068572998046875, -0.064849853515625, -0.0228424072265625, 0.0191650390625, 0.0611724853515625, 0.103179931640625, 0.1451873779296875, 0.18719482421875, 0.2292022705078125, 0.271209716796875, 0.3132171630859375, 0.355224609375, 0.3972320556640625, 0.439239501953125, 0.4812469482421875, 0.52325439453125, 0.5652618408203125, 0.607269287109375, 0.6492767333984375, 0.6912841796875, 0.7332916259765625, 0.775299072265625, 0.8173065185546875, 0.85931396484375, 0.9013214111328125, 0.943328857421875, 0.9853363037109375, 1.02734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 11.0, 12.0, 15.0, 23.0, 31.0, 36.0, 58.0, 90.0, 103.0, 153.0, 285.0, 1407.0, 28274.0, 988342.0, 27386.0, 1421.0, 326.0, 142.0, 111.0, 86.0, 44.0, 47.0, 39.0, 21.0, 21.0, 15.0, 15.0, 8.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8056640625, -1.758758544921875, -1.71185302734375, -1.664947509765625, -1.6180419921875, -1.571136474609375, -1.52423095703125, -1.477325439453125, -1.430419921875, -1.383514404296875, -1.33660888671875, -1.289703369140625, -1.2427978515625, -1.195892333984375, -1.14898681640625, -1.102081298828125, -1.05517578125, -1.008270263671875, -0.96136474609375, -0.914459228515625, -0.8675537109375, -0.820648193359375, -0.77374267578125, -0.726837158203125, -0.679931640625, -0.633026123046875, -0.58612060546875, -0.539215087890625, -0.4923095703125, -0.445404052734375, -0.39849853515625, -0.351593017578125, -0.3046875, -0.257781982421875, -0.21087646484375, -0.163970947265625, -0.1170654296875, -0.070159912109375, -0.02325439453125, 0.023651123046875, 0.070556640625, 0.117462158203125, 0.16436767578125, 0.211273193359375, 0.2581787109375, 0.305084228515625, 0.35198974609375, 0.398895263671875, 0.44580078125, 0.492706298828125, 0.53961181640625, 0.586517333984375, 0.6334228515625, 0.680328369140625, 0.72723388671875, 0.774139404296875, 0.821044921875, 0.867950439453125, 0.91485595703125, 0.961761474609375, 1.0086669921875, 1.055572509765625, 1.10247802734375, 1.149383544921875, 1.1962890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 6.0, 12.0, 13.0, 16.0, 29.0, 18.0, 38.0, 33.0, 37.0, 58.0, 37.0, 56.0, 54.0, 46.0, 68.0, 61.0, 56.0, 60.0, 42.0, 44.0, 41.0, 34.0, 27.0, 28.0, 25.0, 13.0, 6.0, 7.0, 11.0, 5.0, 1.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.333984375, -1.2986984252929688, -1.2634124755859375, -1.2281265258789062, -1.192840576171875, -1.1575546264648438, -1.1222686767578125, -1.0869827270507812, -1.05169677734375, -1.0164108276367188, -0.9811248779296875, -0.9458389282226562, -0.910552978515625, -0.8752670288085938, -0.8399810791015625, -0.8046951293945312, -0.7694091796875, -0.7341232299804688, -0.6988372802734375, -0.6635513305664062, -0.628265380859375, -0.5929794311523438, -0.5576934814453125, -0.5224075317382812, -0.48712158203125, -0.45183563232421875, -0.4165496826171875, -0.38126373291015625, -0.345977783203125, -0.31069183349609375, -0.2754058837890625, -0.24011993408203125, -0.204833984375, -0.16954803466796875, -0.1342620849609375, -0.09897613525390625, -0.063690185546875, -0.02840423583984375, 0.0068817138671875, 0.04216766357421875, 0.07745361328125, 0.11273956298828125, 0.1480255126953125, 0.18331146240234375, 0.218597412109375, 0.25388336181640625, 0.2891693115234375, 0.32445526123046875, 0.3597412109375, 0.39502716064453125, 0.4303131103515625, 0.46559906005859375, 0.500885009765625, 0.5361709594726562, 0.5714569091796875, 0.6067428588867188, 0.64202880859375, 0.6773147583007812, 0.7126007080078125, 0.7478866577148438, 0.783172607421875, 0.8184585571289062, 0.8537445068359375, 0.8890304565429688, 0.92431640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 19.0, 26.0, 36.0, 73.0, 140.0, 330.0, 796.0, 2012.0, 6710.0, 36910.0, 767116.0, 209741.0, 17813.0, 4252.0, 1439.0, 579.0, 250.0, 120.0, 61.0, 39.0, 21.0, 13.0, 15.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.15876197814941406, -0.15236282348632812, -0.1459636688232422, -0.13956451416015625, -0.1331653594970703, -0.12676620483398438, -0.12036705017089844, -0.1139678955078125, -0.10756874084472656, -0.10116958618164062, -0.09477043151855469, -0.08837127685546875, -0.08197212219238281, -0.07557296752929688, -0.06917381286621094, -0.062774658203125, -0.05637550354003906, -0.049976348876953125, -0.04357719421386719, -0.03717803955078125, -0.030778884887695312, -0.024379730224609375, -0.017980575561523438, -0.0115814208984375, -0.0051822662353515625, 0.001216888427734375, 0.0076160430908203125, 0.01401519775390625, 0.020414352416992188, 0.026813507080078125, 0.03321266174316406, 0.03961181640625, 0.04601097106933594, 0.052410125732421875, 0.05880928039550781, 0.06520843505859375, 0.07160758972167969, 0.07800674438476562, 0.08440589904785156, 0.0908050537109375, 0.09720420837402344, 0.10360336303710938, 0.11000251770019531, 0.11640167236328125, 0.12280082702636719, 0.12919998168945312, 0.13559913635253906, 0.141998291015625, 0.14839744567871094, 0.15479660034179688, 0.1611957550048828, 0.16759490966796875, 0.1739940643310547, 0.18039321899414062, 0.18679237365722656, 0.1931915283203125, 0.19959068298339844, 0.20598983764648438, 0.2123889923095703, 0.21878814697265625, 0.2251873016357422, 0.23158645629882812, 0.23798561096191406, 0.244384765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 7.0, 4.0, 5.0, 7.0, 19.0, 15.0, 15.0, 28.0, 33.0, 72.0, 85.0, 159.0, 163.0, 122.0, 89.0, 48.0, 29.0, 26.0, 25.0, 10.0, 10.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1398067474365234e-05, -2.0713545382022858e-05, -2.002902328968048e-05, -1.9344501197338104e-05, -1.8659979104995728e-05, -1.797545701265335e-05, -1.7290934920310974e-05, -1.6606412827968597e-05, -1.592189073562622e-05, -1.5237368643283844e-05, -1.4552846550941467e-05, -1.386832445859909e-05, -1.3183802366256714e-05, -1.2499280273914337e-05, -1.181475818157196e-05, -1.1130236089229584e-05, -1.0445713996887207e-05, -9.76119190454483e-06, -9.076669812202454e-06, -8.392147719860077e-06, -7.7076256275177e-06, -7.0231035351753235e-06, -6.338581442832947e-06, -5.65405935049057e-06, -4.969537258148193e-06, -4.285015165805817e-06, -3.60049307346344e-06, -2.9159709811210632e-06, -2.2314488887786865e-06, -1.5469267964363098e-06, -8.624047040939331e-07, -1.778826117515564e-07, 5.066394805908203e-07, 1.191161572933197e-06, 1.8756836652755737e-06, 2.5602057576179504e-06, 3.244727849960327e-06, 3.929249942302704e-06, 4.6137720346450806e-06, 5.298294126987457e-06, 5.982816219329834e-06, 6.667338311672211e-06, 7.351860404014587e-06, 8.036382496356964e-06, 8.72090458869934e-06, 9.405426681041718e-06, 1.0089948773384094e-05, 1.0774470865726471e-05, 1.1458992958068848e-05, 1.2143515050411224e-05, 1.2828037142753601e-05, 1.3512559235095978e-05, 1.4197081327438354e-05, 1.4881603419780731e-05, 1.5566125512123108e-05, 1.6250647604465485e-05, 1.693516969680786e-05, 1.7619691789150238e-05, 1.8304213881492615e-05, 1.898873597383499e-05, 1.9673258066177368e-05, 2.0357780158519745e-05, 2.104230225086212e-05, 2.1726824343204498e-05, 2.2411346435546875e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 2.0, 8.0, 9.0, 22.0, 34.0, 44.0, 81.0, 141.0, 276.0, 650.0, 1547.0, 4395.0, 15302.0, 89464.0, 807141.0, 104763.0, 16752.0, 4844.0, 1701.0, 676.0, 317.0, 143.0, 85.0, 51.0, 23.0, 21.0, 18.0, 14.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1827392578125, -0.17655181884765625, -0.1703643798828125, -0.16417694091796875, -0.157989501953125, -0.15180206298828125, -0.1456146240234375, -0.13942718505859375, -0.13323974609375, -0.12705230712890625, -0.1208648681640625, -0.11467742919921875, -0.108489990234375, -0.10230255126953125, -0.0961151123046875, -0.08992767333984375, -0.083740234375, -0.07755279541015625, -0.0713653564453125, -0.06517791748046875, -0.058990478515625, -0.05280303955078125, -0.0466156005859375, -0.04042816162109375, -0.03424072265625, -0.02805328369140625, -0.0218658447265625, -0.01567840576171875, -0.009490966796875, -0.00330352783203125, 0.0028839111328125, 0.00907135009765625, 0.0152587890625, 0.02144622802734375, 0.0276336669921875, 0.03382110595703125, 0.040008544921875, 0.04619598388671875, 0.0523834228515625, 0.05857086181640625, 0.06475830078125, 0.07094573974609375, 0.0771331787109375, 0.08332061767578125, 0.089508056640625, 0.09569549560546875, 0.1018829345703125, 0.10807037353515625, 0.1142578125, 0.12044525146484375, 0.1266326904296875, 0.13282012939453125, 0.139007568359375, 0.14519500732421875, 0.1513824462890625, 0.15756988525390625, 0.16375732421875, 0.16994476318359375, 0.1761322021484375, 0.18231964111328125, 0.188507080078125, 0.19469451904296875, 0.2008819580078125, 0.20706939697265625, 0.2132568359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 6.0, 10.0, 20.0, 18.0, 51.0, 57.0, 77.0, 159.0, 218.0, 156.0, 82.0, 49.0, 36.0, 13.0, 16.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.11395263671875, -0.11120414733886719, -0.10845565795898438, -0.10570716857910156, -0.10295867919921875, -0.10021018981933594, -0.09746170043945312, -0.09471321105957031, -0.0919647216796875, -0.08921623229980469, -0.08646774291992188, -0.08371925354003906, -0.08097076416015625, -0.07822227478027344, -0.07547378540039062, -0.07272529602050781, -0.069976806640625, -0.06722831726074219, -0.06447982788085938, -0.06173133850097656, -0.05898284912109375, -0.05623435974121094, -0.053485870361328125, -0.05073738098144531, -0.0479888916015625, -0.04524040222167969, -0.042491912841796875, -0.03974342346191406, -0.03699493408203125, -0.03424644470214844, -0.031497955322265625, -0.028749465942382812, -0.0260009765625, -0.023252487182617188, -0.020503997802734375, -0.017755508422851562, -0.01500701904296875, -0.012258529663085938, -0.009510040283203125, -0.0067615509033203125, -0.0040130615234375, -0.0012645721435546875, 0.001483917236328125, 0.0042324066162109375, 0.00698089599609375, 0.009729385375976562, 0.012477874755859375, 0.015226364135742188, 0.017974853515625, 0.020723342895507812, 0.023471832275390625, 0.026220321655273438, 0.02896881103515625, 0.03171730041503906, 0.034465789794921875, 0.03721427917480469, 0.0399627685546875, 0.04271125793457031, 0.045459747314453125, 0.04820823669433594, 0.05095672607421875, 0.05370521545410156, 0.056453704833984375, 0.05920219421386719, 0.06195068359375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 12.0, 19.0, 18.0, 33.0, 53.0, 89.0, 108.0, 143.0, 136.0, 114.0, 85.0, 71.0, 44.0, 26.0, 14.0, 7.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.205672025680542, -2.15190052986145, -2.0981292724609375, -2.0443577766418457, -1.990586280822754, -1.9368149042129517, -1.8830435276031494, -1.8292720317840576, -1.7755006551742554, -1.7217292785644531, -1.6679577827453613, -1.614186406135559, -1.5604150295257568, -1.506643533706665, -1.4528721570968628, -1.3991007804870605, -1.3453292846679688, -1.2915579080581665, -1.2377864122390747, -1.1840150356292725, -1.1302435398101807, -1.0764721632003784, -1.0227007865905762, -0.9689293503761292, -0.9151579141616821, -0.8613864779472351, -0.8076150417327881, -0.7538436651229858, -0.7000722289085388, -0.6463007926940918, -0.5925294160842896, -0.5387579798698425, -0.4849865436553955, -0.4312151074409485, -0.37744370102882385, -0.3236722946166992, -0.2699008584022522, -0.21612942218780518, -0.16235801577568054, -0.10858660936355591, -0.05481517314910889, -0.001043751835823059, 0.05272766947746277, 0.1064990907907486, 0.16027051210403442, 0.21404194831848145, 0.2678133547306061, 0.3215847611427307, 0.37535619735717773, 0.42912763357162476, 0.4828990399837494, 0.536670446395874, 0.590441882610321, 0.6442133188247681, 0.6979846954345703, 0.7517561316490173, 0.8055275678634644, 0.8592990040779114, 0.9130704402923584, 0.9668418169021606, 1.020613193511963, 1.0743846893310547, 1.128156065940857, 1.1819274425506592, 1.235698938369751]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 14.0, 19.0, 25.0, 41.0, 39.0, 49.0, 55.0, 87.0, 90.0, 93.0, 85.0, 93.0, 70.0, 57.0, 65.0, 39.0, 26.0, 21.0, 14.0, 9.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.637506484985352, -4.538212299346924, -4.438917636871338, -4.33962345123291, -4.240329265594482, -4.1410346031188965, -4.041740417480469, -3.942445993423462, -3.843151569366455, -3.7438571453094482, -3.6445629596710205, -3.5452685356140137, -3.445974111557007, -3.3466796875, -3.2473855018615723, -3.1480910778045654, -3.0487968921661377, -2.949502468109131, -2.850208282470703, -2.7509138584136963, -2.6516194343566895, -2.5523252487182617, -2.453030824661255, -2.353736400604248, -2.2544422149658203, -2.1551477909088135, -2.0558536052703857, -1.956559181213379, -1.857264757156372, -1.7579704523086548, -1.6586761474609375, -1.5593817234039307, -1.4600872993469238, -1.3607929944992065, -1.2614985704421997, -1.1622042655944824, -1.0629098415374756, -0.9636155366897583, -0.864321231842041, -0.765026867389679, -0.6657325029373169, -0.5664381384849548, -0.46714380383491516, -0.3678494691848755, -0.2685551047325134, -0.16926074028015137, -0.06996643543243408, 0.02932792901992798, 0.12862229347229004, 0.2279166430234909, 0.3272109925746918, 0.42650532722473145, 0.5257996916770935, 0.6250940561294556, 0.7243883609771729, 0.8236827254295349, 0.922977089881897, 1.0222713947296143, 1.121565818786621, 1.2208601236343384, 1.3201544284820557, 1.4194488525390625, 1.5187431573867798, 1.618037462234497, 1.717331886291504]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 13.0, 15.0, 16.0, 27.0, 34.0, 41.0, 70.0, 76.0, 124.0, 209.0, 324.0, 513.0, 843.0, 1353.0, 2515.0, 4793.0, 10938.0, 27806.0, 103144.0, 620026.0, 2141255.0, 1029429.0, 180345.0, 40557.0, 14945.0, 6727.0, 3401.0, 1785.0, 1077.0, 672.0, 405.0, 251.0, 158.0, 114.0, 80.0, 51.0, 39.0, 26.0, 22.0, 16.0, 16.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.76611328125, -0.7440109252929688, -0.7219085693359375, -0.6998062133789062, -0.677703857421875, -0.6556015014648438, -0.6334991455078125, -0.6113967895507812, -0.58929443359375, -0.5671920776367188, -0.5450897216796875, -0.5229873657226562, -0.500885009765625, -0.47878265380859375, -0.4566802978515625, -0.43457794189453125, -0.4124755859375, -0.39037322998046875, -0.3682708740234375, -0.34616851806640625, -0.324066162109375, -0.30196380615234375, -0.2798614501953125, -0.25775909423828125, -0.23565673828125, -0.21355438232421875, -0.1914520263671875, -0.16934967041015625, -0.147247314453125, -0.12514495849609375, -0.1030426025390625, -0.08094024658203125, -0.058837890625, -0.03673553466796875, -0.0146331787109375, 0.00746917724609375, 0.029571533203125, 0.05167388916015625, 0.0737762451171875, 0.09587860107421875, 0.11798095703125, 0.14008331298828125, 0.1621856689453125, 0.18428802490234375, 0.206390380859375, 0.22849273681640625, 0.2505950927734375, 0.27269744873046875, 0.2947998046875, 0.31690216064453125, 0.3390045166015625, 0.36110687255859375, 0.383209228515625, 0.40531158447265625, 0.4274139404296875, 0.44951629638671875, 0.47161865234375, 0.49372100830078125, 0.5158233642578125, 0.5379257202148438, 0.560028076171875, 0.5821304321289062, 0.6042327880859375, 0.6263351440429688, 0.6484375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 10.0, 17.0, 16.0, 18.0, 34.0, 26.0, 44.0, 41.0, 54.0, 53.0, 63.0, 64.0, 74.0, 77.0, 60.0, 64.0, 60.0, 48.0, 32.0, 30.0, 32.0, 18.0, 14.0, 13.0, 3.0, 8.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7701644897460938, -0.7463836669921875, -0.7226028442382812, -0.698822021484375, -0.6750411987304688, -0.6512603759765625, -0.6274795532226562, -0.60369873046875, -0.5799179077148438, -0.5561370849609375, -0.5323562622070312, -0.508575439453125, -0.48479461669921875, -0.4610137939453125, -0.43723297119140625, -0.4134521484375, -0.38967132568359375, -0.3658905029296875, -0.34210968017578125, -0.318328857421875, -0.29454803466796875, -0.2707672119140625, -0.24698638916015625, -0.22320556640625, -0.19942474365234375, -0.1756439208984375, -0.15186309814453125, -0.128082275390625, -0.10430145263671875, -0.0805206298828125, -0.05673980712890625, -0.032958984375, -0.00917816162109375, 0.0146026611328125, 0.03838348388671875, 0.062164306640625, 0.08594512939453125, 0.1097259521484375, 0.13350677490234375, 0.15728759765625, 0.18106842041015625, 0.2048492431640625, 0.22863006591796875, 0.252410888671875, 0.27619171142578125, 0.2999725341796875, 0.32375335693359375, 0.3475341796875, 0.37131500244140625, 0.3950958251953125, 0.41887664794921875, 0.442657470703125, 0.46643829345703125, 0.4902191162109375, 0.5139999389648438, 0.53778076171875, 0.5615615844726562, 0.5853424072265625, 0.6091232299804688, 0.632904052734375, 0.6566848754882812, 0.6804656982421875, 0.7042465209960938, 0.72802734375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 22.0, 42.0, 80.0, 117.0, 272.0, 549.0, 3073.0, 143439.0, 4031487.0, 13169.0, 1239.0, 375.0, 180.0, 85.0, 61.0, 35.0, 20.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48046875, -3.372528076171875, -3.26458740234375, -3.156646728515625, -3.0487060546875, -2.940765380859375, -2.83282470703125, -2.724884033203125, -2.616943359375, -2.509002685546875, -2.40106201171875, -2.293121337890625, -2.1851806640625, -2.077239990234375, -1.96929931640625, -1.861358642578125, -1.75341796875, -1.645477294921875, -1.53753662109375, -1.429595947265625, -1.3216552734375, -1.213714599609375, -1.10577392578125, -0.997833251953125, -0.889892578125, -0.781951904296875, -0.67401123046875, -0.566070556640625, -0.4581298828125, -0.350189208984375, -0.24224853515625, -0.134307861328125, -0.0263671875, 0.081573486328125, 0.18951416015625, 0.297454833984375, 0.4053955078125, 0.513336181640625, 0.62127685546875, 0.729217529296875, 0.837158203125, 0.945098876953125, 1.05303955078125, 1.160980224609375, 1.2689208984375, 1.376861572265625, 1.48480224609375, 1.592742919921875, 1.70068359375, 1.808624267578125, 1.91656494140625, 2.024505615234375, 2.1324462890625, 2.240386962890625, 2.34832763671875, 2.456268310546875, 2.564208984375, 2.672149658203125, 2.78009033203125, 2.888031005859375, 2.9959716796875, 3.103912353515625, 3.21185302734375, 3.319793701171875, 3.427734375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 3.0, 5.0, 6.0, 11.0, 22.0, 26.0, 34.0, 59.0, 93.0, 203.0, 343.0, 806.0, 1086.0, 686.0, 302.0, 140.0, 82.0, 52.0, 35.0, 24.0, 17.0, 13.0, 8.0, 3.0, 5.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.5000076293945312, -0.4873199462890625, -0.47463226318359375, -0.461944580078125, -0.44925689697265625, -0.4365692138671875, -0.42388153076171875, -0.41119384765625, -0.39850616455078125, -0.3858184814453125, -0.37313079833984375, -0.360443115234375, -0.34775543212890625, -0.3350677490234375, -0.32238006591796875, -0.3096923828125, -0.29700469970703125, -0.2843170166015625, -0.27162933349609375, -0.258941650390625, -0.24625396728515625, -0.2335662841796875, -0.22087860107421875, -0.20819091796875, -0.19550323486328125, -0.1828155517578125, -0.17012786865234375, -0.157440185546875, -0.14475250244140625, -0.1320648193359375, -0.11937713623046875, -0.106689453125, -0.09400177001953125, -0.0813140869140625, -0.06862640380859375, -0.055938720703125, -0.04325103759765625, -0.0305633544921875, -0.01787567138671875, -0.00518798828125, 0.00749969482421875, 0.0201873779296875, 0.03287506103515625, 0.045562744140625, 0.05825042724609375, 0.0709381103515625, 0.08362579345703125, 0.0963134765625, 0.10900115966796875, 0.1216888427734375, 0.13437652587890625, 0.147064208984375, 0.15975189208984375, 0.1724395751953125, 0.18512725830078125, 0.19781494140625, 0.21050262451171875, 0.2231903076171875, 0.23587799072265625, 0.248565673828125, 0.26125335693359375, 0.2739410400390625, 0.28662872314453125, 0.29931640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 12.0, 14.0, 10.0, 23.0, 13.0, 31.0, 32.0, 52.0, 56.0, 70.0, 71.0, 89.0, 91.0, 74.0, 62.0, 55.0, 62.0, 44.0, 21.0, 20.0, 19.0, 12.0, 13.0, 11.0, 3.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7963128685951233, -0.7697895765304565, -0.743266224861145, -0.7167429327964783, -0.6902196407318115, -0.6636962890625, -0.6371729969978333, -0.6106497049331665, -0.584126353263855, -0.5576030611991882, -0.5310797095298767, -0.50455641746521, -0.4780330955982208, -0.4515097737312317, -0.42498648166656494, -0.3984631597995758, -0.37193983793258667, -0.34541651606559753, -0.3188931941986084, -0.29236990213394165, -0.2658465802669525, -0.23932325839996338, -0.21279995143413544, -0.1862766444683075, -0.15975332260131836, -0.13323000073432922, -0.10670669376850128, -0.08018337935209274, -0.053660064935684204, -0.02713674306869507, -0.0006134361028671265, 0.025909870862960815, 0.05243319272994995, 0.07895650714635849, 0.10547982156276703, 0.13200312852859497, 0.1585264503955841, 0.18504977226257324, 0.21157307922840118, 0.23809638619422913, 0.26461970806121826, 0.2911430299282074, 0.31766635179519653, 0.3441896438598633, 0.3707129657268524, 0.39723628759384155, 0.4237595796585083, 0.45028290152549744, 0.4768062233924866, 0.5033295154571533, 0.5298528671264648, 0.5563761591911316, 0.5828994512557983, 0.6094228029251099, 0.6359460949897766, 0.6624693870544434, 0.6889927387237549, 0.7155160307884216, 0.7420393824577332, 0.7685626745223999, 0.7950860261917114, 0.8216093182563782, 0.8481326103210449, 0.8746559619903564, 0.9011792540550232]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 15.0, 19.0, 20.0, 19.0, 34.0, 31.0, 33.0, 47.0, 49.0, 47.0, 64.0, 60.0, 52.0, 55.0, 59.0, 68.0, 53.0, 48.0, 36.0, 27.0, 33.0, 27.0, 24.0, 19.0, 15.0, 14.0, 8.0, 6.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8162955045700073, -0.7911674976348877, -0.7660394906997681, -0.7409114837646484, -0.7157834768295288, -0.6906554698944092, -0.6655274629592896, -0.6403994560241699, -0.6152714490890503, -0.5901434421539307, -0.565015435218811, -0.5398874282836914, -0.5147594213485718, -0.48963141441345215, -0.4645034074783325, -0.4393754005432129, -0.4142473638057709, -0.38911935687065125, -0.3639913499355316, -0.338863343000412, -0.31373533606529236, -0.28860729932785034, -0.2634792923927307, -0.23835130035877228, -0.21322329342365265, -0.18809528648853302, -0.1629672795534134, -0.13783925771713257, -0.11271125823259354, -0.08758324384689331, -0.06245523691177368, -0.03732722997665405, -0.012199223041534424, 0.012928785756230354, 0.03805679455399513, 0.06318480521440506, 0.08831281214952469, 0.11344082653522491, 0.13856883347034454, 0.16369684040546417, 0.1888248473405838, 0.21395285427570343, 0.23908086121082306, 0.2642088830471039, 0.2893368899822235, 0.31446489691734314, 0.33959290385246277, 0.3647209107875824, 0.389848917722702, 0.41497692465782166, 0.4401049315929413, 0.4652329385280609, 0.49036094546318054, 0.5154889822006226, 0.5406169891357422, 0.5657449960708618, 0.5908730030059814, 0.6160010099411011, 0.6411290168762207, 0.6662570238113403, 0.69138503074646, 0.7165130376815796, 0.7416410446166992, 0.7667690515518188, 0.7918970584869385]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 11.0, 18.0, 24.0, 38.0, 60.0, 96.0, 127.0, 184.0, 322.0, 534.0, 1008.0, 1959.0, 4083.0, 9523.0, 24573.0, 73775.0, 264074.0, 440935.0, 152954.0, 45127.0, 16236.0, 6557.0, 2911.0, 1435.0, 810.0, 434.0, 264.0, 157.0, 117.0, 55.0, 37.0, 39.0, 22.0, 13.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.125244140625, -0.12179279327392578, -0.11834144592285156, -0.11489009857177734, -0.11143875122070312, -0.1079874038696289, -0.10453605651855469, -0.10108470916748047, -0.09763336181640625, -0.09418201446533203, -0.09073066711425781, -0.0872793197631836, -0.08382797241210938, -0.08037662506103516, -0.07692527770996094, -0.07347393035888672, -0.0700225830078125, -0.06657123565673828, -0.06311988830566406, -0.059668540954589844, -0.056217193603515625, -0.052765846252441406, -0.04931449890136719, -0.04586315155029297, -0.04241180419921875, -0.03896045684814453, -0.03550910949707031, -0.032057762145996094, -0.028606414794921875, -0.025155067443847656, -0.021703720092773438, -0.01825237274169922, -0.014801025390625, -0.011349678039550781, -0.007898330688476562, -0.004446983337402344, -0.000995635986328125, 0.0024557113647460938, 0.0059070587158203125, 0.009358406066894531, 0.01280975341796875, 0.01626110076904297, 0.019712448120117188, 0.023163795471191406, 0.026615142822265625, 0.030066490173339844, 0.03351783752441406, 0.03696918487548828, 0.0404205322265625, 0.04387187957763672, 0.04732322692871094, 0.050774574279785156, 0.054225921630859375, 0.057677268981933594, 0.06112861633300781, 0.06457996368408203, 0.06803131103515625, 0.07148265838623047, 0.07493400573730469, 0.0783853530883789, 0.08183670043945312, 0.08528804779052734, 0.08873939514160156, 0.09219074249267578, 0.09564208984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 14.0, 10.0, 19.0, 24.0, 39.0, 39.0, 42.0, 43.0, 67.0, 60.0, 67.0, 60.0, 67.0, 64.0, 58.0, 63.0, 46.0, 38.0, 41.0, 41.0, 16.0, 22.0, 14.0, 12.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.5201797485351562, -0.5022735595703125, -0.48436737060546875, -0.466461181640625, -0.44855499267578125, -0.4306488037109375, -0.41274261474609375, -0.39483642578125, -0.37693023681640625, -0.3590240478515625, -0.34111785888671875, -0.323211669921875, -0.30530548095703125, -0.2873992919921875, -0.26949310302734375, -0.2515869140625, -0.23368072509765625, -0.2157745361328125, -0.19786834716796875, -0.179962158203125, -0.16205596923828125, -0.1441497802734375, -0.12624359130859375, -0.10833740234375, -0.09043121337890625, -0.0725250244140625, -0.05461883544921875, -0.036712646484375, -0.01880645751953125, -0.0009002685546875, 0.01700592041015625, 0.034912109375, 0.05281829833984375, 0.0707244873046875, 0.08863067626953125, 0.106536865234375, 0.12444305419921875, 0.1423492431640625, 0.16025543212890625, 0.17816162109375, 0.19606781005859375, 0.2139739990234375, 0.23188018798828125, 0.249786376953125, 0.26769256591796875, 0.2855987548828125, 0.30350494384765625, 0.3214111328125, 0.33931732177734375, 0.3572235107421875, 0.37512969970703125, 0.393035888671875, 0.41094207763671875, 0.4288482666015625, 0.44675445556640625, 0.46466064453125, 0.48256683349609375, 0.5004730224609375, 0.5183792114257812, 0.536285400390625, 0.5541915893554688, 0.5720977783203125, 0.5900039672851562, 0.60791015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 10.0, 10.0, 10.0, 9.0, 16.0, 23.0, 44.0, 67.0, 100.0, 142.0, 228.0, 389.0, 603.0, 1058.0, 1796.0, 3013.0, 5139.0, 8880.0, 15292.0, 27382.0, 49095.0, 90102.0, 159710.0, 228964.0, 194595.0, 116807.0, 63904.0, 35052.0, 19409.0, 10918.0, 6431.0, 3791.0, 2179.0, 1295.0, 807.0, 483.0, 282.0, 202.0, 128.0, 60.0, 64.0, 26.0, 22.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.050933837890625, -0.049466609954833984, -0.04799938201904297, -0.04653215408325195, -0.04506492614746094, -0.04359769821166992, -0.042130470275878906, -0.04066324234008789, -0.039196014404296875, -0.03772878646850586, -0.036261558532714844, -0.03479433059692383, -0.03332710266113281, -0.0318598747253418, -0.03039264678955078, -0.028925418853759766, -0.02745819091796875, -0.025990962982177734, -0.02452373504638672, -0.023056507110595703, -0.021589279174804688, -0.020122051239013672, -0.018654823303222656, -0.01718759536743164, -0.015720367431640625, -0.01425313949584961, -0.012785911560058594, -0.011318683624267578, -0.009851455688476562, -0.008384227752685547, -0.006916999816894531, -0.005449771881103516, -0.0039825439453125, -0.0025153160095214844, -0.0010480880737304688, 0.0004191398620605469, 0.0018863677978515625, 0.003353595733642578, 0.004820823669433594, 0.006288051605224609, 0.007755279541015625, 0.00922250747680664, 0.010689735412597656, 0.012156963348388672, 0.013624191284179688, 0.015091419219970703, 0.01655864715576172, 0.018025875091552734, 0.01949310302734375, 0.020960330963134766, 0.02242755889892578, 0.023894786834716797, 0.025362014770507812, 0.026829242706298828, 0.028296470642089844, 0.02976369857788086, 0.031230926513671875, 0.03269815444946289, 0.034165382385253906, 0.03563261032104492, 0.03709983825683594, 0.03856706619262695, 0.04003429412841797, 0.041501522064208984, 0.04296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 8.0, 4.0, 12.0, 14.0, 13.0, 24.0, 15.0, 26.0, 22.0, 25.0, 21.0, 37.0, 34.0, 30.0, 29.0, 53.0, 36.0, 41.0, 40.0, 42.0, 50.0, 44.0, 40.0, 36.0, 42.0, 43.0, 34.0, 26.0, 17.0, 29.0, 16.0, 19.0, 9.0, 14.0, 12.0, 9.0, 6.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6165008544921875, -0.590911865234375, -0.5653228759765625, -0.53973388671875, -0.5141448974609375, -0.488555908203125, -0.4629669189453125, -0.4373779296875, -0.4117889404296875, -0.386199951171875, -0.3606109619140625, -0.33502197265625, -0.3094329833984375, -0.283843994140625, -0.2582550048828125, -0.232666015625, -0.2070770263671875, -0.181488037109375, -0.1558990478515625, -0.13031005859375, -0.1047210693359375, -0.079132080078125, -0.0535430908203125, -0.0279541015625, -0.0023651123046875, 0.023223876953125, 0.0488128662109375, 0.07440185546875, 0.0999908447265625, 0.125579833984375, 0.1511688232421875, 0.1767578125, 0.2023468017578125, 0.227935791015625, 0.2535247802734375, 0.27911376953125, 0.3047027587890625, 0.330291748046875, 0.3558807373046875, 0.3814697265625, 0.4070587158203125, 0.432647705078125, 0.4582366943359375, 0.48382568359375, 0.5094146728515625, 0.535003662109375, 0.5605926513671875, 0.586181640625, 0.6117706298828125, 0.637359619140625, 0.6629486083984375, 0.68853759765625, 0.7141265869140625, 0.739715576171875, 0.7653045654296875, 0.7908935546875, 0.8164825439453125, 0.842071533203125, 0.8676605224609375, 0.89324951171875, 0.9188385009765625, 0.944427490234375, 0.9700164794921875, 0.99560546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 14.0, 6.0, 15.0, 26.0, 32.0, 49.0, 76.0, 133.0, 244.0, 458.0, 904.0, 2022.0, 5035.0, 16485.0, 69995.0, 369730.0, 459653.0, 92658.0, 20699.0, 6142.0, 2142.0, 914.0, 482.0, 232.0, 160.0, 65.0, 62.0, 43.0, 21.0, 11.0, 11.0, 16.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01458740234375, -0.014159440994262695, -0.01373147964477539, -0.013303518295288086, -0.012875556945800781, -0.012447595596313477, -0.012019634246826172, -0.011591672897338867, -0.011163711547851562, -0.010735750198364258, -0.010307788848876953, -0.009879827499389648, -0.009451866149902344, -0.009023904800415039, -0.008595943450927734, -0.00816798210144043, -0.007740020751953125, -0.00731205940246582, -0.006884098052978516, -0.006456136703491211, -0.006028175354003906, -0.0056002140045166016, -0.005172252655029297, -0.004744291305541992, -0.0043163299560546875, -0.003888368606567383, -0.003460407257080078, -0.0030324459075927734, -0.0026044845581054688, -0.002176523208618164, -0.0017485618591308594, -0.0013206005096435547, -0.00089263916015625, -0.0004646778106689453, -3.6716461181640625e-05, 0.00039124488830566406, 0.0008192062377929688, 0.0012471675872802734, 0.0016751289367675781, 0.002103090286254883, 0.0025310516357421875, 0.002959012985229492, 0.003386974334716797, 0.0038149356842041016, 0.004242897033691406, 0.004670858383178711, 0.005098819732666016, 0.00552678108215332, 0.005954742431640625, 0.00638270378112793, 0.006810665130615234, 0.007238626480102539, 0.007666587829589844, 0.008094549179077148, 0.008522510528564453, 0.008950471878051758, 0.009378433227539062, 0.009806394577026367, 0.010234355926513672, 0.010662317276000977, 0.011090278625488281, 0.011518239974975586, 0.01194620132446289, 0.012374162673950195, 0.0128021240234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 20.0, 19.0, 20.0, 25.0, 39.0, 52.0, 64.0, 76.0, 73.0, 97.0, 114.0, 65.0, 57.0, 62.0, 52.0, 30.0, 19.0, 16.0, 9.0, 18.0, 14.0, 12.0, 5.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33514404296875e-05, -1.2707896530628204e-05, -1.2064352631568909e-05, -1.1420808732509613e-05, -1.0777264833450317e-05, -1.0133720934391022e-05, -9.490177035331726e-06, -8.84663313627243e-06, -8.203089237213135e-06, -7.559545338153839e-06, -6.9160014390945435e-06, -6.272457540035248e-06, -5.628913640975952e-06, -4.9853697419166565e-06, -4.341825842857361e-06, -3.698281943798065e-06, -3.0547380447387695e-06, -2.411194145679474e-06, -1.7676502466201782e-06, -1.1241063475608826e-06, -4.805624485015869e-07, 1.6298145055770874e-07, 8.065253496170044e-07, 1.4500692486763e-06, 2.0936131477355957e-06, 2.7371570467948914e-06, 3.380700945854187e-06, 4.024244844913483e-06, 4.667788743972778e-06, 5.311332643032074e-06, 5.95487654209137e-06, 6.598420441150665e-06, 7.241964340209961e-06, 7.885508239269257e-06, 8.529052138328552e-06, 9.172596037387848e-06, 9.816139936447144e-06, 1.045968383550644e-05, 1.1103227734565735e-05, 1.174677163362503e-05, 1.2390315532684326e-05, 1.3033859431743622e-05, 1.3677403330802917e-05, 1.4320947229862213e-05, 1.4964491128921509e-05, 1.5608035027980804e-05, 1.62515789270401e-05, 1.6895122826099396e-05, 1.753866672515869e-05, 1.8182210624217987e-05, 1.8825754523277283e-05, 1.946929842233658e-05, 2.0112842321395874e-05, 2.075638622045517e-05, 2.1399930119514465e-05, 2.204347401857376e-05, 2.2687017917633057e-05, 2.3330561816692352e-05, 2.3974105715751648e-05, 2.4617649614810944e-05, 2.526119351387024e-05, 2.5904737412929535e-05, 2.654828131198883e-05, 2.7191825211048126e-05, 2.7835369110107422e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 1.0, 6.0, 10.0, 8.0, 12.0, 17.0, 21.0, 50.0, 84.0, 165.0, 499.0, 1960.0, 13504.0, 289697.0, 708602.0, 29236.0, 3474.0, 716.0, 215.0, 107.0, 52.0, 35.0, 20.0, 9.0, 10.0, 2.0, 13.0, 9.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0310821533203125, -0.030172109603881836, -0.029262065887451172, -0.028352022171020508, -0.027441978454589844, -0.02653193473815918, -0.025621891021728516, -0.02471184730529785, -0.023801803588867188, -0.022891759872436523, -0.02198171615600586, -0.021071672439575195, -0.02016162872314453, -0.019251585006713867, -0.018341541290283203, -0.01743149757385254, -0.016521453857421875, -0.015611410140991211, -0.014701366424560547, -0.013791322708129883, -0.012881278991699219, -0.011971235275268555, -0.01106119155883789, -0.010151147842407227, -0.009241104125976562, -0.008331060409545898, -0.007421016693115234, -0.00651097297668457, -0.005600929260253906, -0.004690885543823242, -0.003780841827392578, -0.002870798110961914, -0.00196075439453125, -0.001050710678100586, -0.00014066696166992188, 0.0007693767547607422, 0.0016794204711914062, 0.0025894641876220703, 0.0034995079040527344, 0.0044095516204833984, 0.0053195953369140625, 0.0062296390533447266, 0.007139682769775391, 0.008049726486206055, 0.008959770202636719, 0.009869813919067383, 0.010779857635498047, 0.011689901351928711, 0.012599945068359375, 0.013509988784790039, 0.014420032501220703, 0.015330076217651367, 0.01624011993408203, 0.017150163650512695, 0.01806020736694336, 0.018970251083374023, 0.019880294799804688, 0.02079033851623535, 0.021700382232666016, 0.02261042594909668, 0.023520469665527344, 0.024430513381958008, 0.025340557098388672, 0.026250600814819336, 0.02716064453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 19.0, 26.0, 27.0, 43.0, 50.0, 73.0, 87.0, 82.0, 103.0, 96.0, 82.0, 71.0, 58.0, 44.0, 21.0, 23.0, 22.0, 8.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003757476806640625, -0.0036332011222839355, -0.003508925437927246, -0.0033846497535705566, -0.003260374069213867, -0.0031360983848571777, -0.0030118227005004883, -0.002887547016143799, -0.0027632713317871094, -0.00263899564743042, -0.0025147199630737305, -0.002390444278717041, -0.0022661685943603516, -0.002141892910003662, -0.0020176172256469727, -0.0018933415412902832, -0.0017690658569335938, -0.0016447901725769043, -0.0015205144882202148, -0.0013962388038635254, -0.001271963119506836, -0.0011476874351501465, -0.001023411750793457, -0.0008991360664367676, -0.0007748603820800781, -0.0006505846977233887, -0.0005263090133666992, -0.00040203332901000977, -0.0002777576446533203, -0.00015348196029663086, -2.9206275939941406e-05, 9.506940841674805e-05, 0.0002193450927734375, 0.00034362077713012695, 0.0004678964614868164, 0.0005921721458435059, 0.0007164478302001953, 0.0008407235145568848, 0.0009649991989135742, 0.0010892748832702637, 0.0012135505676269531, 0.0013378262519836426, 0.001462101936340332, 0.0015863776206970215, 0.001710653305053711, 0.0018349289894104004, 0.00195920467376709, 0.0020834803581237793, 0.0022077560424804688, 0.002332031726837158, 0.0024563074111938477, 0.002580583095550537, 0.0027048587799072266, 0.002829134464263916, 0.0029534101486206055, 0.003077685832977295, 0.0032019615173339844, 0.003326237201690674, 0.0034505128860473633, 0.0035747885704040527, 0.003699064254760742, 0.0038233399391174316, 0.003947615623474121, 0.0040718913078308105, 0.0041961669921875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 0.0, 8.0, 4.0, 8.0, 27.0, 16.0, 16.0, 45.0, 38.0, 63.0, 84.0, 112.0, 106.0, 108.0, 97.0, 76.0, 58.0, 40.0, 28.0, 20.0, 12.0, 10.0, 6.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49328410625457764, -0.4715797007083893, -0.44987526535987854, -0.4281708598136902, -0.40646642446517944, -0.3847620189189911, -0.36305761337280273, -0.341353178024292, -0.31964877247810364, -0.2979443669319153, -0.27623993158340454, -0.2545355260372162, -0.23283110558986664, -0.2111266851425171, -0.18942227959632874, -0.1677178591489792, -0.14601343870162964, -0.12430901825428009, -0.10260460525751114, -0.08090019226074219, -0.05919577181339264, -0.03749135136604309, -0.015786945819854736, 0.005917474627494812, 0.02762189507484436, 0.04932631179690361, 0.07103072851896286, 0.09273514151573181, 0.11443956196308136, 0.1361439824104309, 0.15784838795661926, 0.1795528084039688, 0.20125716924667358, 0.22296158969402313, 0.24466601014137268, 0.26637041568756104, 0.2880748510360718, 0.30977925658226013, 0.3314836621284485, 0.35318809747695923, 0.3748925030231476, 0.39659690856933594, 0.4183013439178467, 0.44000574946403503, 0.4617101550102234, 0.48341459035873413, 0.5051189661026001, 0.5268234014511108, 0.5485278367996216, 0.5702322721481323, 0.5919366478919983, 0.613641083240509, 0.6353455185890198, 0.6570498943328857, 0.6787543296813965, 0.7004587650299072, 0.722163200378418, 0.7438676357269287, 0.7655720114707947, 0.7872764468193054, 0.8089808821678162, 0.8306852579116821, 0.8523896932601929, 0.8740941286087036, 0.8957985043525696]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 17.0, 18.0, 24.0, 33.0, 34.0, 42.0, 62.0, 47.0, 66.0, 70.0, 64.0, 65.0, 73.0, 76.0, 52.0, 45.0, 46.0, 40.0, 25.0, 25.0, 17.0, 17.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6185455322265625, -0.6004334092140198, -0.582321286201477, -0.5642091631889343, -0.5460970401763916, -0.5279848575592041, -0.5098727345466614, -0.49176061153411865, -0.4736484885215759, -0.4555363655090332, -0.4374242424964905, -0.41931208968162537, -0.40119996666908264, -0.3830878436565399, -0.3649756908416748, -0.3468635678291321, -0.32875144481658936, -0.31063932180404663, -0.2925271987915039, -0.2744150459766388, -0.25630292296409607, -0.23819079995155334, -0.22007866203784943, -0.2019665241241455, -0.18385440111160278, -0.16574227809906006, -0.14763014018535614, -0.12951800227165222, -0.1114058792591095, -0.09329374879598618, -0.07518161833286285, -0.057069480419158936, -0.03895735740661621, -0.02084522694349289, -0.002733096480369568, 0.015379033982753754, 0.033491164445877075, 0.0516032949090004, 0.06971542537212372, 0.08782756328582764, 0.10593968629837036, 0.12405181676149368, 0.142163947224617, 0.16027608513832092, 0.17838820815086365, 0.19650033116340637, 0.2146124690771103, 0.2327246069908142, 0.25083673000335693, 0.26894885301589966, 0.2870609760284424, 0.3051731288433075, 0.3232852518558502, 0.34139737486839294, 0.35950952768325806, 0.3776216506958008, 0.3957337737083435, 0.41384589672088623, 0.43195801973342896, 0.45007017254829407, 0.4681822955608368, 0.4862944185733795, 0.5044065713882446, 0.5225186944007874, 0.5406308174133301]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 9.0, 3.0, 5.0, 10.0, 14.0, 10.0, 28.0, 25.0, 49.0, 79.0, 115.0, 195.0, 319.0, 666.0, 1266.0, 2802.0, 7466.0, 26881.0, 212991.0, 701583.0, 71127.0, 14069.0, 4778.0, 1962.0, 939.0, 498.0, 244.0, 150.0, 82.0, 60.0, 39.0, 28.0, 23.0, 17.0, 6.0, 4.0, 6.0, 2.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.494140625, -0.47834014892578125, -0.4625396728515625, -0.44673919677734375, -0.430938720703125, -0.41513824462890625, -0.3993377685546875, -0.38353729248046875, -0.36773681640625, -0.35193634033203125, -0.3361358642578125, -0.32033538818359375, -0.304534912109375, -0.28873443603515625, -0.2729339599609375, -0.25713348388671875, -0.2413330078125, -0.22553253173828125, -0.2097320556640625, -0.19393157958984375, -0.178131103515625, -0.16233062744140625, -0.1465301513671875, -0.13072967529296875, -0.11492919921875, -0.09912872314453125, -0.0833282470703125, -0.06752777099609375, -0.051727294921875, -0.03592681884765625, -0.0201263427734375, -0.00432586669921875, 0.011474609375, 0.02727508544921875, 0.0430755615234375, 0.05887603759765625, 0.074676513671875, 0.09047698974609375, 0.1062774658203125, 0.12207794189453125, 0.13787841796875, 0.15367889404296875, 0.1694793701171875, 0.18527984619140625, 0.201080322265625, 0.21688079833984375, 0.2326812744140625, 0.24848175048828125, 0.2642822265625, 0.28008270263671875, 0.2958831787109375, 0.31168365478515625, 0.327484130859375, 0.34328460693359375, 0.3590850830078125, 0.37488555908203125, 0.39068603515625, 0.40648651123046875, 0.4222869873046875, 0.43808746337890625, 0.453887939453125, 0.46968841552734375, 0.4854888916015625, 0.5012893676757812, 0.51708984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 11.0, 8.0, 20.0, 23.0, 33.0, 38.0, 39.0, 52.0, 71.0, 66.0, 71.0, 76.0, 84.0, 84.0, 64.0, 46.0, 51.0, 42.0, 35.0, 28.0, 19.0, 14.0, 17.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6357421875, -1.5934906005859375, -1.551239013671875, -1.5089874267578125, -1.46673583984375, -1.4244842529296875, -1.382232666015625, -1.3399810791015625, -1.2977294921875, -1.2554779052734375, -1.213226318359375, -1.1709747314453125, -1.12872314453125, -1.0864715576171875, -1.044219970703125, -1.0019683837890625, -0.959716796875, -0.9174652099609375, -0.875213623046875, -0.8329620361328125, -0.79071044921875, -0.7484588623046875, -0.706207275390625, -0.6639556884765625, -0.6217041015625, -0.5794525146484375, -0.537200927734375, -0.4949493408203125, -0.45269775390625, -0.4104461669921875, -0.368194580078125, -0.3259429931640625, -0.28369140625, -0.2414398193359375, -0.199188232421875, -0.1569366455078125, -0.11468505859375, -0.0724334716796875, -0.030181884765625, 0.0120697021484375, 0.0543212890625, 0.0965728759765625, 0.138824462890625, 0.1810760498046875, 0.22332763671875, 0.2655792236328125, 0.307830810546875, 0.3500823974609375, 0.392333984375, 0.4345855712890625, 0.476837158203125, 0.5190887451171875, 0.56134033203125, 0.6035919189453125, 0.645843505859375, 0.6880950927734375, 0.7303466796875, 0.7725982666015625, 0.814849853515625, 0.8571014404296875, 0.89935302734375, 0.9416046142578125, 0.983856201171875, 1.0261077880859375, 1.068359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 5.0, 6.0, 12.0, 8.0, 10.0, 12.0, 25.0, 13.0, 25.0, 31.0, 38.0, 36.0, 64.0, 100.0, 171.0, 504.0, 3012.0, 51885.0, 958327.0, 30971.0, 2318.0, 408.0, 177.0, 78.0, 70.0, 53.0, 29.0, 31.0, 33.0, 23.0, 15.0, 18.0, 11.0, 12.0, 12.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1179275512695312, -1.0844879150390625, -1.0510482788085938, -1.017608642578125, -0.9841690063476562, -0.9507293701171875, -0.9172897338867188, -0.88385009765625, -0.8504104614257812, -0.8169708251953125, -0.7835311889648438, -0.750091552734375, -0.7166519165039062, -0.6832122802734375, -0.6497726440429688, -0.6163330078125, -0.5828933715820312, -0.5494537353515625, -0.5160140991210938, -0.482574462890625, -0.44913482666015625, -0.4156951904296875, -0.38225555419921875, -0.34881591796875, -0.31537628173828125, -0.2819366455078125, -0.24849700927734375, -0.215057373046875, -0.18161773681640625, -0.1481781005859375, -0.11473846435546875, -0.081298828125, -0.04785919189453125, -0.0144195556640625, 0.01902008056640625, 0.052459716796875, 0.08589935302734375, 0.1193389892578125, 0.15277862548828125, 0.18621826171875, 0.21965789794921875, 0.2530975341796875, 0.28653717041015625, 0.319976806640625, 0.35341644287109375, 0.3868560791015625, 0.42029571533203125, 0.4537353515625, 0.48717498779296875, 0.5206146240234375, 0.5540542602539062, 0.587493896484375, 0.6209335327148438, 0.6543731689453125, 0.6878128051757812, 0.72125244140625, 0.7546920776367188, 0.7881317138671875, 0.8215713500976562, 0.855010986328125, 0.8884506225585938, 0.9218902587890625, 0.9553298950195312, 0.98876953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 10.0, 8.0, 13.0, 19.0, 28.0, 20.0, 21.0, 29.0, 34.0, 55.0, 59.0, 60.0, 52.0, 71.0, 58.0, 66.0, 58.0, 63.0, 46.0, 30.0, 46.0, 30.0, 20.0, 22.0, 25.0, 20.0, 11.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.264373779296875, -1.22601318359375, -1.187652587890625, -1.1492919921875, -1.110931396484375, -1.07257080078125, -1.034210205078125, -0.995849609375, -0.957489013671875, -0.91912841796875, -0.880767822265625, -0.8424072265625, -0.804046630859375, -0.76568603515625, -0.727325439453125, -0.68896484375, -0.650604248046875, -0.61224365234375, -0.573883056640625, -0.5355224609375, -0.497161865234375, -0.45880126953125, -0.420440673828125, -0.382080078125, -0.343719482421875, -0.30535888671875, -0.266998291015625, -0.2286376953125, -0.190277099609375, -0.15191650390625, -0.113555908203125, -0.0751953125, -0.036834716796875, 0.00152587890625, 0.039886474609375, 0.0782470703125, 0.116607666015625, 0.15496826171875, 0.193328857421875, 0.231689453125, 0.270050048828125, 0.30841064453125, 0.346771240234375, 0.3851318359375, 0.423492431640625, 0.46185302734375, 0.500213623046875, 0.53857421875, 0.576934814453125, 0.61529541015625, 0.653656005859375, 0.6920166015625, 0.730377197265625, 0.76873779296875, 0.807098388671875, 0.845458984375, 0.883819580078125, 0.92218017578125, 0.960540771484375, 0.9989013671875, 1.037261962890625, 1.07562255859375, 1.113983154296875, 1.15234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 14.0, 10.0, 17.0, 18.0, 29.0, 38.0, 54.0, 72.0, 84.0, 129.0, 197.0, 301.0, 493.0, 880.0, 1813.0, 4199.0, 12505.0, 54032.0, 546109.0, 365368.0, 43972.0, 10750.0, 3715.0, 1539.0, 809.0, 472.0, 299.0, 192.0, 127.0, 72.0, 61.0, 46.0, 29.0, 22.0, 17.0, 12.0, 7.0, 15.0, 7.0, 4.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.11669921875, -0.1133584976196289, -0.11001777648925781, -0.10667705535888672, -0.10333633422851562, -0.09999561309814453, -0.09665489196777344, -0.09331417083740234, -0.08997344970703125, -0.08663272857666016, -0.08329200744628906, -0.07995128631591797, -0.07661056518554688, -0.07326984405517578, -0.06992912292480469, -0.0665884017944336, -0.0632476806640625, -0.059906959533691406, -0.05656623840332031, -0.05322551727294922, -0.049884796142578125, -0.04654407501220703, -0.04320335388183594, -0.039862632751464844, -0.03652191162109375, -0.033181190490722656, -0.029840469360351562, -0.02649974822998047, -0.023159027099609375, -0.01981830596923828, -0.016477584838867188, -0.013136863708496094, -0.009796142578125, -0.006455421447753906, -0.0031147003173828125, 0.00022602081298828125, 0.003566741943359375, 0.006907463073730469, 0.010248184204101562, 0.013588905334472656, 0.01692962646484375, 0.020270347595214844, 0.023611068725585938, 0.02695178985595703, 0.030292510986328125, 0.03363323211669922, 0.03697395324707031, 0.040314674377441406, 0.0436553955078125, 0.046996116638183594, 0.05033683776855469, 0.05367755889892578, 0.057018280029296875, 0.06035900115966797, 0.06369972229003906, 0.06704044342041016, 0.07038116455078125, 0.07372188568115234, 0.07706260681152344, 0.08040332794189453, 0.08374404907226562, 0.08708477020263672, 0.09042549133300781, 0.0937662124633789, 0.09710693359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 12.0, 6.0, 7.0, 13.0, 18.0, 27.0, 31.0, 58.0, 102.0, 164.0, 200.0, 139.0, 67.0, 44.0, 34.0, 14.0, 19.0, 13.0, 7.0, 2.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.3576820492744446e-05, -1.2967735528945923e-05, -1.23586505651474e-05, -1.1749565601348877e-05, -1.1140480637550354e-05, -1.0531395673751831e-05, -9.922310709953308e-06, -9.313225746154785e-06, -8.704140782356262e-06, -8.09505581855774e-06, -7.485970854759216e-06, -6.876885890960693e-06, -6.26780092716217e-06, -5.6587159633636475e-06, -5.0496309995651245e-06, -4.4405460357666016e-06, -3.831461071968079e-06, -3.2223761081695557e-06, -2.6132911443710327e-06, -2.0042061805725098e-06, -1.3951212167739868e-06, -7.860362529754639e-07, -1.7695128917694092e-07, 4.3213367462158203e-07, 1.041218638420105e-06, 1.650303602218628e-06, 2.259388566017151e-06, 2.868473529815674e-06, 3.4775584936141968e-06, 4.08664345741272e-06, 4.695728421211243e-06, 5.304813385009766e-06, 5.9138983488082886e-06, 6.5229833126068115e-06, 7.1320682764053345e-06, 7.741153240203857e-06, 8.35023820400238e-06, 8.959323167800903e-06, 9.568408131599426e-06, 1.017749309539795e-05, 1.0786578059196472e-05, 1.1395663022994995e-05, 1.2004747986793518e-05, 1.2613832950592041e-05, 1.3222917914390564e-05, 1.3832002878189087e-05, 1.444108784198761e-05, 1.5050172805786133e-05, 1.5659257769584656e-05, 1.626834273338318e-05, 1.68774276971817e-05, 1.7486512660980225e-05, 1.8095597624778748e-05, 1.870468258857727e-05, 1.9313767552375793e-05, 1.9922852516174316e-05, 2.053193747997284e-05, 2.1141022443771362e-05, 2.1750107407569885e-05, 2.2359192371368408e-05, 2.296827733516693e-05, 2.3577362298965454e-05, 2.4186447262763977e-05, 2.47955322265625e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 11.0, 11.0, 23.0, 33.0, 38.0, 54.0, 88.0, 120.0, 208.0, 308.0, 538.0, 1052.0, 2233.0, 5288.0, 14835.0, 59662.0, 562311.0, 335759.0, 44798.0, 12453.0, 4423.0, 1940.0, 980.0, 544.0, 291.0, 161.0, 95.0, 80.0, 49.0, 33.0, 31.0, 19.0, 8.0, 5.0, 12.0, 4.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1165771484375, -0.11292362213134766, -0.10927009582519531, -0.10561656951904297, -0.10196304321289062, -0.09830951690673828, -0.09465599060058594, -0.0910024642944336, -0.08734893798828125, -0.0836954116821289, -0.08004188537597656, -0.07638835906982422, -0.07273483276367188, -0.06908130645751953, -0.06542778015136719, -0.061774253845214844, -0.0581207275390625, -0.054467201232910156, -0.05081367492675781, -0.04716014862060547, -0.043506622314453125, -0.03985309600830078, -0.03619956970214844, -0.032546043395996094, -0.02889251708984375, -0.025238990783691406, -0.021585464477539062, -0.01793193817138672, -0.014278411865234375, -0.010624885559082031, -0.0069713592529296875, -0.0033178329467773438, 0.000335693359375, 0.003989219665527344, 0.0076427459716796875, 0.011296272277832031, 0.014949798583984375, 0.01860332489013672, 0.022256851196289062, 0.025910377502441406, 0.02956390380859375, 0.033217430114746094, 0.03687095642089844, 0.04052448272705078, 0.044178009033203125, 0.04783153533935547, 0.05148506164550781, 0.055138587951660156, 0.0587921142578125, 0.062445640563964844, 0.06609916687011719, 0.06975269317626953, 0.07340621948242188, 0.07705974578857422, 0.08071327209472656, 0.0843667984008789, 0.08802032470703125, 0.0916738510131836, 0.09532737731933594, 0.09898090362548828, 0.10263442993164062, 0.10628795623779297, 0.10994148254394531, 0.11359500885009766, 0.11724853515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 10.0, 10.0, 13.0, 15.0, 15.0, 27.0, 34.0, 42.0, 50.0, 74.0, 123.0, 144.0, 123.0, 42.0, 58.0, 36.0, 27.0, 20.0, 27.0, 16.0, 8.0, 9.0, 13.0, 10.0, 4.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.042755126953125, -0.04130220413208008, -0.039849281311035156, -0.038396358489990234, -0.03694343566894531, -0.03549051284790039, -0.03403759002685547, -0.03258466720581055, -0.031131744384765625, -0.029678821563720703, -0.02822589874267578, -0.02677297592163086, -0.025320053100585938, -0.023867130279541016, -0.022414207458496094, -0.020961284637451172, -0.01950836181640625, -0.018055438995361328, -0.016602516174316406, -0.015149593353271484, -0.013696670532226562, -0.01224374771118164, -0.010790824890136719, -0.009337902069091797, -0.007884979248046875, -0.006432056427001953, -0.004979133605957031, -0.0035262107849121094, -0.0020732879638671875, -0.0006203651428222656, 0.0008325576782226562, 0.002285480499267578, 0.0037384033203125, 0.005191326141357422, 0.006644248962402344, 0.008097171783447266, 0.009550094604492188, 0.01100301742553711, 0.012455940246582031, 0.013908863067626953, 0.015361785888671875, 0.016814708709716797, 0.01826763153076172, 0.01972055435180664, 0.021173477172851562, 0.022626399993896484, 0.024079322814941406, 0.025532245635986328, 0.02698516845703125, 0.028438091278076172, 0.029891014099121094, 0.031343936920166016, 0.03279685974121094, 0.03424978256225586, 0.03570270538330078, 0.0371556282043457, 0.038608551025390625, 0.04006147384643555, 0.04151439666748047, 0.04296731948852539, 0.04442024230957031, 0.045873165130615234, 0.047326087951660156, 0.04877901077270508, 0.05023193359375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 19.0, 27.0, 64.0, 64.0, 132.0, 180.0, 166.0, 133.0, 77.0, 51.0, 29.0, 18.0, 11.0, 4.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6173129081726074, -1.5500413179397583, -1.4827696084976196, -1.4154980182647705, -1.3482264280319214, -1.2809548377990723, -1.2136831283569336, -1.1464115381240845, -1.0791399478912354, -1.0118683576583862, -0.9445967078208923, -0.8773250579833984, -0.8100534677505493, -0.7427818179130554, -0.6755101680755615, -0.6082385778427124, -0.5409668684005737, -0.4736952483654022, -0.4064236283302307, -0.3391519784927368, -0.2718803584575653, -0.2046087384223938, -0.1373370885848999, -0.0700654685497284, -0.0027938485145568848, 0.06447777897119522, 0.13174940645694733, 0.19902104139328003, 0.26629266142845154, 0.33356428146362305, 0.40083593130111694, 0.46810755133628845, 0.53537917137146, 0.6026508212089539, 0.669922411441803, 0.7371940612792969, 0.804465651512146, 0.8717373013496399, 0.9390089511871338, 1.006280541419983, 1.073552131652832, 1.1408237218856812, 1.2080954313278198, 1.275367021560669, 1.342638611793518, 1.4099102020263672, 1.4771819114685059, 1.544453501701355, 1.6117252111434937, 1.6789968013763428, 1.7462685108184814, 1.8135401010513306, 1.8808116912841797, 1.9480834007263184, 2.015355110168457, 2.0826265811920166, 2.1498982906341553, 2.217170000076294, 2.2844414710998535, 2.351713180541992, 2.418984889984131, 2.4862563610076904, 2.553528070449829, 2.6207997798919678, 2.6880712509155273]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 9.0, 7.0, 7.0, 4.0, 8.0, 11.0, 8.0, 16.0, 18.0, 30.0, 18.0, 16.0, 33.0, 30.0, 28.0, 26.0, 32.0, 38.0, 35.0, 42.0, 36.0, 47.0, 33.0, 49.0, 38.0, 33.0, 43.0, 35.0, 37.0, 40.0, 29.0, 20.0, 24.0, 19.0, 15.0, 16.0, 16.0, 6.0, 8.0, 6.0, 8.0, 7.0, 9.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.5444324016571045, -1.4969345331192017, -1.4494365453720093, -1.4019386768341064, -1.3544408082962036, -1.3069429397583008, -1.2594449520111084, -1.2119470834732056, -1.1644492149353027, -1.1169513463974, -1.0694533586502075, -1.0219554901123047, -0.9744576215744019, -0.9269596934318542, -0.8794617652893066, -0.8319638967514038, -0.7844659090042114, -0.7369679808616638, -0.689470112323761, -0.6419721841812134, -0.5944743156433105, -0.5469763875007629, -0.49947845935821533, -0.4519805610179901, -0.4044826626777649, -0.3569847643375397, -0.30948686599731445, -0.26198893785476685, -0.21449103951454163, -0.1669931411743164, -0.1194952130317688, -0.07199731469154358, -0.02449953556060791, 0.022998370230197906, 0.07049627602100372, 0.11799418926239014, 0.16549208760261536, 0.21298998594284058, 0.2604879140853882, 0.3079858124256134, 0.3554837107658386, 0.40298160910606384, 0.45047950744628906, 0.49797743558883667, 0.5454753637313843, 0.5929732322692871, 0.6404711604118347, 0.6879690885543823, 0.7354669570922852, 0.7829648852348328, 0.8304627537727356, 0.8779606819152832, 0.925458550453186, 0.9729564785957336, 1.0204544067382812, 1.067952275276184, 1.115450143814087, 1.1629480123519897, 1.2104460000991821, 1.257943868637085, 1.3054417371749878, 1.3529396057128906, 1.400437593460083, 1.4479354619979858, 1.4954334497451782]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 6.0, 11.0, 11.0, 24.0, 25.0, 42.0, 52.0, 81.0, 137.0, 171.0, 265.0, 439.0, 694.0, 1088.0, 2079.0, 4033.0, 8975.0, 25021.0, 108847.0, 697617.0, 2458609.0, 739449.0, 101680.0, 25443.0, 9438.0, 4507.0, 2285.0, 1195.0, 703.0, 434.0, 296.0, 210.0, 119.0, 94.0, 65.0, 41.0, 25.0, 18.0, 15.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.79443359375, -0.7714157104492188, -0.7483978271484375, -0.7253799438476562, -0.702362060546875, -0.6793441772460938, -0.6563262939453125, -0.6333084106445312, -0.61029052734375, -0.5872726440429688, -0.5642547607421875, -0.5412368774414062, -0.518218994140625, -0.49520111083984375, -0.4721832275390625, -0.44916534423828125, -0.4261474609375, -0.40312957763671875, -0.3801116943359375, -0.35709381103515625, -0.334075927734375, -0.31105804443359375, -0.2880401611328125, -0.26502227783203125, -0.24200439453125, -0.21898651123046875, -0.1959686279296875, -0.17295074462890625, -0.149932861328125, -0.12691497802734375, -0.1038970947265625, -0.08087921142578125, -0.057861328125, -0.03484344482421875, -0.0118255615234375, 0.01119232177734375, 0.034210205078125, 0.05722808837890625, 0.0802459716796875, 0.10326385498046875, 0.12628173828125, 0.14929962158203125, 0.1723175048828125, 0.19533538818359375, 0.218353271484375, 0.24137115478515625, 0.2643890380859375, 0.28740692138671875, 0.3104248046875, 0.33344268798828125, 0.3564605712890625, 0.37947845458984375, 0.402496337890625, 0.42551422119140625, 0.4485321044921875, 0.47154998779296875, 0.49456787109375, 0.5175857543945312, 0.5406036376953125, 0.5636215209960938, 0.586639404296875, 0.6096572875976562, 0.6326751708984375, 0.6556930541992188, 0.6787109375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 11.0, 12.0, 14.0, 25.0, 35.0, 36.0, 49.0, 52.0, 64.0, 74.0, 70.0, 63.0, 81.0, 68.0, 73.0, 65.0, 39.0, 40.0, 28.0, 25.0, 17.0, 15.0, 13.0, 5.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9052734375, -0.8805618286132812, -0.8558502197265625, -0.8311386108398438, -0.806427001953125, -0.7817153930664062, -0.7570037841796875, -0.7322921752929688, -0.70758056640625, -0.6828689575195312, -0.6581573486328125, -0.6334457397460938, -0.608734130859375, -0.5840225219726562, -0.5593109130859375, -0.5345993041992188, -0.5098876953125, -0.48517608642578125, -0.4604644775390625, -0.43575286865234375, -0.411041259765625, -0.38632965087890625, -0.3616180419921875, -0.33690643310546875, -0.31219482421875, -0.28748321533203125, -0.2627716064453125, -0.23805999755859375, -0.213348388671875, -0.18863677978515625, -0.1639251708984375, -0.13921356201171875, -0.114501953125, -0.08979034423828125, -0.0650787353515625, -0.04036712646484375, -0.015655517578125, 0.00905609130859375, 0.0337677001953125, 0.05847930908203125, 0.08319091796875, 0.10790252685546875, 0.1326141357421875, 0.15732574462890625, 0.182037353515625, 0.20674896240234375, 0.2314605712890625, 0.25617218017578125, 0.2808837890625, 0.30559539794921875, 0.3303070068359375, 0.35501861572265625, 0.379730224609375, 0.40444183349609375, 0.4291534423828125, 0.45386505126953125, 0.47857666015625, 0.5032882690429688, 0.5279998779296875, 0.5527114868164062, 0.577423095703125, 0.6021347045898438, 0.6268463134765625, 0.6515579223632812, 0.67626953125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 9.0, 16.0, 21.0, 42.0, 73.0, 151.0, 335.0, 771.0, 2701.0, 13302.0, 268450.0, 3844223.0, 55372.0, 6287.0, 1528.0, 521.0, 209.0, 118.0, 42.0, 24.0, 28.0, 13.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.439453125, -1.38470458984375, -1.3299560546875, -1.27520751953125, -1.220458984375, -1.16571044921875, -1.1109619140625, -1.05621337890625, -1.00146484375, -0.94671630859375, -0.8919677734375, -0.83721923828125, -0.782470703125, -0.72772216796875, -0.6729736328125, -0.61822509765625, -0.5634765625, -0.50872802734375, -0.4539794921875, -0.39923095703125, -0.344482421875, -0.28973388671875, -0.2349853515625, -0.18023681640625, -0.12548828125, -0.07073974609375, -0.0159912109375, 0.03875732421875, 0.093505859375, 0.14825439453125, 0.2030029296875, 0.25775146484375, 0.3125, 0.36724853515625, 0.4219970703125, 0.47674560546875, 0.531494140625, 0.58624267578125, 0.6409912109375, 0.69573974609375, 0.75048828125, 0.80523681640625, 0.8599853515625, 0.91473388671875, 0.969482421875, 1.02423095703125, 1.0789794921875, 1.13372802734375, 1.1884765625, 1.24322509765625, 1.2979736328125, 1.35272216796875, 1.407470703125, 1.46221923828125, 1.5169677734375, 1.57171630859375, 1.62646484375, 1.68121337890625, 1.7359619140625, 1.79071044921875, 1.845458984375, 1.90020751953125, 1.9549560546875, 2.00970458984375, 2.064453125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 9.0, 5.0, 17.0, 29.0, 31.0, 60.0, 103.0, 206.0, 511.0, 956.0, 1027.0, 548.0, 251.0, 115.0, 63.0, 42.0, 25.0, 18.0, 10.0, 11.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466064453125, -0.4534912109375, -0.44091796875, -0.4283447265625, -0.415771484375, -0.4031982421875, -0.390625, -0.3780517578125, -0.365478515625, -0.3529052734375, -0.34033203125, -0.3277587890625, -0.315185546875, -0.3026123046875, -0.2900390625, -0.2774658203125, -0.264892578125, -0.2523193359375, -0.23974609375, -0.2271728515625, -0.214599609375, -0.2020263671875, -0.189453125, -0.1768798828125, -0.164306640625, -0.1517333984375, -0.13916015625, -0.1265869140625, -0.114013671875, -0.1014404296875, -0.0888671875, -0.0762939453125, -0.063720703125, -0.0511474609375, -0.03857421875, -0.0260009765625, -0.013427734375, -0.0008544921875, 0.01171875, 0.0242919921875, 0.036865234375, 0.0494384765625, 0.06201171875, 0.0745849609375, 0.087158203125, 0.0997314453125, 0.1123046875, 0.1248779296875, 0.137451171875, 0.1500244140625, 0.16259765625, 0.1751708984375, 0.187744140625, 0.2003173828125, 0.212890625, 0.2254638671875, 0.238037109375, 0.2506103515625, 0.26318359375, 0.2757568359375, 0.288330078125, 0.3009033203125, 0.3134765625, 0.3260498046875, 0.338623046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 11.0, 2.0, 3.0, 5.0, 9.0, 11.0, 20.0, 18.0, 18.0, 30.0, 35.0, 37.0, 73.0, 79.0, 77.0, 69.0, 73.0, 75.0, 81.0, 58.0, 47.0, 47.0, 37.0, 18.0, 21.0, 13.0, 5.0, 10.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7154378890991211, -0.6900482773780823, -0.6646586656570435, -0.6392691135406494, -0.6138795018196106, -0.5884898900985718, -0.563100278377533, -0.5377106666564941, -0.5123210549354553, -0.4869314432144165, -0.4615418612957001, -0.43615224957466125, -0.41076263785362244, -0.385373055934906, -0.3599834442138672, -0.33459383249282837, -0.30920425057411194, -0.2838146388530731, -0.2584250569343567, -0.23303544521331787, -0.20764583349227905, -0.18225623667240143, -0.1568666398525238, -0.13147702813148499, -0.10608743131160736, -0.08069782704114914, -0.055308226495981216, -0.029918625950813293, -0.004529021680355072, 0.02086058259010315, 0.046250179409980774, 0.07163979113101959, 0.09702938795089722, 0.12241899222135544, 0.14780859649181366, 0.17319819331169128, 0.1985878050327301, 0.22397740185260773, 0.24936699867248535, 0.27475661039352417, 0.300146222114563, 0.3255358338356018, 0.35092541575431824, 0.37631502747535706, 0.4017046391963959, 0.4270942211151123, 0.4524838328361511, 0.47787344455718994, 0.503262996673584, 0.5286526083946228, 0.5540422201156616, 0.5794317722320557, 0.6048213839530945, 0.6302109956741333, 0.6556006073951721, 0.6809902191162109, 0.7063798308372498, 0.7317694425582886, 0.7571590542793274, 0.7825486660003662, 0.8079382181167603, 0.8333278298377991, 0.8587174415588379, 0.8841070532798767, 0.9094966650009155]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 8.0, 10.0, 10.0, 10.0, 19.0, 28.0, 22.0, 39.0, 30.0, 42.0, 49.0, 33.0, 49.0, 53.0, 66.0, 65.0, 59.0, 59.0, 50.0, 46.0, 54.0, 30.0, 34.0, 30.0, 22.0, 22.0, 15.0, 14.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8351083993911743, -0.8112479448318481, -0.7873875498771667, -0.7635271549224854, -0.7396667003631592, -0.715806245803833, -0.6919458508491516, -0.6680854558944702, -0.644225001335144, -0.6203645467758179, -0.5965041518211365, -0.5726437568664551, -0.5487833023071289, -0.5249228477478027, -0.5010624527931213, -0.47720202803611755, -0.45334160327911377, -0.42948117852211, -0.4056207537651062, -0.3817603290081024, -0.35789990425109863, -0.33403947949409485, -0.31017905473709106, -0.2863186299800873, -0.2624582052230835, -0.2385977804660797, -0.21473735570907593, -0.19087693095207214, -0.16701650619506836, -0.14315608143806458, -0.11929565668106079, -0.095435231924057, -0.07157474756240845, -0.04771432280540466, -0.02385389804840088, 6.5267086029052734e-06, 0.02386695146560669, 0.047727376222610474, 0.07158780097961426, 0.09544822573661804, 0.11930865049362183, 0.1431690752506256, 0.1670295000076294, 0.19088992476463318, 0.21475034952163696, 0.23861077427864075, 0.26247119903564453, 0.2863316237926483, 0.3101920485496521, 0.3340524733066559, 0.35791289806365967, 0.38177332282066345, 0.40563374757766724, 0.429494172334671, 0.4533545970916748, 0.4772150218486786, 0.5010754466056824, 0.5249358415603638, 0.5487962961196899, 0.5726567506790161, 0.5965171456336975, 0.6203775405883789, 0.6442379951477051, 0.6680984497070312, 0.6919588446617126]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 12.0, 5.0, 10.0, 15.0, 25.0, 29.0, 49.0, 81.0, 126.0, 212.0, 391.0, 655.0, 1442.0, 3414.0, 8579.0, 27596.0, 112869.0, 470132.0, 323791.0, 69370.0, 18643.0, 6112.0, 2494.0, 1146.0, 568.0, 301.0, 174.0, 112.0, 79.0, 43.0, 19.0, 20.0, 12.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.1494140625, -0.1455669403076172, -0.14171981811523438, -0.13787269592285156, -0.13402557373046875, -0.13017845153808594, -0.12633132934570312, -0.12248420715332031, -0.1186370849609375, -0.11478996276855469, -0.11094284057617188, -0.10709571838378906, -0.10324859619140625, -0.09940147399902344, -0.09555435180664062, -0.09170722961425781, -0.087860107421875, -0.08401298522949219, -0.08016586303710938, -0.07631874084472656, -0.07247161865234375, -0.06862449645996094, -0.06477737426757812, -0.06093025207519531, -0.0570831298828125, -0.05323600769042969, -0.049388885498046875, -0.04554176330566406, -0.04169464111328125, -0.03784751892089844, -0.034000396728515625, -0.030153274536132812, -0.02630615234375, -0.022459030151367188, -0.018611907958984375, -0.014764785766601562, -0.01091766357421875, -0.0070705413818359375, -0.003223419189453125, 0.0006237030029296875, 0.0044708251953125, 0.008317947387695312, 0.012165069580078125, 0.016012191772460938, 0.01985931396484375, 0.023706436157226562, 0.027553558349609375, 0.03140068054199219, 0.035247802734375, 0.03909492492675781, 0.042942047119140625, 0.04678916931152344, 0.05063629150390625, 0.05448341369628906, 0.058330535888671875, 0.06217765808105469, 0.0660247802734375, 0.06987190246582031, 0.07371902465820312, 0.07756614685058594, 0.08141326904296875, 0.08526039123535156, 0.08910751342773438, 0.09295463562011719, 0.0968017578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 20.0, 12.0, 23.0, 33.0, 29.0, 51.0, 59.0, 55.0, 79.0, 78.0, 57.0, 79.0, 73.0, 66.0, 71.0, 47.0, 36.0, 30.0, 21.0, 26.0, 10.0, 9.0, 2.0, 5.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5107421875, -0.4915313720703125, -0.472320556640625, -0.4531097412109375, -0.43389892578125, -0.4146881103515625, -0.395477294921875, -0.3762664794921875, -0.3570556640625, -0.3378448486328125, -0.318634033203125, -0.2994232177734375, -0.28021240234375, -0.2610015869140625, -0.241790771484375, -0.2225799560546875, -0.203369140625, -0.1841583251953125, -0.164947509765625, -0.1457366943359375, -0.12652587890625, -0.1073150634765625, -0.088104248046875, -0.0688934326171875, -0.0496826171875, -0.0304718017578125, -0.011260986328125, 0.0079498291015625, 0.02716064453125, 0.0463714599609375, 0.065582275390625, 0.0847930908203125, 0.10400390625, 0.1232147216796875, 0.142425537109375, 0.1616363525390625, 0.18084716796875, 0.2000579833984375, 0.219268798828125, 0.2384796142578125, 0.2576904296875, 0.2769012451171875, 0.296112060546875, 0.3153228759765625, 0.33453369140625, 0.3537445068359375, 0.372955322265625, 0.3921661376953125, 0.411376953125, 0.4305877685546875, 0.449798583984375, 0.4690093994140625, 0.48822021484375, 0.5074310302734375, 0.526641845703125, 0.5458526611328125, 0.5650634765625, 0.5842742919921875, 0.603485107421875, 0.6226959228515625, 0.64190673828125, 0.6611175537109375, 0.680328369140625, 0.6995391845703125, 0.71875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 3.0, 6.0, 17.0, 38.0, 36.0, 48.0, 70.0, 111.0, 184.0, 232.0, 385.0, 496.0, 750.0, 1095.0, 1729.0, 2469.0, 3770.0, 5727.0, 9074.0, 15037.0, 24983.0, 43084.0, 73880.0, 127604.0, 194417.0, 203265.0, 138702.0, 81675.0, 47627.0, 27595.0, 16271.0, 9903.0, 6216.0, 4094.0, 2526.0, 1717.0, 1206.0, 775.0, 525.0, 383.0, 264.0, 168.0, 107.0, 103.0, 46.0, 40.0, 35.0, 20.0, 10.0, 15.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.036468505859375, -0.03529548645019531, -0.034122467041015625, -0.03294944763183594, -0.03177642822265625, -0.030603408813476562, -0.029430389404296875, -0.028257369995117188, -0.0270843505859375, -0.025911331176757812, -0.024738311767578125, -0.023565292358398438, -0.02239227294921875, -0.021219253540039062, -0.020046234130859375, -0.018873214721679688, -0.0177001953125, -0.016527175903320312, -0.015354156494140625, -0.014181137084960938, -0.01300811767578125, -0.011835098266601562, -0.010662078857421875, -0.009489059448242188, -0.0083160400390625, -0.0071430206298828125, -0.005970001220703125, -0.0047969818115234375, -0.00362396240234375, -0.0024509429931640625, -0.001277923583984375, -0.0001049041748046875, 0.001068115234375, 0.0022411346435546875, 0.003414154052734375, 0.0045871734619140625, 0.00576019287109375, 0.0069332122802734375, 0.008106231689453125, 0.009279251098632812, 0.0104522705078125, 0.011625289916992188, 0.012798309326171875, 0.013971328735351562, 0.01514434814453125, 0.016317367553710938, 0.017490386962890625, 0.018663406372070312, 0.01983642578125, 0.021009445190429688, 0.022182464599609375, 0.023355484008789062, 0.02452850341796875, 0.025701522827148438, 0.026874542236328125, 0.028047561645507812, 0.0292205810546875, 0.030393600463867188, 0.031566619873046875, 0.03273963928222656, 0.03391265869140625, 0.03508567810058594, 0.036258697509765625, 0.03743171691894531, 0.038604736328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 9.0, 10.0, 7.0, 11.0, 10.0, 13.0, 14.0, 11.0, 25.0, 22.0, 34.0, 28.0, 35.0, 55.0, 37.0, 52.0, 49.0, 39.0, 36.0, 52.0, 52.0, 62.0, 43.0, 38.0, 41.0, 31.0, 30.0, 36.0, 23.0, 12.0, 13.0, 14.0, 8.0, 4.0, 9.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.912109375, -0.8861846923828125, -0.860260009765625, -0.8343353271484375, -0.80841064453125, -0.7824859619140625, -0.756561279296875, -0.7306365966796875, -0.7047119140625, -0.6787872314453125, -0.652862548828125, -0.6269378662109375, -0.60101318359375, -0.5750885009765625, -0.549163818359375, -0.5232391357421875, -0.497314453125, -0.4713897705078125, -0.445465087890625, -0.4195404052734375, -0.39361572265625, -0.3676910400390625, -0.341766357421875, -0.3158416748046875, -0.2899169921875, -0.2639923095703125, -0.238067626953125, -0.2121429443359375, -0.18621826171875, -0.1602935791015625, -0.134368896484375, -0.1084442138671875, -0.08251953125, -0.0565948486328125, -0.030670166015625, -0.0047454833984375, 0.02117919921875, 0.0471038818359375, 0.073028564453125, 0.0989532470703125, 0.1248779296875, 0.1508026123046875, 0.176727294921875, 0.2026519775390625, 0.22857666015625, 0.2545013427734375, 0.280426025390625, 0.3063507080078125, 0.332275390625, 0.3582000732421875, 0.384124755859375, 0.4100494384765625, 0.43597412109375, 0.4618988037109375, 0.487823486328125, 0.5137481689453125, 0.5396728515625, 0.5655975341796875, 0.591522216796875, 0.6174468994140625, 0.64337158203125, 0.6692962646484375, 0.695220947265625, 0.7211456298828125, 0.7470703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 16.0, 13.0, 14.0, 39.0, 56.0, 92.0, 113.0, 257.0, 510.0, 942.0, 1925.0, 4902.0, 17702.0, 125039.0, 716798.0, 149977.0, 20409.0, 5429.0, 2140.0, 995.0, 547.0, 231.0, 172.0, 85.0, 50.0, 33.0, 16.0, 17.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0160675048828125, -0.015558004379272461, -0.015048503875732422, -0.014539003372192383, -0.014029502868652344, -0.013520002365112305, -0.013010501861572266, -0.012501001358032227, -0.011991500854492188, -0.011482000350952148, -0.01097249984741211, -0.01046299934387207, -0.009953498840332031, -0.009443998336791992, -0.008934497833251953, -0.008424997329711914, -0.007915496826171875, -0.007405996322631836, -0.006896495819091797, -0.006386995315551758, -0.005877494812011719, -0.00536799430847168, -0.004858493804931641, -0.0043489933013916016, -0.0038394927978515625, -0.0033299922943115234, -0.0028204917907714844, -0.0023109912872314453, -0.0018014907836914062, -0.0012919902801513672, -0.0007824897766113281, -0.00027298927307128906, 0.00023651123046875, 0.0007460117340087891, 0.0012555122375488281, 0.0017650127410888672, 0.0022745132446289062, 0.0027840137481689453, 0.0032935142517089844, 0.0038030147552490234, 0.0043125152587890625, 0.0048220157623291016, 0.005331516265869141, 0.00584101676940918, 0.006350517272949219, 0.006860017776489258, 0.007369518280029297, 0.007879018783569336, 0.008388519287109375, 0.008898019790649414, 0.009407520294189453, 0.009917020797729492, 0.010426521301269531, 0.01093602180480957, 0.01144552230834961, 0.011955022811889648, 0.012464523315429688, 0.012974023818969727, 0.013483524322509766, 0.013993024826049805, 0.014502525329589844, 0.015012025833129883, 0.015521526336669922, 0.01603102684020996, 0.01654052734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 10.0, 8.0, 11.0, 15.0, 16.0, 35.0, 65.0, 137.0, 204.0, 205.0, 126.0, 63.0, 44.0, 17.0, 17.0, 9.0, 6.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.170967102050781e-05, -3.057718276977539e-05, -2.944469451904297e-05, -2.8312206268310547e-05, -2.7179718017578125e-05, -2.6047229766845703e-05, -2.491474151611328e-05, -2.378225326538086e-05, -2.2649765014648438e-05, -2.1517276763916016e-05, -2.0384788513183594e-05, -1.9252300262451172e-05, -1.811981201171875e-05, -1.6987323760986328e-05, -1.5854835510253906e-05, -1.4722347259521484e-05, -1.3589859008789062e-05, -1.245737075805664e-05, -1.1324882507324219e-05, -1.0192394256591797e-05, -9.059906005859375e-06, -7.927417755126953e-06, -6.794929504394531e-06, -5.662441253662109e-06, -4.5299530029296875e-06, -3.3974647521972656e-06, -2.2649765014648438e-06, -1.1324882507324219e-06, 0.0, 1.1324882507324219e-06, 2.2649765014648438e-06, 3.3974647521972656e-06, 4.5299530029296875e-06, 5.662441253662109e-06, 6.794929504394531e-06, 7.927417755126953e-06, 9.059906005859375e-06, 1.0192394256591797e-05, 1.1324882507324219e-05, 1.245737075805664e-05, 1.3589859008789062e-05, 1.4722347259521484e-05, 1.5854835510253906e-05, 1.6987323760986328e-05, 1.811981201171875e-05, 1.9252300262451172e-05, 2.0384788513183594e-05, 2.1517276763916016e-05, 2.2649765014648438e-05, 2.378225326538086e-05, 2.491474151611328e-05, 2.6047229766845703e-05, 2.7179718017578125e-05, 2.8312206268310547e-05, 2.944469451904297e-05, 3.057718276977539e-05, 3.170967102050781e-05, 3.2842159271240234e-05, 3.3974647521972656e-05, 3.510713577270508e-05, 3.62396240234375e-05, 3.737211227416992e-05, 3.8504600524902344e-05, 3.9637088775634766e-05, 4.076957702636719e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 9.0, 8.0, 11.0, 20.0, 25.0, 42.0, 75.0, 211.0, 501.0, 1541.0, 6405.0, 57255.0, 879918.0, 91454.0, 8067.0, 1880.0, 627.0, 247.0, 107.0, 50.0, 20.0, 22.0, 13.0, 8.0, 10.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025177001953125, -0.02432560920715332, -0.02347421646118164, -0.02262282371520996, -0.02177143096923828, -0.0209200382232666, -0.020068645477294922, -0.019217252731323242, -0.018365859985351562, -0.017514467239379883, -0.016663074493408203, -0.015811681747436523, -0.014960289001464844, -0.014108896255493164, -0.013257503509521484, -0.012406110763549805, -0.011554718017578125, -0.010703325271606445, -0.009851932525634766, -0.009000539779663086, -0.008149147033691406, -0.0072977542877197266, -0.006446361541748047, -0.005594968795776367, -0.0047435760498046875, -0.003892183303833008, -0.003040790557861328, -0.0021893978118896484, -0.0013380050659179688, -0.00048661231994628906, 0.0003647804260253906, 0.0012161731719970703, 0.00206756591796875, 0.0029189586639404297, 0.0037703514099121094, 0.004621744155883789, 0.005473136901855469, 0.0063245296478271484, 0.007175922393798828, 0.008027315139770508, 0.008878707885742188, 0.009730100631713867, 0.010581493377685547, 0.011432886123657227, 0.012284278869628906, 0.013135671615600586, 0.013987064361572266, 0.014838457107543945, 0.015689849853515625, 0.016541242599487305, 0.017392635345458984, 0.018244028091430664, 0.019095420837402344, 0.019946813583374023, 0.020798206329345703, 0.021649599075317383, 0.022500991821289062, 0.023352384567260742, 0.024203777313232422, 0.0250551700592041, 0.02590656280517578, 0.02675795555114746, 0.02760934829711914, 0.02846074104309082, 0.0293121337890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 6.0, 5.0, 14.0, 24.0, 21.0, 42.0, 86.0, 136.0, 239.0, 177.0, 102.0, 56.0, 27.0, 18.0, 11.0, 10.0, 3.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00677490234375, -0.006579220294952393, -0.006383538246154785, -0.006187856197357178, -0.00599217414855957, -0.005796492099761963, -0.0056008100509643555, -0.005405128002166748, -0.005209445953369141, -0.005013763904571533, -0.004818081855773926, -0.004622399806976318, -0.004426717758178711, -0.0042310357093811035, -0.004035353660583496, -0.0038396716117858887, -0.0036439895629882812, -0.003448307514190674, -0.0032526254653930664, -0.003056943416595459, -0.0028612613677978516, -0.002665579319000244, -0.0024698972702026367, -0.0022742152214050293, -0.002078533172607422, -0.0018828511238098145, -0.001687169075012207, -0.0014914870262145996, -0.0012958049774169922, -0.0011001229286193848, -0.0009044408798217773, -0.0007087588310241699, -0.0005130767822265625, -0.0003173947334289551, -0.00012171268463134766, 7.396936416625977e-05, 0.0002696514129638672, 0.0004653334617614746, 0.000661015510559082, 0.0008566975593566895, 0.0010523796081542969, 0.0012480616569519043, 0.0014437437057495117, 0.0016394257545471191, 0.0018351078033447266, 0.002030789852142334, 0.0022264719009399414, 0.002422153949737549, 0.0026178359985351562, 0.0028135180473327637, 0.003009200096130371, 0.0032048821449279785, 0.003400564193725586, 0.0035962462425231934, 0.0037919282913208008, 0.003987610340118408, 0.004183292388916016, 0.004378974437713623, 0.0045746564865112305, 0.004770338535308838, 0.004966020584106445, 0.005161702632904053, 0.00535738468170166, 0.005553066730499268, 0.005748748779296875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 9.0, 18.0, 17.0, 28.0, 34.0, 56.0, 67.0, 96.0, 109.0, 91.0, 100.0, 94.0, 70.0, 53.0, 43.0, 28.0, 19.0, 8.0, 14.0, 7.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36570796370506287, -0.34694990515708923, -0.3281918466091156, -0.30943378806114197, -0.29067572951316833, -0.2719176709651947, -0.25315964221954346, -0.23440156877040863, -0.215643510222435, -0.19688545167446136, -0.17812739312648773, -0.1593693494796753, -0.14061129093170166, -0.12185322493314743, -0.1030951738357544, -0.08433711528778076, -0.06557905673980713, -0.046820998191833496, -0.028062943369150162, -0.009304888546466827, 0.009453170001506805, 0.028211228549480438, 0.046969279646873474, 0.0657273381948471, 0.08448539674282074, 0.10324345529079437, 0.122001513838768, 0.14075955748558044, 0.15951761603355408, 0.1782756745815277, 0.19703373312950134, 0.21579179167747498, 0.23454982042312622, 0.25330787897109985, 0.2720659375190735, 0.2908239960670471, 0.30958205461502075, 0.3283401131629944, 0.347098171710968, 0.36585623025894165, 0.3846142888069153, 0.4033723473548889, 0.42213040590286255, 0.4408884644508362, 0.4596465229988098, 0.47840458154678345, 0.4971626400947571, 0.5159206986427307, 0.5346786975860596, 0.5534367561340332, 0.5721948146820068, 0.5909528732299805, 0.6097109317779541, 0.6284689903259277, 0.6472270488739014, 0.665985107421875, 0.6847431659698486, 0.7035012245178223, 0.7222592830657959, 0.7410173416137695, 0.7597754001617432, 0.7785334587097168, 0.7972915172576904, 0.8160495758056641, 0.8348076343536377]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 18.0, 12.0, 11.0, 30.0, 40.0, 46.0, 56.0, 64.0, 51.0, 77.0, 82.0, 92.0, 75.0, 64.0, 67.0, 42.0, 41.0, 39.0, 22.0, 22.0, 15.0, 7.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5722128748893738, -0.553123950958252, -0.5340349674224854, -0.5149460434913635, -0.4958570599555969, -0.4767681360244751, -0.4576791822910309, -0.43859022855758667, -0.41950127482414246, -0.40041232109069824, -0.38132336735725403, -0.3622344136238098, -0.343145489692688, -0.3240565061569214, -0.30496758222579956, -0.28587862849235535, -0.26678967475891113, -0.24770072102546692, -0.2286117672920227, -0.20952282845973969, -0.19043387472629547, -0.17134492099285126, -0.15225598216056824, -0.13316702842712402, -0.11407807469367981, -0.0949891209602356, -0.07590017467737198, -0.05681122466921806, -0.03772227466106415, -0.018633320927619934, 0.00045562535524368286, 0.0195445716381073, 0.03863358497619629, 0.057722534984350204, 0.07681148499250412, 0.09590043127536774, 0.11498938500881195, 0.13407833874225616, 0.15316727757453918, 0.1722562313079834, 0.1913451850414276, 0.21043413877487183, 0.22952309250831604, 0.24861203134059906, 0.2677009701728821, 0.2867899537086487, 0.3058788776397705, 0.3249678313732147, 0.34405678510665894, 0.36314573884010315, 0.38223469257354736, 0.4013236463069916, 0.4204126000404358, 0.4395015239715576, 0.45859047770500183, 0.47767943143844604, 0.49676838517189026, 0.5158573389053345, 0.5349462628364563, 0.5540352463722229, 0.5731241703033447, 0.5922131538391113, 0.6113020777702332, 0.630391001701355, 0.6494799852371216]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 8.0, 9.0, 20.0, 36.0, 34.0, 35.0, 60.0, 95.0, 150.0, 227.0, 317.0, 502.0, 769.0, 1117.0, 1970.0, 3473.0, 7132.0, 22321.0, 154366.0, 721992.0, 101523.0, 18059.0, 6440.0, 3134.0, 1686.0, 981.0, 681.0, 412.0, 300.0, 206.0, 128.0, 96.0, 73.0, 57.0, 43.0, 31.0, 11.0, 16.0, 14.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326904296875, -0.315399169921875, -0.30389404296875, -0.292388916015625, -0.2808837890625, -0.269378662109375, -0.25787353515625, -0.246368408203125, -0.23486328125, -0.223358154296875, -0.21185302734375, -0.200347900390625, -0.1888427734375, -0.177337646484375, -0.16583251953125, -0.154327392578125, -0.142822265625, -0.131317138671875, -0.11981201171875, -0.108306884765625, -0.0968017578125, -0.085296630859375, -0.07379150390625, -0.062286376953125, -0.05078125, -0.039276123046875, -0.02777099609375, -0.016265869140625, -0.0047607421875, 0.006744384765625, 0.01824951171875, 0.029754638671875, 0.041259765625, 0.052764892578125, 0.06427001953125, 0.075775146484375, 0.0872802734375, 0.098785400390625, 0.11029052734375, 0.121795654296875, 0.13330078125, 0.144805908203125, 0.15631103515625, 0.167816162109375, 0.1793212890625, 0.190826416015625, 0.20233154296875, 0.213836669921875, 0.225341796875, 0.236846923828125, 0.24835205078125, 0.259857177734375, 0.2713623046875, 0.282867431640625, 0.29437255859375, 0.305877685546875, 0.3173828125, 0.328887939453125, 0.34039306640625, 0.351898193359375, 0.3634033203125, 0.374908447265625, 0.38641357421875, 0.397918701171875, 0.409423828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 13.0, 24.0, 16.0, 29.0, 19.0, 36.0, 42.0, 47.0, 47.0, 60.0, 72.0, 57.0, 57.0, 58.0, 52.0, 55.0, 42.0, 50.0, 37.0, 27.0, 30.0, 21.0, 9.0, 16.0, 14.0, 11.0, 8.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.1630859375, -1.132537841796875, -1.10198974609375, -1.071441650390625, -1.0408935546875, -1.010345458984375, -0.97979736328125, -0.949249267578125, -0.918701171875, -0.888153076171875, -0.85760498046875, -0.827056884765625, -0.7965087890625, -0.765960693359375, -0.73541259765625, -0.704864501953125, -0.67431640625, -0.643768310546875, -0.61322021484375, -0.582672119140625, -0.5521240234375, -0.521575927734375, -0.49102783203125, -0.460479736328125, -0.429931640625, -0.399383544921875, -0.36883544921875, -0.338287353515625, -0.3077392578125, -0.277191162109375, -0.24664306640625, -0.216094970703125, -0.185546875, -0.154998779296875, -0.12445068359375, -0.093902587890625, -0.0633544921875, -0.032806396484375, -0.00225830078125, 0.028289794921875, 0.058837890625, 0.089385986328125, 0.11993408203125, 0.150482177734375, 0.1810302734375, 0.211578369140625, 0.24212646484375, 0.272674560546875, 0.30322265625, 0.333770751953125, 0.36431884765625, 0.394866943359375, 0.4254150390625, 0.455963134765625, 0.48651123046875, 0.517059326171875, 0.547607421875, 0.578155517578125, 0.60870361328125, 0.639251708984375, 0.6697998046875, 0.700347900390625, 0.73089599609375, 0.761444091796875, 0.7919921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 13.0, 11.0, 11.0, 12.0, 17.0, 31.0, 27.0, 43.0, 56.0, 90.0, 122.0, 225.0, 368.0, 712.0, 1553.0, 3685.0, 14193.0, 418807.0, 584420.0, 16663.0, 4029.0, 1629.0, 773.0, 408.0, 219.0, 117.0, 93.0, 65.0, 42.0, 22.0, 22.0, 21.0, 18.0, 14.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.615234375, -0.5954132080078125, -0.575592041015625, -0.5557708740234375, -0.53594970703125, -0.5161285400390625, -0.496307373046875, -0.4764862060546875, -0.4566650390625, -0.4368438720703125, -0.417022705078125, -0.3972015380859375, -0.37738037109375, -0.3575592041015625, -0.337738037109375, -0.3179168701171875, -0.298095703125, -0.2782745361328125, -0.258453369140625, -0.2386322021484375, -0.21881103515625, -0.1989898681640625, -0.179168701171875, -0.1593475341796875, -0.1395263671875, -0.1197052001953125, -0.099884033203125, -0.0800628662109375, -0.06024169921875, -0.0404205322265625, -0.020599365234375, -0.0007781982421875, 0.01904296875, 0.0388641357421875, 0.058685302734375, 0.0785064697265625, 0.09832763671875, 0.1181488037109375, 0.137969970703125, 0.1577911376953125, 0.1776123046875, 0.1974334716796875, 0.217254638671875, 0.2370758056640625, 0.25689697265625, 0.2767181396484375, 0.296539306640625, 0.3163604736328125, 0.336181640625, 0.3560028076171875, 0.375823974609375, 0.3956451416015625, 0.41546630859375, 0.4352874755859375, 0.455108642578125, 0.4749298095703125, 0.4947509765625, 0.5145721435546875, 0.534393310546875, 0.5542144775390625, 0.57403564453125, 0.5938568115234375, 0.613677978515625, 0.6334991455078125, 0.6533203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 13.0, 9.0, 26.0, 11.0, 33.0, 36.0, 44.0, 49.0, 49.0, 54.0, 69.0, 67.0, 67.0, 79.0, 58.0, 55.0, 56.0, 40.0, 40.0, 27.0, 29.0, 16.0, 14.0, 11.0, 13.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.413726806640625, -1.37237548828125, -1.331024169921875, -1.2896728515625, -1.248321533203125, -1.20697021484375, -1.165618896484375, -1.124267578125, -1.082916259765625, -1.04156494140625, -1.000213623046875, -0.9588623046875, -0.917510986328125, -0.87615966796875, -0.834808349609375, -0.79345703125, -0.752105712890625, -0.71075439453125, -0.669403076171875, -0.6280517578125, -0.586700439453125, -0.54534912109375, -0.503997802734375, -0.462646484375, -0.421295166015625, -0.37994384765625, -0.338592529296875, -0.2972412109375, -0.255889892578125, -0.21453857421875, -0.173187255859375, -0.1318359375, -0.090484619140625, -0.04913330078125, -0.007781982421875, 0.0335693359375, 0.074920654296875, 0.11627197265625, 0.157623291015625, 0.198974609375, 0.240325927734375, 0.28167724609375, 0.323028564453125, 0.3643798828125, 0.405731201171875, 0.44708251953125, 0.488433837890625, 0.52978515625, 0.571136474609375, 0.61248779296875, 0.653839111328125, 0.6951904296875, 0.736541748046875, 0.77789306640625, 0.819244384765625, 0.860595703125, 0.901947021484375, 0.94329833984375, 0.984649658203125, 1.0260009765625, 1.067352294921875, 1.10870361328125, 1.150054931640625, 1.19140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 13.0, 7.0, 16.0, 21.0, 41.0, 67.0, 127.0, 280.0, 712.0, 2890.0, 22545.0, 957652.0, 57898.0, 4589.0, 1007.0, 358.0, 133.0, 73.0, 39.0, 22.0, 11.0, 12.0, 11.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27392578125, -0.2646827697753906, -0.25543975830078125, -0.24619674682617188, -0.2369537353515625, -0.22771072387695312, -0.21846771240234375, -0.20922470092773438, -0.199981689453125, -0.19073867797851562, -0.18149566650390625, -0.17225265502929688, -0.1630096435546875, -0.15376663208007812, -0.14452362060546875, -0.13528060913085938, -0.12603759765625, -0.11679458618164062, -0.10755157470703125, -0.09830856323242188, -0.0890655517578125, -0.07982254028320312, -0.07057952880859375, -0.061336517333984375, -0.052093505859375, -0.042850494384765625, -0.03360748291015625, -0.024364471435546875, -0.0151214599609375, -0.005878448486328125, 0.00336456298828125, 0.012607574462890625, 0.0218505859375, 0.031093597412109375, 0.04033660888671875, 0.049579620361328125, 0.0588226318359375, 0.06806564331054688, 0.07730865478515625, 0.08655166625976562, 0.095794677734375, 0.10503768920898438, 0.11428070068359375, 0.12352371215820312, 0.1327667236328125, 0.14200973510742188, 0.15125274658203125, 0.16049575805664062, 0.16973876953125, 0.17898178100585938, 0.18822479248046875, 0.19746780395507812, 0.2067108154296875, 0.21595382690429688, 0.22519683837890625, 0.23443984985351562, 0.243682861328125, 0.2529258728027344, 0.26216888427734375, 0.2714118957519531, 0.2806549072265625, 0.2898979187011719, 0.29914093017578125, 0.3083839416503906, 0.317626953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 6.0, 9.0, 4.0, 15.0, 22.0, 41.0, 82.0, 88.0, 190.0, 188.0, 140.0, 88.0, 34.0, 27.0, 17.0, 12.0, 14.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3937784135341644e-05, -2.325884997844696e-05, -2.2579915821552277e-05, -2.1900981664657593e-05, -2.122204750776291e-05, -2.0543113350868225e-05, -1.986417919397354e-05, -1.9185245037078857e-05, -1.8506310880184174e-05, -1.782737672328949e-05, -1.7148442566394806e-05, -1.6469508409500122e-05, -1.5790574252605438e-05, -1.5111640095710754e-05, -1.443270593881607e-05, -1.3753771781921387e-05, -1.3074837625026703e-05, -1.2395903468132019e-05, -1.1716969311237335e-05, -1.1038035154342651e-05, -1.0359100997447968e-05, -9.680166840553284e-06, -9.0012326836586e-06, -8.322298526763916e-06, -7.643364369869232e-06, -6.964430212974548e-06, -6.2854960560798645e-06, -5.606561899185181e-06, -4.927627742290497e-06, -4.248693585395813e-06, -3.569759428501129e-06, -2.8908252716064453e-06, -2.2118911147117615e-06, -1.5329569578170776e-06, -8.540228009223938e-07, -1.7508864402770996e-07, 5.038455128669739e-07, 1.1827796697616577e-06, 1.8617138266563416e-06, 2.5406479835510254e-06, 3.2195821404457092e-06, 3.898516297340393e-06, 4.577450454235077e-06, 5.256384611129761e-06, 5.935318768024445e-06, 6.614252924919128e-06, 7.293187081813812e-06, 7.972121238708496e-06, 8.65105539560318e-06, 9.329989552497864e-06, 1.0008923709392548e-05, 1.0687857866287231e-05, 1.1366792023181915e-05, 1.2045726180076599e-05, 1.2724660336971283e-05, 1.3403594493865967e-05, 1.408252865076065e-05, 1.4761462807655334e-05, 1.544039696455002e-05, 1.6119331121444702e-05, 1.6798265278339386e-05, 1.747719943523407e-05, 1.8156133592128754e-05, 1.8835067749023438e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 20.0, 28.0, 33.0, 69.0, 123.0, 253.0, 517.0, 1457.0, 4153.0, 18383.0, 756315.0, 249119.0, 12652.0, 3314.0, 1135.0, 492.0, 189.0, 117.0, 61.0, 37.0, 17.0, 16.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24635696411132812, -0.23783111572265625, -0.22930526733398438, -0.2207794189453125, -0.21225357055664062, -0.20372772216796875, -0.19520187377929688, -0.186676025390625, -0.17815017700195312, -0.16962432861328125, -0.16109848022460938, -0.1525726318359375, -0.14404678344726562, -0.13552093505859375, -0.12699508666992188, -0.11846923828125, -0.10994338989257812, -0.10141754150390625, -0.09289169311523438, -0.0843658447265625, -0.07583999633789062, -0.06731414794921875, -0.058788299560546875, -0.050262451171875, -0.041736602783203125, -0.03321075439453125, -0.024684906005859375, -0.0161590576171875, -0.007633209228515625, 0.00089263916015625, 0.009418487548828125, 0.0179443359375, 0.026470184326171875, 0.03499603271484375, 0.043521881103515625, 0.0520477294921875, 0.060573577880859375, 0.06909942626953125, 0.07762527465820312, 0.086151123046875, 0.09467697143554688, 0.10320281982421875, 0.11172866821289062, 0.1202545166015625, 0.12878036499023438, 0.13730621337890625, 0.14583206176757812, 0.15435791015625, 0.16288375854492188, 0.17140960693359375, 0.17993545532226562, 0.1884613037109375, 0.19698715209960938, 0.20551300048828125, 0.21403884887695312, 0.222564697265625, 0.23109054565429688, 0.23961639404296875, 0.24814224243164062, 0.2566680908203125, 0.2651939392089844, 0.27371978759765625, 0.2822456359863281, 0.290771484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 5.0, 7.0, 15.0, 16.0, 33.0, 43.0, 102.0, 210.0, 255.0, 127.0, 63.0, 42.0, 18.0, 16.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0982666015625, -0.0955495834350586, -0.09283256530761719, -0.09011554718017578, -0.08739852905273438, -0.08468151092529297, -0.08196449279785156, -0.07924747467041016, -0.07653045654296875, -0.07381343841552734, -0.07109642028808594, -0.06837940216064453, -0.06566238403320312, -0.06294536590576172, -0.06022834777832031, -0.057511329650878906, -0.0547943115234375, -0.052077293395996094, -0.04936027526855469, -0.04664325714111328, -0.043926239013671875, -0.04120922088623047, -0.03849220275878906, -0.035775184631347656, -0.03305816650390625, -0.030341148376464844, -0.027624130249023438, -0.02490711212158203, -0.022190093994140625, -0.01947307586669922, -0.016756057739257812, -0.014039039611816406, -0.011322021484375, -0.008605003356933594, -0.0058879852294921875, -0.0031709671020507812, -0.000453948974609375, 0.0022630691528320312, 0.0049800872802734375, 0.007697105407714844, 0.01041412353515625, 0.013131141662597656, 0.015848159790039062, 0.01856517791748047, 0.021282196044921875, 0.02399921417236328, 0.026716232299804688, 0.029433250427246094, 0.0321502685546875, 0.034867286682128906, 0.03758430480957031, 0.04030132293701172, 0.043018341064453125, 0.04573535919189453, 0.04845237731933594, 0.051169395446777344, 0.05388641357421875, 0.056603431701660156, 0.05932044982910156, 0.06203746795654297, 0.06475448608398438, 0.06747150421142578, 0.07018852233886719, 0.0729055404663086, 0.07562255859375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 15.0, 18.0, 35.0, 49.0, 89.0, 135.0, 151.0, 126.0, 135.0, 88.0, 53.0, 28.0, 29.0, 8.0, 9.0, 4.0, 4.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.826431155204773, -0.771565318107605, -0.7166994214057922, -0.6618335843086243, -0.6069676876068115, -0.5521018505096436, -0.4972360134124756, -0.44237014651298523, -0.3875042796134949, -0.3326384127140045, -0.27777254581451416, -0.2229067087173462, -0.16804084181785583, -0.11317497491836548, -0.05830913782119751, -0.0034432709217071533, 0.0514225959777832, 0.10628845542669296, 0.16115431487560272, 0.21602016687393188, 0.27088603377342224, 0.3257519006729126, 0.38061773777008057, 0.4354836046695709, 0.4903494715690613, 0.5452153086662292, 0.600081205368042, 0.65494704246521, 0.7098128795623779, 0.7646787762641907, 0.8195446133613586, 0.8744105100631714, 0.9292762279510498, 0.9841420650482178, 1.0390079021453857, 1.0938737392425537, 1.1487396955490112, 1.2036055326461792, 1.2584713697433472, 1.3133372068405151, 1.3682031631469727, 1.4230690002441406, 1.4779348373413086, 1.5328006744384766, 1.587666630744934, 1.642532467842102, 1.69739830493927, 1.752264142036438, 1.807129979133606, 1.861995816230774, 1.916861653327942, 1.9717276096343994, 2.0265934467315674, 2.0814592838287354, 2.1363251209259033, 2.1911909580230713, 2.2460567951202393, 2.3009226322174072, 2.355788469314575, 2.410654306411743, 2.465520143508911, 2.520386219024658, 2.575252056121826, 2.630117893218994, 2.684983730316162]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 7.0, 8.0, 11.0, 3.0, 9.0, 16.0, 10.0, 21.0, 21.0, 31.0, 27.0, 28.0, 24.0, 44.0, 35.0, 30.0, 40.0, 32.0, 39.0, 46.0, 47.0, 62.0, 39.0, 42.0, 36.0, 36.0, 29.0, 36.0, 22.0, 20.0, 21.0, 15.0, 21.0, 10.0, 15.0, 13.0, 9.0, 14.0, 9.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.7301201820373535, -1.6773638725280762, -1.6246075630187988, -1.5718512535095215, -1.5190949440002441, -1.4663386344909668, -1.4135823249816895, -1.360826015472412, -1.3080697059631348, -1.2553133964538574, -1.20255708694458, -1.1498007774353027, -1.0970444679260254, -1.044288158416748, -0.9915318489074707, -0.9387755393981934, -0.886019229888916, -0.8332629203796387, -0.7805066108703613, -0.727750301361084, -0.6749939918518066, -0.6222376823425293, -0.569481372833252, -0.5167250633239746, -0.46396875381469727, -0.4112124443054199, -0.3584561347961426, -0.30569982528686523, -0.2529435157775879, -0.20018720626831055, -0.1474308967590332, -0.09467458724975586, -0.041918396949768066, 0.010837912559509277, 0.06359422206878662, 0.11635053157806396, 0.1691068410873413, 0.22186315059661865, 0.274619460105896, 0.32737576961517334, 0.3801320791244507, 0.432888388633728, 0.48564469814300537, 0.5384010076522827, 0.5911573171615601, 0.6439136266708374, 0.6966699361801147, 0.7494262456893921, 0.8021825551986694, 0.8549388647079468, 0.9076951742172241, 0.9604514837265015, 1.0132077932357788, 1.0659641027450562, 1.1187204122543335, 1.1714767217636108, 1.2242330312728882, 1.2769893407821655, 1.3297456502914429, 1.3825019598007202, 1.4352582693099976, 1.488014578819275, 1.5407708883285522, 1.5935271978378296, 1.646283507347107]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 9.0, 20.0, 23.0, 34.0, 46.0, 68.0, 99.0, 142.0, 254.0, 383.0, 630.0, 1062.0, 2107.0, 4630.0, 12475.0, 63189.0, 598328.0, 2914871.0, 525020.0, 50832.0, 10926.0, 4162.0, 1983.0, 1094.0, 645.0, 415.0, 276.0, 176.0, 116.0, 55.0, 47.0, 45.0, 34.0, 25.0, 16.0, 9.0, 10.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.95166015625, -0.9232330322265625, -0.894805908203125, -0.8663787841796875, -0.83795166015625, -0.8095245361328125, -0.781097412109375, -0.7526702880859375, -0.7242431640625, -0.6958160400390625, -0.667388916015625, -0.6389617919921875, -0.61053466796875, -0.5821075439453125, -0.553680419921875, -0.5252532958984375, -0.496826171875, -0.4683990478515625, -0.439971923828125, -0.4115447998046875, -0.38311767578125, -0.3546905517578125, -0.326263427734375, -0.2978363037109375, -0.2694091796875, -0.2409820556640625, -0.212554931640625, -0.1841278076171875, -0.15570068359375, -0.1272735595703125, -0.098846435546875, -0.0704193115234375, -0.0419921875, -0.0135650634765625, 0.014862060546875, 0.0432891845703125, 0.07171630859375, 0.1001434326171875, 0.128570556640625, 0.1569976806640625, 0.1854248046875, 0.2138519287109375, 0.242279052734375, 0.2707061767578125, 0.29913330078125, 0.3275604248046875, 0.355987548828125, 0.3844146728515625, 0.412841796875, 0.4412689208984375, 0.469696044921875, 0.4981231689453125, 0.52655029296875, 0.5549774169921875, 0.583404541015625, 0.6118316650390625, 0.6402587890625, 0.6686859130859375, 0.697113037109375, 0.7255401611328125, 0.75396728515625, 0.7823944091796875, 0.810821533203125, 0.8392486572265625, 0.86767578125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 0.0, 6.0, 5.0, 8.0, 11.0, 17.0, 16.0, 21.0, 29.0, 43.0, 47.0, 60.0, 43.0, 63.0, 65.0, 87.0, 68.0, 64.0, 61.0, 51.0, 45.0, 37.0, 31.0, 27.0, 22.0, 23.0, 16.0, 12.0, 2.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59228515625, -0.571014404296875, -0.54974365234375, -0.528472900390625, -0.5072021484375, -0.485931396484375, -0.46466064453125, -0.443389892578125, -0.422119140625, -0.400848388671875, -0.37957763671875, -0.358306884765625, -0.3370361328125, -0.315765380859375, -0.29449462890625, -0.273223876953125, -0.251953125, -0.230682373046875, -0.20941162109375, -0.188140869140625, -0.1668701171875, -0.145599365234375, -0.12432861328125, -0.103057861328125, -0.081787109375, -0.060516357421875, -0.03924560546875, -0.017974853515625, 0.0032958984375, 0.024566650390625, 0.04583740234375, 0.067108154296875, 0.08837890625, 0.109649658203125, 0.13092041015625, 0.152191162109375, 0.1734619140625, 0.194732666015625, 0.21600341796875, 0.237274169921875, 0.258544921875, 0.279815673828125, 0.30108642578125, 0.322357177734375, 0.3436279296875, 0.364898681640625, 0.38616943359375, 0.407440185546875, 0.4287109375, 0.449981689453125, 0.47125244140625, 0.492523193359375, 0.5137939453125, 0.535064697265625, 0.55633544921875, 0.577606201171875, 0.598876953125, 0.620147705078125, 0.64141845703125, 0.662689208984375, 0.6839599609375, 0.705230712890625, 0.72650146484375, 0.747772216796875, 0.76904296875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 11.0, 22.0, 22.0, 51.0, 76.0, 137.0, 258.0, 546.0, 1392.0, 3960.0, 15459.0, 151437.0, 3867299.0, 133706.0, 13957.0, 3538.0, 1277.0, 551.0, 252.0, 128.0, 64.0, 47.0, 26.0, 13.0, 10.0, 9.0, 4.0, 2.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.145477294921875, -1.10052490234375, -1.055572509765625, -1.0106201171875, -0.965667724609375, -0.92071533203125, -0.875762939453125, -0.830810546875, -0.785858154296875, -0.74090576171875, -0.695953369140625, -0.6510009765625, -0.606048583984375, -0.56109619140625, -0.516143798828125, -0.47119140625, -0.426239013671875, -0.38128662109375, -0.336334228515625, -0.2913818359375, -0.246429443359375, -0.20147705078125, -0.156524658203125, -0.111572265625, -0.066619873046875, -0.02166748046875, 0.023284912109375, 0.0682373046875, 0.113189697265625, 0.15814208984375, 0.203094482421875, 0.248046875, 0.292999267578125, 0.33795166015625, 0.382904052734375, 0.4278564453125, 0.472808837890625, 0.51776123046875, 0.562713623046875, 0.607666015625, 0.652618408203125, 0.69757080078125, 0.742523193359375, 0.7874755859375, 0.832427978515625, 0.87738037109375, 0.922332763671875, 0.96728515625, 1.012237548828125, 1.05718994140625, 1.102142333984375, 1.1470947265625, 1.192047119140625, 1.23699951171875, 1.281951904296875, 1.326904296875, 1.371856689453125, 1.41680908203125, 1.461761474609375, 1.5067138671875, 1.551666259765625, 1.59661865234375, 1.641571044921875, 1.6865234375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 5.0, 8.0, 8.0, 37.0, 38.0, 75.0, 115.0, 248.0, 515.0, 1096.0, 978.0, 438.0, 206.0, 100.0, 55.0, 45.0, 30.0, 19.0, 11.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4755859375, -0.46335601806640625, -0.4511260986328125, -0.43889617919921875, -0.426666259765625, -0.41443634033203125, -0.4022064208984375, -0.38997650146484375, -0.37774658203125, -0.36551666259765625, -0.3532867431640625, -0.34105682373046875, -0.328826904296875, -0.31659698486328125, -0.3043670654296875, -0.29213714599609375, -0.2799072265625, -0.26767730712890625, -0.2554473876953125, -0.24321746826171875, -0.230987548828125, -0.21875762939453125, -0.2065277099609375, -0.19429779052734375, -0.18206787109375, -0.16983795166015625, -0.1576080322265625, -0.14537811279296875, -0.133148193359375, -0.12091827392578125, -0.1086883544921875, -0.09645843505859375, -0.084228515625, -0.07199859619140625, -0.0597686767578125, -0.04753875732421875, -0.035308837890625, -0.02307891845703125, -0.0108489990234375, 0.00138092041015625, 0.01361083984375, 0.02584075927734375, 0.0380706787109375, 0.05030059814453125, 0.062530517578125, 0.07476043701171875, 0.0869903564453125, 0.09922027587890625, 0.1114501953125, 0.12368011474609375, 0.1359100341796875, 0.14813995361328125, 0.160369873046875, 0.17259979248046875, 0.1848297119140625, 0.19705963134765625, 0.20928955078125, 0.22151947021484375, 0.2337493896484375, 0.24597930908203125, 0.258209228515625, 0.27043914794921875, 0.2826690673828125, 0.29489898681640625, 0.30712890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 7.0, 8.0, 10.0, 14.0, 7.0, 10.0, 19.0, 22.0, 25.0, 29.0, 47.0, 53.0, 35.0, 72.0, 84.0, 80.0, 72.0, 73.0, 54.0, 49.0, 31.0, 39.0, 33.0, 19.0, 24.0, 16.0, 12.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6451905965805054, -0.6239470839500427, -0.6027035713195801, -0.5814599990844727, -0.56021648645401, -0.5389729738235474, -0.5177294015884399, -0.4964858889579773, -0.47524237632751465, -0.453998863697052, -0.43275532126426697, -0.41151177883148193, -0.3902682662010193, -0.36902475357055664, -0.3477812111377716, -0.3265376687049866, -0.3052941560745239, -0.2840506434440613, -0.26280710101127625, -0.2415635734796524, -0.22032004594802856, -0.19907651841640472, -0.17783299088478088, -0.15658946335315704, -0.1353459358215332, -0.11410240828990936, -0.09285888075828552, -0.07161535322666168, -0.05037182569503784, -0.029128298163414, -0.007884770631790161, 0.01335875689983368, 0.03460228443145752, 0.05584581196308136, 0.0770893394947052, 0.09833286702632904, 0.11957639455795288, 0.14081992208957672, 0.16206344962120056, 0.1833069771528244, 0.20455050468444824, 0.22579403221607208, 0.24703755974769592, 0.26828110218048096, 0.2895246148109436, 0.31076812744140625, 0.3320116698741913, 0.3532552123069763, 0.37449872493743896, 0.3957422375679016, 0.41698578000068665, 0.4382293224334717, 0.4594728350639343, 0.480716347694397, 0.5019599199295044, 0.523203432559967, 0.5444469451904297, 0.5656904578208923, 0.586933970451355, 0.6081775426864624, 0.629421055316925, 0.6506645679473877, 0.6719081401824951, 0.6931516528129578, 0.7143951654434204]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 15.0, 11.0, 22.0, 33.0, 30.0, 25.0, 42.0, 33.0, 48.0, 51.0, 57.0, 61.0, 69.0, 53.0, 70.0, 68.0, 46.0, 46.0, 41.0, 35.0, 27.0, 24.0, 21.0, 20.0, 14.0, 7.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7658556699752808, -0.7404689788818359, -0.7150822877883911, -0.6896955966949463, -0.6643089056015015, -0.6389222145080566, -0.6135355234146118, -0.588148832321167, -0.5627621412277222, -0.5373754501342773, -0.5119887590408325, -0.4866020679473877, -0.46121537685394287, -0.43582868576049805, -0.41044196486473083, -0.385055273771286, -0.3596685528755188, -0.334281861782074, -0.30889517068862915, -0.2835084795951843, -0.2581217885017395, -0.23273508250713348, -0.20734837651252747, -0.18196168541908264, -0.15657499432563782, -0.131188303232193, -0.10580160468816757, -0.08041490614414215, -0.05502821505069733, -0.029641523957252502, -0.004254817962646484, 0.02113187313079834, 0.04651850461959839, 0.07190519571304321, 0.09729189425706863, 0.12267859280109406, 0.14806528389453888, 0.1734519749879837, 0.19883868098258972, 0.22422537207603455, 0.24961206316947937, 0.2749987542629242, 0.300385445356369, 0.32577216625213623, 0.35115885734558105, 0.3765455484390259, 0.4019322395324707, 0.4273189306259155, 0.45270562171936035, 0.4780923128128052, 0.50347900390625, 0.5288656949996948, 0.5542523860931396, 0.5796390771865845, 0.6050257682800293, 0.6304124593734741, 0.655799150466919, 0.6811858415603638, 0.7065725326538086, 0.7319592237472534, 0.7573459148406982, 0.7827326059341431, 0.8081192970275879, 0.8335059881210327, 0.8588927388191223]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 14.0, 32.0, 43.0, 74.0, 107.0, 188.0, 368.0, 1097.0, 4007.0, 18622.0, 129785.0, 711250.0, 155070.0, 21230.0, 4540.0, 1222.0, 430.0, 200.0, 95.0, 69.0, 40.0, 27.0, 17.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19384765625, -0.1875, -0.18115234375, -0.1748046875, -0.16845703125, -0.162109375, -0.15576171875, -0.1494140625, -0.14306640625, -0.13671875, -0.13037109375, -0.1240234375, -0.11767578125, -0.111328125, -0.10498046875, -0.0986328125, -0.09228515625, -0.0859375, -0.07958984375, -0.0732421875, -0.06689453125, -0.060546875, -0.05419921875, -0.0478515625, -0.04150390625, -0.03515625, -0.02880859375, -0.0224609375, -0.01611328125, -0.009765625, -0.00341796875, 0.0029296875, 0.00927734375, 0.015625, 0.02197265625, 0.0283203125, 0.03466796875, 0.041015625, 0.04736328125, 0.0537109375, 0.06005859375, 0.06640625, 0.07275390625, 0.0791015625, 0.08544921875, 0.091796875, 0.09814453125, 0.1044921875, 0.11083984375, 0.1171875, 0.12353515625, 0.1298828125, 0.13623046875, 0.142578125, 0.14892578125, 0.1552734375, 0.16162109375, 0.16796875, 0.17431640625, 0.1806640625, 0.18701171875, 0.193359375, 0.19970703125, 0.2060546875, 0.21240234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 11.0, 8.0, 17.0, 24.0, 23.0, 31.0, 50.0, 51.0, 63.0, 92.0, 76.0, 75.0, 90.0, 74.0, 70.0, 75.0, 42.0, 40.0, 30.0, 22.0, 14.0, 12.0, 8.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.576171875, -0.55291748046875, -0.5296630859375, -0.50640869140625, -0.483154296875, -0.45989990234375, -0.4366455078125, -0.41339111328125, -0.39013671875, -0.36688232421875, -0.3436279296875, -0.32037353515625, -0.297119140625, -0.27386474609375, -0.2506103515625, -0.22735595703125, -0.2041015625, -0.18084716796875, -0.1575927734375, -0.13433837890625, -0.111083984375, -0.08782958984375, -0.0645751953125, -0.04132080078125, -0.01806640625, 0.00518798828125, 0.0284423828125, 0.05169677734375, 0.074951171875, 0.09820556640625, 0.1214599609375, 0.14471435546875, 0.16796875, 0.19122314453125, 0.2144775390625, 0.23773193359375, 0.260986328125, 0.28424072265625, 0.3074951171875, 0.33074951171875, 0.35400390625, 0.37725830078125, 0.4005126953125, 0.42376708984375, 0.447021484375, 0.47027587890625, 0.4935302734375, 0.51678466796875, 0.5400390625, 0.56329345703125, 0.5865478515625, 0.60980224609375, 0.633056640625, 0.65631103515625, 0.6795654296875, 0.70281982421875, 0.72607421875, 0.74932861328125, 0.7725830078125, 0.79583740234375, 0.819091796875, 0.84234619140625, 0.8656005859375, 0.88885498046875, 0.912109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 13.0, 13.0, 26.0, 28.0, 47.0, 55.0, 87.0, 126.0, 190.0, 275.0, 415.0, 547.0, 832.0, 1224.0, 1834.0, 2704.0, 4210.0, 6478.0, 9871.0, 15501.0, 24725.0, 40857.0, 69427.0, 115983.0, 177033.0, 196688.0, 147368.0, 91242.0, 53493.0, 31863.0, 19685.0, 12308.0, 7799.0, 4974.0, 3480.0, 2294.0, 1594.0, 1043.0, 695.0, 487.0, 324.0, 233.0, 141.0, 111.0, 63.0, 39.0, 46.0, 23.0, 19.0, 13.0, 9.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0], "bins": [-0.036163330078125, -0.03504228591918945, -0.033921241760253906, -0.03280019760131836, -0.03167915344238281, -0.030558109283447266, -0.02943706512451172, -0.028316020965576172, -0.027194976806640625, -0.026073932647705078, -0.02495288848876953, -0.023831844329833984, -0.022710800170898438, -0.02158975601196289, -0.020468711853027344, -0.019347667694091797, -0.01822662353515625, -0.017105579376220703, -0.015984535217285156, -0.01486349105834961, -0.013742446899414062, -0.012621402740478516, -0.011500358581542969, -0.010379314422607422, -0.009258270263671875, -0.008137226104736328, -0.007016181945800781, -0.005895137786865234, -0.0047740936279296875, -0.0036530494689941406, -0.0025320053100585938, -0.0014109611511230469, -0.0002899169921875, 0.0008311271667480469, 0.0019521713256835938, 0.0030732154846191406, 0.0041942596435546875, 0.005315303802490234, 0.006436347961425781, 0.007557392120361328, 0.008678436279296875, 0.009799480438232422, 0.010920524597167969, 0.012041568756103516, 0.013162612915039062, 0.01428365707397461, 0.015404701232910156, 0.016525745391845703, 0.01764678955078125, 0.018767833709716797, 0.019888877868652344, 0.02100992202758789, 0.022130966186523438, 0.023252010345458984, 0.02437305450439453, 0.025494098663330078, 0.026615142822265625, 0.027736186981201172, 0.02885723114013672, 0.029978275299072266, 0.031099319458007812, 0.03222036361694336, 0.033341407775878906, 0.03446245193481445, 0.03558349609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 11.0, 14.0, 16.0, 14.0, 18.0, 31.0, 12.0, 27.0, 23.0, 34.0, 41.0, 38.0, 40.0, 44.0, 52.0, 49.0, 53.0, 48.0, 42.0, 40.0, 37.0, 38.0, 43.0, 30.0, 28.0, 23.0, 22.0, 15.0, 20.0, 15.0, 7.0, 14.0, 13.0, 10.0, 8.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80419921875, -0.7788848876953125, -0.753570556640625, -0.7282562255859375, -0.70294189453125, -0.6776275634765625, -0.652313232421875, -0.6269989013671875, -0.6016845703125, -0.5763702392578125, -0.551055908203125, -0.5257415771484375, -0.50042724609375, -0.4751129150390625, -0.449798583984375, -0.4244842529296875, -0.399169921875, -0.3738555908203125, -0.348541259765625, -0.3232269287109375, -0.29791259765625, -0.2725982666015625, -0.247283935546875, -0.2219696044921875, -0.1966552734375, -0.1713409423828125, -0.146026611328125, -0.1207122802734375, -0.09539794921875, -0.0700836181640625, -0.044769287109375, -0.0194549560546875, 0.005859375, 0.0311737060546875, 0.056488037109375, 0.0818023681640625, 0.10711669921875, 0.1324310302734375, 0.157745361328125, 0.1830596923828125, 0.2083740234375, 0.2336883544921875, 0.259002685546875, 0.2843170166015625, 0.30963134765625, 0.3349456787109375, 0.360260009765625, 0.3855743408203125, 0.410888671875, 0.4362030029296875, 0.461517333984375, 0.4868316650390625, 0.51214599609375, 0.5374603271484375, 0.562774658203125, 0.5880889892578125, 0.6134033203125, 0.6387176513671875, 0.664031982421875, 0.6893463134765625, 0.71466064453125, 0.7399749755859375, 0.765289306640625, 0.7906036376953125, 0.81591796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 19.0, 17.0, 27.0, 42.0, 73.0, 101.0, 130.0, 283.0, 426.0, 872.0, 2138.0, 6830.0, 27656.0, 173535.0, 648626.0, 152581.0, 25188.0, 6292.0, 2017.0, 801.0, 374.0, 223.0, 101.0, 66.0, 43.0, 27.0, 29.0, 6.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01503753662109375, -0.014588236808776855, -0.014138936996459961, -0.013689637184143066, -0.013240337371826172, -0.012791037559509277, -0.012341737747192383, -0.011892437934875488, -0.011443138122558594, -0.0109938383102417, -0.010544538497924805, -0.01009523868560791, -0.009645938873291016, -0.009196639060974121, -0.008747339248657227, -0.008298039436340332, -0.007848739624023438, -0.007399439811706543, -0.0069501399993896484, -0.006500840187072754, -0.006051540374755859, -0.005602240562438965, -0.00515294075012207, -0.004703640937805176, -0.004254341125488281, -0.0038050413131713867, -0.003355741500854492, -0.0029064416885375977, -0.002457141876220703, -0.0020078420639038086, -0.001558542251586914, -0.0011092424392700195, -0.000659942626953125, -0.00021064281463623047, 0.00023865699768066406, 0.0006879568099975586, 0.0011372566223144531, 0.0015865564346313477, 0.002035856246948242, 0.0024851560592651367, 0.0029344558715820312, 0.0033837556838989258, 0.0038330554962158203, 0.004282355308532715, 0.004731655120849609, 0.005180954933166504, 0.0056302547454833984, 0.006079554557800293, 0.0065288543701171875, 0.006978154182434082, 0.0074274539947509766, 0.007876753807067871, 0.008326053619384766, 0.00877535343170166, 0.009224653244018555, 0.00967395305633545, 0.010123252868652344, 0.010572552680969238, 0.011021852493286133, 0.011471152305603027, 0.011920452117919922, 0.012369751930236816, 0.012819051742553711, 0.013268351554870605, 0.0137176513671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 6.0, 8.0, 7.0, 11.0, 5.0, 14.0, 24.0, 33.0, 40.0, 56.0, 64.0, 108.0, 113.0, 125.0, 94.0, 72.0, 62.0, 38.0, 33.0, 24.0, 19.0, 8.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5139579772949219e-05, -1.4482066035270691e-05, -1.3824552297592163e-05, -1.3167038559913635e-05, -1.2509524822235107e-05, -1.185201108455658e-05, -1.1194497346878052e-05, -1.0536983609199524e-05, -9.879469871520996e-06, -9.221956133842468e-06, -8.56444239616394e-06, -7.906928658485413e-06, -7.249414920806885e-06, -6.591901183128357e-06, -5.934387445449829e-06, -5.276873707771301e-06, -4.6193599700927734e-06, -3.961846232414246e-06, -3.3043324947357178e-06, -2.64681875705719e-06, -1.989305019378662e-06, -1.3317912817001343e-06, -6.742775440216064e-07, -1.6763806343078613e-08, 6.407499313354492e-07, 1.298263669013977e-06, 1.955777406692505e-06, 2.6132911443710327e-06, 3.2708048820495605e-06, 3.928318619728088e-06, 4.585832357406616e-06, 5.243346095085144e-06, 5.900859832763672e-06, 6.5583735704422e-06, 7.2158873081207275e-06, 7.873401045799255e-06, 8.530914783477783e-06, 9.188428521156311e-06, 9.845942258834839e-06, 1.0503455996513367e-05, 1.1160969734191895e-05, 1.1818483471870422e-05, 1.247599720954895e-05, 1.3133510947227478e-05, 1.3791024684906006e-05, 1.4448538422584534e-05, 1.5106052160263062e-05, 1.576356589794159e-05, 1.6421079635620117e-05, 1.7078593373298645e-05, 1.7736107110977173e-05, 1.83936208486557e-05, 1.905113458633423e-05, 1.9708648324012756e-05, 2.0366162061691284e-05, 2.1023675799369812e-05, 2.168118953704834e-05, 2.2338703274726868e-05, 2.2996217012405396e-05, 2.3653730750083923e-05, 2.431124448776245e-05, 2.496875822544098e-05, 2.5626271963119507e-05, 2.6283785700798035e-05, 2.6941299438476562e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 16.0, 13.0, 13.0, 29.0, 38.0, 76.0, 126.0, 238.0, 463.0, 902.0, 2454.0, 8983.0, 53737.0, 525358.0, 404500.0, 40555.0, 7266.0, 2064.0, 778.0, 406.0, 214.0, 133.0, 78.0, 42.0, 26.0, 15.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01222991943359375, -0.011739373207092285, -0.01124882698059082, -0.010758280754089355, -0.01026773452758789, -0.009777188301086426, -0.009286642074584961, -0.008796095848083496, -0.008305549621582031, -0.007815003395080566, -0.0073244571685791016, -0.006833910942077637, -0.006343364715576172, -0.005852818489074707, -0.005362272262573242, -0.004871726036071777, -0.0043811798095703125, -0.0038906335830688477, -0.003400087356567383, -0.002909541130065918, -0.002418994903564453, -0.0019284486770629883, -0.0014379024505615234, -0.0009473562240600586, -0.00045680999755859375, 3.3736228942871094e-05, 0.0005242824554443359, 0.0010148286819458008, 0.0015053749084472656, 0.0019959211349487305, 0.0024864673614501953, 0.00297701358795166, 0.003467559814453125, 0.00395810604095459, 0.004448652267456055, 0.0049391984939575195, 0.005429744720458984, 0.005920290946960449, 0.006410837173461914, 0.006901383399963379, 0.007391929626464844, 0.007882475852966309, 0.008373022079467773, 0.008863568305969238, 0.009354114532470703, 0.009844660758972168, 0.010335206985473633, 0.010825753211975098, 0.011316299438476562, 0.011806845664978027, 0.012297391891479492, 0.012787938117980957, 0.013278484344482422, 0.013769030570983887, 0.014259576797485352, 0.014750123023986816, 0.015240669250488281, 0.015731215476989746, 0.01622176170349121, 0.016712307929992676, 0.01720285415649414, 0.017693400382995605, 0.01818394660949707, 0.018674492835998535, 0.0191650390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 4.0, 8.0, 4.0, 15.0, 22.0, 30.0, 42.0, 55.0, 37.0, 67.0, 91.0, 98.0, 91.0, 83.0, 79.0, 70.0, 57.0, 34.0, 25.0, 20.0, 14.0, 15.0, 5.0, 9.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033779144287109375, -0.0032819509506225586, -0.0031859874725341797, -0.0030900239944458008, -0.002994060516357422, -0.002898097038269043, -0.002802133560180664, -0.002706170082092285, -0.0026102066040039062, -0.0025142431259155273, -0.0024182796478271484, -0.0023223161697387695, -0.0022263526916503906, -0.0021303892135620117, -0.002034425735473633, -0.001938462257385254, -0.001842498779296875, -0.001746535301208496, -0.0016505718231201172, -0.0015546083450317383, -0.0014586448669433594, -0.0013626813888549805, -0.0012667179107666016, -0.0011707544326782227, -0.0010747909545898438, -0.0009788274765014648, -0.0008828639984130859, -0.000786900520324707, -0.0006909370422363281, -0.0005949735641479492, -0.0004990100860595703, -0.0004030466079711914, -0.0003070831298828125, -0.0002111196517944336, -0.00011515617370605469, -1.919269561767578e-05, 7.677078247070312e-05, 0.00017273426055908203, 0.00026869773864746094, 0.00036466121673583984, 0.00046062469482421875, 0.0005565881729125977, 0.0006525516510009766, 0.0007485151290893555, 0.0008444786071777344, 0.0009404420852661133, 0.0010364055633544922, 0.001132369041442871, 0.00122833251953125, 0.001324295997619629, 0.0014202594757080078, 0.0015162229537963867, 0.0016121864318847656, 0.0017081499099731445, 0.0018041133880615234, 0.0019000768661499023, 0.0019960403442382812, 0.00209200382232666, 0.002187967300415039, 0.002283930778503418, 0.002379894256591797, 0.0024758577346801758, 0.0025718212127685547, 0.0026677846908569336, 0.0027637481689453125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 12.0, 14.0, 26.0, 37.0, 84.0, 134.0, 230.0, 191.0, 112.0, 71.0, 47.0, 18.0, 11.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113785982131958, -1.2737228870391846, -1.236067295074463, -1.1984115839004517, -1.1607558727264404, -1.1231001615524292, -1.085444450378418, -1.0477888584136963, -1.010133147239685, -0.9724774360656738, -0.9348217844963074, -0.8971661329269409, -0.8595104217529297, -0.8218547105789185, -0.784199059009552, -0.7465434074401855, -0.7088876962661743, -0.6712319850921631, -0.6335763335227966, -0.5959206819534302, -0.558264970779419, -0.5206092596054077, -0.48295360803604126, -0.4452979266643524, -0.4076422452926636, -0.36998656392097473, -0.3323308825492859, -0.29467520117759705, -0.2570195198059082, -0.21936383843421936, -0.18170815706253052, -0.14405247569084167, -0.10639667510986328, -0.06874099373817444, -0.031085312366485596, 0.006570369005203247, 0.04422605037689209, 0.08188173174858093, 0.11953741312026978, 0.15719309449195862, 0.19484877586364746, 0.2325044572353363, 0.27016013860702515, 0.307815819978714, 0.34547150135040283, 0.3831271827220917, 0.4207828640937805, 0.45843854546546936, 0.4960942268371582, 0.5337499380111694, 0.5714055895805359, 0.6090612411499023, 0.6467169523239136, 0.6843726634979248, 0.7220283150672913, 0.7596839666366577, 0.797339677810669, 0.8349953889846802, 0.8726510405540466, 0.9103066921234131, 0.9479624032974243, 0.9856181144714355, 1.0232737064361572, 1.0609294176101685, 1.0985851287841797]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 11.0, 11.0, 25.0, 42.0, 35.0, 47.0, 49.0, 64.0, 73.0, 81.0, 88.0, 87.0, 76.0, 71.0, 51.0, 50.0, 36.0, 26.0, 26.0, 17.0, 9.0, 8.0, 9.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.563001275062561, -0.5409615635871887, -0.5189219117164612, -0.49688220024108887, -0.47484254837036133, -0.452802836894989, -0.4307631552219391, -0.40872347354888916, -0.38668379187583923, -0.3646441102027893, -0.3426044285297394, -0.32056474685668945, -0.29852503538131714, -0.2764853835105896, -0.2544456720352173, -0.23240599036216736, -0.21036630868911743, -0.1883266270160675, -0.16628694534301758, -0.14424724876880646, -0.12220756709575653, -0.1001678854227066, -0.07812818884849548, -0.05608850717544556, -0.03404882550239563, -0.012009140104055405, 0.01003054529428482, 0.032070234417915344, 0.05410991609096527, 0.0761495977640152, 0.09818929433822632, 0.12022897601127625, 0.1422685980796814, 0.16430827975273132, 0.18634796142578125, 0.20838765799999237, 0.2304273396730423, 0.2524670362472534, 0.27450671792030334, 0.29654639959335327, 0.3185860812664032, 0.3406257629394531, 0.36266544461250305, 0.384705126285553, 0.4067448377609253, 0.42878448963165283, 0.45082420110702515, 0.4728638827800751, 0.494903564453125, 0.5169432759284973, 0.5389829277992249, 0.5610226392745972, 0.5830622911453247, 0.605102002620697, 0.6271417140960693, 0.6491813659667969, 0.6712210178375244, 0.6932607293128967, 0.7153003811836243, 0.7373400926589966, 0.7593797445297241, 0.7814194560050964, 0.8034591674804688, 0.8254988193511963, 0.8475385308265686]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 11.0, 18.0, 23.0, 29.0, 45.0, 62.0, 67.0, 132.0, 193.0, 278.0, 433.0, 632.0, 1037.0, 1729.0, 2821.0, 5121.0, 10679.0, 27767.0, 133715.0, 666360.0, 144217.0, 29330.0, 10922.0, 5297.0, 2953.0, 1757.0, 1029.0, 596.0, 411.0, 290.0, 173.0, 118.0, 76.0, 50.0, 35.0, 39.0, 19.0, 21.0, 14.0, 11.0, 7.0, 5.0, 3.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.30322265625, -0.29360198974609375, -0.2839813232421875, -0.27436065673828125, -0.264739990234375, -0.25511932373046875, -0.2454986572265625, -0.23587799072265625, -0.22625732421875, -0.21663665771484375, -0.2070159912109375, -0.19739532470703125, -0.187774658203125, -0.17815399169921875, -0.1685333251953125, -0.15891265869140625, -0.1492919921875, -0.13967132568359375, -0.1300506591796875, -0.12042999267578125, -0.110809326171875, -0.10118865966796875, -0.0915679931640625, -0.08194732666015625, -0.07232666015625, -0.06270599365234375, -0.0530853271484375, -0.04346466064453125, -0.033843994140625, -0.02422332763671875, -0.0146026611328125, -0.00498199462890625, 0.004638671875, 0.01425933837890625, 0.0238800048828125, 0.03350067138671875, 0.043121337890625, 0.05274200439453125, 0.0623626708984375, 0.07198333740234375, 0.08160400390625, 0.09122467041015625, 0.1008453369140625, 0.11046600341796875, 0.120086669921875, 0.12970733642578125, 0.1393280029296875, 0.14894866943359375, 0.1585693359375, 0.16819000244140625, 0.1778106689453125, 0.18743133544921875, 0.197052001953125, 0.20667266845703125, 0.2162933349609375, 0.22591400146484375, 0.23553466796875, 0.24515533447265625, 0.2547760009765625, 0.26439666748046875, 0.274017333984375, 0.28363800048828125, 0.2932586669921875, 0.30287933349609375, 0.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 8.0, 13.0, 27.0, 27.0, 16.0, 26.0, 32.0, 39.0, 41.0, 39.0, 46.0, 70.0, 56.0, 62.0, 59.0, 56.0, 64.0, 46.0, 40.0, 36.0, 41.0, 26.0, 22.0, 24.0, 12.0, 17.0, 11.0, 7.0, 2.0, 7.0, 3.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.171875, -1.1406402587890625, -1.109405517578125, -1.0781707763671875, -1.04693603515625, -1.0157012939453125, -0.984466552734375, -0.9532318115234375, -0.9219970703125, -0.8907623291015625, -0.859527587890625, -0.8282928466796875, -0.79705810546875, -0.7658233642578125, -0.734588623046875, -0.7033538818359375, -0.672119140625, -0.6408843994140625, -0.609649658203125, -0.5784149169921875, -0.54718017578125, -0.5159454345703125, -0.484710693359375, -0.4534759521484375, -0.4222412109375, -0.3910064697265625, -0.359771728515625, -0.3285369873046875, -0.29730224609375, -0.2660675048828125, -0.234832763671875, -0.2035980224609375, -0.17236328125, -0.1411285400390625, -0.109893798828125, -0.0786590576171875, -0.04742431640625, -0.0161895751953125, 0.015045166015625, 0.0462799072265625, 0.0775146484375, 0.1087493896484375, 0.139984130859375, 0.1712188720703125, 0.20245361328125, 0.2336883544921875, 0.264923095703125, 0.2961578369140625, 0.327392578125, 0.3586273193359375, 0.389862060546875, 0.4210968017578125, 0.45233154296875, 0.4835662841796875, 0.514801025390625, 0.5460357666015625, 0.5772705078125, 0.6085052490234375, 0.639739990234375, 0.6709747314453125, 0.70220947265625, 0.7334442138671875, 0.764678955078125, 0.7959136962890625, 0.8271484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 11.0, 12.0, 11.0, 16.0, 22.0, 30.0, 45.0, 61.0, 109.0, 180.0, 333.0, 794.0, 2826.0, 21125.0, 961220.0, 55120.0, 4557.0, 1068.0, 441.0, 216.0, 119.0, 70.0, 52.0, 28.0, 24.0, 15.0, 19.0, 9.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0375518798828125, -1.005767822265625, -0.9739837646484375, -0.94219970703125, -0.9104156494140625, -0.878631591796875, -0.8468475341796875, -0.8150634765625, -0.7832794189453125, -0.751495361328125, -0.7197113037109375, -0.68792724609375, -0.6561431884765625, -0.624359130859375, -0.5925750732421875, -0.560791015625, -0.5290069580078125, -0.497222900390625, -0.4654388427734375, -0.43365478515625, -0.4018707275390625, -0.370086669921875, -0.3383026123046875, -0.3065185546875, -0.2747344970703125, -0.242950439453125, -0.2111663818359375, -0.17938232421875, -0.1475982666015625, -0.115814208984375, -0.0840301513671875, -0.05224609375, -0.0204620361328125, 0.011322021484375, 0.0431060791015625, 0.07489013671875, 0.1066741943359375, 0.138458251953125, 0.1702423095703125, 0.2020263671875, 0.2338104248046875, 0.265594482421875, 0.2973785400390625, 0.32916259765625, 0.3609466552734375, 0.392730712890625, 0.4245147705078125, 0.456298828125, 0.4880828857421875, 0.519866943359375, 0.5516510009765625, 0.58343505859375, 0.6152191162109375, 0.647003173828125, 0.6787872314453125, 0.7105712890625, 0.7423553466796875, 0.774139404296875, 0.8059234619140625, 0.83770751953125, 0.8694915771484375, 0.901275634765625, 0.9330596923828125, 0.96484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 12.0, 8.0, 16.0, 13.0, 30.0, 37.0, 28.0, 47.0, 59.0, 62.0, 84.0, 50.0, 84.0, 83.0, 74.0, 63.0, 49.0, 47.0, 41.0, 22.0, 25.0, 19.0, 12.0, 9.0, 12.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8466796875, -1.795928955078125, -1.74517822265625, -1.694427490234375, -1.6436767578125, -1.592926025390625, -1.54217529296875, -1.491424560546875, -1.440673828125, -1.389923095703125, -1.33917236328125, -1.288421630859375, -1.2376708984375, -1.186920166015625, -1.13616943359375, -1.085418701171875, -1.03466796875, -0.983917236328125, -0.93316650390625, -0.882415771484375, -0.8316650390625, -0.780914306640625, -0.73016357421875, -0.679412841796875, -0.628662109375, -0.577911376953125, -0.52716064453125, -0.476409912109375, -0.4256591796875, -0.374908447265625, -0.32415771484375, -0.273406982421875, -0.22265625, -0.171905517578125, -0.12115478515625, -0.070404052734375, -0.0196533203125, 0.031097412109375, 0.08184814453125, 0.132598876953125, 0.183349609375, 0.234100341796875, 0.28485107421875, 0.335601806640625, 0.3863525390625, 0.437103271484375, 0.48785400390625, 0.538604736328125, 0.58935546875, 0.640106201171875, 0.69085693359375, 0.741607666015625, 0.7923583984375, 0.843109130859375, 0.89385986328125, 0.944610595703125, 0.995361328125, 1.046112060546875, 1.09686279296875, 1.147613525390625, 1.1983642578125, 1.249114990234375, 1.29986572265625, 1.350616455078125, 1.4013671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 7.0, 11.0, 22.0, 41.0, 83.0, 235.0, 796.0, 6319.0, 847000.0, 189470.0, 3637.0, 567.0, 198.0, 70.0, 38.0, 13.0, 13.0, 10.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.40576171875, -0.3950538635253906, -0.38434600830078125, -0.3736381530761719, -0.3629302978515625, -0.3522224426269531, -0.34151458740234375, -0.3308067321777344, -0.320098876953125, -0.3093910217285156, -0.29868316650390625, -0.2879753112792969, -0.2772674560546875, -0.2665596008300781, -0.25585174560546875, -0.24514389038085938, -0.23443603515625, -0.22372817993164062, -0.21302032470703125, -0.20231246948242188, -0.1916046142578125, -0.18089675903320312, -0.17018890380859375, -0.15948104858398438, -0.148773193359375, -0.13806533813476562, -0.12735748291015625, -0.11664962768554688, -0.1059417724609375, -0.09523391723632812, -0.08452606201171875, -0.07381820678710938, -0.0631103515625, -0.052402496337890625, -0.04169464111328125, -0.030986785888671875, -0.0202789306640625, -0.009571075439453125, 0.00113677978515625, 0.011844635009765625, 0.022552490234375, 0.033260345458984375, 0.04396820068359375, 0.054676055908203125, 0.0653839111328125, 0.07609176635742188, 0.08679962158203125, 0.09750747680664062, 0.10821533203125, 0.11892318725585938, 0.12963104248046875, 0.14033889770507812, 0.1510467529296875, 0.16175460815429688, 0.17246246337890625, 0.18317031860351562, 0.193878173828125, 0.20458602905273438, 0.21529388427734375, 0.22600173950195312, 0.2367095947265625, 0.24741744995117188, 0.25812530517578125, 0.2688331604003906, 0.279541015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 3.0, 7.0, 6.0, 12.0, 17.0, 13.0, 30.0, 51.0, 105.0, 166.0, 256.0, 126.0, 59.0, 41.0, 30.0, 20.0, 16.0, 11.0, 5.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.777576446533203e-05, -2.7134083211421967e-05, -2.6492401957511902e-05, -2.5850720703601837e-05, -2.5209039449691772e-05, -2.4567358195781708e-05, -2.3925676941871643e-05, -2.328399568796158e-05, -2.2642314434051514e-05, -2.200063318014145e-05, -2.1358951926231384e-05, -2.071727067232132e-05, -2.0075589418411255e-05, -1.943390816450119e-05, -1.8792226910591125e-05, -1.815054565668106e-05, -1.7508864402770996e-05, -1.686718314886093e-05, -1.6225501894950867e-05, -1.5583820641040802e-05, -1.4942139387130737e-05, -1.4300458133220673e-05, -1.3658776879310608e-05, -1.3017095625400543e-05, -1.2375414371490479e-05, -1.1733733117580414e-05, -1.1092051863670349e-05, -1.0450370609760284e-05, -9.80868935585022e-06, -9.167008101940155e-06, -8.52532684803009e-06, -7.883645594120026e-06, -7.241964340209961e-06, -6.600283086299896e-06, -5.9586018323898315e-06, -5.316920578479767e-06, -4.675239324569702e-06, -4.0335580706596375e-06, -3.3918768167495728e-06, -2.750195562839508e-06, -2.1085143089294434e-06, -1.4668330550193787e-06, -8.25151801109314e-07, -1.8347054719924927e-07, 4.5821070671081543e-07, 1.0998919606208801e-06, 1.7415732145309448e-06, 2.3832544684410095e-06, 3.0249357223510742e-06, 3.666616976261139e-06, 4.308298230171204e-06, 4.949979484081268e-06, 5.591660737991333e-06, 6.233341991901398e-06, 6.875023245811462e-06, 7.516704499721527e-06, 8.158385753631592e-06, 8.800067007541656e-06, 9.441748261451721e-06, 1.0083429515361786e-05, 1.072511076927185e-05, 1.1366792023181915e-05, 1.200847327709198e-05, 1.2650154531002045e-05, 1.329183578491211e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 5.0, 9.0, 26.0, 46.0, 73.0, 144.0, 324.0, 785.0, 3052.0, 39162.0, 968373.0, 32395.0, 2801.0, 753.0, 285.0, 142.0, 66.0, 32.0, 28.0, 12.0, 6.0, 3.0, 8.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.26220703125, -0.25266265869140625, -0.2431182861328125, -0.23357391357421875, -0.224029541015625, -0.21448516845703125, -0.2049407958984375, -0.19539642333984375, -0.18585205078125, -0.17630767822265625, -0.1667633056640625, -0.15721893310546875, -0.147674560546875, -0.13813018798828125, -0.1285858154296875, -0.11904144287109375, -0.1094970703125, -0.09995269775390625, -0.0904083251953125, -0.08086395263671875, -0.071319580078125, -0.06177520751953125, -0.0522308349609375, -0.04268646240234375, -0.03314208984375, -0.02359771728515625, -0.0140533447265625, -0.00450897216796875, 0.005035400390625, 0.01457977294921875, 0.0241241455078125, 0.03366851806640625, 0.043212890625, 0.05275726318359375, 0.0623016357421875, 0.07184600830078125, 0.081390380859375, 0.09093475341796875, 0.1004791259765625, 0.11002349853515625, 0.11956787109375, 0.12911224365234375, 0.1386566162109375, 0.14820098876953125, 0.157745361328125, 0.16728973388671875, 0.1768341064453125, 0.18637847900390625, 0.1959228515625, 0.20546722412109375, 0.2150115966796875, 0.22455596923828125, 0.234100341796875, 0.24364471435546875, 0.2531890869140625, 0.26273345947265625, 0.27227783203125, 0.28182220458984375, 0.2913665771484375, 0.30091094970703125, 0.310455322265625, 0.31999969482421875, 0.3295440673828125, 0.33908843994140625, 0.3486328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 9.0, 6.0, 8.0, 10.0, 19.0, 32.0, 44.0, 92.0, 134.0, 278.0, 142.0, 79.0, 56.0, 32.0, 17.0, 9.0, 8.0, 10.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1051025390625, -0.10256576538085938, -0.10002899169921875, -0.09749221801757812, -0.0949554443359375, -0.09241867065429688, -0.08988189697265625, -0.08734512329101562, -0.084808349609375, -0.08227157592773438, -0.07973480224609375, -0.07719802856445312, -0.0746612548828125, -0.07212448120117188, -0.06958770751953125, -0.06705093383789062, -0.06451416015625, -0.061977386474609375, -0.05944061279296875, -0.056903839111328125, -0.0543670654296875, -0.051830291748046875, -0.04929351806640625, -0.046756744384765625, -0.044219970703125, -0.041683197021484375, -0.03914642333984375, -0.036609649658203125, -0.0340728759765625, -0.031536102294921875, -0.02899932861328125, -0.026462554931640625, -0.02392578125, -0.021389007568359375, -0.01885223388671875, -0.016315460205078125, -0.0137786865234375, -0.011241912841796875, -0.00870513916015625, -0.006168365478515625, -0.003631591796875, -0.001094818115234375, 0.00144195556640625, 0.003978729248046875, 0.0065155029296875, 0.009052276611328125, 0.01158905029296875, 0.014125823974609375, 0.01666259765625, 0.019199371337890625, 0.02173614501953125, 0.024272918701171875, 0.0268096923828125, 0.029346466064453125, 0.03188323974609375, 0.034420013427734375, 0.036956787109375, 0.039493560791015625, 0.04203033447265625, 0.044567108154296875, 0.0471038818359375, 0.049640655517578125, 0.05217742919921875, 0.054714202880859375, 0.0572509765625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 10.0, 10.0, 9.0, 9.0, 15.0, 10.0, 29.0, 26.0, 28.0, 35.0, 62.0, 69.0, 76.0, 82.0, 83.0, 70.0, 61.0, 66.0, 50.0, 28.0, 34.0, 25.0, 21.0, 11.0, 23.0, 9.0, 2.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8745756149291992, -0.8464668989181519, -0.8183581233024597, -0.7902494072914124, -0.7621406316757202, -0.7340319156646729, -0.7059231996536255, -0.6778144836425781, -0.649705708026886, -0.6215969920158386, -0.5934882164001465, -0.5653795003890991, -0.5372707843780518, -0.5091620087623596, -0.48105329275131226, -0.4529445469379425, -0.42483580112457275, -0.396727055311203, -0.36861830949783325, -0.3405095934867859, -0.31240084767341614, -0.2842921018600464, -0.256183385848999, -0.22807464003562927, -0.19996589422225952, -0.17185714840888977, -0.1437484174966812, -0.11563967913389206, -0.0875309407711029, -0.059422194957733154, -0.0313134640455246, -0.00320473313331604, 0.024904072284698486, 0.05301281064748764, 0.0811215490102768, 0.10923028737306595, 0.1373390257358551, 0.16544777154922485, 0.1935565024614334, 0.22166523337364197, 0.24977397918701172, 0.27788272500038147, 0.3059914708137512, 0.3341001868247986, 0.36220893263816833, 0.3903176784515381, 0.41842639446258545, 0.4465351402759552, 0.47464388608932495, 0.5027526021003723, 0.5308613777160645, 0.5589700937271118, 0.5870788097381592, 0.6151875853538513, 0.6432963013648987, 0.6714050769805908, 0.6995137929916382, 0.7276225090026855, 0.7557312846183777, 0.783840000629425, 0.8119487762451172, 0.8400574922561646, 0.8681662082672119, 0.8962749242782593, 0.9243836998939514]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 7.0, 16.0, 16.0, 21.0, 20.0, 26.0, 30.0, 35.0, 53.0, 50.0, 59.0, 49.0, 55.0, 52.0, 53.0, 52.0, 58.0, 43.0, 57.0, 42.0, 46.0, 35.0, 29.0, 16.0, 15.0, 18.0, 13.0, 11.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.043912887573242, -1.967638611793518, -1.891364336013794, -1.8150900602340698, -1.7388157844543457, -1.6625415086746216, -1.5862672328948975, -1.509993076324463, -1.4337186813354492, -1.357444405555725, -1.281170129776001, -1.2048958539962769, -1.1286215782165527, -1.0523473024368286, -0.9760730862617493, -0.8997988104820251, -0.8235245943069458, -0.7472503185272217, -0.6709760427474976, -0.5947017669677734, -0.5184274911880493, -0.4421532452106476, -0.36587899923324585, -0.28960472345352173, -0.2133304476737976, -0.1370561718940735, -0.06078191101551056, 0.015492349863052368, 0.09176662564277649, 0.1680409014225006, 0.24431514739990234, 0.32058942317962646, 0.3968636989593506, 0.4731379747390747, 0.5494122505187988, 0.625686526298523, 0.7019608020782471, 0.7782350778579712, 0.8545092940330505, 0.9307835698127747, 1.0070579051971436, 1.0833321809768677, 1.1596064567565918, 1.235880732536316, 1.31215500831604, 1.3884292840957642, 1.4647035598754883, 1.5409777164459229, 1.617251992225647, 1.693526268005371, 1.7698005437850952, 1.8460748195648193, 1.9223490953445435, 1.9986233711242676, 2.074897527694702, 2.151171922683716, 2.2274460792541504, 2.303720235824585, 2.3799946308135986, 2.456268787384033, 2.532543182373047, 2.6088173389434814, 2.685091733932495, 2.7613658905029297, 2.8376402854919434]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 9.0, 13.0, 18.0, 29.0, 34.0, 59.0, 100.0, 123.0, 243.0, 358.0, 771.0, 1638.0, 4260.0, 16431.0, 252232.0, 3406726.0, 475302.0, 26940.0, 5220.0, 1866.0, 805.0, 417.0, 242.0, 137.0, 101.0, 55.0, 41.0, 39.0, 15.0, 17.0, 2.0, 9.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2216796875, -1.178955078125, -1.13623046875, -1.093505859375, -1.05078125, -1.008056640625, -0.96533203125, -0.922607421875, -0.8798828125, -0.837158203125, -0.79443359375, -0.751708984375, -0.708984375, -0.666259765625, -0.62353515625, -0.580810546875, -0.5380859375, -0.495361328125, -0.45263671875, -0.409912109375, -0.3671875, -0.324462890625, -0.28173828125, -0.239013671875, -0.1962890625, -0.153564453125, -0.11083984375, -0.068115234375, -0.025390625, 0.017333984375, 0.06005859375, 0.102783203125, 0.1455078125, 0.188232421875, 0.23095703125, 0.273681640625, 0.31640625, 0.359130859375, 0.40185546875, 0.444580078125, 0.4873046875, 0.530029296875, 0.57275390625, 0.615478515625, 0.658203125, 0.700927734375, 0.74365234375, 0.786376953125, 0.8291015625, 0.871826171875, 0.91455078125, 0.957275390625, 1.0, 1.042724609375, 1.08544921875, 1.128173828125, 1.1708984375, 1.213623046875, 1.25634765625, 1.299072265625, 1.341796875, 1.384521484375, 1.42724609375, 1.469970703125, 1.5126953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 10.0, 16.0, 20.0, 27.0, 25.0, 41.0, 50.0, 51.0, 52.0, 64.0, 73.0, 67.0, 62.0, 69.0, 63.0, 41.0, 43.0, 56.0, 28.0, 19.0, 18.0, 23.0, 16.0, 15.0, 9.0, 4.0, 5.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6533203125, -0.63134765625, -0.609375, -0.58740234375, -0.5654296875, -0.54345703125, -0.521484375, -0.49951171875, -0.4775390625, -0.45556640625, -0.43359375, -0.41162109375, -0.3896484375, -0.36767578125, -0.345703125, -0.32373046875, -0.3017578125, -0.27978515625, -0.2578125, -0.23583984375, -0.2138671875, -0.19189453125, -0.169921875, -0.14794921875, -0.1259765625, -0.10400390625, -0.08203125, -0.06005859375, -0.0380859375, -0.01611328125, 0.005859375, 0.02783203125, 0.0498046875, 0.07177734375, 0.09375, 0.11572265625, 0.1376953125, 0.15966796875, 0.181640625, 0.20361328125, 0.2255859375, 0.24755859375, 0.26953125, 0.29150390625, 0.3134765625, 0.33544921875, 0.357421875, 0.37939453125, 0.4013671875, 0.42333984375, 0.4453125, 0.46728515625, 0.4892578125, 0.51123046875, 0.533203125, 0.55517578125, 0.5771484375, 0.59912109375, 0.62109375, 0.64306640625, 0.6650390625, 0.68701171875, 0.708984375, 0.73095703125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 7.0, 5.0, 7.0, 8.0, 12.0, 16.0, 30.0, 43.0, 114.0, 319.0, 996.0, 4767.0, 49756.0, 4038241.0, 91412.0, 6754.0, 1193.0, 325.0, 142.0, 65.0, 29.0, 16.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.90496826171875, -2.8255615234375, -2.74615478515625, -2.666748046875, -2.58734130859375, -2.5079345703125, -2.42852783203125, -2.34912109375, -2.26971435546875, -2.1903076171875, -2.11090087890625, -2.031494140625, -1.95208740234375, -1.8726806640625, -1.79327392578125, -1.7138671875, -1.63446044921875, -1.5550537109375, -1.47564697265625, -1.396240234375, -1.31683349609375, -1.2374267578125, -1.15802001953125, -1.07861328125, -0.99920654296875, -0.9197998046875, -0.84039306640625, -0.760986328125, -0.68157958984375, -0.6021728515625, -0.52276611328125, -0.443359375, -0.36395263671875, -0.2845458984375, -0.20513916015625, -0.125732421875, -0.04632568359375, 0.0330810546875, 0.11248779296875, 0.19189453125, 0.27130126953125, 0.3507080078125, 0.43011474609375, 0.509521484375, 0.58892822265625, 0.6683349609375, 0.74774169921875, 0.8271484375, 0.90655517578125, 0.9859619140625, 1.06536865234375, 1.144775390625, 1.22418212890625, 1.3035888671875, 1.38299560546875, 1.46240234375, 1.54180908203125, 1.6212158203125, 1.70062255859375, 1.780029296875, 1.85943603515625, 1.9388427734375, 2.01824951171875, 2.09765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 7.0, 7.0, 15.0, 8.0, 15.0, 13.0, 17.0, 31.0, 57.0, 88.0, 207.0, 500.0, 1073.0, 1096.0, 494.0, 185.0, 105.0, 53.0, 22.0, 23.0, 11.0, 11.0, 11.0, 7.0, 4.0, 5.0, 1.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47265625, -0.4583168029785156, -0.44397735595703125, -0.4296379089355469, -0.4152984619140625, -0.4009590148925781, -0.38661956787109375, -0.3722801208496094, -0.357940673828125, -0.3436012268066406, -0.32926177978515625, -0.3149223327636719, -0.3005828857421875, -0.2862434387207031, -0.27190399169921875, -0.2575645446777344, -0.24322509765625, -0.22888565063476562, -0.21454620361328125, -0.20020675659179688, -0.1858673095703125, -0.17152786254882812, -0.15718841552734375, -0.14284896850585938, -0.128509521484375, -0.11417007446289062, -0.09983062744140625, -0.08549118041992188, -0.0711517333984375, -0.056812286376953125, -0.04247283935546875, -0.028133392333984375, -0.0137939453125, 0.000545501708984375, 0.01488494873046875, 0.029224395751953125, 0.0435638427734375, 0.057903289794921875, 0.07224273681640625, 0.08658218383789062, 0.100921630859375, 0.11526107788085938, 0.12960052490234375, 0.14393997192382812, 0.1582794189453125, 0.17261886596679688, 0.18695831298828125, 0.20129776000976562, 0.21563720703125, 0.22997665405273438, 0.24431610107421875, 0.2586555480957031, 0.2729949951171875, 0.2873344421386719, 0.30167388916015625, 0.3160133361816406, 0.330352783203125, 0.3446922302246094, 0.35903167724609375, 0.3733711242675781, 0.3877105712890625, 0.4020500183105469, 0.41638946533203125, 0.4307289123535156, 0.445068359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 4.0, 7.0, 8.0, 15.0, 18.0, 17.0, 17.0, 27.0, 40.0, 52.0, 51.0, 89.0, 82.0, 77.0, 91.0, 71.0, 58.0, 71.0, 45.0, 44.0, 26.0, 16.0, 18.0, 11.0, 14.0, 6.0, 4.0, 0.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.803127646446228, -0.7754397988319397, -0.7477519512176514, -0.7200641632080078, -0.6923763155937195, -0.6646884679794312, -0.6370006203651428, -0.6093127727508545, -0.5816249847412109, -0.5539371371269226, -0.5262492895126343, -0.49856147170066833, -0.4708736538887024, -0.44318580627441406, -0.41549795866012573, -0.3878101408481598, -0.36012229323387146, -0.33243444561958313, -0.3047466278076172, -0.27705878019332886, -0.24937096238136292, -0.22168311476707458, -0.19399528205394745, -0.1663074493408203, -0.13861961662769318, -0.11093178391456604, -0.0832439512014389, -0.05555611103773117, -0.027868278324604034, -0.00018043816089630127, 0.027507394552230835, 0.05519522726535797, 0.08288305997848511, 0.11057089269161224, 0.13825872540473938, 0.1659465730190277, 0.19363439083099365, 0.22132223844528198, 0.24901007115840912, 0.27669790387153625, 0.3043857216835022, 0.3320735692977905, 0.35976138710975647, 0.3874492347240448, 0.41513705253601074, 0.4428249001502991, 0.4705127477645874, 0.49820056557655334, 0.5258884429931641, 0.5535762906074524, 0.5812641382217407, 0.6089519262313843, 0.6366397738456726, 0.6643276214599609, 0.6920154690742493, 0.7197033166885376, 0.7473911046981812, 0.7750789523124695, 0.8027667999267578, 0.8304545879364014, 0.8581424355506897, 0.885830283164978, 0.9135181307792664, 0.9412059783935547, 0.9688937664031982]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 3.0, 9.0, 12.0, 13.0, 13.0, 28.0, 14.0, 17.0, 29.0, 35.0, 33.0, 33.0, 39.0, 33.0, 54.0, 41.0, 43.0, 45.0, 54.0, 45.0, 38.0, 38.0, 43.0, 37.0, 27.0, 19.0, 19.0, 21.0, 28.0, 21.0, 16.0, 23.0, 13.0, 14.0, 7.0, 7.0, 10.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5212469696998596, -0.5023834705352783, -0.4835200011730194, -0.4646565318107605, -0.4457930326461792, -0.4269295632839203, -0.4080660939216614, -0.3892025947570801, -0.37033912539482117, -0.35147565603256226, -0.33261215686798096, -0.31374868750572205, -0.29488521814346313, -0.27602171897888184, -0.2571582496166229, -0.23829476535320282, -0.21943128108978271, -0.2005677968263626, -0.1817043125629425, -0.1628408432006836, -0.1439773589372635, -0.12511387467384338, -0.10625039786100388, -0.08738692104816437, -0.06852343678474426, -0.049659956246614456, -0.03079647570848465, -0.011932995170354843, 0.006930485367774963, 0.02579396963119507, 0.044657446444034576, 0.06352092325687408, 0.08238440752029419, 0.1012478917837143, 0.1201113685965538, 0.1389748454093933, 0.15783832967281342, 0.17670181393623352, 0.19556528329849243, 0.21442876756191254, 0.23329225182533264, 0.25215572118759155, 0.27101922035217285, 0.28988268971443176, 0.3087461590766907, 0.327609658241272, 0.3464731276035309, 0.3653365969657898, 0.3842000961303711, 0.40306356549263, 0.4219270646572113, 0.4407905340194702, 0.4596540331840515, 0.4785175025463104, 0.49738097190856934, 0.5162444710731506, 0.5351079702377319, 0.5539714694023132, 0.5728349089622498, 0.591698408126831, 0.6105619072914124, 0.6294254064559937, 0.6482888460159302, 0.6671523451805115, 0.686015784740448]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 17.0, 24.0, 24.0, 58.0, 59.0, 110.0, 135.0, 230.0, 379.0, 589.0, 976.0, 1629.0, 2816.0, 5382.0, 11018.0, 23546.0, 57641.0, 178040.0, 460682.0, 194180.0, 61542.0, 25122.0, 11526.0, 5570.0, 2972.0, 1652.0, 961.0, 592.0, 369.0, 237.0, 130.0, 101.0, 72.0, 50.0, 36.0, 19.0, 17.0, 12.0, 13.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10882568359375, -0.10558032989501953, -0.10233497619628906, -0.0990896224975586, -0.09584426879882812, -0.09259891510009766, -0.08935356140136719, -0.08610820770263672, -0.08286285400390625, -0.07961750030517578, -0.07637214660644531, -0.07312679290771484, -0.06988143920898438, -0.0666360855102539, -0.06339073181152344, -0.06014537811279297, -0.0569000244140625, -0.05365467071533203, -0.05040931701660156, -0.047163963317871094, -0.043918609619140625, -0.040673255920410156, -0.03742790222167969, -0.03418254852294922, -0.03093719482421875, -0.02769184112548828, -0.024446487426757812, -0.021201133728027344, -0.017955780029296875, -0.014710426330566406, -0.011465072631835938, -0.008219718933105469, -0.004974365234375, -0.0017290115356445312, 0.0015163421630859375, 0.004761695861816406, 0.008007049560546875, 0.011252403259277344, 0.014497756958007812, 0.01774311065673828, 0.02098846435546875, 0.02423381805419922, 0.027479171752929688, 0.030724525451660156, 0.033969879150390625, 0.037215232849121094, 0.04046058654785156, 0.04370594024658203, 0.0469512939453125, 0.05019664764404297, 0.05344200134277344, 0.056687355041503906, 0.059932708740234375, 0.06317806243896484, 0.06642341613769531, 0.06966876983642578, 0.07291412353515625, 0.07615947723388672, 0.07940483093261719, 0.08265018463134766, 0.08589553833007812, 0.0891408920288086, 0.09238624572753906, 0.09563159942626953, 0.098876953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 7.0, 7.0, 12.0, 16.0, 20.0, 24.0, 29.0, 30.0, 27.0, 44.0, 39.0, 42.0, 44.0, 51.0, 61.0, 54.0, 51.0, 47.0, 50.0, 48.0, 41.0, 32.0, 18.0, 29.0, 22.0, 24.0, 22.0, 16.0, 24.0, 15.0, 8.0, 7.0, 5.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466064453125, -0.4521942138671875, -0.438323974609375, -0.4244537353515625, -0.41058349609375, -0.3967132568359375, -0.382843017578125, -0.3689727783203125, -0.3551025390625, -0.3412322998046875, -0.327362060546875, -0.3134918212890625, -0.29962158203125, -0.2857513427734375, -0.271881103515625, -0.2580108642578125, -0.244140625, -0.2302703857421875, -0.216400146484375, -0.2025299072265625, -0.18865966796875, -0.1747894287109375, -0.160919189453125, -0.1470489501953125, -0.1331787109375, -0.1193084716796875, -0.105438232421875, -0.0915679931640625, -0.07769775390625, -0.0638275146484375, -0.049957275390625, -0.0360870361328125, -0.022216796875, -0.0083465576171875, 0.005523681640625, 0.0193939208984375, 0.03326416015625, 0.0471343994140625, 0.061004638671875, 0.0748748779296875, 0.0887451171875, 0.1026153564453125, 0.116485595703125, 0.1303558349609375, 0.14422607421875, 0.1580963134765625, 0.171966552734375, 0.1858367919921875, 0.19970703125, 0.2135772705078125, 0.227447509765625, 0.2413177490234375, 0.25518798828125, 0.2690582275390625, 0.282928466796875, 0.2967987060546875, 0.3106689453125, 0.3245391845703125, 0.338409423828125, 0.3522796630859375, 0.36614990234375, 0.3800201416015625, 0.393890380859375, 0.4077606201171875, 0.421630859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 9.0, 9.0, 17.0, 18.0, 28.0, 56.0, 72.0, 109.0, 165.0, 263.0, 399.0, 663.0, 1059.0, 1684.0, 2834.0, 4607.0, 8057.0, 14258.0, 27161.0, 54709.0, 116224.0, 239283.0, 279198.0, 150997.0, 70192.0, 34843.0, 17741.0, 9771.0, 5568.0, 3227.0, 2029.0, 1193.0, 753.0, 469.0, 286.0, 188.0, 120.0, 97.0, 56.0, 45.0, 29.0, 25.0, 8.0, 16.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04693603515625, -0.04543018341064453, -0.04392433166503906, -0.042418479919433594, -0.040912628173828125, -0.039406776428222656, -0.03790092468261719, -0.03639507293701172, -0.03488922119140625, -0.03338336944580078, -0.03187751770019531, -0.030371665954589844, -0.028865814208984375, -0.027359962463378906, -0.025854110717773438, -0.02434825897216797, -0.0228424072265625, -0.02133655548095703, -0.019830703735351562, -0.018324851989746094, -0.016819000244140625, -0.015313148498535156, -0.013807296752929688, -0.012301445007324219, -0.01079559326171875, -0.009289741516113281, -0.0077838897705078125, -0.006278038024902344, -0.004772186279296875, -0.0032663345336914062, -0.0017604827880859375, -0.00025463104248046875, 0.001251220703125, 0.0027570724487304688, 0.0042629241943359375, 0.005768775939941406, 0.007274627685546875, 0.008780479431152344, 0.010286331176757812, 0.011792182922363281, 0.01329803466796875, 0.014803886413574219, 0.016309738159179688, 0.017815589904785156, 0.019321441650390625, 0.020827293395996094, 0.022333145141601562, 0.02383899688720703, 0.0253448486328125, 0.02685070037841797, 0.028356552124023438, 0.029862403869628906, 0.031368255615234375, 0.032874107360839844, 0.03437995910644531, 0.03588581085205078, 0.03739166259765625, 0.03889751434326172, 0.04040336608886719, 0.041909217834472656, 0.043415069580078125, 0.044920921325683594, 0.04642677307128906, 0.04793262481689453, 0.0494384765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 8.0, 9.0, 5.0, 7.0, 13.0, 16.0, 17.0, 26.0, 33.0, 36.0, 45.0, 48.0, 34.0, 34.0, 55.0, 58.0, 57.0, 75.0, 48.0, 45.0, 45.0, 46.0, 38.0, 34.0, 41.0, 23.0, 23.0, 15.0, 13.0, 10.0, 6.0, 10.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7822265625, -0.753875732421875, -0.72552490234375, -0.697174072265625, -0.6688232421875, -0.640472412109375, -0.61212158203125, -0.583770751953125, -0.555419921875, -0.527069091796875, -0.49871826171875, -0.470367431640625, -0.4420166015625, -0.413665771484375, -0.38531494140625, -0.356964111328125, -0.32861328125, -0.300262451171875, -0.27191162109375, -0.243560791015625, -0.2152099609375, -0.186859130859375, -0.15850830078125, -0.130157470703125, -0.101806640625, -0.073455810546875, -0.04510498046875, -0.016754150390625, 0.0115966796875, 0.039947509765625, 0.06829833984375, 0.096649169921875, 0.125, 0.153350830078125, 0.18170166015625, 0.210052490234375, 0.2384033203125, 0.266754150390625, 0.29510498046875, 0.323455810546875, 0.351806640625, 0.380157470703125, 0.40850830078125, 0.436859130859375, 0.4652099609375, 0.493560791015625, 0.52191162109375, 0.550262451171875, 0.57861328125, 0.606964111328125, 0.63531494140625, 0.663665771484375, 0.6920166015625, 0.720367431640625, 0.74871826171875, 0.777069091796875, 0.805419921875, 0.833770751953125, 0.86212158203125, 0.890472412109375, 0.9188232421875, 0.947174072265625, 0.97552490234375, 1.003875732421875, 1.0322265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 11.0, 1.0, 7.0, 13.0, 14.0, 27.0, 46.0, 49.0, 64.0, 106.0, 145.0, 249.0, 406.0, 624.0, 1106.0, 1978.0, 3805.0, 8107.0, 19797.0, 57224.0, 204055.0, 463058.0, 197044.0, 55828.0, 18939.0, 7441.0, 3591.0, 1850.0, 1151.0, 649.0, 406.0, 241.0, 176.0, 106.0, 82.0, 51.0, 33.0, 19.0, 21.0, 12.0, 11.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007648468017578125, -0.007397592067718506, -0.007146716117858887, -0.006895840167999268, -0.0066449642181396484, -0.006394088268280029, -0.00614321231842041, -0.005892336368560791, -0.005641460418701172, -0.005390584468841553, -0.005139708518981934, -0.0048888325691223145, -0.004637956619262695, -0.004387080669403076, -0.004136204719543457, -0.003885328769683838, -0.0036344528198242188, -0.0033835768699645996, -0.0031327009201049805, -0.0028818249702453613, -0.002630949020385742, -0.002380073070526123, -0.002129197120666504, -0.0018783211708068848, -0.0016274452209472656, -0.0013765692710876465, -0.0011256933212280273, -0.0008748173713684082, -0.0006239414215087891, -0.0003730654716491699, -0.00012218952178955078, 0.00012868642807006836, 0.0003795623779296875, 0.0006304383277893066, 0.0008813142776489258, 0.001132190227508545, 0.001383066177368164, 0.0016339421272277832, 0.0018848180770874023, 0.0021356940269470215, 0.0023865699768066406, 0.0026374459266662598, 0.002888321876525879, 0.003139197826385498, 0.003390073776245117, 0.0036409497261047363, 0.0038918256759643555, 0.004142701625823975, 0.004393577575683594, 0.004644453525543213, 0.004895329475402832, 0.005146205425262451, 0.00539708137512207, 0.0056479573249816895, 0.005898833274841309, 0.006149709224700928, 0.006400585174560547, 0.006651461124420166, 0.006902337074279785, 0.007153213024139404, 0.0074040889739990234, 0.007654964923858643, 0.007905840873718262, 0.00815671682357788, 0.0084075927734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 6.0, 11.0, 16.0, 28.0, 57.0, 95.0, 173.0, 200.0, 170.0, 94.0, 58.0, 40.0, 17.0, 11.0, 4.0, 5.0, 7.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6312808990478516e-05, -4.5200809836387634e-05, -4.408881068229675e-05, -4.297681152820587e-05, -4.186481237411499e-05, -4.075281322002411e-05, -3.964081406593323e-05, -3.8528814911842346e-05, -3.7416815757751465e-05, -3.6304816603660583e-05, -3.51928174495697e-05, -3.408081829547882e-05, -3.296881914138794e-05, -3.185681998729706e-05, -3.074482083320618e-05, -2.9632821679115295e-05, -2.8520822525024414e-05, -2.7408823370933533e-05, -2.629682421684265e-05, -2.518482506275177e-05, -2.407282590866089e-05, -2.2960826754570007e-05, -2.1848827600479126e-05, -2.0736828446388245e-05, -1.9624829292297363e-05, -1.8512830138206482e-05, -1.74008309841156e-05, -1.628883183002472e-05, -1.5176832675933838e-05, -1.4064833521842957e-05, -1.2952834367752075e-05, -1.1840835213661194e-05, -1.0728836059570312e-05, -9.616836905479431e-06, -8.50483775138855e-06, -7.3928385972976685e-06, -6.280839443206787e-06, -5.168840289115906e-06, -4.056841135025024e-06, -2.944841980934143e-06, -1.8328428268432617e-06, -7.208436727523804e-07, 3.91155481338501e-07, 1.5031546354293823e-06, 2.6151537895202637e-06, 3.727152943611145e-06, 4.839152097702026e-06, 5.951151251792908e-06, 7.063150405883789e-06, 8.17514955997467e-06, 9.287148714065552e-06, 1.0399147868156433e-05, 1.1511147022247314e-05, 1.2623146176338196e-05, 1.3735145330429077e-05, 1.4847144484519958e-05, 1.595914363861084e-05, 1.707114279270172e-05, 1.8183141946792603e-05, 1.9295141100883484e-05, 2.0407140254974365e-05, 2.1519139409065247e-05, 2.2631138563156128e-05, 2.374313771724701e-05, 2.485513687133789e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 10.0, 17.0, 22.0, 38.0, 45.0, 86.0, 132.0, 218.0, 363.0, 667.0, 1208.0, 2704.0, 6563.0, 19024.0, 69253.0, 343605.0, 465566.0, 99121.0, 25081.0, 8378.0, 3177.0, 1470.0, 756.0, 390.0, 236.0, 152.0, 79.0, 59.0, 33.0, 29.0, 13.0, 20.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.011138916015625, -0.010830521583557129, -0.010522127151489258, -0.010213732719421387, -0.009905338287353516, -0.009596943855285645, -0.009288549423217773, -0.008980154991149902, -0.008671760559082031, -0.00836336612701416, -0.008054971694946289, -0.007746577262878418, -0.007438182830810547, -0.007129788398742676, -0.006821393966674805, -0.006512999534606934, -0.0062046051025390625, -0.005896210670471191, -0.00558781623840332, -0.005279421806335449, -0.004971027374267578, -0.004662632942199707, -0.004354238510131836, -0.004045844078063965, -0.0037374496459960938, -0.0034290552139282227, -0.0031206607818603516, -0.0028122663497924805, -0.0025038719177246094, -0.0021954774856567383, -0.0018870830535888672, -0.001578688621520996, -0.001270294189453125, -0.0009618997573852539, -0.0006535053253173828, -0.0003451108932495117, -3.6716461181640625e-05, 0.00027167797088623047, 0.0005800724029541016, 0.0008884668350219727, 0.0011968612670898438, 0.0015052556991577148, 0.001813650131225586, 0.002122044563293457, 0.002430438995361328, 0.0027388334274291992, 0.0030472278594970703, 0.0033556222915649414, 0.0036640167236328125, 0.003972411155700684, 0.004280805587768555, 0.004589200019836426, 0.004897594451904297, 0.005205988883972168, 0.005514383316040039, 0.00582277774810791, 0.006131172180175781, 0.006439566612243652, 0.0067479610443115234, 0.0070563554763793945, 0.007364749908447266, 0.007673144340515137, 0.007981538772583008, 0.008289933204650879, 0.00859832763671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 0.0, 4.0, 13.0, 4.0, 13.0, 5.0, 16.0, 21.0, 29.0, 32.0, 46.0, 53.0, 80.0, 72.0, 94.0, 105.0, 78.0, 77.0, 60.0, 47.0, 34.0, 28.0, 21.0, 15.0, 11.0, 12.0, 5.0, 10.0, 11.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022373199462890625, -0.002144843339920044, -0.0020523667335510254, -0.001959890127182007, -0.0018674135208129883, -0.0017749369144439697, -0.0016824603080749512, -0.0015899837017059326, -0.001497507095336914, -0.0014050304889678955, -0.001312553882598877, -0.0012200772762298584, -0.0011276006698608398, -0.0010351240634918213, -0.0009426474571228027, -0.0008501708507537842, -0.0007576942443847656, -0.0006652176380157471, -0.0005727410316467285, -0.00048026442527770996, -0.0003877878189086914, -0.00029531121253967285, -0.0002028346061706543, -0.00011035799980163574, -1.7881393432617188e-05, 7.459521293640137e-05, 0.00016707181930541992, 0.0002595484256744385, 0.00035202503204345703, 0.0004445016384124756, 0.0005369782447814941, 0.0006294548511505127, 0.0007219314575195312, 0.0008144080638885498, 0.0009068846702575684, 0.000999361276626587, 0.0010918378829956055, 0.001184314489364624, 0.0012767910957336426, 0.0013692677021026611, 0.0014617443084716797, 0.0015542209148406982, 0.0016466975212097168, 0.0017391741275787354, 0.001831650733947754, 0.0019241273403167725, 0.002016603946685791, 0.0021090805530548096, 0.002201557159423828, 0.0022940337657928467, 0.0023865103721618652, 0.002478986978530884, 0.0025714635848999023, 0.002663940191268921, 0.0027564167976379395, 0.002848893404006958, 0.0029413700103759766, 0.003033846616744995, 0.0031263232231140137, 0.0032187998294830322, 0.0033112764358520508, 0.0034037530422210693, 0.003496229648590088, 0.0035887062549591064, 0.003681182861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 10.0, 20.0, 20.0, 37.0, 43.0, 69.0, 87.0, 112.0, 131.0, 108.0, 104.0, 63.0, 61.0, 37.0, 22.0, 16.0, 9.0, 7.0, 12.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8220674395561218, -0.7995972633361816, -0.7771270871162415, -0.7546569108963013, -0.7321867942810059, -0.7097166180610657, -0.6872464418411255, -0.6647762656211853, -0.6423060894012451, -0.6198359131813049, -0.5973657369613647, -0.5748955607414246, -0.5524253845214844, -0.529955267906189, -0.5074850916862488, -0.4850149154663086, -0.4625447392463684, -0.4400745630264282, -0.41760438680648804, -0.39513424038887024, -0.37266406416893005, -0.35019388794898987, -0.32772374153137207, -0.3052535653114319, -0.2827833890914917, -0.2603132128715515, -0.23784305155277252, -0.21537289023399353, -0.19290271401405334, -0.17043253779411316, -0.14796237647533417, -0.12549221515655518, -0.10302197933197021, -0.08055181056261063, -0.05808164179325104, -0.03561147302389145, -0.01314130425453186, 0.009328864514827728, 0.03179903328418732, 0.05426919460296631, 0.0767393708229065, 0.09920953959226608, 0.12167970836162567, 0.14414986968040466, 0.16662004590034485, 0.18909022212028503, 0.21156038343906403, 0.23403054475784302, 0.2565007209777832, 0.2789708971977234, 0.3014410734176636, 0.32391121983528137, 0.34638139605522156, 0.36885157227516174, 0.39132171869277954, 0.4137918949127197, 0.4362620711326599, 0.4587322473526001, 0.4812024235725403, 0.5036725997924805, 0.5261427164077759, 0.5486128926277161, 0.5710830688476562, 0.5935532450675964, 0.6160234212875366]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 4.0, 7.0, 18.0, 21.0, 23.0, 24.0, 24.0, 40.0, 41.0, 49.0, 42.0, 43.0, 71.0, 49.0, 55.0, 60.0, 51.0, 49.0, 55.0, 38.0, 20.0, 31.0, 26.0, 29.0, 26.0, 19.0, 17.0, 20.0, 13.0, 5.0, 3.0, 1.0, 7.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4200538694858551, -0.4058607220649719, -0.39166760444641113, -0.37747445702552795, -0.3632813096046448, -0.349088191986084, -0.3348950445652008, -0.3207018971443176, -0.30650877952575684, -0.29231563210487366, -0.27812251448631287, -0.2639293670654297, -0.2497362345457077, -0.23554310202598572, -0.22134995460510254, -0.20715682208538055, -0.19296368956565857, -0.17877055704593658, -0.1645774245262146, -0.15038427710533142, -0.13619114458560944, -0.12199801206588745, -0.10780487209558487, -0.09361173212528229, -0.0794185996055603, -0.06522546708583832, -0.051032327115535736, -0.03683919087052345, -0.02264605462551117, -0.008452922105789185, 0.005740217864513397, 0.01993335783481598, 0.034126490354537964, 0.04831962659955025, 0.06251276284456253, 0.07670590281486511, 0.0908990353345871, 0.10509216785430908, 0.11928530782461166, 0.13347844779491425, 0.14767158031463623, 0.16186471283435822, 0.1760578453540802, 0.19025099277496338, 0.20444412529468536, 0.21863725781440735, 0.23283040523529053, 0.2470235377550125, 0.2612166702747345, 0.2754098176956177, 0.28960293531417847, 0.30379608273506165, 0.3179892301559448, 0.3321823477745056, 0.3463754951953888, 0.360568642616272, 0.37476176023483276, 0.38895490765571594, 0.40314802527427673, 0.4173411726951599, 0.4315342903137207, 0.4457274377346039, 0.45992058515548706, 0.47411370277404785, 0.48830685019493103]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 8.0, 11.0, 12.0, 14.0, 16.0, 32.0, 32.0, 55.0, 81.0, 132.0, 237.0, 440.0, 877.0, 1911.0, 5376.0, 17793.0, 98181.0, 818443.0, 80912.0, 15598.0, 4725.0, 1808.0, 817.0, 394.0, 240.0, 128.0, 85.0, 48.0, 44.0, 17.0, 20.0, 15.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.5234375, -0.5086746215820312, -0.4939117431640625, -0.47914886474609375, -0.464385986328125, -0.44962310791015625, -0.4348602294921875, -0.42009735107421875, -0.40533447265625, -0.39057159423828125, -0.3758087158203125, -0.36104583740234375, -0.346282958984375, -0.33152008056640625, -0.3167572021484375, -0.30199432373046875, -0.2872314453125, -0.27246856689453125, -0.2577056884765625, -0.24294281005859375, -0.228179931640625, -0.21341705322265625, -0.1986541748046875, -0.18389129638671875, -0.16912841796875, -0.15436553955078125, -0.1396026611328125, -0.12483978271484375, -0.110076904296875, -0.09531402587890625, -0.0805511474609375, -0.06578826904296875, -0.051025390625, -0.03626251220703125, -0.0214996337890625, -0.00673675537109375, 0.008026123046875, 0.02278900146484375, 0.0375518798828125, 0.05231475830078125, 0.06707763671875, 0.08184051513671875, 0.0966033935546875, 0.11136627197265625, 0.126129150390625, 0.14089202880859375, 0.1556549072265625, 0.17041778564453125, 0.1851806640625, 0.19994354248046875, 0.2147064208984375, 0.22946929931640625, 0.244232177734375, 0.25899505615234375, 0.2737579345703125, 0.28852081298828125, 0.30328369140625, 0.31804656982421875, 0.3328094482421875, 0.34757232666015625, 0.362335205078125, 0.37709808349609375, 0.3918609619140625, 0.40662384033203125, 0.42138671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 7.0, 7.0, 2.0, 12.0, 12.0, 22.0, 21.0, 20.0, 35.0, 31.0, 38.0, 36.0, 47.0, 51.0, 45.0, 53.0, 63.0, 79.0, 50.0, 39.0, 58.0, 44.0, 33.0, 34.0, 23.0, 17.0, 23.0, 14.0, 15.0, 16.0, 11.0, 16.0, 10.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.998046875, -0.9693145751953125, -0.940582275390625, -0.9118499755859375, -0.88311767578125, -0.8543853759765625, -0.825653076171875, -0.7969207763671875, -0.7681884765625, -0.7394561767578125, -0.710723876953125, -0.6819915771484375, -0.65325927734375, -0.6245269775390625, -0.595794677734375, -0.5670623779296875, -0.538330078125, -0.5095977783203125, -0.480865478515625, -0.4521331787109375, -0.42340087890625, -0.3946685791015625, -0.365936279296875, -0.3372039794921875, -0.3084716796875, -0.2797393798828125, -0.251007080078125, -0.2222747802734375, -0.19354248046875, -0.1648101806640625, -0.136077880859375, -0.1073455810546875, -0.07861328125, -0.0498809814453125, -0.021148681640625, 0.0075836181640625, 0.03631591796875, 0.0650482177734375, 0.093780517578125, 0.1225128173828125, 0.1512451171875, 0.1799774169921875, 0.208709716796875, 0.2374420166015625, 0.26617431640625, 0.2949066162109375, 0.323638916015625, 0.3523712158203125, 0.381103515625, 0.4098358154296875, 0.438568115234375, 0.4673004150390625, 0.49603271484375, 0.5247650146484375, 0.553497314453125, 0.5822296142578125, 0.6109619140625, 0.6396942138671875, 0.668426513671875, 0.6971588134765625, 0.72589111328125, 0.7546234130859375, 0.783355712890625, 0.8120880126953125, 0.8408203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 6.0, 12.0, 16.0, 27.0, 24.0, 43.0, 37.0, 34.0, 52.0, 103.0, 328.0, 5017.0, 1036938.0, 5170.0, 302.0, 94.0, 74.0, 50.0, 48.0, 30.0, 31.0, 25.0, 11.0, 20.0, 8.0, 6.0, 5.0, 4.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2734375, -2.19891357421875, -2.1243896484375, -2.04986572265625, -1.975341796875, -1.90081787109375, -1.8262939453125, -1.75177001953125, -1.67724609375, -1.60272216796875, -1.5281982421875, -1.45367431640625, -1.379150390625, -1.30462646484375, -1.2301025390625, -1.15557861328125, -1.0810546875, -1.00653076171875, -0.9320068359375, -0.85748291015625, -0.782958984375, -0.70843505859375, -0.6339111328125, -0.55938720703125, -0.48486328125, -0.41033935546875, -0.3358154296875, -0.26129150390625, -0.186767578125, -0.11224365234375, -0.0377197265625, 0.03680419921875, 0.111328125, 0.18585205078125, 0.2603759765625, 0.33489990234375, 0.409423828125, 0.48394775390625, 0.5584716796875, 0.63299560546875, 0.70751953125, 0.78204345703125, 0.8565673828125, 0.93109130859375, 1.005615234375, 1.08013916015625, 1.1546630859375, 1.22918701171875, 1.3037109375, 1.37823486328125, 1.4527587890625, 1.52728271484375, 1.601806640625, 1.67633056640625, 1.7508544921875, 1.82537841796875, 1.89990234375, 1.97442626953125, 2.0489501953125, 2.12347412109375, 2.197998046875, 2.27252197265625, 2.3470458984375, 2.42156982421875, 2.49609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 9.0, 7.0, 14.0, 15.0, 25.0, 30.0, 30.0, 41.0, 42.0, 46.0, 63.0, 72.0, 76.0, 76.0, 63.0, 64.0, 62.0, 59.0, 36.0, 41.0, 34.0, 28.0, 22.0, 14.0, 7.0, 5.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4853515625, -1.4378662109375, -1.390380859375, -1.3428955078125, -1.29541015625, -1.2479248046875, -1.200439453125, -1.1529541015625, -1.10546875, -1.0579833984375, -1.010498046875, -0.9630126953125, -0.91552734375, -0.8680419921875, -0.820556640625, -0.7730712890625, -0.7255859375, -0.6781005859375, -0.630615234375, -0.5831298828125, -0.53564453125, -0.4881591796875, -0.440673828125, -0.3931884765625, -0.345703125, -0.2982177734375, -0.250732421875, -0.2032470703125, -0.15576171875, -0.1082763671875, -0.060791015625, -0.0133056640625, 0.0341796875, 0.0816650390625, 0.129150390625, 0.1766357421875, 0.22412109375, 0.2716064453125, 0.319091796875, 0.3665771484375, 0.4140625, 0.4615478515625, 0.509033203125, 0.5565185546875, 0.60400390625, 0.6514892578125, 0.698974609375, 0.7464599609375, 0.7939453125, 0.8414306640625, 0.888916015625, 0.9364013671875, 0.98388671875, 1.0313720703125, 1.078857421875, 1.1263427734375, 1.173828125, 1.2213134765625, 1.268798828125, 1.3162841796875, 1.36376953125, 1.4112548828125, 1.458740234375, 1.5062255859375, 1.5537109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 11.0, 13.0, 10.0, 18.0, 27.0, 48.0, 80.0, 182.0, 393.0, 899.0, 2640.0, 7686.0, 40543.0, 957990.0, 27732.0, 6439.0, 2299.0, 832.0, 359.0, 156.0, 72.0, 37.0, 23.0, 17.0, 11.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34765625, -0.3372535705566406, -0.32685089111328125, -0.3164482116699219, -0.3060455322265625, -0.2956428527832031, -0.28524017333984375, -0.2748374938964844, -0.264434814453125, -0.2540321350097656, -0.24362945556640625, -0.23322677612304688, -0.2228240966796875, -0.21242141723632812, -0.20201873779296875, -0.19161605834960938, -0.18121337890625, -0.17081069946289062, -0.16040802001953125, -0.15000534057617188, -0.1396026611328125, -0.12919998168945312, -0.11879730224609375, -0.10839462280273438, -0.097991943359375, -0.08758926391601562, -0.07718658447265625, -0.06678390502929688, -0.0563812255859375, -0.045978546142578125, -0.03557586669921875, -0.025173187255859375, -0.0147705078125, -0.004367828369140625, 0.00603485107421875, 0.016437530517578125, 0.0268402099609375, 0.037242889404296875, 0.04764556884765625, 0.058048248291015625, 0.068450927734375, 0.07885360717773438, 0.08925628662109375, 0.09965896606445312, 0.1100616455078125, 0.12046432495117188, 0.13086700439453125, 0.14126968383789062, 0.15167236328125, 0.16207504272460938, 0.17247772216796875, 0.18288040161132812, 0.1932830810546875, 0.20368576049804688, 0.21408843994140625, 0.22449111938476562, 0.234893798828125, 0.24529647827148438, 0.25569915771484375, 0.2661018371582031, 0.2765045166015625, 0.2869071960449219, 0.29730987548828125, 0.3077125549316406, 0.318115234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 4.0, 8.0, 13.0, 28.0, 76.0, 444.0, 293.0, 61.0, 25.0, 8.0, 4.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.794929504394531e-05, -6.643589586019516e-05, -6.492249667644501e-05, -6.340909749269485e-05, -6.18956983089447e-05, -6.038229912519455e-05, -5.88688999414444e-05, -5.7355500757694244e-05, -5.584210157394409e-05, -5.432870239019394e-05, -5.281530320644379e-05, -5.1301904022693634e-05, -4.978850483894348e-05, -4.827510565519333e-05, -4.6761706471443176e-05, -4.5248307287693024e-05, -4.373490810394287e-05, -4.222150892019272e-05, -4.0708109736442566e-05, -3.919471055269241e-05, -3.768131136894226e-05, -3.616791218519211e-05, -3.4654513001441956e-05, -3.31411138176918e-05, -3.162771463394165e-05, -3.0114315450191498e-05, -2.8600916266441345e-05, -2.7087517082691193e-05, -2.557411789894104e-05, -2.4060718715190887e-05, -2.2547319531440735e-05, -2.1033920347690582e-05, -1.952052116394043e-05, -1.8007121980190277e-05, -1.6493722796440125e-05, -1.4980323612689972e-05, -1.346692442893982e-05, -1.1953525245189667e-05, -1.0440126061439514e-05, -8.926726877689362e-06, -7.413327693939209e-06, -5.899928510189056e-06, -4.386529326438904e-06, -2.8731301426887512e-06, -1.3597309589385986e-06, 1.5366822481155396e-07, 1.6670674085617065e-06, 3.180466592311859e-06, 4.693865776062012e-06, 6.207264959812164e-06, 7.720664143562317e-06, 9.23406332731247e-06, 1.0747462511062622e-05, 1.2260861694812775e-05, 1.3774260878562927e-05, 1.528766006231308e-05, 1.6801059246063232e-05, 1.8314458429813385e-05, 1.9827857613563538e-05, 2.134125679731369e-05, 2.2854655981063843e-05, 2.4368055164813995e-05, 2.5881454348564148e-05, 2.73948535323143e-05, 2.8908252716064453e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 11.0, 11.0, 12.0, 36.0, 55.0, 84.0, 154.0, 257.0, 503.0, 986.0, 2193.0, 5062.0, 13155.0, 88172.0, 899098.0, 24859.0, 7719.0, 3175.0, 1471.0, 738.0, 335.0, 204.0, 100.0, 63.0, 40.0, 19.0, 17.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.2337646484375, -0.22412109375, -0.2144775390625, -0.204833984375, -0.1951904296875, -0.185546875, -0.1759033203125, -0.166259765625, -0.1566162109375, -0.14697265625, -0.1373291015625, -0.127685546875, -0.1180419921875, -0.1083984375, -0.0987548828125, -0.089111328125, -0.0794677734375, -0.06982421875, -0.0601806640625, -0.050537109375, -0.0408935546875, -0.03125, -0.0216064453125, -0.011962890625, -0.0023193359375, 0.00732421875, 0.0169677734375, 0.026611328125, 0.0362548828125, 0.0458984375, 0.0555419921875, 0.065185546875, 0.0748291015625, 0.08447265625, 0.0941162109375, 0.103759765625, 0.1134033203125, 0.123046875, 0.1326904296875, 0.142333984375, 0.1519775390625, 0.16162109375, 0.1712646484375, 0.180908203125, 0.1905517578125, 0.2001953125, 0.2098388671875, 0.219482421875, 0.2291259765625, 0.23876953125, 0.2484130859375, 0.258056640625, 0.2677001953125, 0.27734375, 0.2869873046875, 0.296630859375, 0.3062744140625, 0.31591796875, 0.3255615234375, 0.335205078125, 0.3448486328125, 0.3544921875, 0.3641357421875, 0.373779296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 12.0, 15.0, 14.0, 42.0, 59.0, 142.0, 502.0, 69.0, 53.0, 30.0, 13.0, 10.0, 9.0, 2.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11346435546875, -0.10994625091552734, -0.10642814636230469, -0.10291004180908203, -0.09939193725585938, -0.09587383270263672, -0.09235572814941406, -0.0888376235961914, -0.08531951904296875, -0.0818014144897461, -0.07828330993652344, -0.07476520538330078, -0.07124710083007812, -0.06772899627685547, -0.06421089172363281, -0.060692787170410156, -0.0571746826171875, -0.053656578063964844, -0.05013847351074219, -0.04662036895751953, -0.043102264404296875, -0.03958415985107422, -0.03606605529785156, -0.032547950744628906, -0.02902984619140625, -0.025511741638183594, -0.021993637084960938, -0.01847553253173828, -0.014957427978515625, -0.011439323425292969, -0.007921218872070312, -0.004403114318847656, -0.000885009765625, 0.0026330947875976562, 0.0061511993408203125, 0.009669303894042969, 0.013187408447265625, 0.01670551300048828, 0.020223617553710938, 0.023741722106933594, 0.02725982666015625, 0.030777931213378906, 0.03429603576660156, 0.03781414031982422, 0.041332244873046875, 0.04485034942626953, 0.04836845397949219, 0.051886558532714844, 0.0554046630859375, 0.058922767639160156, 0.06244087219238281, 0.06595897674560547, 0.06947708129882812, 0.07299518585205078, 0.07651329040527344, 0.0800313949584961, 0.08354949951171875, 0.0870676040649414, 0.09058570861816406, 0.09410381317138672, 0.09762191772460938, 0.10114002227783203, 0.10465812683105469, 0.10817623138427734, 0.1116943359375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 7.0, 11.0, 17.0, 26.0, 25.0, 34.0, 63.0, 72.0, 100.0, 110.0, 113.0, 80.0, 85.0, 82.0, 46.0, 29.0, 18.0, 21.0, 15.0, 8.0, 10.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.587047815322876, -1.5433791875839233, -1.4997106790542603, -1.4560420513153076, -1.4123735427856445, -1.368704915046692, -1.3250362873077393, -1.2813677787780762, -1.2376991510391235, -1.194030523300171, -1.1503620147705078, -1.1066933870315552, -1.0630247592926025, -1.0193562507629395, -0.9756876230239868, -0.932019054889679, -0.8883504867553711, -0.8446819186210632, -0.8010133504867554, -0.7573447227478027, -0.7136761546134949, -0.670007586479187, -0.6263389587402344, -0.5826703906059265, -0.5390018224716187, -0.4953332543373108, -0.45166465640068054, -0.4079960584640503, -0.36432749032974243, -0.32065892219543457, -0.2769903242588043, -0.23332172632217407, -0.18965303897857666, -0.1459844559431076, -0.10231587290763855, -0.058647289872169495, -0.01497870683670044, 0.028689876198768616, 0.07235845923423767, 0.11602705717086792, 0.15969562530517578, 0.20336420834064484, 0.2470327913761139, 0.29070138931274414, 0.334369957447052, 0.37803852558135986, 0.4217071235179901, 0.46537572145462036, 0.5090442895889282, 0.5527128577232361, 0.596381425857544, 0.6400500535964966, 0.6837186217308044, 0.7273871898651123, 0.7710558176040649, 0.8147243857383728, 0.8583929538726807, 0.9020615220069885, 0.9457300901412964, 0.989398717880249, 1.033067226409912, 1.0767358541488647, 1.1204044818878174, 1.1640729904174805, 1.207741618156433]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 11.0, 14.0, 9.0, 13.0, 15.0, 18.0, 26.0, 28.0, 26.0, 31.0, 33.0, 32.0, 33.0, 47.0, 36.0, 35.0, 46.0, 47.0, 38.0, 41.0, 52.0, 46.0, 34.0, 44.0, 27.0, 24.0, 24.0, 24.0, 26.0, 17.0, 19.0, 12.0, 12.0, 9.0, 13.0, 6.0, 7.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.5790503025054932, -1.52711021900177, -1.4751700162887573, -1.4232299327850342, -1.371289849281311, -1.319349765777588, -1.2674095630645752, -1.215469479560852, -1.163529396057129, -1.1115893125534058, -1.059649109840393, -1.00770902633667, -0.9557689428329468, -0.9038287997245789, -0.8518886566162109, -0.7999485731124878, -0.7480083703994751, -0.6960682272911072, -0.644128143787384, -0.5921880006790161, -0.540247917175293, -0.48830777406692505, -0.43636763095855713, -0.3844275176525116, -0.33248740434646606, -0.28054729104042053, -0.2286071628332138, -0.17666703462600708, -0.12472692131996155, -0.07278680801391602, -0.020846664905548096, 0.031093448400497437, 0.08303344249725342, 0.13497355580329895, 0.18691368401050568, 0.2388538122177124, 0.29079392552375793, 0.34273403882980347, 0.3946741819381714, 0.4466142952442169, 0.49855440855026245, 0.5504945516586304, 0.6024346351623535, 0.6543747782707214, 0.7063149213790894, 0.7582550048828125, 0.8101951479911804, 0.8621352910995483, 0.9140753746032715, 0.9660155177116394, 1.0179556608200073, 1.0698957443237305, 1.1218358278274536, 1.1737759113311768, 1.2257161140441895, 1.2776561975479126, 1.3295962810516357, 1.3815363645553589, 1.4334765672683716, 1.4854166507720947, 1.5373567342758179, 1.589296817779541, 1.6412370204925537, 1.6931771039962769, 1.7451173067092896]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 5.0, 3.0, 2.0, 7.0, 9.0, 12.0, 13.0, 10.0, 21.0, 25.0, 46.0, 52.0, 56.0, 88.0, 162.0, 258.0, 366.0, 644.0, 1188.0, 2411.0, 5905.0, 25487.0, 438903.0, 3418274.0, 271268.0, 19008.0, 5135.0, 2135.0, 1137.0, 572.0, 360.0, 230.0, 157.0, 91.0, 61.0, 48.0, 31.0, 28.0, 19.0, 16.0, 13.0, 11.0, 7.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9450225830078125, -0.904693603515625, -0.8643646240234375, -0.82403564453125, -0.7837066650390625, -0.743377685546875, -0.7030487060546875, -0.6627197265625, -0.6223907470703125, -0.582061767578125, -0.5417327880859375, -0.50140380859375, -0.4610748291015625, -0.420745849609375, -0.3804168701171875, -0.340087890625, -0.2997589111328125, -0.259429931640625, -0.2191009521484375, -0.17877197265625, -0.1384429931640625, -0.098114013671875, -0.0577850341796875, -0.0174560546875, 0.0228729248046875, 0.063201904296875, 0.1035308837890625, 0.14385986328125, 0.1841888427734375, 0.224517822265625, 0.2648468017578125, 0.30517578125, 0.3455047607421875, 0.385833740234375, 0.4261627197265625, 0.46649169921875, 0.5068206787109375, 0.547149658203125, 0.5874786376953125, 0.6278076171875, 0.6681365966796875, 0.708465576171875, 0.7487945556640625, 0.78912353515625, 0.8294525146484375, 0.869781494140625, 0.9101104736328125, 0.950439453125, 0.9907684326171875, 1.031097412109375, 1.0714263916015625, 1.11175537109375, 1.1520843505859375, 1.192413330078125, 1.2327423095703125, 1.2730712890625, 1.3134002685546875, 1.353729248046875, 1.3940582275390625, 1.43438720703125, 1.4747161865234375, 1.515045166015625, 1.5553741455078125, 1.595703125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 7.0, 9.0, 6.0, 14.0, 13.0, 17.0, 36.0, 18.0, 38.0, 32.0, 29.0, 44.0, 45.0, 44.0, 58.0, 53.0, 46.0, 57.0, 40.0, 45.0, 48.0, 45.0, 40.0, 22.0, 23.0, 26.0, 19.0, 31.0, 15.0, 13.0, 11.0, 12.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.489501953125, -0.4735145568847656, -0.45752716064453125, -0.4415397644042969, -0.4255523681640625, -0.4095649719238281, -0.39357757568359375, -0.3775901794433594, -0.361602783203125, -0.3456153869628906, -0.32962799072265625, -0.3136405944824219, -0.2976531982421875, -0.2816658020019531, -0.26567840576171875, -0.24969100952148438, -0.23370361328125, -0.21771621704101562, -0.20172882080078125, -0.18574142456054688, -0.1697540283203125, -0.15376663208007812, -0.13777923583984375, -0.12179183959960938, -0.105804443359375, -0.08981704711914062, -0.07382965087890625, -0.057842254638671875, -0.0418548583984375, -0.025867462158203125, -0.00988006591796875, 0.006107330322265625, 0.0220947265625, 0.038082122802734375, 0.05406951904296875, 0.07005691528320312, 0.0860443115234375, 0.10203170776367188, 0.11801910400390625, 0.13400650024414062, 0.149993896484375, 0.16598129272460938, 0.18196868896484375, 0.19795608520507812, 0.2139434814453125, 0.22993087768554688, 0.24591827392578125, 0.2619056701660156, 0.27789306640625, 0.2938804626464844, 0.30986785888671875, 0.3258552551269531, 0.3418426513671875, 0.3578300476074219, 0.37381744384765625, 0.3898048400878906, 0.405792236328125, 0.4217796325683594, 0.43776702880859375, 0.4537544250488281, 0.4697418212890625, 0.4857292175292969, 0.5017166137695312, 0.5177040100097656, 0.53369140625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 10.0, 7.0, 20.0, 32.0, 36.0, 49.0, 104.0, 158.0, 328.0, 640.0, 1487.0, 4294.0, 17886.0, 216953.0, 3853912.0, 82171.0, 10999.0, 2978.0, 1111.0, 510.0, 239.0, 128.0, 83.0, 63.0, 34.0, 14.0, 7.0, 9.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.7650299072265625, -1.713653564453125, -1.6622772216796875, -1.61090087890625, -1.5595245361328125, -1.508148193359375, -1.4567718505859375, -1.4053955078125, -1.3540191650390625, -1.302642822265625, -1.2512664794921875, -1.19989013671875, -1.1485137939453125, -1.097137451171875, -1.0457611083984375, -0.994384765625, -0.9430084228515625, -0.891632080078125, -0.8402557373046875, -0.78887939453125, -0.7375030517578125, -0.686126708984375, -0.6347503662109375, -0.5833740234375, -0.5319976806640625, -0.480621337890625, -0.4292449951171875, -0.37786865234375, -0.3264923095703125, -0.275115966796875, -0.2237396240234375, -0.17236328125, -0.1209869384765625, -0.069610595703125, -0.0182342529296875, 0.03314208984375, 0.0845184326171875, 0.135894775390625, 0.1872711181640625, 0.2386474609375, 0.2900238037109375, 0.341400146484375, 0.3927764892578125, 0.44415283203125, 0.4955291748046875, 0.546905517578125, 0.5982818603515625, 0.649658203125, 0.7010345458984375, 0.752410888671875, 0.8037872314453125, 0.85516357421875, 0.9065399169921875, 0.957916259765625, 1.0092926025390625, 1.0606689453125, 1.1120452880859375, 1.163421630859375, 1.2147979736328125, 1.26617431640625, 1.3175506591796875, 1.368927001953125, 1.4203033447265625, 1.4716796875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 14.0, 26.0, 31.0, 40.0, 72.0, 168.0, 379.0, 916.0, 1217.0, 633.0, 260.0, 101.0, 62.0, 46.0, 30.0, 18.0, 12.0, 9.0, 5.0, 4.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.390380859375, -0.37659454345703125, -0.3628082275390625, -0.34902191162109375, -0.335235595703125, -0.32144927978515625, -0.3076629638671875, -0.29387664794921875, -0.28009033203125, -0.26630401611328125, -0.2525177001953125, -0.23873138427734375, -0.224945068359375, -0.21115875244140625, -0.1973724365234375, -0.18358612060546875, -0.1697998046875, -0.15601348876953125, -0.1422271728515625, -0.12844085693359375, -0.114654541015625, -0.10086822509765625, -0.0870819091796875, -0.07329559326171875, -0.05950927734375, -0.04572296142578125, -0.0319366455078125, -0.01815032958984375, -0.004364013671875, 0.00942230224609375, 0.0232086181640625, 0.03699493408203125, 0.05078125, 0.06456756591796875, 0.0783538818359375, 0.09214019775390625, 0.105926513671875, 0.11971282958984375, 0.1334991455078125, 0.14728546142578125, 0.16107177734375, 0.17485809326171875, 0.1886444091796875, 0.20243072509765625, 0.216217041015625, 0.23000335693359375, 0.2437896728515625, 0.25757598876953125, 0.2713623046875, 0.28514862060546875, 0.2989349365234375, 0.31272125244140625, 0.326507568359375, 0.34029388427734375, 0.3540802001953125, 0.36786651611328125, 0.38165283203125, 0.39543914794921875, 0.4092254638671875, 0.42301177978515625, 0.436798095703125, 0.45058441162109375, 0.4643707275390625, 0.47815704345703125, 0.491943359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 13.0, 13.0, 11.0, 23.0, 16.0, 32.0, 36.0, 56.0, 58.0, 87.0, 101.0, 96.0, 94.0, 71.0, 62.0, 45.0, 40.0, 38.0, 16.0, 21.0, 8.0, 12.0, 11.0, 2.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0983513593673706, -1.0688427686691284, -1.0393342971801758, -1.0098257064819336, -0.9803171753883362, -0.9508086442947388, -0.9213001132011414, -0.891791582107544, -0.8622830510139465, -0.8327745199203491, -0.8032659888267517, -0.7737574577331543, -0.7442488670349121, -0.7147403359413147, -0.6852318048477173, -0.6557232737541199, -0.6262147426605225, -0.596706211566925, -0.5671976804733276, -0.5376890897750854, -0.508180558681488, -0.4786720275878906, -0.4491634964942932, -0.4196549654006958, -0.3901463747024536, -0.3606378436088562, -0.3311292827129364, -0.301620751619339, -0.2721122205257416, -0.24260367453098297, -0.21309512853622437, -0.18358659744262695, -0.15407806634902954, -0.12456952780485153, -0.09506098926067352, -0.06555244326591492, -0.03604390472173691, -0.006535366177558899, 0.022973179817199707, 0.05248171091079712, 0.08199025690555573, 0.11149879544973373, 0.14100733399391174, 0.17051587998867035, 0.20002442598342896, 0.22953295707702637, 0.2590414881706238, 0.2885500192642212, 0.318058580160141, 0.3475671112537384, 0.3770756721496582, 0.4065842032432556, 0.436092734336853, 0.46560126543045044, 0.49510982632637024, 0.52461838722229, 0.5541269183158875, 0.5836354494094849, 0.6131439805030823, 0.6426525115966797, 0.6721611022949219, 0.7016696333885193, 0.7311781644821167, 0.7606866955757141, 0.7901952266693115]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 4.0, 6.0, 11.0, 11.0, 14.0, 21.0, 22.0, 18.0, 34.0, 28.0, 26.0, 30.0, 31.0, 30.0, 34.0, 36.0, 49.0, 34.0, 39.0, 38.0, 40.0, 40.0, 45.0, 32.0, 31.0, 40.0, 36.0, 32.0, 40.0, 24.0, 20.0, 14.0, 8.0, 16.0, 12.0, 14.0, 7.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6165400147438049, -0.5979072451591492, -0.5792744159698486, -0.5606416463851929, -0.5420088768005371, -0.5233761072158813, -0.5047432780265808, -0.48611050844192505, -0.4674777090549469, -0.44884490966796875, -0.430212140083313, -0.41157934069633484, -0.3929465413093567, -0.3743137717247009, -0.3556809723377228, -0.33704817295074463, -0.31841540336608887, -0.2997826039791107, -0.28114983439445496, -0.2625170350074768, -0.24388425052165985, -0.2252514660358429, -0.20661866664886475, -0.1879858821630478, -0.16935309767723083, -0.15072031319141388, -0.13208752870559692, -0.11345472931861877, -0.09482194483280182, -0.07618916034698486, -0.05755636841058731, -0.03892357647418976, -0.020290851593017578, -0.001658063381910324, 0.01697472482919693, 0.035607513040304184, 0.05424030125141144, 0.0728730857372284, 0.09150587767362595, 0.1101386696100235, 0.12877145409584045, 0.1474042385816574, 0.16603702306747437, 0.18466982245445251, 0.20330260694026947, 0.22193539142608643, 0.24056819081306458, 0.2592009902000427, 0.2778337597846985, 0.29646655917167664, 0.3150993287563324, 0.33373212814331055, 0.3523648977279663, 0.37099769711494446, 0.3896304965019226, 0.40826326608657837, 0.4268960654735565, 0.44552886486053467, 0.46416163444519043, 0.4827944338321686, 0.5014272332191467, 0.5200600028038025, 0.5386927723884583, 0.5573256015777588, 0.5759583711624146]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 9.0, 5.0, 15.0, 16.0, 20.0, 28.0, 37.0, 44.0, 60.0, 104.0, 140.0, 224.0, 297.0, 515.0, 795.0, 1541.0, 2901.0, 6545.0, 17612.0, 56713.0, 260125.0, 535964.0, 113897.0, 30880.0, 10556.0, 4304.0, 2147.0, 1117.0, 659.0, 369.0, 280.0, 196.0, 120.0, 77.0, 75.0, 52.0, 26.0, 21.0, 17.0, 8.0, 9.0, 14.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.184814453125, -0.17925643920898438, -0.17369842529296875, -0.16814041137695312, -0.1625823974609375, -0.15702438354492188, -0.15146636962890625, -0.14590835571289062, -0.140350341796875, -0.13479232788085938, -0.12923431396484375, -0.12367630004882812, -0.1181182861328125, -0.11256027221679688, -0.10700225830078125, -0.10144424438476562, -0.09588623046875, -0.09032821655273438, -0.08477020263671875, -0.07921218872070312, -0.0736541748046875, -0.06809616088867188, -0.06253814697265625, -0.056980133056640625, -0.051422119140625, -0.045864105224609375, -0.04030609130859375, -0.034748077392578125, -0.0291900634765625, -0.023632049560546875, -0.01807403564453125, -0.012516021728515625, -0.0069580078125, -0.001399993896484375, 0.00415802001953125, 0.009716033935546875, 0.0152740478515625, 0.020832061767578125, 0.02639007568359375, 0.031948089599609375, 0.037506103515625, 0.043064117431640625, 0.04862213134765625, 0.054180145263671875, 0.0597381591796875, 0.06529617309570312, 0.07085418701171875, 0.07641220092773438, 0.08197021484375, 0.08752822875976562, 0.09308624267578125, 0.09864425659179688, 0.1042022705078125, 0.10976028442382812, 0.11531829833984375, 0.12087631225585938, 0.126434326171875, 0.13199234008789062, 0.13755035400390625, 0.14310836791992188, 0.1486663818359375, 0.15422439575195312, 0.15978240966796875, 0.16534042358398438, 0.1708984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 3.0, 3.0, 3.0, 7.0, 12.0, 13.0, 16.0, 20.0, 24.0, 26.0, 27.0, 37.0, 25.0, 27.0, 51.0, 33.0, 37.0, 50.0, 46.0, 43.0, 41.0, 48.0, 45.0, 41.0, 39.0, 33.0, 34.0, 32.0, 27.0, 32.0, 29.0, 19.0, 15.0, 8.0, 11.0, 13.0, 6.0, 6.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41943359375, -0.40528106689453125, -0.3911285400390625, -0.37697601318359375, -0.362823486328125, -0.34867095947265625, -0.3345184326171875, -0.32036590576171875, -0.30621337890625, -0.29206085205078125, -0.2779083251953125, -0.26375579833984375, -0.249603271484375, -0.23545074462890625, -0.2212982177734375, -0.20714569091796875, -0.1929931640625, -0.17884063720703125, -0.1646881103515625, -0.15053558349609375, -0.136383056640625, -0.12223052978515625, -0.1080780029296875, -0.09392547607421875, -0.07977294921875, -0.06562042236328125, -0.0514678955078125, -0.03731536865234375, -0.023162841796875, -0.00901031494140625, 0.0051422119140625, 0.01929473876953125, 0.033447265625, 0.04759979248046875, 0.0617523193359375, 0.07590484619140625, 0.090057373046875, 0.10420989990234375, 0.1183624267578125, 0.13251495361328125, 0.14666748046875, 0.16082000732421875, 0.1749725341796875, 0.18912506103515625, 0.203277587890625, 0.21743011474609375, 0.2315826416015625, 0.24573516845703125, 0.2598876953125, 0.27404022216796875, 0.2881927490234375, 0.30234527587890625, 0.316497802734375, 0.33065032958984375, 0.3448028564453125, 0.35895538330078125, 0.37310791015625, 0.38726043701171875, 0.4014129638671875, 0.41556549072265625, 0.429718017578125, 0.44387054443359375, 0.4580230712890625, 0.47217559814453125, 0.486328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 10.0, 14.0, 18.0, 30.0, 48.0, 73.0, 105.0, 142.0, 200.0, 301.0, 444.0, 705.0, 994.0, 1472.0, 2313.0, 3241.0, 5034.0, 7613.0, 11899.0, 19237.0, 31833.0, 56229.0, 105556.0, 198293.0, 250989.0, 155206.0, 81670.0, 44106.0, 25627.0, 15831.0, 10101.0, 6400.0, 4282.0, 2760.0, 1852.0, 1280.0, 844.0, 550.0, 431.0, 266.0, 155.0, 126.0, 69.0, 59.0, 42.0, 37.0, 23.0, 13.0, 7.0, 9.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0479736328125, -0.046488285064697266, -0.04500293731689453, -0.0435175895690918, -0.04203224182128906, -0.04054689407348633, -0.039061546325683594, -0.03757619857788086, -0.036090850830078125, -0.03460550308227539, -0.033120155334472656, -0.03163480758666992, -0.030149459838867188, -0.028664112091064453, -0.02717876434326172, -0.025693416595458984, -0.02420806884765625, -0.022722721099853516, -0.02123737335205078, -0.019752025604248047, -0.018266677856445312, -0.016781330108642578, -0.015295982360839844, -0.01381063461303711, -0.012325286865234375, -0.01083993911743164, -0.009354591369628906, -0.007869243621826172, -0.0063838958740234375, -0.004898548126220703, -0.0034132003784179688, -0.0019278526306152344, -0.0004425048828125, 0.0010428428649902344, 0.0025281906127929688, 0.004013538360595703, 0.0054988861083984375, 0.006984233856201172, 0.008469581604003906, 0.00995492935180664, 0.011440277099609375, 0.01292562484741211, 0.014410972595214844, 0.015896320343017578, 0.017381668090820312, 0.018867015838623047, 0.02035236358642578, 0.021837711334228516, 0.02332305908203125, 0.024808406829833984, 0.02629375457763672, 0.027779102325439453, 0.029264450073242188, 0.030749797821044922, 0.032235145568847656, 0.03372049331665039, 0.035205841064453125, 0.03669118881225586, 0.038176536560058594, 0.03966188430786133, 0.04114723205566406, 0.0426325798034668, 0.04411792755126953, 0.045603275299072266, 0.047088623046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 7.0, 1.0, 7.0, 6.0, 8.0, 8.0, 7.0, 8.0, 10.0, 13.0, 15.0, 18.0, 28.0, 21.0, 27.0, 36.0, 38.0, 36.0, 50.0, 50.0, 46.0, 41.0, 49.0, 38.0, 55.0, 50.0, 63.0, 28.0, 44.0, 27.0, 24.0, 24.0, 14.0, 20.0, 20.0, 21.0, 8.0, 11.0, 12.0, 8.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9638671875, -0.9322967529296875, -0.900726318359375, -0.8691558837890625, -0.83758544921875, -0.8060150146484375, -0.774444580078125, -0.7428741455078125, -0.7113037109375, -0.6797332763671875, -0.648162841796875, -0.6165924072265625, -0.58502197265625, -0.5534515380859375, -0.521881103515625, -0.4903106689453125, -0.458740234375, -0.4271697998046875, -0.395599365234375, -0.3640289306640625, -0.33245849609375, -0.3008880615234375, -0.269317626953125, -0.2377471923828125, -0.2061767578125, -0.1746063232421875, -0.143035888671875, -0.1114654541015625, -0.07989501953125, -0.0483245849609375, -0.016754150390625, 0.0148162841796875, 0.04638671875, 0.0779571533203125, 0.109527587890625, 0.1410980224609375, 0.17266845703125, 0.2042388916015625, 0.235809326171875, 0.2673797607421875, 0.2989501953125, 0.3305206298828125, 0.362091064453125, 0.3936614990234375, 0.42523193359375, 0.4568023681640625, 0.488372802734375, 0.5199432373046875, 0.551513671875, 0.5830841064453125, 0.614654541015625, 0.6462249755859375, 0.67779541015625, 0.7093658447265625, 0.740936279296875, 0.7725067138671875, 0.8040771484375, 0.8356475830078125, 0.867218017578125, 0.8987884521484375, 0.93035888671875, 0.9619293212890625, 0.993499755859375, 1.0250701904296875, 1.056640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 13.0, 11.0, 22.0, 30.0, 44.0, 60.0, 112.0, 220.0, 346.0, 795.0, 2288.0, 9599.0, 79916.0, 830273.0, 109289.0, 11094.0, 2566.0, 879.0, 446.0, 215.0, 131.0, 95.0, 32.0, 29.0, 15.0, 13.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0260772705078125, -0.025300025939941406, -0.024522781372070312, -0.02374553680419922, -0.022968292236328125, -0.02219104766845703, -0.021413803100585938, -0.020636558532714844, -0.01985931396484375, -0.019082069396972656, -0.018304824829101562, -0.01752758026123047, -0.016750335693359375, -0.01597309112548828, -0.015195846557617188, -0.014418601989746094, -0.013641357421875, -0.012864112854003906, -0.012086868286132812, -0.011309623718261719, -0.010532379150390625, -0.009755134582519531, -0.008977890014648438, -0.008200645446777344, -0.00742340087890625, -0.006646156311035156, -0.0058689117431640625, -0.005091667175292969, -0.004314422607421875, -0.0035371780395507812, -0.0027599334716796875, -0.0019826889038085938, -0.0012054443359375, -0.00042819976806640625, 0.0003490447998046875, 0.0011262893676757812, 0.001903533935546875, 0.0026807785034179688, 0.0034580230712890625, 0.004235267639160156, 0.00501251220703125, 0.005789756774902344, 0.0065670013427734375, 0.007344245910644531, 0.008121490478515625, 0.008898735046386719, 0.009675979614257812, 0.010453224182128906, 0.01123046875, 0.012007713317871094, 0.012784957885742188, 0.013562202453613281, 0.014339447021484375, 0.015116691589355469, 0.015893936157226562, 0.016671180725097656, 0.01744842529296875, 0.018225669860839844, 0.019002914428710938, 0.01978015899658203, 0.020557403564453125, 0.02133464813232422, 0.022111892700195312, 0.022889137268066406, 0.0236663818359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 11.0, 18.0, 30.0, 38.0, 67.0, 129.0, 214.0, 198.0, 122.0, 73.0, 41.0, 22.0, 17.0, 5.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1576881408691406e-05, -2.0233914256095886e-05, -1.8890947103500366e-05, -1.7547979950904846e-05, -1.6205012798309326e-05, -1.4862045645713806e-05, -1.3519078493118286e-05, -1.2176111340522766e-05, -1.0833144187927246e-05, -9.490177035331726e-06, -8.147209882736206e-06, -6.804242730140686e-06, -5.461275577545166e-06, -4.118308424949646e-06, -2.775341272354126e-06, -1.432374119758606e-06, -8.940696716308594e-08, 1.253560185432434e-06, 2.596527338027954e-06, 3.939494490623474e-06, 5.282461643218994e-06, 6.625428795814514e-06, 7.968395948410034e-06, 9.311363101005554e-06, 1.0654330253601074e-05, 1.1997297406196594e-05, 1.3340264558792114e-05, 1.4683231711387634e-05, 1.6026198863983154e-05, 1.7369166016578674e-05, 1.8712133169174194e-05, 2.0055100321769714e-05, 2.1398067474365234e-05, 2.2741034626960754e-05, 2.4084001779556274e-05, 2.5426968932151794e-05, 2.6769936084747314e-05, 2.8112903237342834e-05, 2.9455870389938354e-05, 3.0798837542533875e-05, 3.2141804695129395e-05, 3.3484771847724915e-05, 3.4827739000320435e-05, 3.6170706152915955e-05, 3.7513673305511475e-05, 3.8856640458106995e-05, 4.0199607610702515e-05, 4.1542574763298035e-05, 4.2885541915893555e-05, 4.4228509068489075e-05, 4.5571476221084595e-05, 4.6914443373680115e-05, 4.8257410526275635e-05, 4.9600377678871155e-05, 5.0943344831466675e-05, 5.2286311984062195e-05, 5.3629279136657715e-05, 5.4972246289253235e-05, 5.6315213441848755e-05, 5.7658180594444275e-05, 5.9001147747039795e-05, 6.0344114899635315e-05, 6.168708205223083e-05, 6.303004920482635e-05, 6.437301635742188e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 1.0, 4.0, 7.0, 7.0, 9.0, 12.0, 20.0, 17.0, 38.0, 38.0, 105.0, 144.0, 274.0, 528.0, 1116.0, 2671.0, 8469.0, 62229.0, 871735.0, 85655.0, 9731.0, 2989.0, 1367.0, 626.0, 351.0, 183.0, 84.0, 57.0, 32.0, 16.0, 11.0, 10.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0341796875, -0.03324460983276367, -0.032309532165527344, -0.031374454498291016, -0.030439376831054688, -0.02950429916381836, -0.02856922149658203, -0.027634143829345703, -0.026699066162109375, -0.025763988494873047, -0.02482891082763672, -0.02389383316040039, -0.022958755493164062, -0.022023677825927734, -0.021088600158691406, -0.020153522491455078, -0.01921844482421875, -0.018283367156982422, -0.017348289489746094, -0.016413211822509766, -0.015478134155273438, -0.01454305648803711, -0.013607978820800781, -0.012672901153564453, -0.011737823486328125, -0.010802745819091797, -0.009867668151855469, -0.00893259048461914, -0.007997512817382812, -0.007062435150146484, -0.006127357482910156, -0.005192279815673828, -0.0042572021484375, -0.003322124481201172, -0.0023870468139648438, -0.0014519691467285156, -0.0005168914794921875, 0.0004181861877441406, 0.0013532638549804688, 0.002288341522216797, 0.003223419189453125, 0.004158496856689453, 0.005093574523925781, 0.006028652191162109, 0.0069637298583984375, 0.007898807525634766, 0.008833885192871094, 0.009768962860107422, 0.01070404052734375, 0.011639118194580078, 0.012574195861816406, 0.013509273529052734, 0.014444351196289062, 0.01537942886352539, 0.01631450653076172, 0.017249584197998047, 0.018184661865234375, 0.019119739532470703, 0.02005481719970703, 0.02098989486694336, 0.021924972534179688, 0.022860050201416016, 0.023795127868652344, 0.024730205535888672, 0.025665283203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 6.0, 5.0, 5.0, 3.0, 17.0, 13.0, 25.0, 43.0, 60.0, 120.0, 197.0, 194.0, 127.0, 63.0, 44.0, 21.0, 16.0, 7.0, 8.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006626129150390625, -0.006381094455718994, -0.006136059761047363, -0.005891025066375732, -0.0056459903717041016, -0.005400955677032471, -0.00515592098236084, -0.004910886287689209, -0.004665851593017578, -0.004420816898345947, -0.004175782203674316, -0.0039307475090026855, -0.0036857128143310547, -0.003440678119659424, -0.003195643424987793, -0.002950608730316162, -0.0027055740356445312, -0.0024605393409729004, -0.0022155046463012695, -0.0019704699516296387, -0.0017254352569580078, -0.001480400562286377, -0.001235365867614746, -0.0009903311729431152, -0.0007452964782714844, -0.0005002617835998535, -0.00025522708892822266, -1.0192394256591797e-05, 0.00023484230041503906, 0.0004798769950866699, 0.0007249116897583008, 0.0009699463844299316, 0.0012149810791015625, 0.0014600157737731934, 0.0017050504684448242, 0.001950085163116455, 0.002195119857788086, 0.002440154552459717, 0.0026851892471313477, 0.0029302239418029785, 0.0031752586364746094, 0.0034202933311462402, 0.003665328025817871, 0.003910362720489502, 0.004155397415161133, 0.004400432109832764, 0.0046454668045043945, 0.004890501499176025, 0.005135536193847656, 0.005380570888519287, 0.005625605583190918, 0.005870640277862549, 0.00611567497253418, 0.0063607096672058105, 0.006605744361877441, 0.006850779056549072, 0.007095813751220703, 0.007340848445892334, 0.007585883140563965, 0.007830917835235596, 0.008075952529907227, 0.008320987224578857, 0.008566021919250488, 0.00881105661392212, 0.00905609130859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 12.0, 12.0, 11.0, 20.0, 22.0, 31.0, 20.0, 32.0, 61.0, 72.0, 94.0, 97.0, 106.0, 82.0, 69.0, 62.0, 47.0, 46.0, 21.0, 12.0, 16.0, 12.0, 10.0, 6.0, 10.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7597463130950928, -0.7397879362106323, -0.7198296189308167, -0.6998712420463562, -0.6799129247665405, -0.6599545478820801, -0.6399961709976196, -0.620037853717804, -0.6000794768333435, -0.5801210999488831, -0.5601627826690674, -0.5402044057846069, -0.5202460885047913, -0.5002877116203308, -0.48032936453819275, -0.4603710174560547, -0.4404126703739166, -0.42045432329177856, -0.4004959762096405, -0.38053762912750244, -0.360579252243042, -0.34062090516090393, -0.32066255807876587, -0.3007041811943054, -0.28074586391448975, -0.2607875168323517, -0.24082915484905243, -0.22087080776691437, -0.2009124457836151, -0.18095409870147705, -0.160995751619339, -0.14103738963603973, -0.12107902765274048, -0.10112067312002182, -0.08116231858730316, -0.0612039715051651, -0.04124561697244644, -0.021287262439727783, -0.0013289153575897217, 0.018629446625709534, 0.038587793707847595, 0.058546148240566254, 0.07850450277328491, 0.09846284985542297, 0.11842120438814163, 0.1383795589208603, 0.15833790600299835, 0.1782962679862976, 0.19825461506843567, 0.21821296215057373, 0.23817132413387299, 0.25812965631484985, 0.2780880331993103, 0.29804638028144836, 0.3180047273635864, 0.3379631042480469, 0.35792142152786255, 0.3778797686100006, 0.39783811569213867, 0.4177964925765991, 0.4377548396587372, 0.45771318674087524, 0.4776715338230133, 0.49762988090515137, 0.5175882577896118]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 5.0, 5.0, 4.0, 12.0, 20.0, 20.0, 20.0, 27.0, 33.0, 31.0, 30.0, 30.0, 36.0, 41.0, 36.0, 43.0, 44.0, 39.0, 42.0, 46.0, 41.0, 38.0, 50.0, 37.0, 37.0, 45.0, 37.0, 32.0, 19.0, 12.0, 17.0, 10.0, 14.0, 9.0, 11.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42468205094337463, -0.41093510389328003, -0.39718812704086304, -0.38344117999076843, -0.36969423294067383, -0.3559472858905792, -0.3422003388404846, -0.3284533619880676, -0.314706414937973, -0.3009594678878784, -0.2872124910354614, -0.2734655439853668, -0.2597185969352722, -0.2459716498851776, -0.23222468793392181, -0.21847772598266602, -0.2047307789325714, -0.1909838318824768, -0.177236869931221, -0.1634899079799652, -0.1497429609298706, -0.135996013879776, -0.1222490519285202, -0.108502097427845, -0.0947551429271698, -0.0810081884264946, -0.0672612339258194, -0.053514279425144196, -0.039767324924468994, -0.026020370423793793, -0.012273415923118591, 0.00147353857755661, 0.015220493078231812, 0.028967447578907013, 0.042714402079582214, 0.056461356580257416, 0.07020831108093262, 0.08395526558160782, 0.09770222008228302, 0.11144917458295822, 0.12519612908363342, 0.13894307613372803, 0.15269003808498383, 0.16643700003623962, 0.18018394708633423, 0.19393089413642883, 0.20767785608768463, 0.22142481803894043, 0.23517176508903503, 0.24891871213912964, 0.26266568899154663, 0.27641263604164124, 0.29015958309173584, 0.30390653014183044, 0.31765347719192505, 0.33140045404434204, 0.34514740109443665, 0.35889434814453125, 0.37264132499694824, 0.38638827204704285, 0.40013521909713745, 0.41388216614723206, 0.42762911319732666, 0.44137609004974365, 0.45512303709983826]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 14.0, 6.0, 26.0, 35.0, 35.0, 68.0, 85.0, 128.0, 175.0, 275.0, 472.0, 802.0, 1257.0, 2501.0, 5309.0, 13697.0, 52268.0, 393283.0, 490158.0, 60726.0, 15061.0, 5756.0, 2779.0, 1378.0, 839.0, 485.0, 306.0, 201.0, 118.0, 90.0, 60.0, 44.0, 31.0, 15.0, 13.0, 13.0, 8.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.62646484375, -0.6095542907714844, -0.5926437377929688, -0.5757331848144531, -0.5588226318359375, -0.5419120788574219, -0.5250015258789062, -0.5080909729003906, -0.491180419921875, -0.4742698669433594, -0.45735931396484375, -0.4404487609863281, -0.4235382080078125, -0.4066276550292969, -0.38971710205078125, -0.3728065490722656, -0.35589599609375, -0.3389854431152344, -0.32207489013671875, -0.3051643371582031, -0.2882537841796875, -0.2713432312011719, -0.25443267822265625, -0.23752212524414062, -0.220611572265625, -0.20370101928710938, -0.18679046630859375, -0.16987991333007812, -0.1529693603515625, -0.13605880737304688, -0.11914825439453125, -0.10223770141601562, -0.0853271484375, -0.06841659545898438, -0.05150604248046875, -0.034595489501953125, -0.0176849365234375, -0.000774383544921875, 0.01613616943359375, 0.033046722412109375, 0.049957275390625, 0.06686782836914062, 0.08377838134765625, 0.10068893432617188, 0.1175994873046875, 0.13451004028320312, 0.15142059326171875, 0.16833114624023438, 0.18524169921875, 0.20215225219726562, 0.21906280517578125, 0.23597335815429688, 0.2528839111328125, 0.2697944641113281, 0.28670501708984375, 0.3036155700683594, 0.320526123046875, 0.3374366760253906, 0.35434722900390625, 0.3712577819824219, 0.3881683349609375, 0.4050788879394531, 0.42198944091796875, 0.4388999938964844, 0.455810546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 7.0, 6.0, 6.0, 9.0, 11.0, 14.0, 31.0, 21.0, 28.0, 33.0, 33.0, 33.0, 51.0, 40.0, 52.0, 53.0, 55.0, 54.0, 62.0, 49.0, 50.0, 34.0, 56.0, 40.0, 38.0, 36.0, 27.0, 14.0, 14.0, 6.0, 10.0, 8.0, 11.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1689453125, -1.1388092041015625, -1.108673095703125, -1.0785369873046875, -1.04840087890625, -1.0182647705078125, -0.988128662109375, -0.9579925537109375, -0.9278564453125, -0.8977203369140625, -0.867584228515625, -0.8374481201171875, -0.80731201171875, -0.7771759033203125, -0.747039794921875, -0.7169036865234375, -0.686767578125, -0.6566314697265625, -0.626495361328125, -0.5963592529296875, -0.56622314453125, -0.5360870361328125, -0.505950927734375, -0.4758148193359375, -0.4456787109375, -0.4155426025390625, -0.385406494140625, -0.3552703857421875, -0.32513427734375, -0.2949981689453125, -0.264862060546875, -0.2347259521484375, -0.20458984375, -0.1744537353515625, -0.144317626953125, -0.1141815185546875, -0.08404541015625, -0.0539093017578125, -0.023773193359375, 0.0063629150390625, 0.0364990234375, 0.0666351318359375, 0.096771240234375, 0.1269073486328125, 0.15704345703125, 0.1871795654296875, 0.217315673828125, 0.2474517822265625, 0.277587890625, 0.3077239990234375, 0.337860107421875, 0.3679962158203125, 0.39813232421875, 0.4282684326171875, 0.458404541015625, 0.4885406494140625, 0.5186767578125, 0.5488128662109375, 0.578948974609375, 0.6090850830078125, 0.63922119140625, 0.6693572998046875, 0.699493408203125, 0.7296295166015625, 0.759765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 8.0, 7.0, 15.0, 12.0, 19.0, 21.0, 18.0, 18.0, 40.0, 45.0, 81.0, 143.0, 316.0, 957.0, 5815.0, 442122.0, 590921.0, 6131.0, 1072.0, 320.0, 122.0, 71.0, 48.0, 45.0, 33.0, 24.0, 18.0, 18.0, 20.0, 10.0, 6.0, 10.0, 7.0, 2.0, 3.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7209625244140625, -1.661651611328125, -1.6023406982421875, -1.54302978515625, -1.4837188720703125, -1.424407958984375, -1.3650970458984375, -1.3057861328125, -1.2464752197265625, -1.187164306640625, -1.1278533935546875, -1.06854248046875, -1.0092315673828125, -0.949920654296875, -0.8906097412109375, -0.831298828125, -0.7719879150390625, -0.712677001953125, -0.6533660888671875, -0.59405517578125, -0.5347442626953125, -0.475433349609375, -0.4161224365234375, -0.3568115234375, -0.2975006103515625, -0.238189697265625, -0.1788787841796875, -0.11956787109375, -0.0602569580078125, -0.000946044921875, 0.0583648681640625, 0.11767578125, 0.1769866943359375, 0.236297607421875, 0.2956085205078125, 0.35491943359375, 0.4142303466796875, 0.473541259765625, 0.5328521728515625, 0.5921630859375, 0.6514739990234375, 0.710784912109375, 0.7700958251953125, 0.82940673828125, 0.8887176513671875, 0.948028564453125, 1.0073394775390625, 1.066650390625, 1.1259613037109375, 1.185272216796875, 1.2445831298828125, 1.30389404296875, 1.3632049560546875, 1.422515869140625, 1.4818267822265625, 1.5411376953125, 1.6004486083984375, 1.659759521484375, 1.7190704345703125, 1.77838134765625, 1.8376922607421875, 1.897003173828125, 1.9563140869140625, 2.015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 11.0, 13.0, 16.0, 17.0, 22.0, 16.0, 21.0, 46.0, 45.0, 44.0, 47.0, 47.0, 47.0, 38.0, 43.0, 49.0, 40.0, 45.0, 44.0, 32.0, 35.0, 32.0, 29.0, 22.0, 38.0, 18.0, 23.0, 25.0, 15.0, 7.0, 6.0, 9.0, 4.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8963088989257812, -0.8653717041015625, -0.8344345092773438, -0.803497314453125, -0.7725601196289062, -0.7416229248046875, -0.7106857299804688, -0.67974853515625, -0.6488113403320312, -0.6178741455078125, -0.5869369506835938, -0.555999755859375, -0.5250625610351562, -0.4941253662109375, -0.46318817138671875, -0.4322509765625, -0.40131378173828125, -0.3703765869140625, -0.33943939208984375, -0.308502197265625, -0.27756500244140625, -0.2466278076171875, -0.21569061279296875, -0.18475341796875, -0.15381622314453125, -0.1228790283203125, -0.09194183349609375, -0.061004638671875, -0.03006744384765625, 0.0008697509765625, 0.03180694580078125, 0.062744140625, 0.09368133544921875, 0.1246185302734375, 0.15555572509765625, 0.186492919921875, 0.21743011474609375, 0.2483673095703125, 0.27930450439453125, 0.31024169921875, 0.34117889404296875, 0.3721160888671875, 0.40305328369140625, 0.433990478515625, 0.46492767333984375, 0.4958648681640625, 0.5268020629882812, 0.5577392578125, 0.5886764526367188, 0.6196136474609375, 0.6505508422851562, 0.681488037109375, 0.7124252319335938, 0.7433624267578125, 0.7742996215820312, 0.80523681640625, 0.8361740112304688, 0.8671112060546875, 0.8980484008789062, 0.928985595703125, 0.9599227905273438, 0.9908599853515625, 1.0217971801757812, 1.052734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 12.0, 10.0, 10.0, 23.0, 27.0, 31.0, 32.0, 55.0, 90.0, 173.0, 303.0, 603.0, 1559.0, 4901.0, 17832.0, 96555.0, 817512.0, 84779.0, 16466.0, 4591.0, 1572.0, 629.0, 298.0, 151.0, 87.0, 60.0, 46.0, 26.0, 20.0, 27.0, 11.0, 12.0, 7.0, 9.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.1312541961669922, -0.12664413452148438, -0.12203407287597656, -0.11742401123046875, -0.11281394958496094, -0.10820388793945312, -0.10359382629394531, -0.0989837646484375, -0.09437370300292969, -0.08976364135742188, -0.08515357971191406, -0.08054351806640625, -0.07593345642089844, -0.07132339477539062, -0.06671333312988281, -0.062103271484375, -0.05749320983886719, -0.052883148193359375, -0.04827308654785156, -0.04366302490234375, -0.03905296325683594, -0.034442901611328125, -0.029832839965820312, -0.0252227783203125, -0.020612716674804688, -0.016002655029296875, -0.011392593383789062, -0.00678253173828125, -0.0021724700927734375, 0.002437591552734375, 0.0070476531982421875, 0.01165771484375, 0.016267776489257812, 0.020877838134765625, 0.025487899780273438, 0.03009796142578125, 0.03470802307128906, 0.039318084716796875, 0.04392814636230469, 0.0485382080078125, 0.05314826965332031, 0.057758331298828125, 0.06236839294433594, 0.06697845458984375, 0.07158851623535156, 0.07619857788085938, 0.08080863952636719, 0.085418701171875, 0.09002876281738281, 0.09463882446289062, 0.09924888610839844, 0.10385894775390625, 0.10846900939941406, 0.11307907104492188, 0.11768913269042969, 0.1222991943359375, 0.1269092559814453, 0.13151931762695312, 0.13612937927246094, 0.14073944091796875, 0.14534950256347656, 0.14995956420898438, 0.1545696258544922, 0.1591796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 1.0, 12.0, 11.0, 10.0, 20.0, 25.0, 28.0, 42.0, 76.0, 95.0, 141.0, 159.0, 107.0, 72.0, 41.0, 36.0, 27.0, 19.0, 14.0, 13.0, 8.0, 3.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8537044525146484e-05, -1.7898157238960266e-05, -1.7259269952774048e-05, -1.662038266658783e-05, -1.598149538040161e-05, -1.5342608094215393e-05, -1.4703720808029175e-05, -1.4064833521842957e-05, -1.3425946235656738e-05, -1.278705894947052e-05, -1.2148171663284302e-05, -1.1509284377098083e-05, -1.0870397090911865e-05, -1.0231509804725647e-05, -9.592622518539429e-06, -8.95373523235321e-06, -8.314847946166992e-06, -7.675960659980774e-06, -7.037073373794556e-06, -6.398186087608337e-06, -5.759298801422119e-06, -5.120411515235901e-06, -4.481524229049683e-06, -3.842636942863464e-06, -3.203749656677246e-06, -2.564862370491028e-06, -1.9259750843048096e-06, -1.2870877981185913e-06, -6.48200511932373e-07, -9.313225746154785e-09, 6.295740604400635e-07, 1.2684613466262817e-06, 1.9073486328125e-06, 2.5462359189987183e-06, 3.1851232051849365e-06, 3.824010491371155e-06, 4.462897777557373e-06, 5.101785063743591e-06, 5.7406723499298096e-06, 6.379559636116028e-06, 7.018446922302246e-06, 7.657334208488464e-06, 8.296221494674683e-06, 8.935108780860901e-06, 9.573996067047119e-06, 1.0212883353233337e-05, 1.0851770639419556e-05, 1.1490657925605774e-05, 1.2129545211791992e-05, 1.276843249797821e-05, 1.3407319784164429e-05, 1.4046207070350647e-05, 1.4685094356536865e-05, 1.5323981642723083e-05, 1.5962868928909302e-05, 1.660175621509552e-05, 1.7240643501281738e-05, 1.7879530787467957e-05, 1.8518418073654175e-05, 1.9157305359840393e-05, 1.979619264602661e-05, 2.043507993221283e-05, 2.1073967218399048e-05, 2.1712854504585266e-05, 2.2351741790771484e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 9.0, 16.0, 27.0, 63.0, 108.0, 275.0, 561.0, 1380.0, 5444.0, 65238.0, 942693.0, 27087.0, 3542.0, 1140.0, 502.0, 193.0, 121.0, 65.0, 29.0, 14.0, 11.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.4912109375, -0.48013877868652344, -0.4690666198730469, -0.4579944610595703, -0.44692230224609375, -0.4358501434326172, -0.4247779846191406, -0.41370582580566406, -0.4026336669921875, -0.39156150817871094, -0.3804893493652344, -0.3694171905517578, -0.35834503173828125, -0.3472728729248047, -0.3362007141113281, -0.32512855529785156, -0.314056396484375, -0.30298423767089844, -0.2919120788574219, -0.2808399200439453, -0.26976776123046875, -0.2586956024169922, -0.24762344360351562, -0.23655128479003906, -0.2254791259765625, -0.21440696716308594, -0.20333480834960938, -0.1922626495361328, -0.18119049072265625, -0.1701183319091797, -0.15904617309570312, -0.14797401428222656, -0.13690185546875, -0.12582969665527344, -0.11475753784179688, -0.10368537902832031, -0.09261322021484375, -0.08154106140136719, -0.07046890258789062, -0.05939674377441406, -0.0483245849609375, -0.03725242614746094, -0.026180267333984375, -0.015108108520507812, -0.00403594970703125, 0.0070362091064453125, 0.018108367919921875, 0.029180526733398438, 0.040252685546875, 0.05132484436035156, 0.062397003173828125, 0.07346916198730469, 0.08454132080078125, 0.09561347961425781, 0.10668563842773438, 0.11775779724121094, 0.1288299560546875, 0.13990211486816406, 0.15097427368164062, 0.1620464324951172, 0.17311859130859375, 0.1841907501220703, 0.19526290893554688, 0.20633506774902344, 0.2174072265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 18.0, 21.0, 27.0, 44.0, 77.0, 175.0, 395.0, 113.0, 40.0, 31.0, 13.0, 13.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07977294921875, -0.07562541961669922, -0.07147789001464844, -0.06733036041259766, -0.06318283081054688, -0.059035301208496094, -0.05488777160644531, -0.05074024200439453, -0.04659271240234375, -0.04244518280029297, -0.03829765319824219, -0.034150123596191406, -0.030002593994140625, -0.025855064392089844, -0.021707534790039062, -0.01756000518798828, -0.0134124755859375, -0.009264945983886719, -0.0051174163818359375, -0.0009698867797851562, 0.003177642822265625, 0.007325172424316406, 0.011472702026367188, 0.015620231628417969, 0.01976776123046875, 0.02391529083251953, 0.028062820434570312, 0.032210350036621094, 0.036357879638671875, 0.040505409240722656, 0.04465293884277344, 0.04880046844482422, 0.052947998046875, 0.05709552764892578, 0.06124305725097656, 0.06539058685302734, 0.06953811645507812, 0.0736856460571289, 0.07783317565917969, 0.08198070526123047, 0.08612823486328125, 0.09027576446533203, 0.09442329406738281, 0.0985708236694336, 0.10271835327148438, 0.10686588287353516, 0.11101341247558594, 0.11516094207763672, 0.1193084716796875, 0.12345600128173828, 0.12760353088378906, 0.13175106048583984, 0.13589859008789062, 0.1400461196899414, 0.1441936492919922, 0.14834117889404297, 0.15248870849609375, 0.15663623809814453, 0.1607837677001953, 0.1649312973022461, 0.16907882690429688, 0.17322635650634766, 0.17737388610839844, 0.18152141571044922, 0.1856689453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 11.0, 15.0, 15.0, 17.0, 16.0, 22.0, 44.0, 53.0, 57.0, 94.0, 100.0, 85.0, 96.0, 87.0, 70.0, 50.0, 48.0, 28.0, 14.0, 21.0, 17.0, 9.0, 6.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6432907581329346, -1.6036268472671509, -1.5639630556106567, -1.524299144744873, -1.4846352338790894, -1.4449713230133057, -1.4053075313568115, -1.3656436204910278, -1.3259797096252441, -1.2863157987594604, -1.2466520071029663, -1.2069880962371826, -1.167324185371399, -1.1276602745056152, -1.087996482849121, -1.0483325719833374, -1.0086686611175537, -0.9690048098564148, -0.9293408989906311, -0.8896770477294922, -0.8500131368637085, -0.8103492856025696, -0.7706854343414307, -0.731021523475647, -0.6913577318191528, -0.6516938805580139, -0.6120299696922302, -0.5723661184310913, -0.5327022075653076, -0.4930383563041687, -0.4533744752407074, -0.4137105941772461, -0.3740467429161072, -0.3343828618526459, -0.29471898078918457, -0.25505512952804565, -0.21539123356342316, -0.17572735249996185, -0.13606348633766174, -0.09639960527420044, -0.056735724210739136, -0.01707184687256813, 0.022592030465602875, 0.06225590407848358, 0.10191978514194489, 0.1415836662054062, 0.1812475323677063, 0.2209114134311676, 0.2605752944946289, 0.3002391755580902, 0.3399030566215515, 0.37956690788269043, 0.4192308187484741, 0.45889467000961304, 0.49855855107307434, 0.5382224321365356, 0.5778863430023193, 0.6175501942634583, 0.6572141051292419, 0.6968779563903809, 0.7365418672561646, 0.7762057185173035, 0.8158695697784424, 0.8555334806442261, 0.895197331905365]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 5.0, 8.0, 13.0, 15.0, 16.0, 22.0, 30.0, 29.0, 37.0, 38.0, 46.0, 57.0, 49.0, 53.0, 52.0, 70.0, 62.0, 62.0, 65.0, 59.0, 41.0, 33.0, 25.0, 20.0, 21.0, 16.0, 15.0, 21.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.650493860244751, -2.583235263824463, -2.515976667404175, -2.4487180709838867, -2.3814594745635986, -2.3142008781433105, -2.2469422817230225, -2.1796836853027344, -2.112424850463867, -2.045166254043579, -1.977907657623291, -1.910649061203003, -1.8433904647827148, -1.7761318683624268, -1.7088731527328491, -1.641614556312561, -1.5743560791015625, -1.5070974826812744, -1.4398388862609863, -1.3725802898406982, -1.3053216934204102, -1.238063097000122, -1.1708043813705444, -1.1035457849502563, -1.0362871885299683, -0.9690285921096802, -0.9017699956893921, -0.8345113396644592, -0.7672527432441711, -0.6999941468238831, -0.6327354907989502, -0.5654768943786621, -0.4982184171676636, -0.4309598207473755, -0.363701194524765, -0.29644256830215454, -0.22918397188186646, -0.16192537546157837, -0.0946667492389679, -0.027408123016357422, 0.039850473403930664, 0.10710908472537994, 0.17436769604682922, 0.2416263073682785, 0.3088849186897278, 0.37614351511001587, 0.44340214133262634, 0.5106607675552368, 0.5779193639755249, 0.645177960395813, 0.7124365568161011, 0.7796952128410339, 0.846953809261322, 0.9142124056816101, 0.981471061706543, 1.048729658126831, 1.1159882545471191, 1.1832468509674072, 1.2505054473876953, 1.3177640438079834, 1.3850226402282715, 1.4522812366485596, 1.5195399522781372, 1.5867985486984253, 1.6540571451187134]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 0.0, 4.0, 3.0, 9.0, 12.0, 13.0, 13.0, 21.0, 23.0, 32.0, 63.0, 71.0, 97.0, 152.0, 215.0, 317.0, 470.0, 692.0, 1055.0, 1672.0, 2878.0, 5296.0, 11293.0, 36011.0, 332132.0, 2778930.0, 906097.0, 81995.0, 18213.0, 7083.0, 3608.0, 2123.0, 1250.0, 828.0, 513.0, 355.0, 238.0, 156.0, 111.0, 64.0, 51.0, 39.0, 22.0, 19.0, 15.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9267578125, -0.8992538452148438, -0.8717498779296875, -0.8442459106445312, -0.816741943359375, -0.7892379760742188, -0.7617340087890625, -0.7342300415039062, -0.70672607421875, -0.6792221069335938, -0.6517181396484375, -0.6242141723632812, -0.596710205078125, -0.5692062377929688, -0.5417022705078125, -0.5141983032226562, -0.4866943359375, -0.45919036865234375, -0.4316864013671875, -0.40418243408203125, -0.376678466796875, -0.34917449951171875, -0.3216705322265625, -0.29416656494140625, -0.26666259765625, -0.23915863037109375, -0.2116546630859375, -0.18415069580078125, -0.156646728515625, -0.12914276123046875, -0.1016387939453125, -0.07413482666015625, -0.046630859375, -0.01912689208984375, 0.0083770751953125, 0.03588104248046875, 0.063385009765625, 0.09088897705078125, 0.1183929443359375, 0.14589691162109375, 0.17340087890625, 0.20090484619140625, 0.2284088134765625, 0.25591278076171875, 0.283416748046875, 0.31092071533203125, 0.3384246826171875, 0.36592864990234375, 0.3934326171875, 0.42093658447265625, 0.4484405517578125, 0.47594451904296875, 0.503448486328125, 0.5309524536132812, 0.5584564208984375, 0.5859603881835938, 0.61346435546875, 0.6409683227539062, 0.6684722900390625, 0.6959762573242188, 0.723480224609375, 0.7509841918945312, 0.7784881591796875, 0.8059921264648438, 0.83349609375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 7.0, 6.0, 9.0, 17.0, 23.0, 23.0, 27.0, 29.0, 39.0, 42.0, 36.0, 50.0, 59.0, 62.0, 55.0, 43.0, 48.0, 54.0, 49.0, 58.0, 48.0, 39.0, 38.0, 27.0, 30.0, 22.0, 11.0, 7.0, 10.0, 10.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.587890625, -0.570159912109375, -0.55242919921875, -0.534698486328125, -0.5169677734375, -0.499237060546875, -0.48150634765625, -0.463775634765625, -0.446044921875, -0.428314208984375, -0.41058349609375, -0.392852783203125, -0.3751220703125, -0.357391357421875, -0.33966064453125, -0.321929931640625, -0.30419921875, -0.286468505859375, -0.26873779296875, -0.251007080078125, -0.2332763671875, -0.215545654296875, -0.19781494140625, -0.180084228515625, -0.162353515625, -0.144622802734375, -0.12689208984375, -0.109161376953125, -0.0914306640625, -0.073699951171875, -0.05596923828125, -0.038238525390625, -0.0205078125, -0.002777099609375, 0.01495361328125, 0.032684326171875, 0.0504150390625, 0.068145751953125, 0.08587646484375, 0.103607177734375, 0.121337890625, 0.139068603515625, 0.15679931640625, 0.174530029296875, 0.1922607421875, 0.209991455078125, 0.22772216796875, 0.245452880859375, 0.26318359375, 0.280914306640625, 0.29864501953125, 0.316375732421875, 0.3341064453125, 0.351837158203125, 0.36956787109375, 0.387298583984375, 0.405029296875, 0.422760009765625, 0.44049072265625, 0.458221435546875, 0.4759521484375, 0.493682861328125, 0.51141357421875, 0.529144287109375, 0.546875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 14.0, 19.0, 15.0, 21.0, 43.0, 64.0, 115.0, 132.0, 265.0, 561.0, 1165.0, 2919.0, 8009.0, 27925.0, 186335.0, 3695809.0, 226985.0, 29776.0, 8418.0, 3096.0, 1223.0, 604.0, 296.0, 149.0, 90.0, 82.0, 43.0, 23.0, 24.0, 17.0, 12.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2811279296875, -1.242919921875, -1.2047119140625, -1.16650390625, -1.1282958984375, -1.090087890625, -1.0518798828125, -1.013671875, -0.9754638671875, -0.937255859375, -0.8990478515625, -0.86083984375, -0.8226318359375, -0.784423828125, -0.7462158203125, -0.7080078125, -0.6697998046875, -0.631591796875, -0.5933837890625, -0.55517578125, -0.5169677734375, -0.478759765625, -0.4405517578125, -0.40234375, -0.3641357421875, -0.325927734375, -0.2877197265625, -0.24951171875, -0.2113037109375, -0.173095703125, -0.1348876953125, -0.0966796875, -0.0584716796875, -0.020263671875, 0.0179443359375, 0.05615234375, 0.0943603515625, 0.132568359375, 0.1707763671875, 0.208984375, 0.2471923828125, 0.285400390625, 0.3236083984375, 0.36181640625, 0.4000244140625, 0.438232421875, 0.4764404296875, 0.5146484375, 0.5528564453125, 0.591064453125, 0.6292724609375, 0.66748046875, 0.7056884765625, 0.743896484375, 0.7821044921875, 0.8203125, 0.8585205078125, 0.896728515625, 0.9349365234375, 0.97314453125, 1.0113525390625, 1.049560546875, 1.0877685546875, 1.1259765625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 12.0, 5.0, 8.0, 19.0, 17.0, 33.0, 30.0, 59.0, 56.0, 99.0, 143.0, 298.0, 558.0, 832.0, 760.0, 461.0, 258.0, 131.0, 70.0, 51.0, 24.0, 35.0, 12.0, 12.0, 15.0, 14.0, 5.0, 11.0, 6.0, 7.0, 4.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28466796875, -0.2747993469238281, -0.26493072509765625, -0.2550621032714844, -0.2451934814453125, -0.23532485961914062, -0.22545623779296875, -0.21558761596679688, -0.205718994140625, -0.19585037231445312, -0.18598175048828125, -0.17611312866210938, -0.1662445068359375, -0.15637588500976562, -0.14650726318359375, -0.13663864135742188, -0.12677001953125, -0.11690139770507812, -0.10703277587890625, -0.09716415405273438, -0.0872955322265625, -0.07742691040039062, -0.06755828857421875, -0.057689666748046875, -0.047821044921875, -0.037952423095703125, -0.02808380126953125, -0.018215179443359375, -0.0083465576171875, 0.001522064208984375, 0.01139068603515625, 0.021259307861328125, 0.0311279296875, 0.040996551513671875, 0.05086517333984375, 0.060733795166015625, 0.0706024169921875, 0.08047103881835938, 0.09033966064453125, 0.10020828247070312, 0.110076904296875, 0.11994552612304688, 0.12981414794921875, 0.13968276977539062, 0.1495513916015625, 0.15942001342773438, 0.16928863525390625, 0.17915725708007812, 0.18902587890625, 0.19889450073242188, 0.20876312255859375, 0.21863174438476562, 0.2285003662109375, 0.23836898803710938, 0.24823760986328125, 0.2581062316894531, 0.267974853515625, 0.2778434753417969, 0.28771209716796875, 0.2975807189941406, 0.3074493408203125, 0.3173179626464844, 0.32718658447265625, 0.3370552062988281, 0.346923828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 13.0, 14.0, 6.0, 14.0, 33.0, 35.0, 56.0, 62.0, 82.0, 96.0, 113.0, 95.0, 95.0, 60.0, 53.0, 51.0, 26.0, 27.0, 19.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.083686113357544, -1.052344560623169, -1.0210031270980835, -0.9896615743637085, -0.9583200216293335, -0.9269785284996033, -0.895637035369873, -0.864295482635498, -0.832953929901123, -0.8016124367713928, -0.7702708840370178, -0.7389293909072876, -0.7075878381729126, -0.6762463450431824, -0.6449048519134521, -0.6135632991790771, -0.5822218060493469, -0.5508803129196167, -0.5195387601852417, -0.4881972670555115, -0.4568557143211365, -0.42551422119140625, -0.39417269825935364, -0.362831175327301, -0.3314896523952484, -0.3001481294631958, -0.2688066065311432, -0.23746509850025177, -0.20612357556819916, -0.17478205263614655, -0.14344054460525513, -0.11209902167320251, -0.08075755834579468, -0.049416039139032364, -0.01807451993227005, 0.013266995549201965, 0.04460851848125458, 0.07595004141330719, 0.10729154944419861, 0.13863307237625122, 0.16997459530830383, 0.20131611824035645, 0.23265764117240906, 0.26399916410446167, 0.2953406572341919, 0.3266822099685669, 0.3580237030982971, 0.38936522603034973, 0.42070674896240234, 0.45204827189445496, 0.48338979482650757, 0.5147312879562378, 0.5460728406906128, 0.577414333820343, 0.6087558269500732, 0.6400973796844482, 0.6714389324188232, 0.7027804255485535, 0.7341219782829285, 0.7654634714126587, 0.7968050241470337, 0.8281465172767639, 0.8594880104064941, 0.8908295631408691, 0.9221710562705994]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 14.0, 9.0, 6.0, 15.0, 11.0, 27.0, 23.0, 26.0, 22.0, 29.0, 42.0, 45.0, 40.0, 30.0, 34.0, 62.0, 50.0, 41.0, 42.0, 44.0, 31.0, 42.0, 27.0, 29.0, 22.0, 35.0, 24.0, 29.0, 22.0, 24.0, 16.0, 15.0, 19.0, 9.0, 4.0, 1.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5944231152534485, -0.576090395450592, -0.5577577352523804, -0.5394250154495239, -0.5210923552513123, -0.5027596354484558, -0.48442694544792175, -0.4660942554473877, -0.44776156544685364, -0.4294288754463196, -0.4110961854457855, -0.39276349544525146, -0.374430775642395, -0.35609811544418335, -0.3377653956413269, -0.31943270564079285, -0.3011000156402588, -0.28276732563972473, -0.2644346356391907, -0.24610193073749542, -0.22776924073696136, -0.2094365507364273, -0.19110384583473206, -0.172771155834198, -0.15443846583366394, -0.13610577583312988, -0.11777307838201523, -0.09944038093090057, -0.08110769093036652, -0.06277500092983246, -0.044442303478717804, -0.02610960602760315, -0.007776856422424316, 0.01055583730340004, 0.028888531029224396, 0.04722122475504875, 0.06555391848087311, 0.08388660848140717, 0.10221930593252182, 0.12055200338363647, 0.13888469338417053, 0.1572173833847046, 0.17555007338523865, 0.1938827782869339, 0.21221546828746796, 0.23054815828800201, 0.24888086318969727, 0.2672135531902313, 0.2855462431907654, 0.30387893319129944, 0.3222116231918335, 0.34054431319236755, 0.3588770031929016, 0.37720972299575806, 0.3955424129962921, 0.41387510299682617, 0.43220779299736023, 0.4505404829978943, 0.46887317299842834, 0.4872058629989624, 0.5055385828018188, 0.5238712430000305, 0.542203962802887, 0.5605366230010986, 0.5788693428039551]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 13.0, 15.0, 18.0, 20.0, 32.0, 43.0, 75.0, 84.0, 118.0, 254.0, 436.0, 717.0, 1602.0, 3646.0, 9341.0, 29426.0, 125476.0, 620303.0, 195619.0, 40511.0, 12130.0, 4557.0, 1936.0, 897.0, 480.0, 264.0, 145.0, 115.0, 73.0, 49.0, 36.0, 31.0, 13.0, 20.0, 15.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0], "bins": [-0.1905517578125, -0.1853485107421875, -0.180145263671875, -0.1749420166015625, -0.16973876953125, -0.1645355224609375, -0.159332275390625, -0.1541290283203125, -0.14892578125, -0.1437225341796875, -0.138519287109375, -0.1333160400390625, -0.12811279296875, -0.1229095458984375, -0.117706298828125, -0.1125030517578125, -0.1072998046875, -0.1020965576171875, -0.096893310546875, -0.0916900634765625, -0.08648681640625, -0.0812835693359375, -0.076080322265625, -0.0708770751953125, -0.065673828125, -0.0604705810546875, -0.055267333984375, -0.0500640869140625, -0.04486083984375, -0.0396575927734375, -0.034454345703125, -0.0292510986328125, -0.0240478515625, -0.0188446044921875, -0.013641357421875, -0.0084381103515625, -0.00323486328125, 0.0019683837890625, 0.007171630859375, 0.0123748779296875, 0.017578125, 0.0227813720703125, 0.027984619140625, 0.0331878662109375, 0.03839111328125, 0.0435943603515625, 0.048797607421875, 0.0540008544921875, 0.0592041015625, 0.0644073486328125, 0.069610595703125, 0.0748138427734375, 0.08001708984375, 0.0852203369140625, 0.090423583984375, 0.0956268310546875, 0.100830078125, 0.1060333251953125, 0.111236572265625, 0.1164398193359375, 0.12164306640625, 0.1268463134765625, 0.132049560546875, 0.1372528076171875, 0.1424560546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 11.0, 16.0, 8.0, 12.0, 26.0, 21.0, 20.0, 36.0, 37.0, 34.0, 39.0, 41.0, 43.0, 50.0, 63.0, 43.0, 39.0, 53.0, 54.0, 38.0, 44.0, 32.0, 34.0, 24.0, 28.0, 21.0, 22.0, 19.0, 12.0, 16.0, 10.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.427734375, -0.4160308837890625, -0.404327392578125, -0.3926239013671875, -0.38092041015625, -0.3692169189453125, -0.357513427734375, -0.3458099365234375, -0.3341064453125, -0.3224029541015625, -0.310699462890625, -0.2989959716796875, -0.28729248046875, -0.2755889892578125, -0.263885498046875, -0.2521820068359375, -0.240478515625, -0.2287750244140625, -0.217071533203125, -0.2053680419921875, -0.19366455078125, -0.1819610595703125, -0.170257568359375, -0.1585540771484375, -0.1468505859375, -0.1351470947265625, -0.123443603515625, -0.1117401123046875, -0.10003662109375, -0.0883331298828125, -0.076629638671875, -0.0649261474609375, -0.05322265625, -0.0415191650390625, -0.029815673828125, -0.0181121826171875, -0.00640869140625, 0.0052947998046875, 0.016998291015625, 0.0287017822265625, 0.0404052734375, 0.0521087646484375, 0.063812255859375, 0.0755157470703125, 0.08721923828125, 0.0989227294921875, 0.110626220703125, 0.1223297119140625, 0.134033203125, 0.1457366943359375, 0.157440185546875, 0.1691436767578125, 0.18084716796875, 0.1925506591796875, 0.204254150390625, 0.2159576416015625, 0.2276611328125, 0.2393646240234375, 0.251068115234375, 0.2627716064453125, 0.27447509765625, 0.2861785888671875, 0.297882080078125, 0.3095855712890625, 0.3212890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 7.0, 2.0, 5.0, 4.0, 3.0, 3.0, 15.0, 18.0, 26.0, 42.0, 55.0, 79.0, 107.0, 163.0, 185.0, 302.0, 428.0, 688.0, 1034.0, 1539.0, 2269.0, 3513.0, 5496.0, 8682.0, 13714.0, 22194.0, 38462.0, 67663.0, 128344.0, 222494.0, 226474.0, 132031.0, 70585.0, 39509.0, 23188.0, 13932.0, 8844.0, 5615.0, 3635.0, 2385.0, 1537.0, 1037.0, 713.0, 478.0, 324.0, 226.0, 154.0, 116.0, 74.0, 58.0, 29.0, 22.0, 23.0, 17.0, 6.0, 12.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.03594970703125, -0.034827232360839844, -0.03370475769042969, -0.03258228302001953, -0.031459808349609375, -0.03033733367919922, -0.029214859008789062, -0.028092384338378906, -0.02696990966796875, -0.025847434997558594, -0.024724960327148438, -0.02360248565673828, -0.022480010986328125, -0.02135753631591797, -0.020235061645507812, -0.019112586975097656, -0.0179901123046875, -0.016867637634277344, -0.015745162963867188, -0.014622688293457031, -0.013500213623046875, -0.012377738952636719, -0.011255264282226562, -0.010132789611816406, -0.00901031494140625, -0.007887840270996094, -0.0067653656005859375, -0.005642890930175781, -0.004520416259765625, -0.0033979415893554688, -0.0022754669189453125, -0.0011529922485351562, -3.0517578125e-05, 0.0010919570922851562, 0.0022144317626953125, 0.0033369064331054688, 0.004459381103515625, 0.005581855773925781, 0.0067043304443359375, 0.007826805114746094, 0.00894927978515625, 0.010071754455566406, 0.011194229125976562, 0.012316703796386719, 0.013439178466796875, 0.014561653137207031, 0.015684127807617188, 0.016806602478027344, 0.0179290771484375, 0.019051551818847656, 0.020174026489257812, 0.02129650115966797, 0.022418975830078125, 0.02354145050048828, 0.024663925170898438, 0.025786399841308594, 0.02690887451171875, 0.028031349182128906, 0.029153823852539062, 0.03027629852294922, 0.031398773193359375, 0.03252124786376953, 0.03364372253417969, 0.034766197204589844, 0.035888671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 5.0, 7.0, 17.0, 15.0, 13.0, 24.0, 14.0, 19.0, 34.0, 29.0, 30.0, 41.0, 49.0, 50.0, 54.0, 44.0, 53.0, 47.0, 31.0, 48.0, 37.0, 45.0, 36.0, 39.0, 44.0, 25.0, 28.0, 16.0, 18.0, 14.0, 11.0, 9.0, 5.0, 8.0, 7.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.74853515625, -0.7251739501953125, -0.701812744140625, -0.6784515380859375, -0.65509033203125, -0.6317291259765625, -0.608367919921875, -0.5850067138671875, -0.5616455078125, -0.5382843017578125, -0.514923095703125, -0.4915618896484375, -0.46820068359375, -0.4448394775390625, -0.421478271484375, -0.3981170654296875, -0.374755859375, -0.3513946533203125, -0.328033447265625, -0.3046722412109375, -0.28131103515625, -0.2579498291015625, -0.234588623046875, -0.2112274169921875, -0.1878662109375, -0.1645050048828125, -0.141143798828125, -0.1177825927734375, -0.09442138671875, -0.0710601806640625, -0.047698974609375, -0.0243377685546875, -0.0009765625, 0.0223846435546875, 0.045745849609375, 0.0691070556640625, 0.09246826171875, 0.1158294677734375, 0.139190673828125, 0.1625518798828125, 0.1859130859375, 0.2092742919921875, 0.232635498046875, 0.2559967041015625, 0.27935791015625, 0.3027191162109375, 0.326080322265625, 0.3494415283203125, 0.372802734375, 0.3961639404296875, 0.419525146484375, 0.4428863525390625, 0.46624755859375, 0.4896087646484375, 0.512969970703125, 0.5363311767578125, 0.5596923828125, 0.5830535888671875, 0.606414794921875, 0.6297760009765625, 0.65313720703125, 0.6764984130859375, 0.699859619140625, 0.7232208251953125, 0.74658203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 4.0, 4.0, 0.0, 9.0, 5.0, 9.0, 13.0, 16.0, 23.0, 47.0, 84.0, 144.0, 246.0, 434.0, 877.0, 1961.0, 4908.0, 15892.0, 75521.0, 460907.0, 400283.0, 64502.0, 14288.0, 4551.0, 1876.0, 917.0, 436.0, 241.0, 130.0, 78.0, 45.0, 32.0, 27.0, 14.0, 7.0, 9.0, 3.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01210784912109375, -0.01170361042022705, -0.011299371719360352, -0.010895133018493652, -0.010490894317626953, -0.010086655616760254, -0.009682416915893555, -0.009278178215026855, -0.008873939514160156, -0.008469700813293457, -0.008065462112426758, -0.007661223411560059, -0.007256984710693359, -0.00685274600982666, -0.006448507308959961, -0.006044268608093262, -0.0056400299072265625, -0.005235791206359863, -0.004831552505493164, -0.004427313804626465, -0.004023075103759766, -0.0036188364028930664, -0.003214597702026367, -0.002810359001159668, -0.0024061203002929688, -0.0020018815994262695, -0.0015976428985595703, -0.001193404197692871, -0.0007891654968261719, -0.00038492679595947266, 1.9311904907226562e-05, 0.0004235506057739258, 0.000827789306640625, 0.0012320280075073242, 0.0016362667083740234, 0.0020405054092407227, 0.002444744110107422, 0.002848982810974121, 0.0032532215118408203, 0.0036574602127075195, 0.004061698913574219, 0.004465937614440918, 0.004870176315307617, 0.005274415016174316, 0.005678653717041016, 0.006082892417907715, 0.006487131118774414, 0.006891369819641113, 0.0072956085205078125, 0.007699847221374512, 0.008104085922241211, 0.00850832462310791, 0.00891256332397461, 0.009316802024841309, 0.009721040725708008, 0.010125279426574707, 0.010529518127441406, 0.010933756828308105, 0.011337995529174805, 0.011742234230041504, 0.012146472930908203, 0.012550711631774902, 0.012954950332641602, 0.0133591890335083, 0.013763427734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 9.0, 5.0, 9.0, 17.0, 10.0, 23.0, 24.0, 27.0, 26.0, 50.0, 57.0, 64.0, 72.0, 100.0, 108.0, 85.0, 72.0, 51.0, 37.0, 35.0, 25.0, 20.0, 20.0, 6.0, 10.0, 12.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341104507446289e-05, -1.2821517884731293e-05, -1.2231990694999695e-05, -1.1642463505268097e-05, -1.1052936315536499e-05, -1.0463409125804901e-05, -9.873881936073303e-06, -9.284354746341705e-06, -8.694827556610107e-06, -8.10530036687851e-06, -7.515773177146912e-06, -6.926245987415314e-06, -6.336718797683716e-06, -5.747191607952118e-06, -5.15766441822052e-06, -4.568137228488922e-06, -3.978610038757324e-06, -3.3890828490257263e-06, -2.7995556592941284e-06, -2.2100284695625305e-06, -1.6205012798309326e-06, -1.0309740900993347e-06, -4.414469003677368e-07, 1.4808028936386108e-07, 7.37607479095459e-07, 1.3271346688270569e-06, 1.9166618585586548e-06, 2.5061890482902527e-06, 3.0957162380218506e-06, 3.6852434277534485e-06, 4.274770617485046e-06, 4.864297807216644e-06, 5.453824996948242e-06, 6.04335218667984e-06, 6.632879376411438e-06, 7.222406566143036e-06, 7.811933755874634e-06, 8.401460945606232e-06, 8.99098813533783e-06, 9.580515325069427e-06, 1.0170042514801025e-05, 1.0759569704532623e-05, 1.1349096894264221e-05, 1.1938624083995819e-05, 1.2528151273727417e-05, 1.3117678463459015e-05, 1.3707205653190613e-05, 1.429673284292221e-05, 1.4886260032653809e-05, 1.5475787222385406e-05, 1.6065314412117004e-05, 1.6654841601848602e-05, 1.72443687915802e-05, 1.7833895981311798e-05, 1.8423423171043396e-05, 1.9012950360774994e-05, 1.9602477550506592e-05, 2.019200474023819e-05, 2.0781531929969788e-05, 2.1371059119701385e-05, 2.1960586309432983e-05, 2.255011349916458e-05, 2.313964068889618e-05, 2.3729167878627777e-05, 2.4318695068359375e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 7.0, 9.0, 15.0, 21.0, 28.0, 39.0, 55.0, 81.0, 118.0, 219.0, 417.0, 1041.0, 3361.0, 15809.0, 189758.0, 776628.0, 50203.0, 7397.0, 1854.0, 704.0, 300.0, 177.0, 96.0, 64.0, 55.0, 26.0, 20.0, 13.0, 11.0, 12.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0281524658203125, -0.02739715576171875, -0.026641845703125, -0.02588653564453125, -0.0251312255859375, -0.02437591552734375, -0.02362060546875, -0.02286529541015625, -0.0221099853515625, -0.02135467529296875, -0.020599365234375, -0.01984405517578125, -0.0190887451171875, -0.01833343505859375, -0.017578125, -0.01682281494140625, -0.0160675048828125, -0.01531219482421875, -0.014556884765625, -0.01380157470703125, -0.0130462646484375, -0.01229095458984375, -0.01153564453125, -0.01078033447265625, -0.0100250244140625, -0.00926971435546875, -0.008514404296875, -0.00775909423828125, -0.0070037841796875, -0.00624847412109375, -0.0054931640625, -0.00473785400390625, -0.0039825439453125, -0.00322723388671875, -0.002471923828125, -0.00171661376953125, -0.0009613037109375, -0.00020599365234375, 0.00054931640625, 0.00130462646484375, 0.0020599365234375, 0.00281524658203125, 0.003570556640625, 0.00432586669921875, 0.0050811767578125, 0.00583648681640625, 0.006591796875, 0.00734710693359375, 0.0081024169921875, 0.00885772705078125, 0.009613037109375, 0.01036834716796875, 0.0111236572265625, 0.01187896728515625, 0.01263427734375, 0.01338958740234375, 0.0141448974609375, 0.01490020751953125, 0.015655517578125, 0.01641082763671875, 0.0171661376953125, 0.01792144775390625, 0.0186767578125, 0.01943206787109375, 0.0201873779296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 17.0, 23.0, 20.0, 39.0, 50.0, 107.0, 165.0, 208.0, 136.0, 77.0, 49.0, 25.0, 26.0, 11.0, 12.0, 8.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004070281982421875, -0.003915369510650635, -0.0037604570388793945, -0.0036055445671081543, -0.003450632095336914, -0.003295719623565674, -0.0031408071517944336, -0.0029858946800231934, -0.002830982208251953, -0.002676069736480713, -0.0025211572647094727, -0.0023662447929382324, -0.002211332321166992, -0.002056419849395752, -0.0019015073776245117, -0.0017465949058532715, -0.0015916824340820312, -0.001436769962310791, -0.0012818574905395508, -0.0011269450187683105, -0.0009720325469970703, -0.0008171200752258301, -0.0006622076034545898, -0.0005072951316833496, -0.0003523826599121094, -0.00019747018814086914, -4.2557716369628906e-05, 0.00011235475540161133, 0.00026726722717285156, 0.0004221796989440918, 0.000577092170715332, 0.0007320046424865723, 0.0008869171142578125, 0.0010418295860290527, 0.001196742057800293, 0.0013516545295715332, 0.0015065670013427734, 0.0016614794731140137, 0.001816391944885254, 0.001971304416656494, 0.0021262168884277344, 0.0022811293601989746, 0.002436041831970215, 0.002590954303741455, 0.0027458667755126953, 0.0029007792472839355, 0.0030556917190551758, 0.003210604190826416, 0.0033655166625976562, 0.0035204291343688965, 0.0036753416061401367, 0.003830254077911377, 0.003985166549682617, 0.004140079021453857, 0.004294991493225098, 0.004449903964996338, 0.004604816436767578, 0.004759728908538818, 0.004914641380310059, 0.005069553852081299, 0.005224466323852539, 0.005379378795623779, 0.0055342912673950195, 0.00568920373916626, 0.0058441162109375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 7.0, 20.0, 15.0, 15.0, 34.0, 43.0, 63.0, 77.0, 99.0, 103.0, 128.0, 89.0, 68.0, 57.0, 53.0, 34.0, 28.0, 24.0, 9.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7030730247497559, -0.6840977072715759, -0.665122389793396, -0.6461471319198608, -0.6271718144416809, -0.608196496963501, -0.589221179485321, -0.5702458620071411, -0.551270604133606, -0.532295286655426, -0.5133199691772461, -0.49434468150138855, -0.475369393825531, -0.4563940763473511, -0.43741875886917114, -0.4184434413909912, -0.3994681239128113, -0.38049280643463135, -0.3615175187587738, -0.34254220128059387, -0.32356691360473633, -0.3045915961265564, -0.28561627864837646, -0.26664096117019653, -0.247665673494339, -0.22869037091732025, -0.2097150683403015, -0.19073975086212158, -0.17176444828510284, -0.1527891457080841, -0.13381382822990417, -0.11483852565288544, -0.0958632230758667, -0.07688792049884796, -0.05791261047124863, -0.03893730416893959, -0.019961997866630554, -0.0009866952896118164, 0.01798861473798752, 0.03696392476558685, 0.05593922734260559, 0.07491452991962433, 0.09388983994722366, 0.112865149974823, 0.13184045255184174, 0.15081575512886047, 0.1697910726070404, 0.18876637518405914, 0.20774167776107788, 0.22671698033809662, 0.24569228291511536, 0.2646676003932953, 0.28364288806915283, 0.30261820554733276, 0.3215935230255127, 0.3405688405036926, 0.35954412817955017, 0.3785194456577301, 0.39749473333358765, 0.4164700508117676, 0.4354453682899475, 0.45442065596580505, 0.473395973443985, 0.49237126111984253, 0.5113465785980225]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 12.0, 7.0, 14.0, 9.0, 12.0, 10.0, 22.0, 31.0, 21.0, 34.0, 37.0, 49.0, 38.0, 38.0, 40.0, 60.0, 57.0, 47.0, 48.0, 41.0, 32.0, 52.0, 27.0, 26.0, 31.0, 37.0, 20.0, 31.0, 23.0, 17.0, 21.0, 13.0, 10.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.4061678349971771, -0.3949478268623352, -0.3837278187274933, -0.37250781059265137, -0.36128777265548706, -0.35006776452064514, -0.3388477563858032, -0.3276277482509613, -0.3164077401161194, -0.30518773198127747, -0.29396772384643555, -0.28274768590927124, -0.2715276777744293, -0.2603076696395874, -0.24908766150474548, -0.23786765336990356, -0.22664761543273926, -0.21542760729789734, -0.20420758426189423, -0.1929875761270523, -0.1817675530910492, -0.17054754495620728, -0.15932753682136536, -0.14810752868652344, -0.13688750565052032, -0.1256674975156784, -0.11444747447967529, -0.10322746634483337, -0.09200745075941086, -0.08078743517398834, -0.06956742703914642, -0.05834741145372391, -0.04712739586830139, -0.035907380282878876, -0.02468736842274666, -0.013467356562614441, -0.002247340977191925, 0.00897267460823059, 0.02019268274307251, 0.031412698328495026, 0.04263271391391754, 0.05385272949934006, 0.06507274508476257, 0.07629275321960449, 0.08751276880502701, 0.09873278439044952, 0.10995279252529144, 0.12117280811071396, 0.13239282369613647, 0.1436128318309784, 0.1548328548669815, 0.16605286300182343, 0.17727288603782654, 0.18849289417266846, 0.19971290230751038, 0.2109329104423523, 0.2221529334783554, 0.23337294161319733, 0.24459296464920044, 0.25581297278404236, 0.2670329809188843, 0.2782530188560486, 0.2894729971885681, 0.3006930351257324, 0.31191304326057434]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 16.0, 11.0, 16.0, 43.0, 38.0, 57.0, 84.0, 118.0, 174.0, 234.0, 339.0, 505.0, 801.0, 1205.0, 1966.0, 3208.0, 5491.0, 10023.0, 19083.0, 40215.0, 113802.0, 560512.0, 184432.0, 53119.0, 23818.0, 12220.0, 6669.0, 3820.0, 2288.0, 1443.0, 916.0, 580.0, 365.0, 278.0, 201.0, 136.0, 85.0, 68.0, 39.0, 31.0, 25.0, 24.0, 10.0, 8.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.53955078125, -0.5225067138671875, -0.505462646484375, -0.4884185791015625, -0.47137451171875, -0.4543304443359375, -0.437286376953125, -0.4202423095703125, -0.4031982421875, -0.3861541748046875, -0.369110107421875, -0.3520660400390625, -0.33502197265625, -0.3179779052734375, -0.300933837890625, -0.2838897705078125, -0.266845703125, -0.2498016357421875, -0.232757568359375, -0.2157135009765625, -0.19866943359375, -0.1816253662109375, -0.164581298828125, -0.1475372314453125, -0.1304931640625, -0.1134490966796875, -0.096405029296875, -0.0793609619140625, -0.06231689453125, -0.0452728271484375, -0.028228759765625, -0.0111846923828125, 0.005859375, 0.0229034423828125, 0.039947509765625, 0.0569915771484375, 0.07403564453125, 0.0910797119140625, 0.108123779296875, 0.1251678466796875, 0.1422119140625, 0.1592559814453125, 0.176300048828125, 0.1933441162109375, 0.21038818359375, 0.2274322509765625, 0.244476318359375, 0.2615203857421875, 0.278564453125, 0.2956085205078125, 0.312652587890625, 0.3296966552734375, 0.34674072265625, 0.3637847900390625, 0.380828857421875, 0.3978729248046875, 0.4149169921875, 0.4319610595703125, 0.449005126953125, 0.4660491943359375, 0.48309326171875, 0.5001373291015625, 0.517181396484375, 0.5342254638671875, 0.55126953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 9.0, 7.0, 11.0, 22.0, 18.0, 22.0, 17.0, 30.0, 34.0, 43.0, 50.0, 51.0, 55.0, 60.0, 54.0, 54.0, 55.0, 58.0, 41.0, 30.0, 46.0, 34.0, 33.0, 24.0, 20.0, 17.0, 20.0, 17.0, 16.0, 11.0, 10.0, 6.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87255859375, -0.8478240966796875, -0.823089599609375, -0.7983551025390625, -0.77362060546875, -0.7488861083984375, -0.724151611328125, -0.6994171142578125, -0.6746826171875, -0.6499481201171875, -0.625213623046875, -0.6004791259765625, -0.57574462890625, -0.5510101318359375, -0.526275634765625, -0.5015411376953125, -0.476806640625, -0.4520721435546875, -0.427337646484375, -0.4026031494140625, -0.37786865234375, -0.3531341552734375, -0.328399658203125, -0.3036651611328125, -0.2789306640625, -0.2541961669921875, -0.229461669921875, -0.2047271728515625, -0.17999267578125, -0.1552581787109375, -0.130523681640625, -0.1057891845703125, -0.0810546875, -0.0563201904296875, -0.031585693359375, -0.0068511962890625, 0.01788330078125, 0.0426177978515625, 0.067352294921875, 0.0920867919921875, 0.1168212890625, 0.1415557861328125, 0.166290283203125, 0.1910247802734375, 0.21575927734375, 0.2404937744140625, 0.265228271484375, 0.2899627685546875, 0.314697265625, 0.3394317626953125, 0.364166259765625, 0.3889007568359375, 0.41363525390625, 0.4383697509765625, 0.463104248046875, 0.4878387451171875, 0.5125732421875, 0.5373077392578125, 0.562042236328125, 0.5867767333984375, 0.61151123046875, 0.6362457275390625, 0.660980224609375, 0.6857147216796875, 0.71044921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 3.0, 9.0, 14.0, 14.0, 26.0, 33.0, 30.0, 65.0, 104.0, 136.0, 231.0, 401.0, 635.0, 1249.0, 2219.0, 4547.0, 10626.0, 28951.0, 116547.0, 746267.0, 92830.0, 25139.0, 9501.0, 4203.0, 2063.0, 1081.0, 618.0, 353.0, 218.0, 131.0, 78.0, 72.0, 46.0, 25.0, 22.0, 19.0, 11.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89501953125, -0.8646163940429688, -0.8342132568359375, -0.8038101196289062, -0.773406982421875, -0.7430038452148438, -0.7126007080078125, -0.6821975708007812, -0.65179443359375, -0.6213912963867188, -0.5909881591796875, -0.5605850219726562, -0.530181884765625, -0.49977874755859375, -0.4693756103515625, -0.43897247314453125, -0.4085693359375, -0.37816619873046875, -0.3477630615234375, -0.31735992431640625, -0.286956787109375, -0.25655364990234375, -0.2261505126953125, -0.19574737548828125, -0.16534423828125, -0.13494110107421875, -0.1045379638671875, -0.07413482666015625, -0.043731689453125, -0.01332855224609375, 0.0170745849609375, 0.04747772216796875, 0.077880859375, 0.10828399658203125, 0.1386871337890625, 0.16909027099609375, 0.199493408203125, 0.22989654541015625, 0.2602996826171875, 0.29070281982421875, 0.32110595703125, 0.35150909423828125, 0.3819122314453125, 0.41231536865234375, 0.442718505859375, 0.47312164306640625, 0.5035247802734375, 0.5339279174804688, 0.5643310546875, 0.5947341918945312, 0.6251373291015625, 0.6555404663085938, 0.685943603515625, 0.7163467407226562, 0.7467498779296875, 0.7771530151367188, 0.80755615234375, 0.8379592895507812, 0.8683624267578125, 0.8987655639648438, 0.929168701171875, 0.9595718383789062, 0.9899749755859375, 1.0203781127929688, 1.05078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 9.0, 3.0, 12.0, 8.0, 10.0, 10.0, 21.0, 24.0, 25.0, 27.0, 25.0, 36.0, 44.0, 40.0, 45.0, 55.0, 48.0, 48.0, 62.0, 51.0, 50.0, 50.0, 40.0, 44.0, 39.0, 28.0, 21.0, 26.0, 18.0, 21.0, 9.0, 13.0, 6.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8271484375, -0.7976226806640625, -0.768096923828125, -0.7385711669921875, -0.70904541015625, -0.6795196533203125, -0.649993896484375, -0.6204681396484375, -0.5909423828125, -0.5614166259765625, -0.531890869140625, -0.5023651123046875, -0.47283935546875, -0.4433135986328125, -0.413787841796875, -0.3842620849609375, -0.354736328125, -0.3252105712890625, -0.295684814453125, -0.2661590576171875, -0.23663330078125, -0.2071075439453125, -0.177581787109375, -0.1480560302734375, -0.1185302734375, -0.0890045166015625, -0.059478759765625, -0.0299530029296875, -0.00042724609375, 0.0290985107421875, 0.058624267578125, 0.0881500244140625, 0.11767578125, 0.1472015380859375, 0.176727294921875, 0.2062530517578125, 0.23577880859375, 0.2653045654296875, 0.294830322265625, 0.3243560791015625, 0.3538818359375, 0.3834075927734375, 0.412933349609375, 0.4424591064453125, 0.47198486328125, 0.5015106201171875, 0.531036376953125, 0.5605621337890625, 0.590087890625, 0.6196136474609375, 0.649139404296875, 0.6786651611328125, 0.70819091796875, 0.7377166748046875, 0.767242431640625, 0.7967681884765625, 0.8262939453125, 0.8558197021484375, 0.885345458984375, 0.9148712158203125, 0.94439697265625, 0.9739227294921875, 1.003448486328125, 1.0329742431640625, 1.0625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 3.0, 6.0, 10.0, 14.0, 15.0, 18.0, 32.0, 58.0, 90.0, 126.0, 220.0, 392.0, 790.0, 1327.0, 2829.0, 6376.0, 19683.0, 248593.0, 729266.0, 24650.0, 7515.0, 3116.0, 1474.0, 809.0, 447.0, 252.0, 144.0, 86.0, 68.0, 41.0, 24.0, 18.0, 15.0, 18.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.60205078125, -0.5848884582519531, -0.5677261352539062, -0.5505638122558594, -0.5334014892578125, -0.5162391662597656, -0.49907684326171875, -0.4819145202636719, -0.464752197265625, -0.4475898742675781, -0.43042755126953125, -0.4132652282714844, -0.3961029052734375, -0.3789405822753906, -0.36177825927734375, -0.3446159362792969, -0.32745361328125, -0.3102912902832031, -0.29312896728515625, -0.2759666442871094, -0.2588043212890625, -0.24164199829101562, -0.22447967529296875, -0.20731735229492188, -0.190155029296875, -0.17299270629882812, -0.15583038330078125, -0.13866806030273438, -0.1215057373046875, -0.10434341430664062, -0.08718109130859375, -0.07001876831054688, -0.0528564453125, -0.035694122314453125, -0.01853179931640625, -0.001369476318359375, 0.0157928466796875, 0.032955169677734375, 0.05011749267578125, 0.06727981567382812, 0.084442138671875, 0.10160446166992188, 0.11876678466796875, 0.13592910766601562, 0.1530914306640625, 0.17025375366210938, 0.18741607666015625, 0.20457839965820312, 0.22174072265625, 0.23890304565429688, 0.25606536865234375, 0.2732276916503906, 0.2903900146484375, 0.3075523376464844, 0.32471466064453125, 0.3418769836425781, 0.359039306640625, 0.3762016296386719, 0.39336395263671875, 0.4105262756347656, 0.4276885986328125, 0.4448509216308594, 0.46201324462890625, 0.4791755676269531, 0.496337890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 5.0, 9.0, 9.0, 7.0, 27.0, 40.0, 135.0, 476.0, 160.0, 52.0, 38.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.250640869140625e-05, -8.957833051681519e-05, -8.665025234222412e-05, -8.372217416763306e-05, -8.079409599304199e-05, -7.786601781845093e-05, -7.493793964385986e-05, -7.20098614692688e-05, -6.908178329467773e-05, -6.615370512008667e-05, -6.32256269454956e-05, -6.029754877090454e-05, -5.7369470596313477e-05, -5.444139242172241e-05, -5.151331424713135e-05, -4.858523607254028e-05, -4.565715789794922e-05, -4.2729079723358154e-05, -3.980100154876709e-05, -3.6872923374176025e-05, -3.394484519958496e-05, -3.1016767024993896e-05, -2.8088688850402832e-05, -2.5160610675811768e-05, -2.2232532501220703e-05, -1.930445432662964e-05, -1.6376376152038574e-05, -1.344829797744751e-05, -1.0520219802856445e-05, -7.592141628265381e-06, -4.664063453674316e-06, -1.735985279083252e-06, 1.1920928955078125e-06, 4.120171070098877e-06, 7.048249244689941e-06, 9.976327419281006e-06, 1.290440559387207e-05, 1.5832483768463135e-05, 1.87605619430542e-05, 2.1688640117645264e-05, 2.4616718292236328e-05, 2.7544796466827393e-05, 3.0472874641418457e-05, 3.340095281600952e-05, 3.6329030990600586e-05, 3.925710916519165e-05, 4.2185187339782715e-05, 4.511326551437378e-05, 4.8041343688964844e-05, 5.096942186355591e-05, 5.389750003814697e-05, 5.682557821273804e-05, 5.97536563873291e-05, 6.268173456192017e-05, 6.560981273651123e-05, 6.85378909111023e-05, 7.146596908569336e-05, 7.439404726028442e-05, 7.732212543487549e-05, 8.025020360946655e-05, 8.317828178405762e-05, 8.610635995864868e-05, 8.903443813323975e-05, 9.196251630783081e-05, 9.489059448242188e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 3.0, 6.0, 9.0, 11.0, 20.0, 34.0, 53.0, 58.0, 87.0, 140.0, 228.0, 369.0, 541.0, 927.0, 1800.0, 3359.0, 7350.0, 20139.0, 127431.0, 825224.0, 38867.0, 11600.0, 4656.0, 2441.0, 1246.0, 696.0, 434.0, 270.0, 199.0, 108.0, 79.0, 58.0, 36.0, 17.0, 14.0, 11.0, 12.0, 4.0, 3.0, 1.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.50909423828125, -0.4927978515625, -0.47650146484375, -0.460205078125, -0.44390869140625, -0.4276123046875, -0.41131591796875, -0.39501953125, -0.37872314453125, -0.3624267578125, -0.34613037109375, -0.329833984375, -0.31353759765625, -0.2972412109375, -0.28094482421875, -0.2646484375, -0.24835205078125, -0.2320556640625, -0.21575927734375, -0.199462890625, -0.18316650390625, -0.1668701171875, -0.15057373046875, -0.13427734375, -0.11798095703125, -0.1016845703125, -0.08538818359375, -0.069091796875, -0.05279541015625, -0.0364990234375, -0.02020263671875, -0.00390625, 0.01239013671875, 0.0286865234375, 0.04498291015625, 0.061279296875, 0.07757568359375, 0.0938720703125, 0.11016845703125, 0.12646484375, 0.14276123046875, 0.1590576171875, 0.17535400390625, 0.191650390625, 0.20794677734375, 0.2242431640625, 0.24053955078125, 0.2568359375, 0.27313232421875, 0.2894287109375, 0.30572509765625, 0.322021484375, 0.33831787109375, 0.3546142578125, 0.37091064453125, 0.38720703125, 0.40350341796875, 0.4197998046875, 0.43609619140625, 0.452392578125, 0.46868896484375, 0.4849853515625, 0.50128173828125, 0.517578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 10.0, 8.0, 11.0, 13.0, 21.0, 18.0, 31.0, 89.0, 309.0, 280.0, 85.0, 25.0, 20.0, 16.0, 13.0, 4.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24306488037109375, -0.2346649169921875, -0.22626495361328125, -0.217864990234375, -0.20946502685546875, -0.2010650634765625, -0.19266510009765625, -0.18426513671875, -0.17586517333984375, -0.1674652099609375, -0.15906524658203125, -0.150665283203125, -0.14226531982421875, -0.1338653564453125, -0.12546539306640625, -0.1170654296875, -0.10866546630859375, -0.1002655029296875, -0.09186553955078125, -0.083465576171875, -0.07506561279296875, -0.0666656494140625, -0.05826568603515625, -0.04986572265625, -0.04146575927734375, -0.0330657958984375, -0.02466583251953125, -0.016265869140625, -0.00786590576171875, 0.0005340576171875, 0.00893402099609375, 0.017333984375, 0.02573394775390625, 0.0341339111328125, 0.04253387451171875, 0.050933837890625, 0.05933380126953125, 0.0677337646484375, 0.07613372802734375, 0.08453369140625, 0.09293365478515625, 0.1013336181640625, 0.10973358154296875, 0.118133544921875, 0.12653350830078125, 0.1349334716796875, 0.14333343505859375, 0.1517333984375, 0.16013336181640625, 0.1685333251953125, 0.17693328857421875, 0.185333251953125, 0.19373321533203125, 0.2021331787109375, 0.21053314208984375, 0.21893310546875, 0.22733306884765625, 0.2357330322265625, 0.24413299560546875, 0.252532958984375, 0.26093292236328125, 0.2693328857421875, 0.27773284912109375, 0.2861328125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 24.0, 59.0, 117.0, 226.0, 259.0, 162.0, 84.0, 39.0, 18.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.932828903198242, -5.8145527839660645, -5.6962761878967285, -5.578000068664551, -5.459723949432373, -5.341447353363037, -5.223171234130859, -5.104895114898682, -4.986618518829346, -4.868342399597168, -4.750065803527832, -4.631789684295654, -4.513513565063477, -4.395236968994141, -4.276960849761963, -4.158684730529785, -4.040408134460449, -3.9221317768096924, -3.8038556575775146, -3.685579299926758, -3.567302942276001, -3.449026584625244, -3.3307504653930664, -3.2124741077423096, -3.094198226928711, -2.975921869277954, -2.8576457500457764, -2.7393693923950195, -2.6210930347442627, -2.502816677093506, -2.384540557861328, -2.2662642002105713, -2.1479876041412354, -2.0297112464904785, -1.9114350080490112, -1.793158769607544, -1.674882411956787, -1.5566061735153198, -1.4383299350738525, -1.3200535774230957, -1.2017773389816284, -1.0835011005401611, -0.9652247428894043, -0.846948504447937, -0.728672206401825, -0.6103959083557129, -0.4921196699142456, -0.37384337186813354, -0.2555670738220215, -0.13729079067707062, -0.01901450753211975, 0.09926176071166992, 0.21753805875778198, 0.33581435680389404, 0.45409059524536133, 0.5723668932914734, 0.6906431913375854, 0.8089194893836975, 0.9271957874298096, 1.0454720258712769, 1.1637482643127441, 1.282024621963501, 1.4003008604049683, 1.5185770988464355, 1.6368534564971924]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 1.0, 8.0, 10.0, 14.0, 13.0, 19.0, 23.0, 13.0, 17.0, 27.0, 23.0, 29.0, 33.0, 28.0, 35.0, 28.0, 34.0, 41.0, 46.0, 45.0, 30.0, 38.0, 42.0, 33.0, 32.0, 31.0, 28.0, 28.0, 33.0, 17.0, 28.0, 26.0, 20.0, 16.0, 20.0, 11.0, 7.0, 12.0, 11.0, 12.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.1897069215774536, -1.1516214609146118, -1.11353600025177, -1.0754504203796387, -1.0373649597167969, -0.9992794990539551, -0.9611940383911133, -0.9231085181236267, -0.8850229978561401, -0.8469375371932983, -0.8088520169258118, -0.77076655626297, -0.7326810359954834, -0.6945955753326416, -0.6565101146697998, -0.6184245944023132, -0.5803391337394714, -0.5422536730766296, -0.5041681528091431, -0.46608269214630127, -0.4279971718788147, -0.3899117112159729, -0.3518262207508087, -0.31374073028564453, -0.27565523982048035, -0.23756974935531616, -0.19948425889015198, -0.161398783326149, -0.1233132928609848, -0.08522780239582062, -0.04714232683181763, -0.009056836366653442, 0.029028654098510742, 0.06711414456367493, 0.10519962757825851, 0.1432851105928421, 0.1813706010580063, 0.21945609152317047, 0.25754156708717346, 0.29562705755233765, 0.33371254801750183, 0.371798038482666, 0.4098835289478302, 0.4479690194129944, 0.4860544800758362, 0.5241400003433228, 0.5622254610061646, 0.6003109216690063, 0.6383964419364929, 0.6764819025993347, 0.7145674228668213, 0.7526528835296631, 0.7907384037971497, 0.8288238644599915, 0.866909384727478, 0.9049948453903198, 0.9430803060531616, 0.9811657667160034, 1.0192512273788452, 1.0573368072509766, 1.0954222679138184, 1.1335077285766602, 1.171593189239502, 1.2096786499023438, 1.247764229774475]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 6.0, 13.0, 7.0, 13.0, 15.0, 27.0, 45.0, 59.0, 91.0, 102.0, 161.0, 235.0, 365.0, 561.0, 847.0, 1570.0, 2895.0, 5938.0, 18758.0, 463788.0, 3511679.0, 164043.0, 12714.0, 4636.0, 2291.0, 1265.0, 779.0, 432.0, 286.0, 177.0, 143.0, 90.0, 69.0, 41.0, 40.0, 25.0, 22.0, 15.0, 10.0, 4.0, 7.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.5341796875, -1.489532470703125, -1.44488525390625, -1.400238037109375, -1.3555908203125, -1.310943603515625, -1.26629638671875, -1.221649169921875, -1.177001953125, -1.132354736328125, -1.08770751953125, -1.043060302734375, -0.9984130859375, -0.953765869140625, -0.90911865234375, -0.864471435546875, -0.81982421875, -0.775177001953125, -0.73052978515625, -0.685882568359375, -0.6412353515625, -0.596588134765625, -0.55194091796875, -0.507293701171875, -0.462646484375, -0.417999267578125, -0.37335205078125, -0.328704833984375, -0.2840576171875, -0.239410400390625, -0.19476318359375, -0.150115966796875, -0.10546875, -0.060821533203125, -0.01617431640625, 0.028472900390625, 0.0731201171875, 0.117767333984375, 0.16241455078125, 0.207061767578125, 0.251708984375, 0.296356201171875, 0.34100341796875, 0.385650634765625, 0.4302978515625, 0.474945068359375, 0.51959228515625, 0.564239501953125, 0.60888671875, 0.653533935546875, 0.69818115234375, 0.742828369140625, 0.7874755859375, 0.832122802734375, 0.87677001953125, 0.921417236328125, 0.966064453125, 1.010711669921875, 1.05535888671875, 1.100006103515625, 1.1446533203125, 1.189300537109375, 1.23394775390625, 1.278594970703125, 1.3232421875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 4.0, 12.0, 13.0, 16.0, 14.0, 21.0, 20.0, 27.0, 33.0, 31.0, 34.0, 47.0, 50.0, 44.0, 48.0, 47.0, 58.0, 46.0, 44.0, 40.0, 42.0, 38.0, 45.0, 46.0, 27.0, 29.0, 16.0, 16.0, 15.0, 11.0, 10.0, 10.0, 5.0, 1.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5107421875, -0.4962272644042969, -0.48171234130859375, -0.4671974182128906, -0.4526824951171875, -0.4381675720214844, -0.42365264892578125, -0.4091377258300781, -0.394622802734375, -0.3801078796386719, -0.36559295654296875, -0.3510780334472656, -0.3365631103515625, -0.3220481872558594, -0.30753326416015625, -0.2930183410644531, -0.27850341796875, -0.2639884948730469, -0.24947357177734375, -0.23495864868164062, -0.2204437255859375, -0.20592880249023438, -0.19141387939453125, -0.17689895629882812, -0.162384033203125, -0.14786911010742188, -0.13335418701171875, -0.11883926391601562, -0.1043243408203125, -0.08980941772460938, -0.07529449462890625, -0.060779571533203125, -0.0462646484375, -0.031749725341796875, -0.01723480224609375, -0.002719879150390625, 0.0117950439453125, 0.026309967041015625, 0.04082489013671875, 0.055339813232421875, 0.069854736328125, 0.08436965942382812, 0.09888458251953125, 0.11339950561523438, 0.1279144287109375, 0.14242935180664062, 0.15694427490234375, 0.17145919799804688, 0.18597412109375, 0.20048904418945312, 0.21500396728515625, 0.22951889038085938, 0.2440338134765625, 0.2585487365722656, 0.27306365966796875, 0.2875785827636719, 0.302093505859375, 0.3166084289550781, 0.33112335205078125, 0.3456382751464844, 0.3601531982421875, 0.3746681213378906, 0.38918304443359375, 0.4036979675292969, 0.418212890625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 10.0, 14.0, 35.0, 53.0, 93.0, 162.0, 344.0, 728.0, 1911.0, 5889.0, 29072.0, 2162094.0, 1956299.0, 28265.0, 5939.0, 1904.0, 773.0, 307.0, 144.0, 92.0, 34.0, 25.0, 23.0, 8.0, 7.0, 10.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.337890625, -2.2794342041015625, -2.220977783203125, -2.1625213623046875, -2.10406494140625, -2.0456085205078125, -1.987152099609375, -1.9286956787109375, -1.8702392578125, -1.8117828369140625, -1.753326416015625, -1.6948699951171875, -1.63641357421875, -1.5779571533203125, -1.519500732421875, -1.4610443115234375, -1.402587890625, -1.3441314697265625, -1.285675048828125, -1.2272186279296875, -1.16876220703125, -1.1103057861328125, -1.051849365234375, -0.9933929443359375, -0.9349365234375, -0.8764801025390625, -0.818023681640625, -0.7595672607421875, -0.70111083984375, -0.6426544189453125, -0.584197998046875, -0.5257415771484375, -0.46728515625, -0.4088287353515625, -0.350372314453125, -0.2919158935546875, -0.23345947265625, -0.1750030517578125, -0.116546630859375, -0.0580902099609375, 0.0003662109375, 0.0588226318359375, 0.117279052734375, 0.1757354736328125, 0.23419189453125, 0.2926483154296875, 0.351104736328125, 0.4095611572265625, 0.468017578125, 0.5264739990234375, 0.584930419921875, 0.6433868408203125, 0.70184326171875, 0.7602996826171875, 0.818756103515625, 0.8772125244140625, 0.9356689453125, 0.9941253662109375, 1.052581787109375, 1.1110382080078125, 1.16949462890625, 1.2279510498046875, 1.286407470703125, 1.3448638916015625, 1.4033203125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 16.0, 13.0, 19.0, 36.0, 51.0, 89.0, 198.0, 428.0, 762.0, 950.0, 670.0, 383.0, 171.0, 83.0, 42.0, 28.0, 23.0, 13.0, 15.0, 14.0, 12.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3701171875, -0.3583221435546875, -0.346527099609375, -0.3347320556640625, -0.32293701171875, -0.3111419677734375, -0.299346923828125, -0.2875518798828125, -0.2757568359375, -0.2639617919921875, -0.252166748046875, -0.2403717041015625, -0.22857666015625, -0.2167816162109375, -0.204986572265625, -0.1931915283203125, -0.181396484375, -0.1696014404296875, -0.157806396484375, -0.1460113525390625, -0.13421630859375, -0.1224212646484375, -0.110626220703125, -0.0988311767578125, -0.0870361328125, -0.0752410888671875, -0.063446044921875, -0.0516510009765625, -0.03985595703125, -0.0280609130859375, -0.016265869140625, -0.0044708251953125, 0.00732421875, 0.0191192626953125, 0.030914306640625, 0.0427093505859375, 0.05450439453125, 0.0662994384765625, 0.078094482421875, 0.0898895263671875, 0.1016845703125, 0.1134796142578125, 0.125274658203125, 0.1370697021484375, 0.14886474609375, 0.1606597900390625, 0.172454833984375, 0.1842498779296875, 0.196044921875, 0.2078399658203125, 0.219635009765625, 0.2314300537109375, 0.24322509765625, 0.2550201416015625, 0.266815185546875, 0.2786102294921875, 0.2904052734375, 0.3022003173828125, 0.313995361328125, 0.3257904052734375, 0.33758544921875, 0.3493804931640625, 0.361175537109375, 0.3729705810546875, 0.384765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 2.0, 10.0, 8.0, 8.0, 15.0, 20.0, 18.0, 25.0, 30.0, 46.0, 60.0, 61.0, 79.0, 66.0, 87.0, 73.0, 63.0, 69.0, 50.0, 68.0, 36.0, 34.0, 18.0, 11.0, 4.0, 9.0, 7.0, 2.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8555957674980164, -0.8292353749275208, -0.8028750419616699, -0.7765146493911743, -0.7501542568206787, -0.7237939238548279, -0.6974335312843323, -0.6710731983184814, -0.6447128057479858, -0.6183524131774902, -0.5919920802116394, -0.5656316876411438, -0.539271354675293, -0.5129109621047974, -0.48655056953430176, -0.46019020676612854, -0.4338298439979553, -0.4074694812297821, -0.3811091184616089, -0.3547487258911133, -0.32838836312294006, -0.30202800035476685, -0.27566760778427124, -0.24930724501609802, -0.2229468822479248, -0.1965865194797516, -0.17022614181041718, -0.14386576414108276, -0.11750540137290955, -0.09114503860473633, -0.06478466093540192, -0.038424283266067505, -0.012063860893249512, 0.014296509325504303, 0.04065687954425812, 0.06701724976301193, 0.09337761998176575, 0.11973798274993896, 0.14609836041927338, 0.1724587380886078, 0.198819100856781, 0.22517946362495422, 0.25153982639312744, 0.27790021896362305, 0.30426058173179626, 0.3306209444999695, 0.3569813370704651, 0.3833416998386383, 0.4097020626068115, 0.43606242537498474, 0.46242278814315796, 0.48878318071365356, 0.5151435136795044, 0.54150390625, 0.5678642988204956, 0.5942246913909912, 0.620585024356842, 0.6469454169273376, 0.6733057498931885, 0.6996661424636841, 0.7260265350341797, 0.7523868680000305, 0.7787472605705261, 0.805107593536377, 0.8314679861068726]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 1.0, 5.0, 6.0, 7.0, 11.0, 19.0, 15.0, 21.0, 19.0, 38.0, 35.0, 34.0, 32.0, 41.0, 47.0, 51.0, 43.0, 42.0, 34.0, 38.0, 46.0, 36.0, 47.0, 40.0, 26.0, 30.0, 26.0, 28.0, 25.0, 22.0, 24.0, 21.0, 17.0, 14.0, 7.0, 13.0, 4.0, 5.0, 2.0, 2.0, 6.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5326315760612488, -0.5152978301048279, -0.497964084148407, -0.4806303381919861, -0.4632965922355652, -0.4459628462791443, -0.4286291003227234, -0.4112953543663025, -0.3939616084098816, -0.3766278624534607, -0.3592941164970398, -0.3419603705406189, -0.324626624584198, -0.3072928786277771, -0.2899591326713562, -0.2726253867149353, -0.2552916407585144, -0.2379578948020935, -0.2206241488456726, -0.2032904028892517, -0.1859566569328308, -0.1686229109764099, -0.151289165019989, -0.13395541906356812, -0.11662167310714722, -0.09928792715072632, -0.08195418119430542, -0.06462043523788452, -0.04728668928146362, -0.029952943325042725, -0.012619197368621826, 0.004714548587799072, 0.022048234939575195, 0.039381980895996094, 0.05671572685241699, 0.07404947280883789, 0.09138321876525879, 0.10871696472167969, 0.12605071067810059, 0.14338445663452148, 0.16071820259094238, 0.17805194854736328, 0.19538569450378418, 0.21271944046020508, 0.23005318641662598, 0.24738693237304688, 0.2647206783294678, 0.28205442428588867, 0.29938817024230957, 0.31672191619873047, 0.33405566215515137, 0.35138940811157227, 0.36872315406799316, 0.38605690002441406, 0.40339064598083496, 0.42072439193725586, 0.43805813789367676, 0.45539188385009766, 0.47272562980651855, 0.49005937576293945, 0.5073931217193604, 0.5247268676757812, 0.5420606136322021, 0.559394359588623, 0.576728105545044]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 5.0, 2.0, 9.0, 12.0, 22.0, 19.0, 17.0, 30.0, 40.0, 54.0, 88.0, 93.0, 110.0, 140.0, 175.0, 248.0, 327.0, 533.0, 931.0, 1925.0, 4816.0, 15830.0, 73732.0, 582882.0, 306066.0, 42596.0, 10535.0, 3444.0, 1385.0, 745.0, 451.0, 340.0, 235.0, 171.0, 114.0, 108.0, 82.0, 49.0, 47.0, 27.0, 30.0, 24.0, 16.0, 13.0, 15.0, 2.0, 2.0, 2.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.16269302368164062, -0.15705108642578125, -0.15140914916992188, -0.1457672119140625, -0.14012527465820312, -0.13448333740234375, -0.12884140014648438, -0.123199462890625, -0.11755752563476562, -0.11191558837890625, -0.10627365112304688, -0.1006317138671875, -0.09498977661132812, -0.08934783935546875, -0.08370590209960938, -0.07806396484375, -0.07242202758789062, -0.06678009033203125, -0.061138153076171875, -0.0554962158203125, -0.049854278564453125, -0.04421234130859375, -0.038570404052734375, -0.032928466796875, -0.027286529541015625, -0.02164459228515625, -0.016002655029296875, -0.0103607177734375, -0.004718780517578125, 0.00092315673828125, 0.006565093994140625, 0.01220703125, 0.017848968505859375, 0.02349090576171875, 0.029132843017578125, 0.0347747802734375, 0.040416717529296875, 0.04605865478515625, 0.051700592041015625, 0.057342529296875, 0.06298446655273438, 0.06862640380859375, 0.07426834106445312, 0.0799102783203125, 0.08555221557617188, 0.09119415283203125, 0.09683609008789062, 0.10247802734375, 0.10811996459960938, 0.11376190185546875, 0.11940383911132812, 0.1250457763671875, 0.13068771362304688, 0.13632965087890625, 0.14197158813476562, 0.147613525390625, 0.15325546264648438, 0.15889739990234375, 0.16453933715820312, 0.1701812744140625, 0.17582321166992188, 0.18146514892578125, 0.18710708618164062, 0.1927490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 6.0, 5.0, 13.0, 17.0, 15.0, 20.0, 25.0, 30.0, 28.0, 39.0, 32.0, 44.0, 44.0, 52.0, 42.0, 54.0, 42.0, 43.0, 56.0, 37.0, 44.0, 37.0, 27.0, 33.0, 30.0, 25.0, 22.0, 18.0, 25.0, 13.0, 16.0, 14.0, 11.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3408203125, -0.328857421875, -0.31689453125, -0.304931640625, -0.29296875, -0.281005859375, -0.26904296875, -0.257080078125, -0.2451171875, -0.233154296875, -0.22119140625, -0.209228515625, -0.197265625, -0.185302734375, -0.17333984375, -0.161376953125, -0.1494140625, -0.137451171875, -0.12548828125, -0.113525390625, -0.1015625, -0.089599609375, -0.07763671875, -0.065673828125, -0.0537109375, -0.041748046875, -0.02978515625, -0.017822265625, -0.005859375, 0.006103515625, 0.01806640625, 0.030029296875, 0.0419921875, 0.053955078125, 0.06591796875, 0.077880859375, 0.08984375, 0.101806640625, 0.11376953125, 0.125732421875, 0.1376953125, 0.149658203125, 0.16162109375, 0.173583984375, 0.185546875, 0.197509765625, 0.20947265625, 0.221435546875, 0.2333984375, 0.245361328125, 0.25732421875, 0.269287109375, 0.28125, 0.293212890625, 0.30517578125, 0.317138671875, 0.3291015625, 0.341064453125, 0.35302734375, 0.364990234375, 0.376953125, 0.388916015625, 0.40087890625, 0.412841796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 6.0, 6.0, 15.0, 29.0, 37.0, 74.0, 86.0, 118.0, 189.0, 300.0, 419.0, 631.0, 982.0, 1456.0, 2214.0, 3423.0, 5328.0, 8179.0, 12839.0, 20766.0, 35147.0, 63257.0, 125033.0, 243837.0, 243076.0, 125257.0, 63481.0, 35485.0, 20672.0, 12607.0, 8240.0, 5245.0, 3438.0, 2304.0, 1432.0, 1003.0, 666.0, 446.0, 249.0, 191.0, 143.0, 86.0, 49.0, 29.0, 25.0, 25.0, 14.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.045074462890625, -0.04362058639526367, -0.042166709899902344, -0.040712833404541016, -0.03925895690917969, -0.03780508041381836, -0.03635120391845703, -0.0348973274230957, -0.033443450927734375, -0.03198957443237305, -0.03053569793701172, -0.02908182144165039, -0.027627944946289062, -0.026174068450927734, -0.024720191955566406, -0.023266315460205078, -0.02181243896484375, -0.020358562469482422, -0.018904685974121094, -0.017450809478759766, -0.015996932983398438, -0.01454305648803711, -0.013089179992675781, -0.011635303497314453, -0.010181427001953125, -0.008727550506591797, -0.007273674011230469, -0.005819797515869141, -0.0043659210205078125, -0.0029120445251464844, -0.0014581680297851562, -4.291534423828125e-06, 0.0014495849609375, 0.002903461456298828, 0.004357337951660156, 0.005811214447021484, 0.0072650909423828125, 0.00871896743774414, 0.010172843933105469, 0.011626720428466797, 0.013080596923828125, 0.014534473419189453, 0.01598834991455078, 0.01744222640991211, 0.018896102905273438, 0.020349979400634766, 0.021803855895996094, 0.023257732391357422, 0.02471160888671875, 0.026165485382080078, 0.027619361877441406, 0.029073238372802734, 0.030527114868164062, 0.03198099136352539, 0.03343486785888672, 0.03488874435424805, 0.036342620849609375, 0.0377964973449707, 0.03925037384033203, 0.04070425033569336, 0.04215812683105469, 0.043612003326416016, 0.045065879821777344, 0.04651975631713867, 0.0479736328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 12.0, 9.0, 13.0, 15.0, 11.0, 27.0, 29.0, 25.0, 26.0, 31.0, 38.0, 31.0, 43.0, 48.0, 52.0, 41.0, 45.0, 54.0, 44.0, 50.0, 32.0, 40.0, 36.0, 32.0, 38.0, 21.0, 18.0, 12.0, 15.0, 15.0, 17.0, 4.0, 9.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.966796875, -0.9393692016601562, -0.9119415283203125, -0.8845138549804688, -0.857086181640625, -0.8296585083007812, -0.8022308349609375, -0.7748031616210938, -0.74737548828125, -0.7199478149414062, -0.6925201416015625, -0.6650924682617188, -0.637664794921875, -0.6102371215820312, -0.5828094482421875, -0.5553817749023438, -0.5279541015625, -0.5005264282226562, -0.4730987548828125, -0.44567108154296875, -0.418243408203125, -0.39081573486328125, -0.3633880615234375, -0.33596038818359375, -0.30853271484375, -0.28110504150390625, -0.2536773681640625, -0.22624969482421875, -0.198822021484375, -0.17139434814453125, -0.1439666748046875, -0.11653900146484375, -0.089111328125, -0.06168365478515625, -0.0342559814453125, -0.00682830810546875, 0.020599365234375, 0.04802703857421875, 0.0754547119140625, 0.10288238525390625, 0.13031005859375, 0.15773773193359375, 0.1851654052734375, 0.21259307861328125, 0.240020751953125, 0.26744842529296875, 0.2948760986328125, 0.32230377197265625, 0.3497314453125, 0.37715911865234375, 0.4045867919921875, 0.43201446533203125, 0.459442138671875, 0.48686981201171875, 0.5142974853515625, 0.5417251586914062, 0.56915283203125, 0.5965805053710938, 0.6240081787109375, 0.6514358520507812, 0.678863525390625, 0.7062911987304688, 0.7337188720703125, 0.7611465454101562, 0.78857421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 3.0, 5.0, 6.0, 9.0, 25.0, 25.0, 43.0, 77.0, 113.0, 210.0, 462.0, 1141.0, 3547.0, 14337.0, 131140.0, 797473.0, 83850.0, 11107.0, 2963.0, 1022.0, 420.0, 215.0, 141.0, 85.0, 47.0, 38.0, 22.0, 9.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023681640625, -0.02284836769104004, -0.022015094757080078, -0.021181821823120117, -0.020348548889160156, -0.019515275955200195, -0.018682003021240234, -0.017848730087280273, -0.017015457153320312, -0.01618218421936035, -0.01534891128540039, -0.01451563835144043, -0.013682365417480469, -0.012849092483520508, -0.012015819549560547, -0.011182546615600586, -0.010349273681640625, -0.009516000747680664, -0.008682727813720703, -0.007849454879760742, -0.007016181945800781, -0.00618290901184082, -0.005349636077880859, -0.0045163631439208984, -0.0036830902099609375, -0.0028498172760009766, -0.0020165443420410156, -0.0011832714080810547, -0.00034999847412109375, 0.0004832744598388672, 0.0013165473937988281, 0.002149820327758789, 0.00298309326171875, 0.003816366195678711, 0.004649639129638672, 0.005482912063598633, 0.006316184997558594, 0.007149457931518555, 0.007982730865478516, 0.008816003799438477, 0.009649276733398438, 0.010482549667358398, 0.01131582260131836, 0.01214909553527832, 0.012982368469238281, 0.013815641403198242, 0.014648914337158203, 0.015482187271118164, 0.016315460205078125, 0.017148733139038086, 0.017982006072998047, 0.018815279006958008, 0.01964855194091797, 0.02048182487487793, 0.02131509780883789, 0.02214837074279785, 0.022981643676757812, 0.023814916610717773, 0.024648189544677734, 0.025481462478637695, 0.026314735412597656, 0.027148008346557617, 0.027981281280517578, 0.02881455421447754, 0.0296478271484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 11.0, 8.0, 21.0, 25.0, 35.0, 62.0, 81.0, 109.0, 104.0, 151.0, 106.0, 77.0, 61.0, 45.0, 23.0, 29.0, 10.0, 9.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.8584152460098267e-05, -2.7664005756378174e-05, -2.674385905265808e-05, -2.5823712348937988e-05, -2.4903565645217896e-05, -2.3983418941497803e-05, -2.306327223777771e-05, -2.2143125534057617e-05, -2.1222978830337524e-05, -2.030283212661743e-05, -1.938268542289734e-05, -1.8462538719177246e-05, -1.7542392015457153e-05, -1.662224531173706e-05, -1.5702098608016968e-05, -1.4781951904296875e-05, -1.3861805200576782e-05, -1.294165849685669e-05, -1.2021511793136597e-05, -1.1101365089416504e-05, -1.0181218385696411e-05, -9.261071681976318e-06, -8.340924978256226e-06, -7.420778274536133e-06, -6.50063157081604e-06, -5.580484867095947e-06, -4.6603381633758545e-06, -3.7401914596557617e-06, -2.820044755935669e-06, -1.8998980522155762e-06, -9.797513484954834e-07, -5.960464477539063e-08, 8.605420589447021e-07, 1.780688762664795e-06, 2.7008354663848877e-06, 3.6209821701049805e-06, 4.541128873825073e-06, 5.461275577545166e-06, 6.381422281265259e-06, 7.3015689849853516e-06, 8.221715688705444e-06, 9.141862392425537e-06, 1.006200909614563e-05, 1.0982155799865723e-05, 1.1902302503585815e-05, 1.2822449207305908e-05, 1.3742595911026001e-05, 1.4662742614746094e-05, 1.5582889318466187e-05, 1.650303602218628e-05, 1.7423182725906372e-05, 1.8343329429626465e-05, 1.9263476133346558e-05, 2.018362283706665e-05, 2.1103769540786743e-05, 2.2023916244506836e-05, 2.294406294822693e-05, 2.386420965194702e-05, 2.4784356355667114e-05, 2.5704503059387207e-05, 2.66246497631073e-05, 2.7544796466827393e-05, 2.8464943170547485e-05, 2.9385089874267578e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 16.0, 18.0, 30.0, 44.0, 71.0, 97.0, 109.0, 163.0, 250.0, 380.0, 581.0, 909.0, 1563.0, 2707.0, 5049.0, 10752.0, 24902.0, 69768.0, 258366.0, 453844.0, 140091.0, 43873.0, 17385.0, 7868.0, 3902.0, 2154.0, 1238.0, 785.0, 486.0, 325.0, 281.0, 148.0, 111.0, 89.0, 50.0, 41.0, 31.0, 14.0, 12.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.01119232177734375, -0.010834455490112305, -0.01047658920288086, -0.010118722915649414, -0.009760856628417969, -0.009402990341186523, -0.009045124053955078, -0.008687257766723633, -0.008329391479492188, -0.007971525192260742, -0.007613658905029297, -0.0072557926177978516, -0.006897926330566406, -0.006540060043334961, -0.006182193756103516, -0.00582432746887207, -0.005466461181640625, -0.00510859489440918, -0.004750728607177734, -0.004392862319946289, -0.004034996032714844, -0.0036771297454833984, -0.003319263458251953, -0.002961397171020508, -0.0026035308837890625, -0.002245664596557617, -0.0018877983093261719, -0.0015299320220947266, -0.0011720657348632812, -0.0008141994476318359, -0.0004563331604003906, -9.846687316894531e-05, 0.0002593994140625, 0.0006172657012939453, 0.0009751319885253906, 0.001332998275756836, 0.0016908645629882812, 0.0020487308502197266, 0.002406597137451172, 0.002764463424682617, 0.0031223297119140625, 0.003480195999145508, 0.003838062286376953, 0.0041959285736083984, 0.004553794860839844, 0.004911661148071289, 0.005269527435302734, 0.00562739372253418, 0.005985260009765625, 0.00634312629699707, 0.006700992584228516, 0.007058858871459961, 0.007416725158691406, 0.0077745914459228516, 0.008132457733154297, 0.008490324020385742, 0.008848190307617188, 0.009206056594848633, 0.009563922882080078, 0.009921789169311523, 0.010279655456542969, 0.010637521743774414, 0.01099538803100586, 0.011353254318237305, 0.01171112060546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 11.0, 13.0, 23.0, 29.0, 55.0, 61.0, 76.0, 115.0, 145.0, 129.0, 83.0, 53.0, 37.0, 41.0, 28.0, 13.0, 19.0, 14.0, 8.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00505828857421875, -0.004892170429229736, -0.004726052284240723, -0.004559934139251709, -0.004393815994262695, -0.004227697849273682, -0.004061579704284668, -0.0038954615592956543, -0.0037293434143066406, -0.003563225269317627, -0.0033971071243286133, -0.0032309889793395996, -0.003064870834350586, -0.0028987526893615723, -0.0027326345443725586, -0.002566516399383545, -0.0024003982543945312, -0.0022342801094055176, -0.002068161964416504, -0.0019020438194274902, -0.0017359256744384766, -0.0015698075294494629, -0.0014036893844604492, -0.0012375712394714355, -0.0010714530944824219, -0.0009053349494934082, -0.0007392168045043945, -0.0005730986595153809, -0.0004069805145263672, -0.00024086236953735352, -7.474422454833984e-05, 9.137392044067383e-05, 0.0002574920654296875, 0.00042361021041870117, 0.0005897283554077148, 0.0007558465003967285, 0.0009219646453857422, 0.0010880827903747559, 0.0012542009353637695, 0.0014203190803527832, 0.0015864372253417969, 0.0017525553703308105, 0.0019186735153198242, 0.002084791660308838, 0.0022509098052978516, 0.0024170279502868652, 0.002583146095275879, 0.0027492642402648926, 0.0029153823852539062, 0.00308150053024292, 0.0032476186752319336, 0.0034137368202209473, 0.003579854965209961, 0.0037459731101989746, 0.003912091255187988, 0.004078209400177002, 0.004244327545166016, 0.004410445690155029, 0.004576563835144043, 0.004742681980133057, 0.00490880012512207, 0.005074918270111084, 0.005241036415100098, 0.005407154560089111, 0.005573272705078125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 10.0, 11.0, 17.0, 28.0, 38.0, 45.0, 74.0, 89.0, 96.0, 111.0, 84.0, 90.0, 102.0, 56.0, 45.0, 27.0, 28.0, 11.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.8398318886756897, -0.8192303776741028, -0.7986288070678711, -0.7780272960662842, -0.7574257850646973, -0.7368242740631104, -0.7162227034568787, -0.6956211924552917, -0.6750196218490601, -0.6544181108474731, -0.6338165402412415, -0.6132150292396545, -0.5926135182380676, -0.5720119476318359, -0.551410436630249, -0.5308089256286621, -0.5102074146270752, -0.4896058738231659, -0.469004362821579, -0.4484028220176697, -0.42780131101608276, -0.40719977021217346, -0.38659822940826416, -0.36599671840667725, -0.34539517760276794, -0.32479363679885864, -0.30419212579727173, -0.2835905849933624, -0.2629890441894531, -0.2423875331878662, -0.2217859923839569, -0.2011844664812088, -0.18058300018310547, -0.15998147428035736, -0.13937994837760925, -0.11877840757369995, -0.09817688167095184, -0.07757535576820374, -0.05697382241487503, -0.036372289061546326, -0.015770763158798218, 0.004830766469240189, 0.025432296097278595, 0.046033825725317, 0.06663535535335541, 0.08723688125610352, 0.10783841460943222, 0.12843994796276093, 0.14904147386550903, 0.16964299976825714, 0.19024452567100525, 0.21084606647491455, 0.23144759237766266, 0.25204911828041077, 0.27265065908432007, 0.293252170085907, 0.3138537108898163, 0.3344552516937256, 0.3550567626953125, 0.3756583034992218, 0.3962598443031311, 0.416861355304718, 0.4374628961086273, 0.4580644369125366, 0.47866594791412354]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 5.0, 9.0, 10.0, 19.0, 12.0, 22.0, 20.0, 34.0, 41.0, 32.0, 31.0, 46.0, 54.0, 53.0, 48.0, 37.0, 43.0, 37.0, 44.0, 47.0, 37.0, 36.0, 28.0, 26.0, 32.0, 22.0, 26.0, 25.0, 23.0, 18.0, 15.0, 9.0, 10.0, 5.0, 6.0, 2.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3273007869720459, -0.3163032829761505, -0.3053057789802551, -0.29430827498435974, -0.28331077098846436, -0.27231326699256897, -0.2613157629966736, -0.2503182590007782, -0.2393207550048828, -0.22832325100898743, -0.21732574701309204, -0.20632824301719666, -0.19533073902130127, -0.18433323502540588, -0.1733357310295105, -0.1623382270336151, -0.15134072303771973, -0.14034321904182434, -0.12934571504592896, -0.11834821105003357, -0.10735070705413818, -0.0963532030582428, -0.08535569906234741, -0.07435819506645203, -0.06336069107055664, -0.052363187074661255, -0.04136568307876587, -0.030368179082870483, -0.019370675086975098, -0.008373171091079712, 0.002624332904815674, 0.01362183690071106, 0.024619340896606445, 0.03561684489250183, 0.04661434888839722, 0.0576118528842926, 0.06860935688018799, 0.07960686087608337, 0.09060436487197876, 0.10160186886787415, 0.11259937286376953, 0.12359687685966492, 0.1345943808555603, 0.1455918848514557, 0.15658938884735107, 0.16758689284324646, 0.17858439683914185, 0.18958190083503723, 0.20057940483093262, 0.211576908826828, 0.2225744128227234, 0.23357191681861877, 0.24456942081451416, 0.25556692481040955, 0.26656442880630493, 0.2775619328022003, 0.2885594367980957, 0.2995569407939911, 0.3105544447898865, 0.32155194878578186, 0.33254945278167725, 0.34354695677757263, 0.354544460773468, 0.3655419647693634, 0.3765394687652588]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 13.0, 16.0, 27.0, 41.0, 57.0, 78.0, 100.0, 175.0, 217.0, 334.0, 456.0, 802.0, 1147.0, 1867.0, 2911.0, 4729.0, 7918.0, 13779.0, 25994.0, 53414.0, 135694.0, 409575.0, 232179.0, 77421.0, 35152.0, 18280.0, 10215.0, 5882.0, 3506.0, 2272.0, 1472.0, 927.0, 609.0, 418.0, 281.0, 193.0, 132.0, 66.0, 65.0, 40.0, 32.0, 25.0, 5.0, 10.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.60400390625, -0.58660888671875, -0.5692138671875, -0.55181884765625, -0.534423828125, -0.51702880859375, -0.4996337890625, -0.48223876953125, -0.46484375, -0.44744873046875, -0.4300537109375, -0.41265869140625, -0.395263671875, -0.37786865234375, -0.3604736328125, -0.34307861328125, -0.32568359375, -0.30828857421875, -0.2908935546875, -0.27349853515625, -0.256103515625, -0.23870849609375, -0.2213134765625, -0.20391845703125, -0.1865234375, -0.16912841796875, -0.1517333984375, -0.13433837890625, -0.116943359375, -0.09954833984375, -0.0821533203125, -0.06475830078125, -0.04736328125, -0.02996826171875, -0.0125732421875, 0.00482177734375, 0.022216796875, 0.03961181640625, 0.0570068359375, 0.07440185546875, 0.091796875, 0.10919189453125, 0.1265869140625, 0.14398193359375, 0.161376953125, 0.17877197265625, 0.1961669921875, 0.21356201171875, 0.23095703125, 0.24835205078125, 0.2657470703125, 0.28314208984375, 0.300537109375, 0.31793212890625, 0.3353271484375, 0.35272216796875, 0.3701171875, 0.38751220703125, 0.4049072265625, 0.42230224609375, 0.439697265625, 0.45709228515625, 0.4744873046875, 0.49188232421875, 0.50927734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 5.0, 8.0, 6.0, 12.0, 16.0, 26.0, 22.0, 32.0, 35.0, 28.0, 34.0, 42.0, 51.0, 45.0, 67.0, 41.0, 48.0, 50.0, 46.0, 46.0, 38.0, 35.0, 33.0, 32.0, 29.0, 24.0, 19.0, 21.0, 23.0, 14.0, 16.0, 7.0, 5.0, 7.0, 5.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6162109375, -0.5967330932617188, -0.5772552490234375, -0.5577774047851562, -0.538299560546875, -0.5188217163085938, -0.4993438720703125, -0.47986602783203125, -0.46038818359375, -0.44091033935546875, -0.4214324951171875, -0.40195465087890625, -0.382476806640625, -0.36299896240234375, -0.3435211181640625, -0.32404327392578125, -0.3045654296875, -0.28508758544921875, -0.2656097412109375, -0.24613189697265625, -0.226654052734375, -0.20717620849609375, -0.1876983642578125, -0.16822052001953125, -0.14874267578125, -0.12926483154296875, -0.1097869873046875, -0.09030914306640625, -0.070831298828125, -0.05135345458984375, -0.0318756103515625, -0.01239776611328125, 0.007080078125, 0.02655792236328125, 0.0460357666015625, 0.06551361083984375, 0.084991455078125, 0.10446929931640625, 0.1239471435546875, 0.14342498779296875, 0.16290283203125, 0.18238067626953125, 0.2018585205078125, 0.22133636474609375, 0.240814208984375, 0.26029205322265625, 0.2797698974609375, 0.29924774169921875, 0.3187255859375, 0.33820343017578125, 0.3576812744140625, 0.37715911865234375, 0.396636962890625, 0.41611480712890625, 0.4355926513671875, 0.45507049560546875, 0.47454833984375, 0.49402618408203125, 0.5135040283203125, 0.5329818725585938, 0.552459716796875, 0.5719375610351562, 0.5914154052734375, 0.6108932495117188, 0.63037109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 8.0, 15.0, 16.0, 22.0, 36.0, 35.0, 45.0, 74.0, 123.0, 153.0, 219.0, 343.0, 578.0, 819.0, 1460.0, 2429.0, 4477.0, 8718.0, 18592.0, 43039.0, 127737.0, 485368.0, 236318.0, 65977.0, 25962.0, 12028.0, 6032.0, 3160.0, 1780.0, 1028.0, 636.0, 417.0, 274.0, 188.0, 118.0, 88.0, 66.0, 57.0, 32.0, 22.0, 19.0, 14.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7849884033203125, -0.759429931640625, -0.7338714599609375, -0.70831298828125, -0.6827545166015625, -0.657196044921875, -0.6316375732421875, -0.6060791015625, -0.5805206298828125, -0.554962158203125, -0.5294036865234375, -0.50384521484375, -0.4782867431640625, -0.452728271484375, -0.4271697998046875, -0.401611328125, -0.3760528564453125, -0.350494384765625, -0.3249359130859375, -0.29937744140625, -0.2738189697265625, -0.248260498046875, -0.2227020263671875, -0.1971435546875, -0.1715850830078125, -0.146026611328125, -0.1204681396484375, -0.09490966796875, -0.0693511962890625, -0.043792724609375, -0.0182342529296875, 0.00732421875, 0.0328826904296875, 0.058441162109375, 0.0839996337890625, 0.10955810546875, 0.1351165771484375, 0.160675048828125, 0.1862335205078125, 0.2117919921875, 0.2373504638671875, 0.262908935546875, 0.2884674072265625, 0.31402587890625, 0.3395843505859375, 0.365142822265625, 0.3907012939453125, 0.416259765625, 0.4418182373046875, 0.467376708984375, 0.4929351806640625, 0.51849365234375, 0.5440521240234375, 0.569610595703125, 0.5951690673828125, 0.6207275390625, 0.6462860107421875, 0.671844482421875, 0.6974029541015625, 0.72296142578125, 0.7485198974609375, 0.774078369140625, 0.7996368408203125, 0.8251953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 9.0, 6.0, 9.0, 11.0, 14.0, 14.0, 26.0, 28.0, 38.0, 35.0, 48.0, 52.0, 54.0, 58.0, 57.0, 64.0, 76.0, 74.0, 63.0, 53.0, 34.0, 40.0, 29.0, 30.0, 18.0, 11.0, 12.0, 16.0, 8.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.0624160766601562, -1.0310821533203125, -0.9997482299804688, -0.968414306640625, -0.9370803833007812, -0.9057464599609375, -0.8744125366210938, -0.84307861328125, -0.8117446899414062, -0.7804107666015625, -0.7490768432617188, -0.717742919921875, -0.6864089965820312, -0.6550750732421875, -0.6237411499023438, -0.5924072265625, -0.5610733032226562, -0.5297393798828125, -0.49840545654296875, -0.467071533203125, -0.43573760986328125, -0.4044036865234375, -0.37306976318359375, -0.34173583984375, -0.31040191650390625, -0.2790679931640625, -0.24773406982421875, -0.216400146484375, -0.18506622314453125, -0.1537322998046875, -0.12239837646484375, -0.091064453125, -0.05973052978515625, -0.0283966064453125, 0.00293731689453125, 0.034271240234375, 0.06560516357421875, 0.0969390869140625, 0.12827301025390625, 0.15960693359375, 0.19094085693359375, 0.2222747802734375, 0.25360870361328125, 0.284942626953125, 0.31627655029296875, 0.3476104736328125, 0.37894439697265625, 0.4102783203125, 0.44161224365234375, 0.4729461669921875, 0.5042800903320312, 0.535614013671875, 0.5669479370117188, 0.5982818603515625, 0.6296157836914062, 0.66094970703125, 0.6922836303710938, 0.7236175537109375, 0.7549514770507812, 0.786285400390625, 0.8176193237304688, 0.8489532470703125, 0.8802871704101562, 0.91162109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 11.0, 13.0, 18.0, 17.0, 27.0, 41.0, 57.0, 69.0, 116.0, 133.0, 198.0, 319.0, 491.0, 765.0, 1134.0, 1896.0, 3174.0, 5658.0, 12474.0, 38113.0, 205791.0, 638439.0, 96388.0, 22960.0, 8776.0, 4393.0, 2529.0, 1527.0, 975.0, 675.0, 412.0, 326.0, 204.0, 147.0, 91.0, 56.0, 43.0, 28.0, 21.0, 11.0, 18.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.223388671875, -0.21706008911132812, -0.21073150634765625, -0.20440292358398438, -0.1980743408203125, -0.19174575805664062, -0.18541717529296875, -0.17908859252929688, -0.172760009765625, -0.16643142700195312, -0.16010284423828125, -0.15377426147460938, -0.1474456787109375, -0.14111709594726562, -0.13478851318359375, -0.12845993041992188, -0.12213134765625, -0.11580276489257812, -0.10947418212890625, -0.10314559936523438, -0.0968170166015625, -0.09048843383789062, -0.08415985107421875, -0.07783126831054688, -0.071502685546875, -0.06517410278320312, -0.05884552001953125, -0.052516937255859375, -0.0461883544921875, -0.039859771728515625, -0.03353118896484375, -0.027202606201171875, -0.0208740234375, -0.014545440673828125, -0.00821685791015625, -0.001888275146484375, 0.0044403076171875, 0.010768890380859375, 0.01709747314453125, 0.023426055908203125, 0.029754638671875, 0.036083221435546875, 0.04241180419921875, 0.048740386962890625, 0.0550689697265625, 0.061397552490234375, 0.06772613525390625, 0.07405471801757812, 0.08038330078125, 0.08671188354492188, 0.09304046630859375, 0.09936904907226562, 0.1056976318359375, 0.11202621459960938, 0.11835479736328125, 0.12468338012695312, 0.131011962890625, 0.13734054565429688, 0.14366912841796875, 0.14999771118164062, 0.1563262939453125, 0.16265487670898438, 0.16898345947265625, 0.17531204223632812, 0.181640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 12.0, 10.0, 17.0, 24.0, 44.0, 89.0, 171.0, 294.0, 154.0, 67.0, 52.0, 26.0, 10.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.633996963500977e-05, -6.428547203540802e-05, -6.223097443580627e-05, -6.017647683620453e-05, -5.812197923660278e-05, -5.606748163700104e-05, -5.401298403739929e-05, -5.1958486437797546e-05, -4.99039888381958e-05, -4.7849491238594055e-05, -4.579499363899231e-05, -4.3740496039390564e-05, -4.168599843978882e-05, -3.963150084018707e-05, -3.757700324058533e-05, -3.552250564098358e-05, -3.3468008041381836e-05, -3.141351044178009e-05, -2.9359012842178345e-05, -2.73045152425766e-05, -2.5250017642974854e-05, -2.3195520043373108e-05, -2.1141022443771362e-05, -1.9086524844169617e-05, -1.703202724456787e-05, -1.4977529644966125e-05, -1.292303204536438e-05, -1.0868534445762634e-05, -8.814036846160889e-06, -6.759539246559143e-06, -4.7050416469573975e-06, -2.650544047355652e-06, -5.960464477539062e-07, 1.4584511518478394e-06, 3.512948751449585e-06, 5.5674463510513306e-06, 7.621943950653076e-06, 9.676441550254822e-06, 1.1730939149856567e-05, 1.3785436749458313e-05, 1.583993434906006e-05, 1.7894431948661804e-05, 1.994892954826355e-05, 2.2003427147865295e-05, 2.405792474746704e-05, 2.6112422347068787e-05, 2.8166919946670532e-05, 3.0221417546272278e-05, 3.2275915145874023e-05, 3.433041274547577e-05, 3.6384910345077515e-05, 3.843940794467926e-05, 4.0493905544281006e-05, 4.254840314388275e-05, 4.46029007434845e-05, 4.665739834308624e-05, 4.871189594268799e-05, 5.0766393542289734e-05, 5.282089114189148e-05, 5.4875388741493225e-05, 5.692988634109497e-05, 5.8984383940696716e-05, 6.103888154029846e-05, 6.309337913990021e-05, 6.514787673950195e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 7.0, 14.0, 11.0, 28.0, 34.0, 38.0, 43.0, 78.0, 134.0, 186.0, 250.0, 422.0, 654.0, 1073.0, 1964.0, 3682.0, 8107.0, 22239.0, 110951.0, 777836.0, 86360.0, 19294.0, 7289.0, 3333.0, 1730.0, 1032.0, 590.0, 380.0, 262.0, 164.0, 107.0, 69.0, 48.0, 38.0, 39.0, 18.0, 7.0, 3.0, 9.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37353515625, -0.36236572265625, -0.3511962890625, -0.34002685546875, -0.328857421875, -0.31768798828125, -0.3065185546875, -0.29534912109375, -0.2841796875, -0.27301025390625, -0.2618408203125, -0.25067138671875, -0.239501953125, -0.22833251953125, -0.2171630859375, -0.20599365234375, -0.19482421875, -0.18365478515625, -0.1724853515625, -0.16131591796875, -0.150146484375, -0.13897705078125, -0.1278076171875, -0.11663818359375, -0.10546875, -0.09429931640625, -0.0831298828125, -0.07196044921875, -0.060791015625, -0.04962158203125, -0.0384521484375, -0.02728271484375, -0.01611328125, -0.00494384765625, 0.0062255859375, 0.01739501953125, 0.028564453125, 0.03973388671875, 0.0509033203125, 0.06207275390625, 0.0732421875, 0.08441162109375, 0.0955810546875, 0.10675048828125, 0.117919921875, 0.12908935546875, 0.1402587890625, 0.15142822265625, 0.16259765625, 0.17376708984375, 0.1849365234375, 0.19610595703125, 0.207275390625, 0.21844482421875, 0.2296142578125, 0.24078369140625, 0.251953125, 0.26312255859375, 0.2742919921875, 0.28546142578125, 0.296630859375, 0.30780029296875, 0.3189697265625, 0.33013916015625, 0.34130859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 13.0, 13.0, 21.0, 29.0, 38.0, 58.0, 101.0, 254.0, 206.0, 101.0, 43.0, 25.0, 22.0, 15.0, 7.0, 8.0, 5.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3369140625, -0.3290748596191406, -0.32123565673828125, -0.3133964538574219, -0.3055572509765625, -0.2977180480957031, -0.28987884521484375, -0.2820396423339844, -0.274200439453125, -0.2663612365722656, -0.25852203369140625, -0.2506828308105469, -0.2428436279296875, -0.23500442504882812, -0.22716522216796875, -0.21932601928710938, -0.21148681640625, -0.20364761352539062, -0.19580841064453125, -0.18796920776367188, -0.1801300048828125, -0.17229080200195312, -0.16445159912109375, -0.15661239624023438, -0.148773193359375, -0.14093399047851562, -0.13309478759765625, -0.12525558471679688, -0.1174163818359375, -0.10957717895507812, -0.10173797607421875, -0.09389877319335938, -0.0860595703125, -0.07822036743164062, -0.07038116455078125, -0.06254196166992188, -0.0547027587890625, -0.046863555908203125, -0.03902435302734375, -0.031185150146484375, -0.023345947265625, -0.015506744384765625, -0.00766754150390625, 0.000171661376953125, 0.0080108642578125, 0.015850067138671875, 0.02368927001953125, 0.031528472900390625, 0.03936767578125, 0.047206878662109375, 0.05504608154296875, 0.06288528442382812, 0.0707244873046875, 0.07856369018554688, 0.08640289306640625, 0.09424209594726562, 0.102081298828125, 0.10992050170898438, 0.11775970458984375, 0.12559890747070312, 0.1334381103515625, 0.14127731323242188, 0.14911651611328125, 0.15695571899414062, 0.164794921875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 18.0, 43.0, 113.0, 216.0, 281.0, 183.0, 68.0, 43.0, 16.0, 8.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9394304156303406, -0.8274624347686768, -0.7154945135116577, -0.6035265326499939, -0.49155858159065247, -0.37959063053131104, -0.2676226496696472, -0.15565472841262817, -0.043686747550964355, 0.06828121095895767, 0.1802491694688797, 0.2922171354293823, 0.40418508648872375, 0.5161530375480652, 0.628121018409729, 0.740088939666748, 0.8520569205284119, 0.9640249013900757, 1.0759928226470947, 1.1879608631134033, 1.2999287843704224, 1.4118967056274414, 1.52386474609375, 1.6358325481414795, 1.747800588607788, 1.8597685098648071, 1.9717365503311157, 2.0837044715881348, 2.1956725120544434, 2.307640314102173, 2.4196083545684814, 2.531576156616211, 2.6435444355010986, 2.7555124759674072, 2.8674802780151367, 2.9794483184814453, 3.091416358947754, 3.2033841609954834, 3.315352201461792, 3.4273200035095215, 3.53928804397583, 3.6512560844421387, 3.763223886489868, 3.8751919269561768, 3.9871599674224854, 4.099127769470215, 4.211095809936523, 4.323063850402832, 4.435031890869141, 4.546999931335449, 4.658967971801758, 4.770936012268066, 4.882903575897217, 4.994871616363525, 5.106839656829834, 5.218807697296143, 5.330775260925293, 5.442743301391602, 5.55471134185791, 5.666679382324219, 5.778646945953369, 5.890614986419678, 6.002583026885986, 6.114551067352295, 6.2265191078186035]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 14.0, 9.0, 17.0, 18.0, 19.0, 19.0, 28.0, 20.0, 33.0, 41.0, 36.0, 43.0, 50.0, 34.0, 45.0, 44.0, 46.0, 43.0, 40.0, 41.0, 38.0, 38.0, 36.0, 38.0, 26.0, 26.0, 26.0, 18.0, 11.0, 22.0, 10.0, 10.0, 5.0, 10.0, 6.0, 6.0, 3.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1712275743484497, -1.1353005170822144, -1.0993733406066895, -1.063446283340454, -1.0275192260742188, -0.9915920495986938, -0.9556649923324585, -0.9197378754615784, -0.8838107585906982, -0.8478836417198181, -0.811956524848938, -0.7760294675827026, -0.7401023507118225, -0.7041752338409424, -0.668248176574707, -0.6323210597038269, -0.5963939428329468, -0.5604668259620667, -0.5245397090911865, -0.48861265182495117, -0.45268553495407104, -0.4167584180831909, -0.3808313310146332, -0.34490424394607544, -0.3089771270751953, -0.2730500102043152, -0.23712292313575745, -0.2011958211660385, -0.16526871919631958, -0.12934161722660065, -0.09341451525688171, -0.057487428188323975, -0.021560311317443848, 0.014366790652275085, 0.05029389262199402, 0.08622099459171295, 0.12214809656143188, 0.15807519853115082, 0.19400230050086975, 0.2299293875694275, 0.2658565044403076, 0.30178362131118774, 0.3377107083797455, 0.3736377954483032, 0.40956491231918335, 0.4454920291900635, 0.4814191162586212, 0.517346203327179, 0.5532733201980591, 0.5892004370689392, 0.6251275539398193, 0.6610546112060547, 0.6969817280769348, 0.7329088449478149, 0.7688359022140503, 0.8047630190849304, 0.8406901359558105, 0.8766172528266907, 0.9125443696975708, 0.9484714269638062, 0.9843985438346863, 1.0203256607055664, 1.0562527179718018, 1.092179775238037, 1.128106951713562]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 3.0, 7.0, 9.0, 10.0, 12.0, 10.0, 20.0, 19.0, 37.0, 32.0, 29.0, 49.0, 66.0, 85.0, 114.0, 134.0, 186.0, 266.0, 367.0, 511.0, 775.0, 1117.0, 1043700.0, 852.0, 609.0, 348.0, 285.0, 183.0, 143.0, 138.0, 115.0, 82.0, 49.0, 42.0, 44.0, 33.0, 23.0, 17.0, 18.0, 16.0, 6.0, 4.0, 12.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-2.249666213989258, -2.185634136199951, -2.1216020584106445, -2.057570219039917, -1.9935381412506104, -1.9295060634613037, -1.865473985671997, -1.8014419078826904, -1.7374099493026733, -1.6733778715133667, -1.6093459129333496, -1.545313835144043, -1.4812817573547363, -1.4172497987747192, -1.3532177209854126, -1.2891857624053955, -1.2251536846160889, -1.1611216068267822, -1.0970896482467651, -1.0330575704574585, -0.9690255522727966, -0.9049935340881348, -0.8409614562988281, -0.7769294381141663, -0.7128974199295044, -0.6488654017448425, -0.5848333835601807, -0.520801305770874, -0.45676928758621216, -0.3927372694015503, -0.32870522141456604, -0.2646731734275818, -0.20064115524291992, -0.13660912215709686, -0.0725770890712738, -0.008545055985450745, 0.055486977100372314, 0.11951899528503418, 0.18355104327201843, 0.24758309125900269, 0.31161510944366455, 0.3756471276283264, 0.43967917561531067, 0.5037112236022949, 0.5677432417869568, 0.6317752599716187, 0.6958073377609253, 0.7598393559455872, 0.823871374130249, 0.8879033923149109, 0.9519354104995728, 1.0159674882888794, 1.0799994468688965, 1.1440315246582031, 1.2080636024475098, 1.2720956802368164, 1.3361276388168335, 1.4001597166061401, 1.4641916751861572, 1.5282237529754639, 1.5922558307647705, 1.6562877893447876, 1.7203198671340942, 1.7843518257141113, 1.848383903503418]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 9.0, 4.0, 9.0, 14.0, 19.0, 63.0, 185.0, 698.0, 3999.0, 51457136.0, 7224.0, 1441.0, 365.0, 100.0, 35.0, 18.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8868408203125, -11.422119140625, -10.9573974609375, -10.49267578125, -10.0279541015625, -9.563232421875, -9.0985107421875, -8.6337890625, -8.1690673828125, -7.704345703125, -7.2396240234375, -6.77490234375, -6.3101806640625, -5.845458984375, -5.3807373046875, -4.916015625, -4.4512939453125, -3.986572265625, -3.5218505859375, -3.05712890625, -2.5924072265625, -2.127685546875, -1.6629638671875, -1.1982421875, -0.7335205078125, -0.268798828125, 0.1959228515625, 0.66064453125, 1.1253662109375, 1.590087890625, 2.0548095703125, 2.51953125, 2.9842529296875, 3.448974609375, 3.9136962890625, 4.37841796875, 4.8431396484375, 5.307861328125, 5.7725830078125, 6.2373046875, 6.7020263671875, 7.166748046875, 7.6314697265625, 8.09619140625, 8.5609130859375, 9.025634765625, 9.4903564453125, 9.955078125, 10.4197998046875, 10.884521484375, 11.3492431640625, 11.81396484375, 12.2786865234375, 12.743408203125, 13.2081298828125, 13.6728515625, 14.1375732421875, 14.602294921875, 15.0670166015625, 15.53173828125, 15.9964599609375, 16.461181640625, 16.9259033203125, 17.390625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 8.0, 10.0, 24.0, 40.0, 57.0, 89.0, 115.0, 205.0, 345.0, 502.0, 821.0, 1259.0, 2018.0, 3374.0, 5373.0, 9025.0, 14975.0, 25358.0, 43325.0, 75257.0, 130813.0, 221859.0, 358504.0, 512447.0, 3692920.0, 452098.0, 301953.0, 182433.0, 106533.0, 61483.0, 35471.0, 20959.0, 12297.0, 7465.0, 4435.0, 2779.0, 1778.0, 1095.0, 683.0, 462.0, 294.0, 178.0, 110.0, 74.0, 43.0, 25.0, 27.0, 8.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.322265625, -0.312591552734375, -0.30291748046875, -0.293243408203125, -0.2835693359375, -0.273895263671875, -0.26422119140625, -0.254547119140625, -0.244873046875, -0.235198974609375, -0.22552490234375, -0.215850830078125, -0.2061767578125, -0.196502685546875, -0.18682861328125, -0.177154541015625, -0.16748046875, -0.157806396484375, -0.14813232421875, -0.138458251953125, -0.1287841796875, -0.119110107421875, -0.10943603515625, -0.099761962890625, -0.090087890625, -0.080413818359375, -0.07073974609375, -0.061065673828125, -0.0513916015625, -0.041717529296875, -0.03204345703125, -0.022369384765625, -0.0126953125, -0.003021240234375, 0.00665283203125, 0.016326904296875, 0.0260009765625, 0.035675048828125, 0.04534912109375, 0.055023193359375, 0.064697265625, 0.074371337890625, 0.08404541015625, 0.093719482421875, 0.1033935546875, 0.113067626953125, 0.12274169921875, 0.132415771484375, 0.14208984375, 0.151763916015625, 0.16143798828125, 0.171112060546875, 0.1807861328125, 0.190460205078125, 0.20013427734375, 0.209808349609375, 0.219482421875, 0.229156494140625, 0.23883056640625, 0.248504638671875, 0.2581787109375, 0.267852783203125, 0.27752685546875, 0.287200927734375, 0.296875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 5.0, 11.0, 9.0, 6.0, 11.0, 19.0, 16.0, 33.0, 16.0, 26.0, 23.0, 25.0, 30.0, 33.0, 33.0, 43.0, 61.0, 45.0, 610.0, 502.0, 35.0, 43.0, 26.0, 32.0, 44.0, 40.0, 33.0, 40.0, 20.0, 28.0, 17.0, 19.0, 18.0, 11.0, 15.0, 10.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-5.3046875, -5.148681640625, -4.99267578125, -4.836669921875, -4.6806640625, -4.524658203125, -4.36865234375, -4.212646484375, -4.056640625, -3.900634765625, -3.74462890625, -3.588623046875, -3.4326171875, -3.276611328125, -3.12060546875, -2.964599609375, -2.80859375, -2.652587890625, -2.49658203125, -2.340576171875, -2.1845703125, -2.028564453125, -1.87255859375, -1.716552734375, -1.560546875, -1.404541015625, -1.24853515625, -1.092529296875, -0.9365234375, -0.780517578125, -0.62451171875, -0.468505859375, -0.3125, -0.156494140625, -0.00048828125, 0.155517578125, 0.3115234375, 0.467529296875, 0.62353515625, 0.779541015625, 0.935546875, 1.091552734375, 1.24755859375, 1.403564453125, 1.5595703125, 1.715576171875, 1.87158203125, 2.027587890625, 2.18359375, 2.339599609375, 2.49560546875, 2.651611328125, 2.8076171875, 2.963623046875, 3.11962890625, 3.275634765625, 3.431640625, 3.587646484375, 3.74365234375, 3.899658203125, 4.0556640625, 4.211669921875, 4.36767578125, 4.523681640625, 4.6796875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 9.0, 3.0, 10.0, 14.0, 21.0, 29.0, 32.0, 61.0, 77.0, 128.0, 177.0, 258.0, 381.0, 583.0, 958.0, 1404.0, 2111.0, 3271.0, 5117.0, 7762.0, 12517.0, 19873.0, 32267.0, 52670.0, 85573.0, 136418.0, 210961.0, 302270.0, 392185.0, 3530138.0, 465793.0, 342411.0, 247783.0, 164393.0, 104271.0, 64130.0, 39428.0, 23947.0, 15160.0, 9361.0, 6158.0, 3786.0, 2541.0, 1687.0, 1168.0, 681.0, 500.0, 324.0, 249.0, 138.0, 89.0, 65.0, 31.0, 27.0, 19.0, 11.0, 13.0, 2.0, 3.0, 2.0], "bins": [-0.25439453125, -0.24684715270996094, -0.23929977416992188, -0.2317523956298828, -0.22420501708984375, -0.2166576385498047, -0.20911026000976562, -0.20156288146972656, -0.1940155029296875, -0.18646812438964844, -0.17892074584960938, -0.1713733673095703, -0.16382598876953125, -0.1562786102294922, -0.14873123168945312, -0.14118385314941406, -0.133636474609375, -0.12608909606933594, -0.11854171752929688, -0.11099433898925781, -0.10344696044921875, -0.09589958190917969, -0.08835220336914062, -0.08080482482910156, -0.0732574462890625, -0.06571006774902344, -0.058162689208984375, -0.05061531066894531, -0.04306793212890625, -0.03552055358886719, -0.027973175048828125, -0.020425796508789062, -0.01287841796875, -0.0053310394287109375, 0.002216339111328125, 0.009763717651367188, 0.01731109619140625, 0.024858474731445312, 0.032405853271484375, 0.03995323181152344, 0.0475006103515625, 0.05504798889160156, 0.06259536743164062, 0.07014274597167969, 0.07769012451171875, 0.08523750305175781, 0.09278488159179688, 0.10033226013183594, 0.107879638671875, 0.11542701721191406, 0.12297439575195312, 0.1305217742919922, 0.13806915283203125, 0.1456165313720703, 0.15316390991210938, 0.16071128845214844, 0.1682586669921875, 0.17580604553222656, 0.18335342407226562, 0.1909008026123047, 0.19844818115234375, 0.2059955596923828, 0.21354293823242188, 0.22109031677246094, 0.2286376953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 4.0, 5.0, 5.0, 10.0, 15.0, 12.0, 9.0, 19.0, 8.0, 13.0, 13.0, 14.0, 25.0, 25.0, 26.0, 27.0, 23.0, 34.0, 37.0, 35.0, 27.0, 41.0, 39.0, 979.0, 109.0, 42.0, 31.0, 23.0, 41.0, 35.0, 32.0, 34.0, 28.0, 20.0, 28.0, 24.0, 16.0, 23.0, 16.0, 15.0, 10.0, 9.0, 11.0, 4.0, 5.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 4.0], "bins": [-3.482421875, -3.385040283203125, -3.28765869140625, -3.190277099609375, -3.0928955078125, -2.995513916015625, -2.89813232421875, -2.800750732421875, -2.703369140625, -2.605987548828125, -2.50860595703125, -2.411224365234375, -2.3138427734375, -2.216461181640625, -2.11907958984375, -2.021697998046875, -1.92431640625, -1.826934814453125, -1.72955322265625, -1.632171630859375, -1.5347900390625, -1.437408447265625, -1.34002685546875, -1.242645263671875, -1.145263671875, -1.047882080078125, -0.95050048828125, -0.853118896484375, -0.7557373046875, -0.658355712890625, -0.56097412109375, -0.463592529296875, -0.3662109375, -0.268829345703125, -0.17144775390625, -0.074066162109375, 0.0233154296875, 0.120697021484375, 0.21807861328125, 0.315460205078125, 0.412841796875, 0.510223388671875, 0.60760498046875, 0.704986572265625, 0.8023681640625, 0.899749755859375, 0.99713134765625, 1.094512939453125, 1.19189453125, 1.289276123046875, 1.38665771484375, 1.484039306640625, 1.5814208984375, 1.678802490234375, 1.77618408203125, 1.873565673828125, 1.970947265625, 2.068328857421875, 2.16571044921875, 2.263092041015625, 2.3604736328125, 2.457855224609375, 2.55523681640625, 2.652618408203125, 2.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 4.0, 11.0, 20.0, 34.0, 38.0, 62.0, 103.0, 137.0, 205.0, 322.0, 439.0, 679.0, 1164.0, 1856.0, 3252.0, 5970.0, 11436.0, 23553.0, 53166.0, 125515.0, 303906.0, 662726.0, 4030590.0, 601022.0, 267490.0, 108642.0, 45866.0, 20841.0, 10019.0, 5111.0, 2789.0, 1574.0, 982.0, 628.0, 415.0, 292.0, 181.0, 127.0, 94.0, 64.0, 30.0, 21.0, 27.0, 12.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.452392578125, -0.4379997253417969, -0.42360687255859375, -0.4092140197753906, -0.3948211669921875, -0.3804283142089844, -0.36603546142578125, -0.3516426086425781, -0.337249755859375, -0.3228569030761719, -0.30846405029296875, -0.2940711975097656, -0.2796783447265625, -0.2652854919433594, -0.25089263916015625, -0.23649978637695312, -0.22210693359375, -0.20771408081054688, -0.19332122802734375, -0.17892837524414062, -0.1645355224609375, -0.15014266967773438, -0.13574981689453125, -0.12135696411132812, -0.106964111328125, -0.09257125854492188, -0.07817840576171875, -0.06378555297851562, -0.0493927001953125, -0.034999847412109375, -0.02060699462890625, -0.006214141845703125, 0.0081787109375, 0.022571563720703125, 0.03696441650390625, 0.051357269287109375, 0.0657501220703125, 0.08014297485351562, 0.09453582763671875, 0.10892868041992188, 0.123321533203125, 0.13771438598632812, 0.15210723876953125, 0.16650009155273438, 0.1808929443359375, 0.19528579711914062, 0.20967864990234375, 0.22407150268554688, 0.23846435546875, 0.2528572082519531, 0.26725006103515625, 0.2816429138183594, 0.2960357666015625, 0.3104286193847656, 0.32482147216796875, 0.3392143249511719, 0.353607177734375, 0.3680000305175781, 0.38239288330078125, 0.3967857360839844, 0.4111785888671875, 0.4255714416503906, 0.43996429443359375, 0.4543571472167969, 0.46875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 4.0, 9.0, 4.0, 11.0, 8.0, 12.0, 18.0, 18.0, 20.0, 30.0, 22.0, 28.0, 27.0, 30.0, 27.0, 42.0, 52.0, 49.0, 50.0, 249.0, 855.0, 49.0, 41.0, 38.0, 44.0, 37.0, 34.0, 25.0, 26.0, 26.0, 14.0, 15.0, 20.0, 17.0, 11.0, 15.0, 12.0, 6.0, 7.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.290771484375, -2.20654296875, -2.122314453125, -2.0380859375, -1.953857421875, -1.86962890625, -1.785400390625, -1.701171875, -1.616943359375, -1.53271484375, -1.448486328125, -1.3642578125, -1.280029296875, -1.19580078125, -1.111572265625, -1.02734375, -0.943115234375, -0.85888671875, -0.774658203125, -0.6904296875, -0.606201171875, -0.52197265625, -0.437744140625, -0.353515625, -0.269287109375, -0.18505859375, -0.100830078125, -0.0166015625, 0.067626953125, 0.15185546875, 0.236083984375, 0.3203125, 0.404541015625, 0.48876953125, 0.572998046875, 0.6572265625, 0.741455078125, 0.82568359375, 0.909912109375, 0.994140625, 1.078369140625, 1.16259765625, 1.246826171875, 1.3310546875, 1.415283203125, 1.49951171875, 1.583740234375, 1.66796875, 1.752197265625, 1.83642578125, 1.920654296875, 2.0048828125, 2.089111328125, 2.17333984375, 2.257568359375, 2.341796875, 2.426025390625, 2.51025390625, 2.594482421875, 2.6787109375, 2.762939453125, 2.84716796875, 2.931396484375, 3.015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 22.0, 71.0, 440.0, 393.0, 68.0, 11.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.576021194458008, -11.245546340942383, -10.915071487426758, -10.584595680236816, -10.254120826721191, -9.923645973205566, -9.593171119689941, -9.2626953125, -8.932220458984375, -8.60174560546875, -8.271270751953125, -7.940795421600342, -7.610320091247559, -7.279845237731934, -6.949370384216309, -6.618895053863525, -6.2884202003479, -5.957945346832275, -5.627470016479492, -5.296995162963867, -4.966519832611084, -4.636044979095459, -4.305569648742676, -3.975094795227051, -3.6446197032928467, -3.3141446113586426, -2.9836695194244385, -2.6531944274902344, -2.3227195739746094, -1.9922443628311157, -1.6617693901062012, -1.331294298171997, -1.000819206237793, -0.6703441143035889, -0.33986908197402954, -0.009394049644470215, 0.3210810422897339, 0.651556134223938, 0.9820311069488525, 1.3125061988830566, 1.6429812908172607, 1.9734563827514648, 2.303931474685669, 2.634406566619873, 2.964881420135498, 3.2953567504882812, 3.6258316040039062, 3.9563066959381104, 4.2867817878723145, 4.6172566413879395, 4.947731971740723, 5.278206825256348, 5.608682155609131, 5.939157009124756, 6.269632339477539, 6.600107192993164, 6.930582046508789, 7.261056900024414, 7.591532230377197, 7.922007083892822, 8.252482414245605, 8.58295726776123, 8.913432121276855, 9.243907928466797, 9.574382781982422]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 0.0, 8.0, 8.0, 6.0, 6.0, 15.0, 15.0, 13.0, 12.0, 27.0, 18.0, 30.0, 21.0, 34.0, 37.0, 34.0, 35.0, 51.0, 38.0, 57.0, 44.0, 48.0, 51.0, 43.0, 36.0, 42.0, 40.0, 33.0, 33.0, 29.0, 19.0, 17.0, 18.0, 24.0, 9.0, 9.0, 12.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.067220211029053, -3.930452346801758, -3.793684482574463, -3.656916618347168, -3.520148754119873, -3.383380889892578, -3.246613025665283, -3.1098451614379883, -2.9730772972106934, -2.8363094329833984, -2.6995415687561035, -2.5627737045288086, -2.4260058403015137, -2.2892379760742188, -2.152470111846924, -2.015702247619629, -1.878934383392334, -1.742166519165039, -1.6053986549377441, -1.4686307907104492, -1.3318629264831543, -1.1950950622558594, -1.0583271980285645, -0.9215593338012695, -0.7847914695739746, -0.6480236053466797, -0.5112557411193848, -0.37448787689208984, -0.23772001266479492, -0.1009521484375, 0.03581571578979492, 0.17258358001708984, 0.30935144424438477, 0.4461193084716797, 0.5828871726989746, 0.7196550369262695, 0.8564229011535645, 0.9931907653808594, 1.1299586296081543, 1.2667264938354492, 1.4034943580627441, 1.540262222290039, 1.677030086517334, 1.813797950744629, 1.9505658149719238, 2.0873336791992188, 2.2241015434265137, 2.3608694076538086, 2.4976372718811035, 2.6344051361083984, 2.7711730003356934, 2.9079408645629883, 3.044708728790283, 3.181476593017578, 3.318244457244873, 3.455012321472168, 3.591780185699463, 3.728548049926758, 3.8653159141540527, 4.002083778381348, 4.138851642608643, 4.2756195068359375, 4.412387371063232, 4.549155235290527, 4.685923099517822]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 14.0, 19.0, 31.0, 37.0, 89.0, 217.0, 389.0, 699.0, 1252.0, 2402.0, 4600.0, 9864.0, 23965.0, 71892.0, 2795938.0, 1193620.0, 54360.0, 19032.0, 7834.0, 3467.0, 1872.0, 966.0, 574.0, 405.0, 239.0, 160.0, 107.0, 77.0, 42.0, 24.0, 13.0, 7.0, 5.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.17822265625, -0.17205810546875, -0.1658935546875, -0.15972900390625, -0.153564453125, -0.14739990234375, -0.1412353515625, -0.13507080078125, -0.12890625, -0.12274169921875, -0.1165771484375, -0.11041259765625, -0.104248046875, -0.09808349609375, -0.0919189453125, -0.08575439453125, -0.07958984375, -0.07342529296875, -0.0672607421875, -0.06109619140625, -0.054931640625, -0.04876708984375, -0.0426025390625, -0.03643798828125, -0.0302734375, -0.02410888671875, -0.0179443359375, -0.01177978515625, -0.005615234375, 0.00054931640625, 0.0067138671875, 0.01287841796875, 0.01904296875, 0.02520751953125, 0.0313720703125, 0.03753662109375, 0.043701171875, 0.04986572265625, 0.0560302734375, 0.06219482421875, 0.068359375, 0.07452392578125, 0.0806884765625, 0.08685302734375, 0.093017578125, 0.09918212890625, 0.1053466796875, 0.11151123046875, 0.11767578125, 0.12384033203125, 0.1300048828125, 0.13616943359375, 0.142333984375, 0.14849853515625, 0.1546630859375, 0.16082763671875, 0.1669921875, 0.17315673828125, 0.1793212890625, 0.18548583984375, 0.191650390625, 0.19781494140625, 0.2039794921875, 0.21014404296875, 0.21630859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 9.0, 14.0, 17.0, 14.0, 25.0, 33.0, 34.0, 49.0, 52.0, 59.0, 74.0, 80.0, 60.0, 73.0, 71.0, 64.0, 55.0, 36.0, 35.0, 36.0, 22.0, 13.0, 9.0, 6.0, 11.0, 10.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05181884765625, -0.050046443939208984, -0.04827404022216797, -0.04650163650512695, -0.04472923278808594, -0.04295682907104492, -0.041184425354003906, -0.03941202163696289, -0.037639617919921875, -0.03586721420288086, -0.034094810485839844, -0.03232240676879883, -0.030550003051757812, -0.028777599334716797, -0.02700519561767578, -0.025232791900634766, -0.02346038818359375, -0.021687984466552734, -0.01991558074951172, -0.018143177032470703, -0.016370773315429688, -0.014598369598388672, -0.012825965881347656, -0.01105356216430664, -0.009281158447265625, -0.007508754730224609, -0.005736351013183594, -0.003963947296142578, -0.0021915435791015625, -0.0004191398620605469, 0.0013532638549804688, 0.0031256675720214844, 0.0048980712890625, 0.006670475006103516, 0.008442878723144531, 0.010215282440185547, 0.011987686157226562, 0.013760089874267578, 0.015532493591308594, 0.01730489730834961, 0.019077301025390625, 0.02084970474243164, 0.022622108459472656, 0.024394512176513672, 0.026166915893554688, 0.027939319610595703, 0.02971172332763672, 0.031484127044677734, 0.03325653076171875, 0.035028934478759766, 0.03680133819580078, 0.0385737419128418, 0.04034614562988281, 0.04211854934692383, 0.043890953063964844, 0.04566335678100586, 0.047435760498046875, 0.04920816421508789, 0.050980567932128906, 0.05275297164916992, 0.05452537536621094, 0.05629777908325195, 0.05807018280029297, 0.059842586517333984, 0.061614990234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 1.0, 8.0, 5.0, 4.0, 12.0, 9.0, 13.0, 17.0, 20.0, 24.0, 29.0, 30.0, 62.0, 134.0, 519.0, 4561.0, 161992.0, 4009330.0, 15784.0, 1235.0, 208.0, 64.0, 48.0, 34.0, 18.0, 20.0, 18.0, 10.0, 12.0, 5.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2978515625, -0.28914642333984375, -0.2804412841796875, -0.27173614501953125, -0.263031005859375, -0.25432586669921875, -0.2456207275390625, -0.23691558837890625, -0.22821044921875, -0.21950531005859375, -0.2108001708984375, -0.20209503173828125, -0.193389892578125, -0.18468475341796875, -0.1759796142578125, -0.16727447509765625, -0.1585693359375, -0.14986419677734375, -0.1411590576171875, -0.13245391845703125, -0.123748779296875, -0.11504364013671875, -0.1063385009765625, -0.09763336181640625, -0.08892822265625, -0.08022308349609375, -0.0715179443359375, -0.06281280517578125, -0.054107666015625, -0.04540252685546875, -0.0366973876953125, -0.02799224853515625, -0.019287109375, -0.01058197021484375, -0.0018768310546875, 0.00682830810546875, 0.015533447265625, 0.02423858642578125, 0.0329437255859375, 0.04164886474609375, 0.05035400390625, 0.05905914306640625, 0.0677642822265625, 0.07646942138671875, 0.085174560546875, 0.09387969970703125, 0.1025848388671875, 0.11128997802734375, 0.1199951171875, 0.12870025634765625, 0.1374053955078125, 0.14611053466796875, 0.154815673828125, 0.16352081298828125, 0.1722259521484375, 0.18093109130859375, 0.18963623046875, 0.19834136962890625, 0.2070465087890625, 0.21575164794921875, 0.224456787109375, 0.23316192626953125, 0.2418670654296875, 0.25057220458984375, 0.25927734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 2.0, 0.0, 4.0, 4.0, 12.0, 8.0, 12.0, 19.0, 17.0, 28.0, 31.0, 38.0, 54.0, 78.0, 143.0, 425.0, 1467.0, 1048.0, 272.0, 105.0, 70.0, 49.0, 36.0, 22.0, 22.0, 20.0, 12.0, 10.0, 14.0, 5.0, 6.0, 5.0, 3.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08636474609375, -0.0834646224975586, -0.08056449890136719, -0.07766437530517578, -0.07476425170898438, -0.07186412811279297, -0.06896400451660156, -0.06606388092041016, -0.06316375732421875, -0.060263633728027344, -0.05736351013183594, -0.05446338653564453, -0.051563262939453125, -0.04866313934326172, -0.04576301574707031, -0.042862892150878906, -0.0399627685546875, -0.037062644958496094, -0.03416252136230469, -0.03126239776611328, -0.028362274169921875, -0.02546215057373047, -0.022562026977539062, -0.019661903381347656, -0.01676177978515625, -0.013861656188964844, -0.010961532592773438, -0.008061408996582031, -0.005161285400390625, -0.0022611618041992188, 0.0006389617919921875, 0.0035390853881835938, 0.006439208984375, 0.009339332580566406, 0.012239456176757812, 0.015139579772949219, 0.018039703369140625, 0.02093982696533203, 0.023839950561523438, 0.026740074157714844, 0.02964019775390625, 0.032540321350097656, 0.03544044494628906, 0.03834056854248047, 0.041240692138671875, 0.04414081573486328, 0.04704093933105469, 0.049941062927246094, 0.0528411865234375, 0.055741310119628906, 0.05864143371582031, 0.06154155731201172, 0.06444168090820312, 0.06734180450439453, 0.07024192810058594, 0.07314205169677734, 0.07604217529296875, 0.07894229888916016, 0.08184242248535156, 0.08474254608154297, 0.08764266967773438, 0.09054279327392578, 0.09344291687011719, 0.0963430404663086, 0.0992431640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 52.0, 482.0, 401.0, 62.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2368580847978592, -0.21297499537467957, -0.18909189105033875, -0.16520880162715912, -0.1413257122039795, -0.11744262278079987, -0.09355951845645905, -0.06967642903327942, -0.04579333961009979, -0.021910246461629868, 0.0019728466868400574, 0.02585594356060028, 0.04973903298377991, 0.07362212240695953, 0.09750522673130035, 0.12138831615447998, 0.1452714055776596, 0.16915449500083923, 0.19303759932518005, 0.21692068874835968, 0.2408037781715393, 0.2646868824958801, 0.28856998682022095, 0.3124530613422394, 0.3363361358642578, 0.36021924018859863, 0.38410231471061707, 0.4079854190349579, 0.4318684935569763, 0.45575159788131714, 0.47963470220565796, 0.5035178065299988, 0.5274008512496948, 0.5512839555740356, 0.5751670598983765, 0.5990501642227173, 0.6229332089424133, 0.6468163132667542, 0.670699417591095, 0.6945825219154358, 0.7184655666351318, 0.7423486709594727, 0.7662317752838135, 0.7901148796081543, 0.8139979243278503, 0.8378810286521912, 0.861764132976532, 0.8856472373008728, 0.9095303416252136, 0.9334134459495544, 0.9572965502738953, 0.9811795949935913, 1.0050626993179321, 1.028945803642273, 1.0528289079666138, 1.0767120122909546, 1.1005951166152954, 1.1244782209396362, 1.148361325263977, 1.1722444295883179, 1.1961275339126587, 1.22001051902771, 1.2438936233520508, 1.2677767276763916, 1.2916598320007324]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 9.0, 9.0, 10.0, 11.0, 17.0, 14.0, 17.0, 19.0, 33.0, 22.0, 36.0, 32.0, 32.0, 38.0, 40.0, 45.0, 48.0, 59.0, 44.0, 51.0, 43.0, 46.0, 46.0, 41.0, 35.0, 31.0, 31.0, 22.0, 25.0, 16.0, 11.0, 9.0, 15.0, 10.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.176777184009552, -0.17117714881896973, -0.16557711362838745, -0.15997707843780518, -0.1543770432472229, -0.14877702295780182, -0.14317698776721954, -0.13757695257663727, -0.131976917386055, -0.12637688219547272, -0.12077684700489044, -0.11517681926488876, -0.10957678407430649, -0.10397674888372421, -0.09837672114372253, -0.09277668595314026, -0.08717665076255798, -0.08157661557197571, -0.07597658038139343, -0.07037655264139175, -0.06477651745080948, -0.0591764822602272, -0.053576450794935226, -0.04797641932964325, -0.042376384139060974, -0.0367763489484787, -0.031176317483186722, -0.025576284155249596, -0.01997625082731247, -0.014376217499375343, -0.008776184171438217, -0.0031761527061462402, 0.002423882484436035, 0.008023915812373161, 0.013623949140310287, 0.019223982468247414, 0.02482401579618454, 0.030424049124121666, 0.03602408245205879, 0.04162411391735077, 0.047224149107933044, 0.05282418429851532, 0.0584242157638073, 0.06402424722909927, 0.06962428241968155, 0.07522431761026382, 0.0808243453502655, 0.08642438054084778, 0.09202441573143005, 0.09762445092201233, 0.1032244861125946, 0.10882451385259628, 0.11442454904317856, 0.12002458423376083, 0.1256246119737625, 0.1312246471643448, 0.13682468235492706, 0.14242471754550934, 0.1480247527360916, 0.1536247879266739, 0.15922480821609497, 0.16482484340667725, 0.17042487859725952, 0.1760249137878418, 0.18162494897842407]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 1.0, 8.0, 5.0, 4.0, 8.0, 11.0, 10.0, 22.0, 25.0, 45.0, 64.0, 96.0, 153.0, 239.0, 382.0, 679.0, 1329.0, 2729.0, 7119.0, 35710.0, 888502.0, 93166.0, 10935.0, 3595.0, 1565.0, 819.0, 458.0, 301.0, 187.0, 117.0, 87.0, 52.0, 38.0, 27.0, 20.0, 12.0, 13.0, 4.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5908203125, -0.57470703125, -0.55859375, -0.54248046875, -0.5263671875, -0.51025390625, -0.494140625, -0.47802734375, -0.4619140625, -0.44580078125, -0.4296875, -0.41357421875, -0.3974609375, -0.38134765625, -0.365234375, -0.34912109375, -0.3330078125, -0.31689453125, -0.30078125, -0.28466796875, -0.2685546875, -0.25244140625, -0.236328125, -0.22021484375, -0.2041015625, -0.18798828125, -0.171875, -0.15576171875, -0.1396484375, -0.12353515625, -0.107421875, -0.09130859375, -0.0751953125, -0.05908203125, -0.04296875, -0.02685546875, -0.0107421875, 0.00537109375, 0.021484375, 0.03759765625, 0.0537109375, 0.06982421875, 0.0859375, 0.10205078125, 0.1181640625, 0.13427734375, 0.150390625, 0.16650390625, 0.1826171875, 0.19873046875, 0.21484375, 0.23095703125, 0.2470703125, 0.26318359375, 0.279296875, 0.29541015625, 0.3115234375, 0.32763671875, 0.34375, 0.35986328125, 0.3759765625, 0.39208984375, 0.408203125, 0.42431640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 7.0, 7.0, 9.0, 18.0, 24.0, 22.0, 38.0, 37.0, 60.0, 51.0, 62.0, 85.0, 58.0, 87.0, 65.0, 66.0, 57.0, 58.0, 34.0, 29.0, 24.0, 29.0, 7.0, 11.0, 6.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04788970947265625, -0.0460968017578125, -0.04430389404296875, -0.042510986328125, -0.04071807861328125, -0.0389251708984375, -0.03713226318359375, -0.03533935546875, -0.03354644775390625, -0.0317535400390625, -0.02996063232421875, -0.028167724609375, -0.02637481689453125, -0.0245819091796875, -0.02278900146484375, -0.02099609375, -0.01920318603515625, -0.0174102783203125, -0.01561737060546875, -0.013824462890625, -0.01203155517578125, -0.0102386474609375, -0.00844573974609375, -0.00665283203125, -0.00485992431640625, -0.0030670166015625, -0.00127410888671875, 0.000518798828125, 0.00231170654296875, 0.0041046142578125, 0.00589752197265625, 0.0076904296875, 0.00948333740234375, 0.0112762451171875, 0.01306915283203125, 0.014862060546875, 0.01665496826171875, 0.0184478759765625, 0.02024078369140625, 0.02203369140625, 0.02382659912109375, 0.0256195068359375, 0.02741241455078125, 0.029205322265625, 0.03099822998046875, 0.0327911376953125, 0.03458404541015625, 0.036376953125, 0.03816986083984375, 0.0399627685546875, 0.04175567626953125, 0.043548583984375, 0.04534149169921875, 0.0471343994140625, 0.04892730712890625, 0.05072021484375, 0.05251312255859375, 0.0543060302734375, 0.05609893798828125, 0.057891845703125, 0.05968475341796875, 0.0614776611328125, 0.06327056884765625, 0.0650634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 0.0, 8.0, 3.0, 8.0, 10.0, 9.0, 20.0, 21.0, 38.0, 56.0, 95.0, 183.0, 291.0, 519.0, 984.0, 1835.0, 3924.0, 8903.0, 21330.0, 58882.0, 193496.0, 448164.0, 206900.0, 62465.0, 22824.0, 9307.0, 4067.0, 1870.0, 946.0, 518.0, 327.0, 192.0, 117.0, 76.0, 48.0, 38.0, 30.0, 19.0, 10.0, 5.0, 2.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0850830078125, -0.08254528045654297, -0.08000755310058594, -0.0774698257446289, -0.07493209838867188, -0.07239437103271484, -0.06985664367675781, -0.06731891632080078, -0.06478118896484375, -0.06224346160888672, -0.05970573425292969, -0.057168006896972656, -0.054630279541015625, -0.052092552185058594, -0.04955482482910156, -0.04701709747314453, -0.0444793701171875, -0.04194164276123047, -0.03940391540527344, -0.036866188049316406, -0.034328460693359375, -0.031790733337402344, -0.029253005981445312, -0.02671527862548828, -0.02417755126953125, -0.02163982391357422, -0.019102096557617188, -0.016564369201660156, -0.014026641845703125, -0.011488914489746094, -0.008951187133789062, -0.006413459777832031, -0.003875732421875, -0.0013380050659179688, 0.0011997222900390625, 0.0037374496459960938, 0.006275177001953125, 0.008812904357910156, 0.011350631713867188, 0.013888359069824219, 0.01642608642578125, 0.01896381378173828, 0.021501541137695312, 0.024039268493652344, 0.026576995849609375, 0.029114723205566406, 0.03165245056152344, 0.03419017791748047, 0.0367279052734375, 0.03926563262939453, 0.04180335998535156, 0.044341087341308594, 0.046878814697265625, 0.049416542053222656, 0.05195426940917969, 0.05449199676513672, 0.05702972412109375, 0.05956745147705078, 0.06210517883300781, 0.06464290618896484, 0.06718063354492188, 0.0697183609008789, 0.07225608825683594, 0.07479381561279297, 0.07733154296875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 7.0, 5.0, 4.0, 11.0, 7.0, 8.0, 9.0, 15.0, 14.0, 25.0, 23.0, 36.0, 25.0, 26.0, 35.0, 28.0, 47.0, 44.0, 44.0, 41.0, 39.0, 44.0, 45.0, 33.0, 39.0, 42.0, 53.0, 29.0, 30.0, 28.0, 27.0, 28.0, 13.0, 21.0, 12.0, 12.0, 12.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10559940338134766, -0.10219001770019531, -0.09878063201904297, -0.09537124633789062, -0.09196186065673828, -0.08855247497558594, -0.0851430892944336, -0.08173370361328125, -0.0783243179321289, -0.07491493225097656, -0.07150554656982422, -0.06809616088867188, -0.06468677520751953, -0.06127738952636719, -0.057868003845214844, -0.0544586181640625, -0.051049232482910156, -0.04763984680175781, -0.04423046112060547, -0.040821075439453125, -0.03741168975830078, -0.03400230407714844, -0.030592918395996094, -0.02718353271484375, -0.023774147033691406, -0.020364761352539062, -0.01695537567138672, -0.013545989990234375, -0.010136604309082031, -0.0067272186279296875, -0.0033178329467773438, 9.1552734375e-05, 0.0035009384155273438, 0.0069103240966796875, 0.010319709777832031, 0.013729095458984375, 0.01713848114013672, 0.020547866821289062, 0.023957252502441406, 0.02736663818359375, 0.030776023864746094, 0.03418540954589844, 0.03759479522705078, 0.041004180908203125, 0.04441356658935547, 0.04782295227050781, 0.051232337951660156, 0.0546417236328125, 0.058051109313964844, 0.06146049499511719, 0.06486988067626953, 0.06827926635742188, 0.07168865203857422, 0.07509803771972656, 0.0785074234008789, 0.08191680908203125, 0.0853261947631836, 0.08873558044433594, 0.09214496612548828, 0.09555435180664062, 0.09896373748779297, 0.10237312316894531, 0.10578250885009766, 0.10919189453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 11.0, 16.0, 28.0, 38.0, 55.0, 95.0, 121.0, 191.0, 338.0, 475.0, 831.0, 1505.0, 3100.0, 7256.0, 24809.0, 231166.0, 702127.0, 55206.0, 11734.0, 4455.0, 2166.0, 1114.0, 594.0, 364.0, 237.0, 132.0, 110.0, 72.0, 53.0, 30.0, 28.0, 22.0, 11.0, 10.0, 7.0, 3.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.059783935546875, -0.05803728103637695, -0.056290626525878906, -0.05454397201538086, -0.05279731750488281, -0.051050662994384766, -0.04930400848388672, -0.04755735397338867, -0.045810699462890625, -0.04406404495239258, -0.04231739044189453, -0.040570735931396484, -0.03882408142089844, -0.03707742691040039, -0.035330772399902344, -0.0335841178894043, -0.03183746337890625, -0.030090808868408203, -0.028344154357910156, -0.02659749984741211, -0.024850845336914062, -0.023104190826416016, -0.02135753631591797, -0.019610881805419922, -0.017864227294921875, -0.016117572784423828, -0.014370918273925781, -0.012624263763427734, -0.010877609252929688, -0.00913095474243164, -0.007384300231933594, -0.005637645721435547, -0.0038909912109375, -0.002144336700439453, -0.00039768218994140625, 0.0013489723205566406, 0.0030956268310546875, 0.004842281341552734, 0.006588935852050781, 0.008335590362548828, 0.010082244873046875, 0.011828899383544922, 0.013575553894042969, 0.015322208404541016, 0.017068862915039062, 0.01881551742553711, 0.020562171936035156, 0.022308826446533203, 0.02405548095703125, 0.025802135467529297, 0.027548789978027344, 0.02929544448852539, 0.031042098999023438, 0.032788753509521484, 0.03453540802001953, 0.03628206253051758, 0.038028717041015625, 0.03977537155151367, 0.04152202606201172, 0.043268680572509766, 0.04501533508300781, 0.04676198959350586, 0.048508644104003906, 0.05025529861450195, 0.052001953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 6.0, 7.0, 7.0, 18.0, 32.0, 29.0, 45.0, 42.0, 57.0, 67.0, 67.0, 80.0, 109.0, 77.0, 68.0, 48.0, 41.0, 36.0, 31.0, 19.0, 42.0, 13.0, 5.0, 9.0, 11.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.926455974578857e-06, -3.7997961044311523e-06, -3.6731362342834473e-06, -3.546476364135742e-06, -3.419816493988037e-06, -3.293156623840332e-06, -3.166496753692627e-06, -3.039836883544922e-06, -2.913177013397217e-06, -2.7865171432495117e-06, -2.6598572731018066e-06, -2.5331974029541016e-06, -2.4065375328063965e-06, -2.2798776626586914e-06, -2.1532177925109863e-06, -2.0265579223632812e-06, -1.8998980522155762e-06, -1.773238182067871e-06, -1.646578311920166e-06, -1.519918441772461e-06, -1.3932585716247559e-06, -1.2665987014770508e-06, -1.1399388313293457e-06, -1.0132789611816406e-06, -8.866190910339355e-07, -7.599592208862305e-07, -6.332993507385254e-07, -5.066394805908203e-07, -3.7997961044311523e-07, -2.5331974029541016e-07, -1.2665987014770508e-07, 0.0, 1.2665987014770508e-07, 2.5331974029541016e-07, 3.7997961044311523e-07, 5.066394805908203e-07, 6.332993507385254e-07, 7.599592208862305e-07, 8.866190910339355e-07, 1.0132789611816406e-06, 1.1399388313293457e-06, 1.2665987014770508e-06, 1.3932585716247559e-06, 1.519918441772461e-06, 1.646578311920166e-06, 1.773238182067871e-06, 1.8998980522155762e-06, 2.0265579223632812e-06, 2.1532177925109863e-06, 2.2798776626586914e-06, 2.4065375328063965e-06, 2.5331974029541016e-06, 2.6598572731018066e-06, 2.7865171432495117e-06, 2.913177013397217e-06, 3.039836883544922e-06, 3.166496753692627e-06, 3.293156623840332e-06, 3.419816493988037e-06, 3.546476364135742e-06, 3.6731362342834473e-06, 3.7997961044311523e-06, 3.926455974578857e-06, 4.0531158447265625e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 13.0, 18.0, 32.0, 76.0, 119.0, 209.0, 435.0, 1193.0, 3199.0, 10418.0, 78669.0, 898259.0, 43705.0, 7933.0, 2497.0, 953.0, 384.0, 186.0, 91.0, 58.0, 37.0, 14.0, 17.0, 5.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12310791015625, -0.11905765533447266, -0.11500740051269531, -0.11095714569091797, -0.10690689086914062, -0.10285663604736328, -0.09880638122558594, -0.0947561264038086, -0.09070587158203125, -0.0866556167602539, -0.08260536193847656, -0.07855510711669922, -0.07450485229492188, -0.07045459747314453, -0.06640434265136719, -0.062354087829589844, -0.0583038330078125, -0.054253578186035156, -0.05020332336425781, -0.04615306854248047, -0.042102813720703125, -0.03805255889892578, -0.03400230407714844, -0.029952049255371094, -0.02590179443359375, -0.021851539611816406, -0.017801284790039062, -0.013751029968261719, -0.009700775146484375, -0.005650520324707031, -0.0016002655029296875, 0.0024499893188476562, 0.006500244140625, 0.010550498962402344, 0.014600753784179688, 0.01865100860595703, 0.022701263427734375, 0.02675151824951172, 0.030801773071289062, 0.034852027893066406, 0.03890228271484375, 0.042952537536621094, 0.04700279235839844, 0.05105304718017578, 0.055103302001953125, 0.05915355682373047, 0.06320381164550781, 0.06725406646728516, 0.0713043212890625, 0.07535457611083984, 0.07940483093261719, 0.08345508575439453, 0.08750534057617188, 0.09155559539794922, 0.09560585021972656, 0.0996561050415039, 0.10370635986328125, 0.1077566146850586, 0.11180686950683594, 0.11585712432861328, 0.11990737915039062, 0.12395763397216797, 0.1280078887939453, 0.13205814361572266, 0.1361083984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 5.0, 9.0, 2.0, 6.0, 11.0, 22.0, 33.0, 63.0, 156.0, 312.0, 174.0, 68.0, 38.0, 33.0, 16.0, 13.0, 4.0, 3.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.183837890625, -0.17942047119140625, -0.1750030517578125, -0.17058563232421875, -0.166168212890625, -0.16175079345703125, -0.1573333740234375, -0.15291595458984375, -0.14849853515625, -0.14408111572265625, -0.1396636962890625, -0.13524627685546875, -0.130828857421875, -0.12641143798828125, -0.1219940185546875, -0.11757659912109375, -0.1131591796875, -0.10874176025390625, -0.1043243408203125, -0.09990692138671875, -0.095489501953125, -0.09107208251953125, -0.0866546630859375, -0.08223724365234375, -0.07781982421875, -0.07340240478515625, -0.0689849853515625, -0.06456756591796875, -0.060150146484375, -0.05573272705078125, -0.0513153076171875, -0.04689788818359375, -0.04248046875, -0.03806304931640625, -0.0336456298828125, -0.02922821044921875, -0.024810791015625, -0.02039337158203125, -0.0159759521484375, -0.01155853271484375, -0.00714111328125, -0.00272369384765625, 0.0016937255859375, 0.00611114501953125, 0.010528564453125, 0.01494598388671875, 0.0193634033203125, 0.02378082275390625, 0.0281982421875, 0.03261566162109375, 0.0370330810546875, 0.04145050048828125, 0.045867919921875, 0.05028533935546875, 0.0547027587890625, 0.05912017822265625, 0.06353759765625, 0.06795501708984375, 0.0723724365234375, 0.07678985595703125, 0.081207275390625, 0.08562469482421875, 0.0900421142578125, 0.09445953369140625, 0.098876953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 15.0, 27.0, 114.0, 393.0, 306.0, 116.0, 23.0, 17.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32399025559425354, -0.2689192295074463, -0.21384820342063904, -0.1587771624326706, -0.10370613634586334, -0.0486350953578949, 0.0064359307289123535, 0.061506956815719604, 0.11657798290252686, 0.1716490089893341, 0.22672003507614136, 0.281791090965271, 0.33686208724975586, 0.3919331431388855, 0.44700416922569275, 0.5020751953125, 0.5571461915969849, 0.6122172474861145, 0.6672882437705994, 0.722359299659729, 0.7774302959442139, 0.8325013518333435, 0.8875724077224731, 0.942643404006958, 0.9977144598960876, 1.0527855157852173, 1.1078565120697021, 1.162927508354187, 1.2179986238479614, 1.2730696201324463, 1.3281406164169312, 1.383211612701416, 1.4382826089859009, 1.4933536052703857, 1.5484247207641602, 1.603495717048645, 1.6585667133331299, 1.7136378288269043, 1.7687088251113892, 1.823779821395874, 1.8788508176803589, 1.9339218139648438, 1.9889929294586182, 2.0440638065338135, 2.099134922027588, 2.1542060375213623, 2.2092769145965576, 2.264348030090332, 2.3194191455841064, 2.374490261077881, 2.429561138153076, 2.4846322536468506, 2.539703369140625, 2.5947742462158203, 2.6498453617095947, 2.704916477203369, 2.7599873542785645, 2.815058469772339, 2.870129346847534, 2.9252004623413086, 2.980271577835083, 3.0353424549102783, 3.0904135704040527, 3.145484447479248, 3.2005555629730225]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 2.0, 5.0, 8.0, 13.0, 10.0, 13.0, 13.0, 19.0, 16.0, 25.0, 32.0, 26.0, 29.0, 30.0, 39.0, 34.0, 41.0, 43.0, 49.0, 50.0, 44.0, 44.0, 28.0, 44.0, 45.0, 34.0, 27.0, 38.0, 24.0, 38.0, 23.0, 26.0, 12.0, 13.0, 15.0, 6.0, 6.0, 10.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5913479328155518, -0.5734646916389465, -0.5555815100669861, -0.5376982688903809, -0.5198150873184204, -0.5019318461418152, -0.48404860496520996, -0.4661653935909271, -0.4482821822166443, -0.43039897084236145, -0.4125157594680786, -0.3946325182914734, -0.37674930691719055, -0.3588660955429077, -0.3409828543663025, -0.32309964299201965, -0.3052164316177368, -0.287333220243454, -0.26945000886917114, -0.2515667676925659, -0.23368355631828308, -0.21580034494400024, -0.1979171186685562, -0.18003389239311218, -0.16215068101882935, -0.1442674696445465, -0.12638424336910248, -0.10850102454423904, -0.09061780571937561, -0.07273458689451218, -0.05485136806964874, -0.03696814179420471, -0.0190848708152771, -0.0012016519904136658, 0.016681566834449768, 0.0345647856593132, 0.052448004484176636, 0.07033122330904007, 0.0882144421339035, 0.10609766840934753, 0.12398087978363037, 0.1418640911579132, 0.15974731743335724, 0.17763054370880127, 0.1955137550830841, 0.21339696645736694, 0.23128019273281097, 0.249163419008255, 0.26704663038253784, 0.2849298417568207, 0.3028130531311035, 0.32069629430770874, 0.3385795056819916, 0.3564627170562744, 0.37434595823287964, 0.3922291696071625, 0.4101123809814453, 0.42799559235572815, 0.445878803730011, 0.4637620449066162, 0.48164525628089905, 0.4995284676551819, 0.5174117088317871, 0.5352948904037476, 0.5531781315803528]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 4.0, 10.0, 7.0, 11.0, 10.0, 20.0, 23.0, 47.0, 57.0, 86.0, 85.0, 140.0, 225.0, 303.0, 511.0, 751.0, 1203.0, 2272.0, 4558.0, 11537.0, 41731.0, 660416.0, 3356693.0, 83190.0, 17130.0, 6165.0, 2910.0, 1512.0, 925.0, 567.0, 369.0, 236.0, 132.0, 113.0, 71.0, 51.0, 63.0, 30.0, 36.0, 22.0, 12.0, 8.0, 6.0, 8.0, 6.0, 6.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.15283203125, -0.1475963592529297, -0.14236068725585938, -0.13712501525878906, -0.13188934326171875, -0.12665367126464844, -0.12141799926757812, -0.11618232727050781, -0.1109466552734375, -0.10571098327636719, -0.10047531127929688, -0.09523963928222656, -0.09000396728515625, -0.08476829528808594, -0.07953262329101562, -0.07429695129394531, -0.069061279296875, -0.06382560729980469, -0.058589935302734375, -0.05335426330566406, -0.04811859130859375, -0.04288291931152344, -0.037647247314453125, -0.03241157531738281, -0.0271759033203125, -0.021940231323242188, -0.016704559326171875, -0.011468887329101562, -0.00623321533203125, -0.0009975433349609375, 0.004238128662109375, 0.009473800659179688, 0.01470947265625, 0.019945144653320312, 0.025180816650390625, 0.030416488647460938, 0.03565216064453125, 0.04088783264160156, 0.046123504638671875, 0.05135917663574219, 0.0565948486328125, 0.06183052062988281, 0.06706619262695312, 0.07230186462402344, 0.07753753662109375, 0.08277320861816406, 0.08800888061523438, 0.09324455261230469, 0.098480224609375, 0.10371589660644531, 0.10895156860351562, 0.11418724060058594, 0.11942291259765625, 0.12465858459472656, 0.12989425659179688, 0.1351299285888672, 0.1403656005859375, 0.1456012725830078, 0.15083694458007812, 0.15607261657714844, 0.16130828857421875, 0.16654396057128906, 0.17177963256835938, 0.1770153045654297, 0.1822509765625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 8.0, 12.0, 16.0, 10.0, 5.0, 18.0, 24.0, 31.0, 39.0, 44.0, 42.0, 45.0, 60.0, 68.0, 59.0, 63.0, 63.0, 59.0, 47.0, 44.0, 40.0, 34.0, 29.0, 29.0, 24.0, 11.0, 10.0, 16.0, 10.0, 10.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0447998046875, -0.04325675964355469, -0.041713714599609375, -0.04017066955566406, -0.03862762451171875, -0.03708457946777344, -0.035541534423828125, -0.03399848937988281, -0.0324554443359375, -0.030912399291992188, -0.029369354248046875, -0.027826309204101562, -0.02628326416015625, -0.024740219116210938, -0.023197174072265625, -0.021654129028320312, -0.020111083984375, -0.018568038940429688, -0.017024993896484375, -0.015481948852539062, -0.01393890380859375, -0.012395858764648438, -0.010852813720703125, -0.009309768676757812, -0.0077667236328125, -0.0062236785888671875, -0.004680633544921875, -0.0031375885009765625, -0.00159454345703125, -5.14984130859375e-05, 0.001491546630859375, 0.0030345916748046875, 0.00457763671875, 0.0061206817626953125, 0.007663726806640625, 0.009206771850585938, 0.01074981689453125, 0.012292861938476562, 0.013835906982421875, 0.015378952026367188, 0.0169219970703125, 0.018465042114257812, 0.020008087158203125, 0.021551132202148438, 0.02309417724609375, 0.024637222290039062, 0.026180267333984375, 0.027723312377929688, 0.029266357421875, 0.030809402465820312, 0.032352447509765625, 0.03389549255371094, 0.03543853759765625, 0.03698158264160156, 0.038524627685546875, 0.04006767272949219, 0.0416107177734375, 0.04315376281738281, 0.044696807861328125, 0.04623985290527344, 0.04778289794921875, 0.04932594299316406, 0.050868988037109375, 0.05241203308105469, 0.053955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 18.0, 15.0, 29.0, 65.0, 145.0, 295.0, 672.0, 1604.0, 4795.0, 17682.0, 109175.0, 2297937.0, 1647483.0, 91596.0, 15790.0, 4305.0, 1518.0, 585.0, 286.0, 120.0, 51.0, 31.0, 21.0, 17.0, 7.0, 7.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1900634765625, -0.1854228973388672, -0.18078231811523438, -0.17614173889160156, -0.17150115966796875, -0.16686058044433594, -0.16222000122070312, -0.1575794219970703, -0.1529388427734375, -0.1482982635498047, -0.14365768432617188, -0.13901710510253906, -0.13437652587890625, -0.12973594665527344, -0.12509536743164062, -0.12045478820800781, -0.115814208984375, -0.11117362976074219, -0.10653305053710938, -0.10189247131347656, -0.09725189208984375, -0.09261131286621094, -0.08797073364257812, -0.08333015441894531, -0.0786895751953125, -0.07404899597167969, -0.06940841674804688, -0.06476783752441406, -0.06012725830078125, -0.05548667907714844, -0.050846099853515625, -0.04620552062988281, -0.04156494140625, -0.03692436218261719, -0.032283782958984375, -0.027643203735351562, -0.02300262451171875, -0.018362045288085938, -0.013721466064453125, -0.009080886840820312, -0.0044403076171875, 0.0002002716064453125, 0.004840850830078125, 0.009481430053710938, 0.01412200927734375, 0.018762588500976562, 0.023403167724609375, 0.028043746948242188, 0.032684326171875, 0.03732490539550781, 0.041965484619140625, 0.04660606384277344, 0.05124664306640625, 0.05588722229003906, 0.060527801513671875, 0.06516838073730469, 0.0698089599609375, 0.07444953918457031, 0.07909011840820312, 0.08373069763183594, 0.08837127685546875, 0.09301185607910156, 0.09765243530273438, 0.10229301452636719, 0.10693359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 8.0, 9.0, 7.0, 12.0, 18.0, 20.0, 45.0, 62.0, 69.0, 104.0, 199.0, 347.0, 716.0, 1050.0, 628.0, 292.0, 168.0, 97.0, 64.0, 42.0, 29.0, 25.0, 17.0, 6.0, 9.0, 9.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.060089111328125, -0.05797529220581055, -0.055861473083496094, -0.05374765396118164, -0.05163383483886719, -0.049520015716552734, -0.04740619659423828, -0.04529237747192383, -0.043178558349609375, -0.04106473922729492, -0.03895092010498047, -0.036837100982666016, -0.03472328186035156, -0.03260946273803711, -0.030495643615722656, -0.028381824493408203, -0.02626800537109375, -0.024154186248779297, -0.022040367126464844, -0.01992654800415039, -0.017812728881835938, -0.015698909759521484, -0.013585090637207031, -0.011471271514892578, -0.009357452392578125, -0.007243633270263672, -0.005129814147949219, -0.0030159950256347656, -0.0009021759033203125, 0.0012116432189941406, 0.0033254623413085938, 0.005439281463623047, 0.0075531005859375, 0.009666919708251953, 0.011780738830566406, 0.01389455795288086, 0.016008377075195312, 0.018122196197509766, 0.02023601531982422, 0.022349834442138672, 0.024463653564453125, 0.026577472686767578, 0.02869129180908203, 0.030805110931396484, 0.03291893005371094, 0.03503274917602539, 0.037146568298339844, 0.0392603874206543, 0.04137420654296875, 0.0434880256652832, 0.045601844787597656, 0.04771566390991211, 0.04982948303222656, 0.051943302154541016, 0.05405712127685547, 0.05617094039916992, 0.058284759521484375, 0.06039857864379883, 0.06251239776611328, 0.06462621688842773, 0.06674003601074219, 0.06885385513305664, 0.0709676742553711, 0.07308149337768555, 0.0751953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 11.0, 30.0, 118.0, 338.0, 320.0, 138.0, 45.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.014899492263794, -0.9949918389320374, -0.9750841856002808, -0.9551765322685242, -0.9352688789367676, -0.9153611660003662, -0.8954535126686096, -0.875545859336853, -0.8556382060050964, -0.8357305526733398, -0.8158228993415833, -0.7959152460098267, -0.7760075330734253, -0.7560998797416687, -0.7361922264099121, -0.7162845730781555, -0.6963769197463989, -0.6764692664146423, -0.6565616130828857, -0.6366539597511292, -0.6167463064193726, -0.5968385934829712, -0.5769309401512146, -0.557023286819458, -0.5371156334877014, -0.5172079801559448, -0.49730032682418823, -0.47739264369010925, -0.45748499035835266, -0.43757733702659607, -0.4176696538925171, -0.3977620005607605, -0.3778543174266815, -0.3579466640949249, -0.33803898096084595, -0.31813132762908936, -0.29822367429733276, -0.27831602096557617, -0.2584083676338196, -0.2385006844997406, -0.218593031167984, -0.19868537783622742, -0.17877770960330963, -0.15887004137039185, -0.13896238803863525, -0.11905472725629807, -0.09914706647396088, -0.07923939824104309, -0.0593317449092865, -0.03942408412694931, -0.01951642334461212, 0.00039123743772506714, 0.020298898220062256, 0.040206559002399445, 0.06011421978473663, 0.08002188801765442, 0.09992954134941101, 0.1198372021317482, 0.1397448629140854, 0.15965253114700317, 0.17956018447875977, 0.19946783781051636, 0.21937550604343414, 0.23928317427635193, 0.2591908276081085]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 13.0, 18.0, 17.0, 13.0, 19.0, 14.0, 21.0, 15.0, 26.0, 28.0, 37.0, 35.0, 46.0, 48.0, 47.0, 51.0, 51.0, 50.0, 30.0, 47.0, 35.0, 30.0, 38.0, 33.0, 35.0, 26.0, 21.0, 29.0, 17.0, 14.0, 18.0, 11.0, 5.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.15671849250793457, -0.15233047306537628, -0.147942453622818, -0.1435544490814209, -0.1391664296388626, -0.13477841019630432, -0.13039040565490723, -0.12600238621234894, -0.12161436676979065, -0.11722634732723236, -0.11283833533525467, -0.10845032334327698, -0.10406230390071869, -0.0996742844581604, -0.09528627246618271, -0.09089826047420502, -0.08651024103164673, -0.08212222158908844, -0.07773420959711075, -0.07334619760513306, -0.06895817816257477, -0.06457015872001648, -0.06018214672803879, -0.0557941310107708, -0.05140611529350281, -0.04701809957623482, -0.04263008385896683, -0.03824206814169884, -0.03385405242443085, -0.029466036707162857, -0.025078020989894867, -0.020690005272626877, -0.016301989555358887, -0.011913973838090897, -0.0075259581208229065, -0.0031379424035549164, 0.0012500733137130737, 0.005638089030981064, 0.010026104748249054, 0.014414120465517044, 0.018802136182785034, 0.023190151900053024, 0.027578167617321014, 0.031966183334589005, 0.036354199051856995, 0.040742214769124985, 0.045130230486392975, 0.049518246203660965, 0.053906261920928955, 0.058294277638196945, 0.06268229335546494, 0.06707030534744263, 0.07145832479000092, 0.0758463442325592, 0.0802343562245369, 0.08462236821651459, 0.08901038765907288, 0.09339840710163116, 0.09778641909360886, 0.10217443108558655, 0.10656245052814484, 0.11095046997070312, 0.11533848196268082, 0.11972649395465851, 0.1241145133972168]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 7.0, 4.0, 12.0, 11.0, 26.0, 30.0, 36.0, 64.0, 85.0, 152.0, 231.0, 410.0, 698.0, 1163.0, 2003.0, 3733.0, 7351.0, 15102.0, 33762.0, 87453.0, 259007.0, 389511.0, 149997.0, 53102.0, 22395.0, 10500.0, 5173.0, 2801.0, 1541.0, 823.0, 512.0, 290.0, 171.0, 111.0, 98.0, 62.0, 50.0, 19.0, 20.0, 12.0, 12.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1444091796875, -0.14006614685058594, -0.13572311401367188, -0.1313800811767578, -0.12703704833984375, -0.12269401550292969, -0.11835098266601562, -0.11400794982910156, -0.1096649169921875, -0.10532188415527344, -0.10097885131835938, -0.09663581848144531, -0.09229278564453125, -0.08794975280761719, -0.08360671997070312, -0.07926368713378906, -0.074920654296875, -0.07057762145996094, -0.06623458862304688, -0.06189155578613281, -0.05754852294921875, -0.05320549011230469, -0.048862457275390625, -0.04451942443847656, -0.0401763916015625, -0.03583335876464844, -0.031490325927734375, -0.027147293090820312, -0.02280426025390625, -0.018461227416992188, -0.014118194580078125, -0.009775161743164062, -0.00543212890625, -0.0010890960693359375, 0.003253936767578125, 0.0075969696044921875, 0.01194000244140625, 0.016283035278320312, 0.020626068115234375, 0.024969100952148438, 0.0293121337890625, 0.03365516662597656, 0.037998199462890625, 0.04234123229980469, 0.04668426513671875, 0.05102729797363281, 0.055370330810546875, 0.05971336364746094, 0.064056396484375, 0.06839942932128906, 0.07274246215820312, 0.07708549499511719, 0.08142852783203125, 0.08577156066894531, 0.09011459350585938, 0.09445762634277344, 0.0988006591796875, 0.10314369201660156, 0.10748672485351562, 0.11182975769042969, 0.11617279052734375, 0.12051582336425781, 0.12485885620117188, 0.12920188903808594, 0.133544921875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 17.0, 15.0, 9.0, 13.0, 10.0, 14.0, 22.0, 26.0, 22.0, 42.0, 48.0, 46.0, 46.0, 49.0, 49.0, 38.0, 55.0, 49.0, 54.0, 62.0, 49.0, 37.0, 33.0, 32.0, 29.0, 24.0, 27.0, 18.0, 12.0, 9.0, 9.0, 5.0, 8.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.035064697265625, -0.033724308013916016, -0.03238391876220703, -0.031043529510498047, -0.029703140258789062, -0.028362751007080078, -0.027022361755371094, -0.02568197250366211, -0.024341583251953125, -0.02300119400024414, -0.021660804748535156, -0.020320415496826172, -0.018980026245117188, -0.017639636993408203, -0.01629924774169922, -0.014958858489990234, -0.01361846923828125, -0.012278079986572266, -0.010937690734863281, -0.009597301483154297, -0.008256912231445312, -0.006916522979736328, -0.005576133728027344, -0.004235744476318359, -0.002895355224609375, -0.0015549659729003906, -0.00021457672119140625, 0.0011258125305175781, 0.0024662017822265625, 0.003806591033935547, 0.005146980285644531, 0.006487369537353516, 0.0078277587890625, 0.009168148040771484, 0.010508537292480469, 0.011848926544189453, 0.013189315795898438, 0.014529705047607422, 0.015870094299316406, 0.01721048355102539, 0.018550872802734375, 0.01989126205444336, 0.021231651306152344, 0.022572040557861328, 0.023912429809570312, 0.025252819061279297, 0.02659320831298828, 0.027933597564697266, 0.02927398681640625, 0.030614376068115234, 0.03195476531982422, 0.0332951545715332, 0.03463554382324219, 0.03597593307495117, 0.037316322326660156, 0.03865671157836914, 0.039997100830078125, 0.04133749008178711, 0.042677879333496094, 0.04401826858520508, 0.04535865783691406, 0.04669904708862305, 0.04803943634033203, 0.049379825592041016, 0.05072021484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 6.0, 6.0, 10.0, 13.0, 11.0, 20.0, 19.0, 26.0, 32.0, 20.0, 29.0, 41.0, 46.0, 85.0, 148.0, 443.0, 1991.0, 23855.0, 745638.0, 264911.0, 9306.0, 1112.0, 332.0, 91.0, 77.0, 63.0, 33.0, 36.0, 26.0, 27.0, 15.0, 20.0, 13.0, 14.0, 12.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.463134765625, -0.4494476318359375, -0.435760498046875, -0.4220733642578125, -0.40838623046875, -0.3946990966796875, -0.381011962890625, -0.3673248291015625, -0.3536376953125, -0.3399505615234375, -0.326263427734375, -0.3125762939453125, -0.29888916015625, -0.2852020263671875, -0.271514892578125, -0.2578277587890625, -0.244140625, -0.2304534912109375, -0.216766357421875, -0.2030792236328125, -0.18939208984375, -0.1757049560546875, -0.162017822265625, -0.1483306884765625, -0.1346435546875, -0.1209564208984375, -0.107269287109375, -0.0935821533203125, -0.07989501953125, -0.0662078857421875, -0.052520751953125, -0.0388336181640625, -0.025146484375, -0.0114593505859375, 0.002227783203125, 0.0159149169921875, 0.02960205078125, 0.0432891845703125, 0.056976318359375, 0.0706634521484375, 0.0843505859375, 0.0980377197265625, 0.111724853515625, 0.1254119873046875, 0.13909912109375, 0.1527862548828125, 0.166473388671875, 0.1801605224609375, 0.19384765625, 0.2075347900390625, 0.221221923828125, 0.2349090576171875, 0.24859619140625, 0.2622833251953125, 0.275970458984375, 0.2896575927734375, 0.3033447265625, 0.3170318603515625, 0.330718994140625, 0.3444061279296875, 0.35809326171875, 0.3717803955078125, 0.385467529296875, 0.3991546630859375, 0.412841796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 6.0, 4.0, 7.0, 11.0, 12.0, 16.0, 13.0, 21.0, 18.0, 19.0, 23.0, 26.0, 30.0, 25.0, 33.0, 38.0, 42.0, 52.0, 49.0, 33.0, 46.0, 41.0, 39.0, 49.0, 44.0, 31.0, 27.0, 46.0, 28.0, 23.0, 27.0, 23.0, 17.0, 14.0, 14.0, 12.0, 15.0, 5.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088134765625, -0.08543968200683594, -0.08274459838867188, -0.08004951477050781, -0.07735443115234375, -0.07465934753417969, -0.07196426391601562, -0.06926918029785156, -0.0665740966796875, -0.06387901306152344, -0.061183929443359375, -0.05848884582519531, -0.05579376220703125, -0.05309867858886719, -0.050403594970703125, -0.04770851135253906, -0.045013427734375, -0.04231834411621094, -0.039623260498046875, -0.03692817687988281, -0.03423309326171875, -0.03153800964355469, -0.028842926025390625, -0.026147842407226562, -0.0234527587890625, -0.020757675170898438, -0.018062591552734375, -0.015367507934570312, -0.01267242431640625, -0.009977340698242188, -0.007282257080078125, -0.0045871734619140625, -0.00189208984375, 0.0008029937744140625, 0.003498077392578125, 0.0061931610107421875, 0.00888824462890625, 0.011583328247070312, 0.014278411865234375, 0.016973495483398438, 0.0196685791015625, 0.022363662719726562, 0.025058746337890625, 0.027753829956054688, 0.03044891357421875, 0.03314399719238281, 0.035839080810546875, 0.03853416442871094, 0.041229248046875, 0.04392433166503906, 0.046619415283203125, 0.04931449890136719, 0.05200958251953125, 0.05470466613769531, 0.057399749755859375, 0.06009483337402344, 0.0627899169921875, 0.06548500061035156, 0.06818008422851562, 0.07087516784667969, 0.07357025146484375, 0.07626533508300781, 0.07896041870117188, 0.08165550231933594, 0.0843505859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 10.0, 6.0, 13.0, 22.0, 16.0, 24.0, 35.0, 48.0, 78.0, 123.0, 194.0, 331.0, 643.0, 1388.0, 3564.0, 13542.0, 145982.0, 822248.0, 48038.0, 7526.0, 2370.0, 1017.0, 533.0, 278.0, 151.0, 90.0, 76.0, 52.0, 29.0, 21.0, 20.0, 12.0, 11.0, 12.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.23390769958496094, -0.22501754760742188, -0.2161273956298828, -0.20723724365234375, -0.1983470916748047, -0.18945693969726562, -0.18056678771972656, -0.1716766357421875, -0.16278648376464844, -0.15389633178710938, -0.1450061798095703, -0.13611602783203125, -0.1272258758544922, -0.11833572387695312, -0.10944557189941406, -0.100555419921875, -0.09166526794433594, -0.08277511596679688, -0.07388496398925781, -0.06499481201171875, -0.05610466003417969, -0.047214508056640625, -0.03832435607910156, -0.0294342041015625, -0.020544052124023438, -0.011653900146484375, -0.0027637481689453125, 0.00612640380859375, 0.015016555786132812, 0.023906707763671875, 0.03279685974121094, 0.04168701171875, 0.05057716369628906, 0.059467315673828125, 0.06835746765136719, 0.07724761962890625, 0.08613777160644531, 0.09502792358398438, 0.10391807556152344, 0.1128082275390625, 0.12169837951660156, 0.13058853149414062, 0.1394786834716797, 0.14836883544921875, 0.1572589874267578, 0.16614913940429688, 0.17503929138183594, 0.183929443359375, 0.19281959533691406, 0.20170974731445312, 0.2105998992919922, 0.21949005126953125, 0.2283802032470703, 0.23727035522460938, 0.24616050720214844, 0.2550506591796875, 0.26394081115722656, 0.2728309631347656, 0.2817211151123047, 0.29061126708984375, 0.2995014190673828, 0.3083915710449219, 0.31728172302246094, 0.326171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 10.0, 5.0, 9.0, 14.0, 18.0, 20.0, 23.0, 42.0, 60.0, 87.0, 118.0, 126.0, 105.0, 97.0, 69.0, 45.0, 22.0, 26.0, 16.0, 12.0, 11.0, 10.0, 10.0, 5.0, 8.0, 1.0, 2.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.112705260515213e-05, -2.0498409867286682e-05, -1.9869767129421234e-05, -1.9241124391555786e-05, -1.8612481653690338e-05, -1.798383891582489e-05, -1.7355196177959442e-05, -1.6726553440093994e-05, -1.6097910702228546e-05, -1.5469267964363098e-05, -1.484062522649765e-05, -1.4211982488632202e-05, -1.3583339750766754e-05, -1.2954697012901306e-05, -1.2326054275035858e-05, -1.169741153717041e-05, -1.1068768799304962e-05, -1.0440126061439514e-05, -9.811483323574066e-06, -9.182840585708618e-06, -8.55419784784317e-06, -7.925555109977722e-06, -7.296912372112274e-06, -6.668269634246826e-06, -6.039626896381378e-06, -5.41098415851593e-06, -4.782341420650482e-06, -4.153698682785034e-06, -3.525055944919586e-06, -2.896413207054138e-06, -2.26777046918869e-06, -1.6391277313232422e-06, -1.0104849934577942e-06, -3.818422555923462e-07, 2.468004822731018e-07, 8.754432201385498e-07, 1.5040859580039978e-06, 2.132728695869446e-06, 2.761371433734894e-06, 3.390014171600342e-06, 4.01865690946579e-06, 4.647299647331238e-06, 5.275942385196686e-06, 5.904585123062134e-06, 6.533227860927582e-06, 7.16187059879303e-06, 7.790513336658478e-06, 8.419156074523926e-06, 9.047798812389374e-06, 9.676441550254822e-06, 1.030508428812027e-05, 1.0933727025985718e-05, 1.1562369763851166e-05, 1.2191012501716614e-05, 1.2819655239582062e-05, 1.344829797744751e-05, 1.4076940715312958e-05, 1.4705583453178406e-05, 1.5334226191043854e-05, 1.5962868928909302e-05, 1.659151166677475e-05, 1.7220154404640198e-05, 1.7848797142505646e-05, 1.8477439880371094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 9.0, 9.0, 12.0, 11.0, 19.0, 19.0, 22.0, 26.0, 36.0, 58.0, 75.0, 159.0, 320.0, 1236.0, 5798.0, 52760.0, 680480.0, 283511.0, 19864.0, 2858.0, 643.0, 220.0, 114.0, 61.0, 38.0, 27.0, 31.0, 21.0, 19.0, 17.0, 11.0, 11.0, 9.0, 4.0, 7.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099853515625, -0.10652637481689453, -0.10306739807128906, -0.0996084213256836, -0.09614944458007812, -0.09269046783447266, -0.08923149108886719, -0.08577251434326172, -0.08231353759765625, -0.07885456085205078, -0.07539558410644531, -0.07193660736083984, -0.06847763061523438, -0.0650186538696289, -0.06155967712402344, -0.05810070037841797, -0.0546417236328125, -0.05118274688720703, -0.04772377014160156, -0.044264793395996094, -0.040805816650390625, -0.037346839904785156, -0.03388786315917969, -0.03042888641357422, -0.02696990966796875, -0.02351093292236328, -0.020051956176757812, -0.016592979431152344, -0.013134002685546875, -0.009675025939941406, -0.0062160491943359375, -0.0027570724487304688, 0.000701904296875, 0.004160881042480469, 0.0076198577880859375, 0.011078834533691406, 0.014537811279296875, 0.017996788024902344, 0.021455764770507812, 0.02491474151611328, 0.02837371826171875, 0.03183269500732422, 0.03529167175292969, 0.038750648498535156, 0.042209625244140625, 0.045668601989746094, 0.04912757873535156, 0.05258655548095703, 0.0560455322265625, 0.05950450897216797, 0.06296348571777344, 0.0664224624633789, 0.06988143920898438, 0.07334041595458984, 0.07679939270019531, 0.08025836944580078, 0.08371734619140625, 0.08717632293701172, 0.09063529968261719, 0.09409427642822266, 0.09755325317382812, 0.1010122299194336, 0.10447120666503906, 0.10793018341064453, 0.11138916015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 1.0, 1.0, 6.0, 8.0, 10.0, 9.0, 14.0, 17.0, 19.0, 22.0, 24.0, 28.0, 39.0, 34.0, 33.0, 59.0, 47.0, 52.0, 56.0, 61.0, 40.0, 48.0, 40.0, 45.0, 50.0, 24.0, 26.0, 31.0, 30.0, 24.0, 18.0, 10.0, 10.0, 11.0, 11.0, 8.0, 6.0, 5.0, 8.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023956298828125, -0.02321314811706543, -0.02246999740600586, -0.02172684669494629, -0.02098369598388672, -0.02024054527282715, -0.019497394561767578, -0.018754243850708008, -0.018011093139648438, -0.017267942428588867, -0.016524791717529297, -0.015781641006469727, -0.015038490295410156, -0.014295339584350586, -0.013552188873291016, -0.012809038162231445, -0.012065887451171875, -0.011322736740112305, -0.010579586029052734, -0.009836435317993164, -0.009093284606933594, -0.008350133895874023, -0.007606983184814453, -0.006863832473754883, -0.0061206817626953125, -0.005377531051635742, -0.004634380340576172, -0.0038912296295166016, -0.0031480789184570312, -0.002404928207397461, -0.0016617774963378906, -0.0009186267852783203, -0.00017547607421875, 0.0005676746368408203, 0.0013108253479003906, 0.002053976058959961, 0.0027971267700195312, 0.0035402774810791016, 0.004283428192138672, 0.005026578903198242, 0.0057697296142578125, 0.006512880325317383, 0.007256031036376953, 0.007999181747436523, 0.008742332458496094, 0.009485483169555664, 0.010228633880615234, 0.010971784591674805, 0.011714935302734375, 0.012458086013793945, 0.013201236724853516, 0.013944387435913086, 0.014687538146972656, 0.015430688858032227, 0.016173839569091797, 0.016916990280151367, 0.017660140991210938, 0.018403291702270508, 0.019146442413330078, 0.01988959312438965, 0.02063274383544922, 0.02137589454650879, 0.02211904525756836, 0.02286219596862793, 0.0236053466796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 78.0, 829.0, 104.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.753880500793457, -1.6248242855072021, -1.4957681894302368, -1.366711974143982, -1.2376558780670166, -1.1085996627807617, -0.9795434474945068, -0.8504872918128967, -0.7214311361312866, -0.5923749804496765, -0.463318794965744, -0.3342626094818115, -0.20520645380020142, -0.07615029811859131, 0.052905917167663574, 0.18196207284927368, 0.3110182285308838, 0.4400743842124939, 0.569130539894104, 0.6981867551803589, 0.827242910861969, 0.9562990665435791, 1.085355281829834, 1.2144114971160889, 1.3434675931930542, 1.472523808479309, 1.6015799045562744, 1.7306361198425293, 1.8596923351287842, 1.9887484312057495, 2.117804527282715, 2.2468607425689697, 2.3759169578552246, 2.5049731731414795, 2.6340293884277344, 2.76308536529541, 2.892141580581665, 3.02119779586792, 3.150254011154175, 3.2793102264404297, 3.4083662033081055, 3.5374224185943604, 3.6664786338806152, 3.795534610748291, 3.924590826034546, 4.053647041320801, 4.182703018188477, 4.3117594718933105, 4.4408159255981445, 4.56987190246582, 4.698928356170654, 4.82798433303833, 4.957040786743164, 5.08609676361084, 5.215152740478516, 5.34420919418335, 5.473265171051025, 5.602321147918701, 5.731377601623535, 5.860433578491211, 5.989490032196045, 6.118546009063721, 6.247602462768555, 6.3766584396362305, 6.505714416503906]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 6.0, 10.0, 4.0, 3.0, 13.0, 18.0, 19.0, 19.0, 18.0, 22.0, 41.0, 24.0, 34.0, 35.0, 29.0, 52.0, 40.0, 30.0, 46.0, 44.0, 41.0, 55.0, 51.0, 46.0, 42.0, 29.0, 32.0, 26.0, 20.0, 28.0, 31.0, 14.0, 16.0, 13.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.37379348278045654, -0.36203163862228394, -0.35026979446411133, -0.3385079503059387, -0.3267461061477661, -0.3149842619895935, -0.3032224178314209, -0.2914605736732483, -0.2796987295150757, -0.2679368853569031, -0.25617504119873047, -0.24441319704055786, -0.23265135288238525, -0.22088950872421265, -0.20912766456604004, -0.19736582040786743, -0.18560396134853363, -0.17384211719036102, -0.16208027303218842, -0.1503184288740158, -0.1385565847158432, -0.1267947405576706, -0.11503288894891739, -0.10327104479074478, -0.09150920063257217, -0.07974735647439957, -0.06798551231622696, -0.05622366443276405, -0.044461820274591446, -0.03269997611641884, -0.020938128232955933, -0.009176284074783325, 0.0025855600833892822, 0.014347405172884464, 0.026109250262379646, 0.0378710962831974, 0.04963294044137001, 0.06139478459954262, 0.07315663248300552, 0.08491847664117813, 0.09668032079935074, 0.10844216495752335, 0.12020400911569595, 0.13196586072444916, 0.14372770488262177, 0.15548954904079437, 0.16725139319896698, 0.1790132373571396, 0.1907750815153122, 0.2025369256734848, 0.2142987698316574, 0.22606061398983002, 0.23782245814800262, 0.24958430230617523, 0.26134616136550903, 0.27310800552368164, 0.28486984968185425, 0.29663169384002686, 0.30839353799819946, 0.32015538215637207, 0.3319172263145447, 0.3436790704727173, 0.3554409146308899, 0.3672027587890625, 0.3789646029472351]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 10.0, 8.0, 18.0, 34.0, 51.0, 54.0, 101.0, 142.0, 222.0, 320.0, 477.0, 756.0, 1388.0, 2773.0, 6295.0, 17550.0, 67172.0, 740393.0, 3154858.0, 150400.0, 31327.0, 10306.0, 4357.0, 2172.0, 1117.0, 669.0, 423.0, 297.0, 171.0, 127.0, 76.0, 63.0, 42.0, 27.0, 20.0, 17.0, 8.0, 8.0, 6.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14794921875, -0.14288711547851562, -0.13782501220703125, -0.13276290893554688, -0.1277008056640625, -0.12263870239257812, -0.11757659912109375, -0.11251449584960938, -0.107452392578125, -0.10239028930664062, -0.09732818603515625, -0.09226608276367188, -0.0872039794921875, -0.08214187622070312, -0.07707977294921875, -0.07201766967773438, -0.06695556640625, -0.061893463134765625, -0.05683135986328125, -0.051769256591796875, -0.0467071533203125, -0.041645050048828125, -0.03658294677734375, -0.031520843505859375, -0.026458740234375, -0.021396636962890625, -0.01633453369140625, -0.011272430419921875, -0.0062103271484375, -0.001148223876953125, 0.00391387939453125, 0.008975982666015625, 0.0140380859375, 0.019100189208984375, 0.02416229248046875, 0.029224395751953125, 0.0342864990234375, 0.039348602294921875, 0.04441070556640625, 0.049472808837890625, 0.054534912109375, 0.059597015380859375, 0.06465911865234375, 0.06972122192382812, 0.0747833251953125, 0.07984542846679688, 0.08490753173828125, 0.08996963500976562, 0.09503173828125, 0.10009384155273438, 0.10515594482421875, 0.11021804809570312, 0.1152801513671875, 0.12034225463867188, 0.12540435791015625, 0.13046646118164062, 0.135528564453125, 0.14059066772460938, 0.14565277099609375, 0.15071487426757812, 0.1557769775390625, 0.16083908081054688, 0.16590118408203125, 0.17096328735351562, 0.176025390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 5.0, 7.0, 14.0, 16.0, 10.0, 16.0, 30.0, 32.0, 44.0, 43.0, 45.0, 54.0, 45.0, 58.0, 55.0, 58.0, 51.0, 44.0, 57.0, 51.0, 36.0, 37.0, 29.0, 30.0, 22.0, 22.0, 12.0, 18.0, 12.0, 9.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.046112060546875, -0.04465007781982422, -0.04318809509277344, -0.041726112365722656, -0.040264129638671875, -0.038802146911621094, -0.03734016418457031, -0.03587818145751953, -0.03441619873046875, -0.03295421600341797, -0.03149223327636719, -0.030030250549316406, -0.028568267822265625, -0.027106285095214844, -0.025644302368164062, -0.02418231964111328, -0.0227203369140625, -0.02125835418701172, -0.019796371459960938, -0.018334388732910156, -0.016872406005859375, -0.015410423278808594, -0.013948440551757812, -0.012486457824707031, -0.01102447509765625, -0.009562492370605469, -0.008100509643554688, -0.006638526916503906, -0.005176544189453125, -0.0037145614624023438, -0.0022525787353515625, -0.0007905960083007812, 0.00067138671875, 0.0021333694458007812, 0.0035953521728515625, 0.005057334899902344, 0.006519317626953125, 0.007981300354003906, 0.009443283081054688, 0.010905265808105469, 0.01236724853515625, 0.013829231262207031, 0.015291213989257812, 0.016753196716308594, 0.018215179443359375, 0.019677162170410156, 0.021139144897460938, 0.02260112762451172, 0.0240631103515625, 0.02552509307861328, 0.026987075805664062, 0.028449058532714844, 0.029911041259765625, 0.031373023986816406, 0.03283500671386719, 0.03429698944091797, 0.03575897216796875, 0.03722095489501953, 0.03868293762207031, 0.040144920349121094, 0.041606903076171875, 0.043068885803222656, 0.04453086853027344, 0.04599285125732422, 0.047454833984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 6.0, 17.0, 17.0, 30.0, 60.0, 127.0, 207.0, 438.0, 1035.0, 3183.0, 13497.0, 97532.0, 2294823.0, 1685202.0, 81399.0, 11888.0, 2972.0, 942.0, 459.0, 181.0, 107.0, 63.0, 39.0, 20.0, 13.0, 9.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.203125, -0.19611167907714844, -0.18909835815429688, -0.1820850372314453, -0.17507171630859375, -0.1680583953857422, -0.16104507446289062, -0.15403175354003906, -0.1470184326171875, -0.14000511169433594, -0.13299179077148438, -0.1259784698486328, -0.11896514892578125, -0.11195182800292969, -0.10493850708007812, -0.09792518615722656, -0.090911865234375, -0.08389854431152344, -0.07688522338867188, -0.06987190246582031, -0.06285858154296875, -0.05584526062011719, -0.048831939697265625, -0.04181861877441406, -0.0348052978515625, -0.027791976928710938, -0.020778656005859375, -0.013765335083007812, -0.00675201416015625, 0.0002613067626953125, 0.007274627685546875, 0.014287948608398438, 0.02130126953125, 0.028314590454101562, 0.035327911376953125, 0.04234123229980469, 0.04935455322265625, 0.05636787414550781, 0.06338119506835938, 0.07039451599121094, 0.0774078369140625, 0.08442115783691406, 0.09143447875976562, 0.09844779968261719, 0.10546112060546875, 0.11247444152832031, 0.11948776245117188, 0.12650108337402344, 0.133514404296875, 0.14052772521972656, 0.14754104614257812, 0.1545543670654297, 0.16156768798828125, 0.1685810089111328, 0.17559432983398438, 0.18260765075683594, 0.1896209716796875, 0.19663429260253906, 0.20364761352539062, 0.2106609344482422, 0.21767425537109375, 0.2246875762939453, 0.23170089721679688, 0.23871421813964844, 0.2457275390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 13.0, 8.0, 13.0, 16.0, 41.0, 39.0, 66.0, 103.0, 151.0, 274.0, 512.0, 1005.0, 771.0, 407.0, 219.0, 128.0, 78.0, 73.0, 49.0, 35.0, 18.0, 13.0, 8.0, 6.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.110107421875, -0.1069498062133789, -0.10379219055175781, -0.10063457489013672, -0.09747695922851562, -0.09431934356689453, -0.09116172790527344, -0.08800411224365234, -0.08484649658203125, -0.08168888092041016, -0.07853126525878906, -0.07537364959716797, -0.07221603393554688, -0.06905841827392578, -0.06590080261230469, -0.0627431869506836, -0.0595855712890625, -0.056427955627441406, -0.05327033996582031, -0.05011272430419922, -0.046955108642578125, -0.04379749298095703, -0.04063987731933594, -0.037482261657714844, -0.03432464599609375, -0.031167030334472656, -0.028009414672851562, -0.02485179901123047, -0.021694183349609375, -0.01853656768798828, -0.015378952026367188, -0.012221336364746094, -0.009063720703125, -0.005906105041503906, -0.0027484893798828125, 0.00040912628173828125, 0.003566741943359375, 0.006724357604980469, 0.009881973266601562, 0.013039588928222656, 0.01619720458984375, 0.019354820251464844, 0.022512435913085938, 0.02567005157470703, 0.028827667236328125, 0.03198528289794922, 0.03514289855957031, 0.038300514221191406, 0.0414581298828125, 0.044615745544433594, 0.04777336120605469, 0.05093097686767578, 0.054088592529296875, 0.05724620819091797, 0.06040382385253906, 0.06356143951416016, 0.06671905517578125, 0.06987667083740234, 0.07303428649902344, 0.07619190216064453, 0.07934951782226562, 0.08250713348388672, 0.08566474914550781, 0.0888223648071289, 0.09197998046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 44.0, 249.0, 489.0, 188.0, 33.0, 8.0, 2.0], "bins": [-2.690913438796997, -2.6455609798431396, -2.6002087593078613, -2.554856300354004, -2.5095038414001465, -2.464151620864868, -2.4187991619110107, -2.3734469413757324, -2.328094482421875, -2.2827420234680176, -2.2373898029327393, -2.192037343978882, -2.1466851234436035, -2.101332664489746, -2.0559802055358887, -2.0106279850006104, -1.965275526046753, -1.919923186302185, -1.8745708465576172, -1.8292183876037598, -1.783866047859192, -1.738513708114624, -1.6931612491607666, -1.6478089094161987, -1.6024565696716309, -1.557104229927063, -1.5117518901824951, -1.4663994312286377, -1.4210470914840698, -1.375694751739502, -1.3303422927856445, -1.2849899530410767, -1.2396376132965088, -1.194285273551941, -1.148932933807373, -1.1035804748535156, -1.0582281351089478, -1.0128757953643799, -0.9675233960151672, -0.9221709966659546, -0.8768185973167419, -0.8314661979675293, -0.7861138582229614, -0.7407615184783936, -0.6954091191291809, -0.6500567197799683, -0.6047043800354004, -0.5593520402908325, -0.5139996409416199, -0.4686472713947296, -0.42329490184783936, -0.3779425323009491, -0.33259016275405884, -0.2872377932071686, -0.24188542366027832, -0.19653305411338806, -0.151180699467659, -0.10582832992076874, -0.06047596037387848, -0.01512359082698822, 0.03022877871990204, 0.0755811482667923, 0.12093351781368256, 0.16628588736057281, 0.21163825690746307]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 13.0, 9.0, 13.0, 15.0, 13.0, 18.0, 23.0, 28.0, 28.0, 31.0, 42.0, 37.0, 43.0, 37.0, 44.0, 40.0, 55.0, 32.0, 53.0, 41.0, 55.0, 40.0, 47.0, 31.0, 30.0, 32.0, 29.0, 24.0, 17.0, 12.0, 9.0, 11.0, 12.0, 8.0, 4.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2684650421142578, -0.2606029808521271, -0.2527409493923187, -0.24487890303134918, -0.23701685667037964, -0.2291547954082489, -0.22129274904727936, -0.21343070268630981, -0.20556865632534027, -0.19770660996437073, -0.18984456360340118, -0.18198251724243164, -0.1741204559803009, -0.16625842452049255, -0.15839636325836182, -0.15053431689739227, -0.14267227053642273, -0.13481022417545319, -0.12694817781448364, -0.1190861240029335, -0.11122407764196396, -0.10336203128099442, -0.09549997746944427, -0.08763793110847473, -0.07977588474750519, -0.07191383838653564, -0.0640517920255661, -0.05618973821401596, -0.04832769185304642, -0.040465645492076874, -0.03260359540581703, -0.02474154531955719, -0.016879498958587646, -0.009017450734972954, -0.001155402511358261, 0.006706645712256432, 0.014568693935871124, 0.022430740296840668, 0.03029279038310051, 0.03815484046936035, 0.046016886830329895, 0.05387893319129944, 0.06174098327755928, 0.06960303336381912, 0.07746507972478867, 0.08532712608575821, 0.09318917989730835, 0.1010512262582779, 0.10891327261924744, 0.11677531898021698, 0.12463736534118652, 0.13249941170215607, 0.1403614580631256, 0.14822351932525635, 0.1560855656862259, 0.16394761204719543, 0.17180965840816498, 0.17967170476913452, 0.18753375113010406, 0.1953957974910736, 0.20325785875320435, 0.2111198902130127, 0.21898195147514343, 0.22684399783611298, 0.23470604419708252]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 16.0, 26.0, 40.0, 57.0, 97.0, 137.0, 250.0, 508.0, 995.0, 2089.0, 4444.0, 10035.0, 24745.0, 65562.0, 184709.0, 370059.0, 240386.0, 88408.0, 32220.0, 12820.0, 5718.0, 2542.0, 1263.0, 638.0, 308.0, 191.0, 94.0, 58.0, 42.0, 29.0, 20.0, 8.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.12396240234375, -0.1204843521118164, -0.11700630187988281, -0.11352825164794922, -0.11005020141601562, -0.10657215118408203, -0.10309410095214844, -0.09961605072021484, -0.09613800048828125, -0.09265995025634766, -0.08918190002441406, -0.08570384979248047, -0.08222579956054688, -0.07874774932861328, -0.07526969909667969, -0.0717916488647461, -0.0683135986328125, -0.0648355484008789, -0.06135749816894531, -0.05787944793701172, -0.054401397705078125, -0.05092334747314453, -0.04744529724121094, -0.043967247009277344, -0.04048919677734375, -0.037011146545410156, -0.03353309631347656, -0.03005504608154297, -0.026576995849609375, -0.02309894561767578, -0.019620895385742188, -0.016142845153808594, -0.012664794921875, -0.009186744689941406, -0.0057086944580078125, -0.0022306442260742188, 0.001247406005859375, 0.004725456237792969, 0.008203506469726562, 0.011681556701660156, 0.01515960693359375, 0.018637657165527344, 0.022115707397460938, 0.02559375762939453, 0.029071807861328125, 0.03254985809326172, 0.03602790832519531, 0.039505958557128906, 0.0429840087890625, 0.046462059020996094, 0.04994010925292969, 0.05341815948486328, 0.056896209716796875, 0.06037425994873047, 0.06385231018066406, 0.06733036041259766, 0.07080841064453125, 0.07428646087646484, 0.07776451110839844, 0.08124256134033203, 0.08472061157226562, 0.08819866180419922, 0.09167671203613281, 0.0951547622680664, 0.0986328125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 5.0, 11.0, 9.0, 10.0, 18.0, 18.0, 24.0, 40.0, 36.0, 38.0, 48.0, 57.0, 49.0, 51.0, 58.0, 44.0, 55.0, 54.0, 41.0, 48.0, 48.0, 31.0, 32.0, 25.0, 35.0, 18.0, 22.0, 23.0, 15.0, 7.0, 6.0, 9.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03387451171875, -0.03250455856323242, -0.031134605407714844, -0.029764652252197266, -0.028394699096679688, -0.02702474594116211, -0.02565479278564453, -0.024284839630126953, -0.022914886474609375, -0.021544933319091797, -0.02017498016357422, -0.01880502700805664, -0.017435073852539062, -0.016065120697021484, -0.014695167541503906, -0.013325214385986328, -0.01195526123046875, -0.010585308074951172, -0.009215354919433594, -0.007845401763916016, -0.0064754486083984375, -0.005105495452880859, -0.0037355422973632812, -0.002365589141845703, -0.000995635986328125, 0.0003743171691894531, 0.0017442703247070312, 0.0031142234802246094, 0.0044841766357421875, 0.005854129791259766, 0.007224082946777344, 0.008594036102294922, 0.0099639892578125, 0.011333942413330078, 0.012703895568847656, 0.014073848724365234, 0.015443801879882812, 0.01681375503540039, 0.01818370819091797, 0.019553661346435547, 0.020923614501953125, 0.022293567657470703, 0.02366352081298828, 0.02503347396850586, 0.026403427124023438, 0.027773380279541016, 0.029143333435058594, 0.030513286590576172, 0.03188323974609375, 0.03325319290161133, 0.034623146057128906, 0.035993099212646484, 0.03736305236816406, 0.03873300552368164, 0.04010295867919922, 0.0414729118347168, 0.042842864990234375, 0.04421281814575195, 0.04558277130126953, 0.04695272445678711, 0.04832267761230469, 0.049692630767822266, 0.051062583923339844, 0.05243253707885742, 0.053802490234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 5.0, 7.0, 11.0, 8.0, 19.0, 29.0, 17.0, 19.0, 29.0, 44.0, 39.0, 67.0, 99.0, 153.0, 269.0, 616.0, 1646.0, 5045.0, 17805.0, 74930.0, 353575.0, 453948.0, 106032.0, 23863.0, 6525.0, 2080.0, 741.0, 292.0, 170.0, 102.0, 79.0, 58.0, 51.0, 31.0, 33.0, 19.0, 28.0, 18.0, 6.0, 14.0, 4.0, 11.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15795516967773438, -0.15233612060546875, -0.14671707153320312, -0.1410980224609375, -0.13547897338867188, -0.12985992431640625, -0.12424087524414062, -0.118621826171875, -0.11300277709960938, -0.10738372802734375, -0.10176467895507812, -0.0961456298828125, -0.09052658081054688, -0.08490753173828125, -0.07928848266601562, -0.07366943359375, -0.06805038452148438, -0.06243133544921875, -0.056812286376953125, -0.0511932373046875, -0.045574188232421875, -0.03995513916015625, -0.034336090087890625, -0.028717041015625, -0.023097991943359375, -0.01747894287109375, -0.011859893798828125, -0.0062408447265625, -0.000621795654296875, 0.00499725341796875, 0.010616302490234375, 0.0162353515625, 0.021854400634765625, 0.02747344970703125, 0.033092498779296875, 0.0387115478515625, 0.044330596923828125, 0.04994964599609375, 0.055568695068359375, 0.061187744140625, 0.06680679321289062, 0.07242584228515625, 0.07804489135742188, 0.0836639404296875, 0.08928298950195312, 0.09490203857421875, 0.10052108764648438, 0.10614013671875, 0.11175918579101562, 0.11737823486328125, 0.12299728393554688, 0.1286163330078125, 0.13423538208007812, 0.13985443115234375, 0.14547348022460938, 0.151092529296875, 0.15671157836914062, 0.16233062744140625, 0.16794967651367188, 0.1735687255859375, 0.17918777465820312, 0.18480682373046875, 0.19042587280273438, 0.196044921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 4.0, 9.0, 8.0, 9.0, 10.0, 13.0, 17.0, 19.0, 26.0, 20.0, 29.0, 27.0, 38.0, 28.0, 44.0, 28.0, 40.0, 37.0, 49.0, 41.0, 34.0, 35.0, 36.0, 33.0, 28.0, 24.0, 33.0, 27.0, 27.0, 30.0, 27.0, 22.0, 30.0, 19.0, 11.0, 14.0, 12.0, 11.0, 6.0, 8.0, 7.0, 1.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08367919921875, -0.08101081848144531, -0.07834243774414062, -0.07567405700683594, -0.07300567626953125, -0.07033729553222656, -0.06766891479492188, -0.06500053405761719, -0.0623321533203125, -0.05966377258300781, -0.056995391845703125, -0.05432701110839844, -0.05165863037109375, -0.04899024963378906, -0.046321868896484375, -0.04365348815917969, -0.040985107421875, -0.03831672668457031, -0.035648345947265625, -0.03297996520996094, -0.03031158447265625, -0.027643203735351562, -0.024974822998046875, -0.022306442260742188, -0.0196380615234375, -0.016969680786132812, -0.014301300048828125, -0.011632919311523438, -0.00896453857421875, -0.0062961578369140625, -0.003627777099609375, -0.0009593963623046875, 0.001708984375, 0.0043773651123046875, 0.007045745849609375, 0.009714126586914062, 0.01238250732421875, 0.015050888061523438, 0.017719268798828125, 0.020387649536132812, 0.0230560302734375, 0.025724411010742188, 0.028392791748046875, 0.031061172485351562, 0.03372955322265625, 0.03639793395996094, 0.039066314697265625, 0.04173469543457031, 0.044403076171875, 0.04707145690917969, 0.049739837646484375, 0.05240821838378906, 0.05507659912109375, 0.05774497985839844, 0.060413360595703125, 0.06308174133300781, 0.0657501220703125, 0.06841850280761719, 0.07108688354492188, 0.07375526428222656, 0.07642364501953125, 0.07909202575683594, 0.08176040649414062, 0.08442878723144531, 0.08709716796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 4.0, 14.0, 29.0, 26.0, 47.0, 52.0, 81.0, 136.0, 204.0, 374.0, 665.0, 1217.0, 2285.0, 4492.0, 11164.0, 76323.0, 876950.0, 55552.0, 9843.0, 4252.0, 2086.0, 1156.0, 615.0, 375.0, 220.0, 108.0, 95.0, 50.0, 33.0, 21.0, 17.0, 17.0, 6.0, 11.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3662109375, -0.35616302490234375, -0.3461151123046875, -0.33606719970703125, -0.326019287109375, -0.31597137451171875, -0.3059234619140625, -0.29587554931640625, -0.28582763671875, -0.27577972412109375, -0.2657318115234375, -0.25568389892578125, -0.245635986328125, -0.23558807373046875, -0.2255401611328125, -0.21549224853515625, -0.2054443359375, -0.19539642333984375, -0.1853485107421875, -0.17530059814453125, -0.165252685546875, -0.15520477294921875, -0.1451568603515625, -0.13510894775390625, -0.12506103515625, -0.11501312255859375, -0.1049652099609375, -0.09491729736328125, -0.084869384765625, -0.07482147216796875, -0.0647735595703125, -0.05472564697265625, -0.044677734375, -0.03462982177734375, -0.0245819091796875, -0.01453399658203125, -0.004486083984375, 0.00556182861328125, 0.0156097412109375, 0.02565765380859375, 0.03570556640625, 0.04575347900390625, 0.0558013916015625, 0.06584930419921875, 0.075897216796875, 0.08594512939453125, 0.0959930419921875, 0.10604095458984375, 0.1160888671875, 0.12613677978515625, 0.1361846923828125, 0.14623260498046875, 0.156280517578125, 0.16632843017578125, 0.1763763427734375, 0.18642425537109375, 0.19647216796875, 0.20652008056640625, 0.2165679931640625, 0.22661590576171875, 0.236663818359375, 0.24671173095703125, 0.2567596435546875, 0.26680755615234375, 0.27685546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 3.0, 3.0, 3.0, 11.0, 21.0, 43.0, 76.0, 174.0, 302.0, 195.0, 79.0, 42.0, 17.0, 16.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.193877637386322e-05, -3.073737025260925e-05, -2.9535964131355286e-05, -2.833455801010132e-05, -2.713315188884735e-05, -2.5931745767593384e-05, -2.4730339646339417e-05, -2.352893352508545e-05, -2.2327527403831482e-05, -2.1126121282577515e-05, -1.9924715161323547e-05, -1.872330904006958e-05, -1.7521902918815613e-05, -1.6320496797561646e-05, -1.5119090676307678e-05, -1.3917684555053711e-05, -1.2716278433799744e-05, -1.1514872312545776e-05, -1.0313466191291809e-05, -9.112060070037842e-06, -7.910653948783875e-06, -6.709247827529907e-06, -5.50784170627594e-06, -4.306435585021973e-06, -3.1050294637680054e-06, -1.903623342514038e-06, -7.022172212600708e-07, 4.991888999938965e-07, 1.7005950212478638e-06, 2.902001142501831e-06, 4.103407263755798e-06, 5.304813385009766e-06, 6.506219506263733e-06, 7.7076256275177e-06, 8.909031748771667e-06, 1.0110437870025635e-05, 1.1311843991279602e-05, 1.251325011253357e-05, 1.3714656233787537e-05, 1.4916062355041504e-05, 1.611746847629547e-05, 1.731887459754944e-05, 1.8520280718803406e-05, 1.9721686840057373e-05, 2.092309296131134e-05, 2.2124499082565308e-05, 2.3325905203819275e-05, 2.4527311325073242e-05, 2.572871744632721e-05, 2.6930123567581177e-05, 2.8131529688835144e-05, 2.933293581008911e-05, 3.053434193134308e-05, 3.1735748052597046e-05, 3.293715417385101e-05, 3.413856029510498e-05, 3.533996641635895e-05, 3.6541372537612915e-05, 3.774277865886688e-05, 3.894418478012085e-05, 4.014559090137482e-05, 4.1346997022628784e-05, 4.254840314388275e-05, 4.374980926513672e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 9.0, 8.0, 14.0, 35.0, 54.0, 167.0, 511.0, 1701.0, 8776.0, 392724.0, 630643.0, 11012.0, 1963.0, 573.0, 184.0, 69.0, 31.0, 18.0, 13.0, 8.0, 5.0, 7.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.348388671875, -0.33815765380859375, -0.3279266357421875, -0.31769561767578125, -0.307464599609375, -0.29723358154296875, -0.2870025634765625, -0.27677154541015625, -0.26654052734375, -0.25630950927734375, -0.2460784912109375, -0.23584747314453125, -0.225616455078125, -0.21538543701171875, -0.2051544189453125, -0.19492340087890625, -0.1846923828125, -0.17446136474609375, -0.1642303466796875, -0.15399932861328125, -0.143768310546875, -0.13353729248046875, -0.1233062744140625, -0.11307525634765625, -0.10284423828125, -0.09261322021484375, -0.0823822021484375, -0.07215118408203125, -0.061920166015625, -0.05168914794921875, -0.0414581298828125, -0.03122711181640625, -0.02099609375, -0.01076507568359375, -0.0005340576171875, 0.00969696044921875, 0.019927978515625, 0.03015899658203125, 0.0403900146484375, 0.05062103271484375, 0.06085205078125, 0.07108306884765625, 0.0813140869140625, 0.09154510498046875, 0.101776123046875, 0.11200714111328125, 0.1222381591796875, 0.13246917724609375, 0.1427001953125, 0.15293121337890625, 0.1631622314453125, 0.17339324951171875, 0.183624267578125, 0.19385528564453125, 0.2040863037109375, 0.21431732177734375, 0.22454833984375, 0.23477935791015625, 0.2450103759765625, 0.25524139404296875, 0.265472412109375, 0.27570343017578125, 0.2859344482421875, 0.29616546630859375, 0.306396484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 18.0, 33.0, 58.0, 117.0, 216.0, 216.0, 152.0, 67.0, 38.0, 17.0, 12.0, 10.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1014404296875, -0.0980682373046875, -0.094696044921875, -0.0913238525390625, -0.08795166015625, -0.0845794677734375, -0.081207275390625, -0.0778350830078125, -0.074462890625, -0.0710906982421875, -0.067718505859375, -0.0643463134765625, -0.06097412109375, -0.0576019287109375, -0.054229736328125, -0.0508575439453125, -0.0474853515625, -0.0441131591796875, -0.040740966796875, -0.0373687744140625, -0.03399658203125, -0.0306243896484375, -0.027252197265625, -0.0238800048828125, -0.0205078125, -0.0171356201171875, -0.013763427734375, -0.0103912353515625, -0.00701904296875, -0.0036468505859375, -0.000274658203125, 0.0030975341796875, 0.0064697265625, 0.0098419189453125, 0.013214111328125, 0.0165863037109375, 0.01995849609375, 0.0233306884765625, 0.026702880859375, 0.0300750732421875, 0.033447265625, 0.0368194580078125, 0.040191650390625, 0.0435638427734375, 0.04693603515625, 0.0503082275390625, 0.053680419921875, 0.0570526123046875, 0.0604248046875, 0.0637969970703125, 0.067169189453125, 0.0705413818359375, 0.07391357421875, 0.0772857666015625, 0.080657958984375, 0.0840301513671875, 0.08740234375, 0.0907745361328125, 0.094146728515625, 0.0975189208984375, 0.10089111328125, 0.1042633056640625, 0.107635498046875, 0.1110076904296875, 0.1143798828125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 22.0, 360.0, 580.0, 47.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.158783435821533, -5.066802501678467, -4.974821090698242, -4.882840156555176, -4.790859222412109, -4.698877811431885, -4.606896877288818, -4.514915943145752, -4.422934532165527, -4.330953598022461, -4.238972187042236, -4.14699125289917, -4.0550103187561035, -3.963029146194458, -3.8710479736328125, -3.779067039489746, -3.6870861053466797, -3.595104932785034, -3.5031239986419678, -3.4111428260803223, -3.3191616535186768, -3.2271807193756104, -3.135199546813965, -3.0432186126708984, -2.951237201690674, -2.8592560291290283, -2.767275094985962, -2.6752939224243164, -2.583312749862671, -2.4913318157196045, -2.399350643157959, -2.3073697090148926, -2.215388298034668, -2.1234071254730225, -2.031426191329956, -1.9394450187683105, -1.8474639654159546, -1.7554829120635986, -1.6635017395019531, -1.5715206861495972, -1.4795396327972412, -1.3875585794448853, -1.2955774068832397, -1.2035963535308838, -1.1116153001785278, -1.0196342468261719, -0.9276530742645264, -0.8356720209121704, -0.7436909675598145, -0.6517098546028137, -0.5597288012504578, -0.46774768829345703, -0.3757666051387787, -0.28378552198410034, -0.1918044090270996, -0.09982335567474365, -0.00784224271774292, 0.08413884788751602, 0.17611993849277496, 0.2681010365486145, 0.36008211970329285, 0.4520632028579712, 0.5440443158149719, 0.6360253691673279, 0.7280064821243286]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 16.0, 18.0, 18.0, 31.0, 35.0, 58.0, 41.0, 44.0, 52.0, 64.0, 66.0, 76.0, 66.0, 74.0, 65.0, 62.0, 34.0, 41.0, 31.0, 13.0, 18.0, 17.0, 18.0, 8.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4894716143608093, -0.4751549959182739, -0.4608383774757385, -0.4465217590332031, -0.4322051405906677, -0.4178885221481323, -0.4035719037055969, -0.3892552852630615, -0.3749386668205261, -0.3606220483779907, -0.3463054299354553, -0.3319888114929199, -0.3176721930503845, -0.3033555746078491, -0.2890389561653137, -0.2747223377227783, -0.2604057192802429, -0.24608910083770752, -0.23177248239517212, -0.21745586395263672, -0.20313924551010132, -0.18882262706756592, -0.17450600862503052, -0.16018939018249512, -0.1458728015422821, -0.1315561830997467, -0.1172395646572113, -0.1029229462146759, -0.0886063277721405, -0.0742897167801857, -0.0599730983376503, -0.0456564798951149, -0.0313398540019989, -0.0170232355594635, -0.00270661897957325, 0.011609997600317001, 0.0259266160428524, 0.040243230760097504, 0.054559849202632904, 0.0688764676451683, 0.0831930860877037, 0.0975097045302391, 0.1118263229727745, 0.1261429339647293, 0.1404595524072647, 0.1547761708498001, 0.1690927892923355, 0.1834094077348709, 0.1977260261774063, 0.2120426446199417, 0.2263592630624771, 0.2406758815050125, 0.2549924850463867, 0.2693091034889221, 0.2836257219314575, 0.2979423403739929, 0.3122589588165283, 0.3265755772590637, 0.3408921957015991, 0.3552088141441345, 0.3695254325866699, 0.3838420510292053, 0.3981586694717407, 0.4124752879142761, 0.4267919063568115]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 12.0, 28.0, 41.0, 36.0, 77.0, 101.0, 161.0, 260.0, 398.0, 644.0, 1323.0, 2730.0, 6947.0, 21934.0, 94963.0, 864242.0, 2782390.0, 341681.0, 52253.0, 13947.0, 5023.0, 2236.0, 1062.0, 644.0, 370.0, 227.0, 165.0, 104.0, 76.0, 53.0, 28.0, 26.0, 22.0, 14.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.09943294525146484, -0.09565544128417969, -0.09187793731689453, -0.08810043334960938, -0.08432292938232422, -0.08054542541503906, -0.0767679214477539, -0.07299041748046875, -0.0692129135131836, -0.06543540954589844, -0.06165790557861328, -0.057880401611328125, -0.05410289764404297, -0.05032539367675781, -0.046547889709472656, -0.0427703857421875, -0.038992881774902344, -0.03521537780761719, -0.03143787384033203, -0.027660369873046875, -0.02388286590576172, -0.020105361938476562, -0.016327857971191406, -0.01255035400390625, -0.008772850036621094, -0.0049953460693359375, -0.0012178421020507812, 0.002559661865234375, 0.006337165832519531, 0.010114669799804688, 0.013892173767089844, 0.017669677734375, 0.021447181701660156, 0.025224685668945312, 0.02900218963623047, 0.032779693603515625, 0.03655719757080078, 0.04033470153808594, 0.044112205505371094, 0.04788970947265625, 0.051667213439941406, 0.05544471740722656, 0.05922222137451172, 0.06299972534179688, 0.06677722930908203, 0.07055473327636719, 0.07433223724365234, 0.0781097412109375, 0.08188724517822266, 0.08566474914550781, 0.08944225311279297, 0.09321975708007812, 0.09699726104736328, 0.10077476501464844, 0.1045522689819336, 0.10832977294921875, 0.1121072769165039, 0.11588478088378906, 0.11966228485107422, 0.12343978881835938, 0.12721729278564453, 0.1309947967529297, 0.13477230072021484, 0.1385498046875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 12.0, 11.0, 9.0, 27.0, 33.0, 30.0, 39.0, 64.0, 40.0, 60.0, 76.0, 57.0, 81.0, 67.0, 62.0, 59.0, 67.0, 39.0, 42.0, 29.0, 24.0, 23.0, 16.0, 12.0, 5.0, 2.0, 6.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055084228515625, -0.05321645736694336, -0.05134868621826172, -0.04948091506958008, -0.04761314392089844, -0.0457453727722168, -0.043877601623535156, -0.042009830474853516, -0.040142059326171875, -0.038274288177490234, -0.036406517028808594, -0.03453874588012695, -0.03267097473144531, -0.030803203582763672, -0.02893543243408203, -0.02706766128540039, -0.02519989013671875, -0.02333211898803711, -0.02146434783935547, -0.019596576690673828, -0.017728805541992188, -0.015861034393310547, -0.013993263244628906, -0.012125492095947266, -0.010257720947265625, -0.008389949798583984, -0.006522178649902344, -0.004654407501220703, -0.0027866363525390625, -0.0009188652038574219, 0.0009489059448242188, 0.0028166770935058594, 0.0046844482421875, 0.006552219390869141, 0.008419990539550781, 0.010287761688232422, 0.012155532836914062, 0.014023303985595703, 0.015891075134277344, 0.017758846282958984, 0.019626617431640625, 0.021494388580322266, 0.023362159729003906, 0.025229930877685547, 0.027097702026367188, 0.028965473175048828, 0.03083324432373047, 0.03270101547241211, 0.03456878662109375, 0.03643655776977539, 0.03830432891845703, 0.04017210006713867, 0.04203987121582031, 0.04390764236450195, 0.045775413513183594, 0.047643184661865234, 0.049510955810546875, 0.051378726959228516, 0.053246498107910156, 0.0551142692565918, 0.05698204040527344, 0.05884981155395508, 0.06071758270263672, 0.06258535385131836, 0.064453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 11.0, 8.0, 35.0, 74.0, 219.0, 498.0, 1347.0, 8566.0, 3118570.0, 1058056.0, 5104.0, 1111.0, 389.0, 167.0, 75.0, 35.0, 11.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.57373046875, -0.5562973022460938, -0.5388641357421875, -0.5214309692382812, -0.503997802734375, -0.48656463623046875, -0.4691314697265625, -0.45169830322265625, -0.43426513671875, -0.41683197021484375, -0.3993988037109375, -0.38196563720703125, -0.364532470703125, -0.34709930419921875, -0.3296661376953125, -0.31223297119140625, -0.2947998046875, -0.27736663818359375, -0.2599334716796875, -0.24250030517578125, -0.225067138671875, -0.20763397216796875, -0.1902008056640625, -0.17276763916015625, -0.15533447265625, -0.13790130615234375, -0.1204681396484375, -0.10303497314453125, -0.085601806640625, -0.06816864013671875, -0.0507354736328125, -0.03330230712890625, -0.015869140625, 0.00156402587890625, 0.0189971923828125, 0.03643035888671875, 0.053863525390625, 0.07129669189453125, 0.0887298583984375, 0.10616302490234375, 0.12359619140625, 0.14102935791015625, 0.1584625244140625, 0.17589569091796875, 0.193328857421875, 0.21076202392578125, 0.2281951904296875, 0.24562835693359375, 0.2630615234375, 0.28049468994140625, 0.2979278564453125, 0.31536102294921875, 0.332794189453125, 0.35022735595703125, 0.3676605224609375, 0.38509368896484375, 0.40252685546875, 0.41996002197265625, 0.4373931884765625, 0.45482635498046875, 0.472259521484375, 0.48969268798828125, 0.5071258544921875, 0.5245590209960938, 0.5419921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 22.0, 43.0, 98.0, 226.0, 578.0, 1234.0, 1100.0, 458.0, 196.0, 79.0, 19.0, 11.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.26134300231933594, -0.2533988952636719, -0.2454547882080078, -0.23751068115234375, -0.2295665740966797, -0.22162246704101562, -0.21367835998535156, -0.2057342529296875, -0.19779014587402344, -0.18984603881835938, -0.1819019317626953, -0.17395782470703125, -0.1660137176513672, -0.15806961059570312, -0.15012550354003906, -0.142181396484375, -0.13423728942871094, -0.12629318237304688, -0.11834907531738281, -0.11040496826171875, -0.10246086120605469, -0.09451675415039062, -0.08657264709472656, -0.0786285400390625, -0.07068443298339844, -0.06274032592773438, -0.05479621887207031, -0.04685211181640625, -0.03890800476074219, -0.030963897705078125, -0.023019790649414062, -0.01507568359375, -0.0071315765380859375, 0.000812530517578125, 0.008756637573242188, 0.01670074462890625, 0.024644851684570312, 0.032588958740234375, 0.04053306579589844, 0.0484771728515625, 0.05642127990722656, 0.06436538696289062, 0.07230949401855469, 0.08025360107421875, 0.08819770812988281, 0.09614181518554688, 0.10408592224121094, 0.112030029296875, 0.11997413635253906, 0.12791824340820312, 0.1358623504638672, 0.14380645751953125, 0.1517505645751953, 0.15969467163085938, 0.16763877868652344, 0.1755828857421875, 0.18352699279785156, 0.19147109985351562, 0.1994152069091797, 0.20735931396484375, 0.2153034210205078, 0.22324752807617188, 0.23119163513183594, 0.2391357421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 22.0, 73.0, 231.0, 367.0, 192.0, 82.0, 25.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7819647789001465, -2.7267701625823975, -2.6715757846832275, -2.6163811683654785, -2.5611867904663086, -2.5059921741485596, -2.4507975578308105, -2.3956031799316406, -2.3404085636138916, -2.2852139472961426, -2.2300195693969727, -2.1748249530792236, -2.1196305751800537, -2.0644359588623047, -2.0092415809631348, -1.9540469646453857, -1.8988524675369263, -1.8436579704284668, -1.7884634733200073, -1.7332689762115479, -1.6780743598937988, -1.6228798627853394, -1.5676853656768799, -1.5124908685684204, -1.457296371459961, -1.4021018743515015, -1.346907377243042, -1.291712760925293, -1.2365182638168335, -1.181323766708374, -1.1261292695999146, -1.070934772491455, -1.015740156173706, -0.9605456590652466, -0.9053511023521423, -0.8501566052436829, -0.7949620485305786, -0.7397675514221191, -0.6845730543136597, -0.6293785572052002, -0.5741840600967407, -0.5189895629882812, -0.463795006275177, -0.40860050916671753, -0.35340598225593567, -0.2982114553451538, -0.24301695823669434, -0.18782243132591248, -0.13262790441513062, -0.07743338495492935, -0.02223886549472809, 0.03295564651489258, 0.08815017342567444, 0.1433447003364563, 0.19853919744491577, 0.25373372435569763, 0.3089282512664795, 0.36412277817726135, 0.4193173050880432, 0.4745118021965027, 0.5297063589096069, 0.5849008560180664, 0.6400953531265259, 0.6952898502349854, 0.7504844069480896]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 7.0, 4.0, 6.0, 12.0, 21.0, 17.0, 24.0, 37.0, 34.0, 37.0, 61.0, 61.0, 62.0, 70.0, 80.0, 60.0, 68.0, 52.0, 59.0, 54.0, 40.0, 28.0, 29.0, 24.0, 14.0, 14.0, 15.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5269758105278015, -0.5072430968284607, -0.4875103831291199, -0.46777766942977905, -0.44804495573043823, -0.4283122420310974, -0.4085795283317566, -0.38884681463241577, -0.36911410093307495, -0.34938138723373413, -0.3296486735343933, -0.3099159598350525, -0.29018324613571167, -0.27045053243637085, -0.25071781873703003, -0.2309851050376892, -0.2112523913383484, -0.19151967763900757, -0.17178696393966675, -0.15205425024032593, -0.1323215365409851, -0.11258882284164429, -0.09285610914230347, -0.07312339544296265, -0.053390681743621826, -0.033657968044281006, -0.013925254344940186, 0.005807459354400635, 0.025540173053741455, 0.045272886753082275, 0.0650056004524231, 0.08473831415176392, 0.10447108745574951, 0.12420380115509033, 0.14393651485443115, 0.16366922855377197, 0.1834019422531128, 0.2031346559524536, 0.22286736965179443, 0.24260008335113525, 0.2623327970504761, 0.2820655107498169, 0.3017982244491577, 0.32153093814849854, 0.34126365184783936, 0.3609963655471802, 0.380729079246521, 0.4004617929458618, 0.42019450664520264, 0.43992722034454346, 0.4596599340438843, 0.4793926477432251, 0.4991253614425659, 0.5188580751419067, 0.5385907888412476, 0.5583235025405884, 0.5780562162399292, 0.59778892993927, 0.6175216436386108, 0.6372543573379517, 0.6569870710372925, 0.6767197847366333, 0.6964524984359741, 0.7161852121353149, 0.7359179258346558]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 7.0, 14.0, 14.0, 21.0, 33.0, 30.0, 59.0, 81.0, 110.0, 197.0, 331.0, 621.0, 1143.0, 2213.0, 4631.0, 10561.0, 24732.0, 58843.0, 137470.0, 264935.0, 277728.0, 150797.0, 64686.0, 27147.0, 11689.0, 5265.0, 2417.0, 1160.0, 668.0, 359.0, 199.0, 121.0, 78.0, 48.0, 44.0, 27.0, 17.0, 18.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.106689453125, -0.10301780700683594, -0.09934616088867188, -0.09567451477050781, -0.09200286865234375, -0.08833122253417969, -0.08465957641601562, -0.08098793029785156, -0.0773162841796875, -0.07364463806152344, -0.06997299194335938, -0.06630134582519531, -0.06262969970703125, -0.05895805358886719, -0.055286407470703125, -0.05161476135253906, -0.047943115234375, -0.04427146911621094, -0.040599822998046875, -0.03692817687988281, -0.03325653076171875, -0.029584884643554688, -0.025913238525390625, -0.022241592407226562, -0.0185699462890625, -0.014898300170898438, -0.011226654052734375, -0.0075550079345703125, -0.00388336181640625, -0.0002117156982421875, 0.003459930419921875, 0.0071315765380859375, 0.01080322265625, 0.014474868774414062, 0.018146514892578125, 0.021818161010742188, 0.02548980712890625, 0.029161453247070312, 0.032833099365234375, 0.03650474548339844, 0.0401763916015625, 0.04384803771972656, 0.047519683837890625, 0.05119132995605469, 0.05486297607421875, 0.05853462219238281, 0.062206268310546875, 0.06587791442871094, 0.069549560546875, 0.07322120666503906, 0.07689285278320312, 0.08056449890136719, 0.08423614501953125, 0.08790779113769531, 0.09157943725585938, 0.09525108337402344, 0.0989227294921875, 0.10259437561035156, 0.10626602172851562, 0.10993766784667969, 0.11360931396484375, 0.11728096008300781, 0.12095260620117188, 0.12462425231933594, 0.1282958984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 12.0, 11.0, 11.0, 20.0, 27.0, 26.0, 38.0, 45.0, 55.0, 65.0, 53.0, 62.0, 59.0, 75.0, 81.0, 52.0, 80.0, 51.0, 49.0, 29.0, 29.0, 19.0, 23.0, 13.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059906005859375, -0.05775880813598633, -0.055611610412597656, -0.053464412689208984, -0.05131721496582031, -0.04917001724243164, -0.04702281951904297, -0.0448756217956543, -0.042728424072265625, -0.04058122634887695, -0.03843402862548828, -0.03628683090209961, -0.03413963317871094, -0.031992435455322266, -0.029845237731933594, -0.027698040008544922, -0.02555084228515625, -0.023403644561767578, -0.021256446838378906, -0.019109249114990234, -0.016962051391601562, -0.01481485366821289, -0.012667655944824219, -0.010520458221435547, -0.008373260498046875, -0.006226062774658203, -0.004078865051269531, -0.0019316673278808594, 0.0002155303955078125, 0.0023627281188964844, 0.004509925842285156, 0.006657123565673828, 0.0088043212890625, 0.010951519012451172, 0.013098716735839844, 0.015245914459228516, 0.017393112182617188, 0.01954030990600586, 0.02168750762939453, 0.023834705352783203, 0.025981903076171875, 0.028129100799560547, 0.03027629852294922, 0.03242349624633789, 0.03457069396972656, 0.036717891693115234, 0.038865089416503906, 0.04101228713989258, 0.04315948486328125, 0.04530668258666992, 0.047453880310058594, 0.049601078033447266, 0.05174827575683594, 0.05389547348022461, 0.05604267120361328, 0.05818986892700195, 0.060337066650390625, 0.0624842643737793, 0.06463146209716797, 0.06677865982055664, 0.06892585754394531, 0.07107305526733398, 0.07322025299072266, 0.07536745071411133, 0.0775146484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 7.0, 14.0, 16.0, 17.0, 28.0, 21.0, 37.0, 72.0, 92.0, 164.0, 340.0, 767.0, 1905.0, 5771.0, 20659.0, 92705.0, 380869.0, 407631.0, 104223.0, 23078.0, 6350.0, 2027.0, 829.0, 382.0, 189.0, 100.0, 54.0, 39.0, 36.0, 26.0, 17.0, 14.0, 14.0, 14.0, 8.0, 6.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.20092391967773438, -0.19445037841796875, -0.18797683715820312, -0.1815032958984375, -0.17502975463867188, -0.16855621337890625, -0.16208267211914062, -0.155609130859375, -0.14913558959960938, -0.14266204833984375, -0.13618850708007812, -0.1297149658203125, -0.12324142456054688, -0.11676788330078125, -0.11029434204101562, -0.10382080078125, -0.09734725952148438, -0.09087371826171875, -0.08440017700195312, -0.0779266357421875, -0.07145309448242188, -0.06497955322265625, -0.058506011962890625, -0.052032470703125, -0.045558929443359375, -0.03908538818359375, -0.032611846923828125, -0.0261383056640625, -0.019664764404296875, -0.01319122314453125, -0.006717681884765625, -0.000244140625, 0.006229400634765625, 0.01270294189453125, 0.019176483154296875, 0.0256500244140625, 0.032123565673828125, 0.03859710693359375, 0.045070648193359375, 0.051544189453125, 0.058017730712890625, 0.06449127197265625, 0.07096481323242188, 0.0774383544921875, 0.08391189575195312, 0.09038543701171875, 0.09685897827148438, 0.10333251953125, 0.10980606079101562, 0.11627960205078125, 0.12275314331054688, 0.1292266845703125, 0.13570022583007812, 0.14217376708984375, 0.14864730834960938, 0.155120849609375, 0.16159439086914062, 0.16806793212890625, 0.17454147338867188, 0.1810150146484375, 0.18748855590820312, 0.19396209716796875, 0.20043563842773438, 0.2069091796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 12.0, 20.0, 13.0, 12.0, 22.0, 26.0, 22.0, 29.0, 28.0, 29.0, 36.0, 38.0, 47.0, 40.0, 49.0, 36.0, 37.0, 48.0, 52.0, 39.0, 41.0, 42.0, 23.0, 27.0, 31.0, 31.0, 29.0, 24.0, 13.0, 16.0, 21.0, 17.0, 8.0, 6.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.1339111328125, -0.13003253936767578, -0.12615394592285156, -0.12227535247802734, -0.11839675903320312, -0.1145181655883789, -0.11063957214355469, -0.10676097869873047, -0.10288238525390625, -0.09900379180908203, -0.09512519836425781, -0.0912466049194336, -0.08736801147460938, -0.08348941802978516, -0.07961082458496094, -0.07573223114013672, -0.0718536376953125, -0.06797504425048828, -0.06409645080566406, -0.060217857360839844, -0.056339263916015625, -0.052460670471191406, -0.04858207702636719, -0.04470348358154297, -0.04082489013671875, -0.03694629669189453, -0.03306770324707031, -0.029189109802246094, -0.025310516357421875, -0.021431922912597656, -0.017553329467773438, -0.013674736022949219, -0.009796142578125, -0.005917549133300781, -0.0020389556884765625, 0.0018396377563476562, 0.005718231201171875, 0.009596824645996094, 0.013475418090820312, 0.01735401153564453, 0.02123260498046875, 0.02511119842529297, 0.028989791870117188, 0.032868385314941406, 0.036746978759765625, 0.040625572204589844, 0.04450416564941406, 0.04838275909423828, 0.0522613525390625, 0.05613994598388672, 0.06001853942871094, 0.06389713287353516, 0.06777572631835938, 0.0716543197631836, 0.07553291320800781, 0.07941150665283203, 0.08329010009765625, 0.08716869354248047, 0.09104728698730469, 0.0949258804321289, 0.09880447387695312, 0.10268306732177734, 0.10656166076660156, 0.11044025421142578, 0.11431884765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 14.0, 13.0, 36.0, 56.0, 83.0, 157.0, 221.0, 384.0, 772.0, 1532.0, 3211.0, 8953.0, 992903.0, 30914.0, 4814.0, 2203.0, 1015.0, 513.0, 269.0, 179.0, 115.0, 60.0, 44.0, 18.0, 20.0, 11.0, 2.0, 11.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.021484375, -0.989288330078125, -0.95709228515625, -0.924896240234375, -0.8927001953125, -0.860504150390625, -0.82830810546875, -0.796112060546875, -0.763916015625, -0.731719970703125, -0.69952392578125, -0.667327880859375, -0.6351318359375, -0.602935791015625, -0.57073974609375, -0.538543701171875, -0.50634765625, -0.474151611328125, -0.44195556640625, -0.409759521484375, -0.3775634765625, -0.345367431640625, -0.31317138671875, -0.280975341796875, -0.248779296875, -0.216583251953125, -0.18438720703125, -0.152191162109375, -0.1199951171875, -0.087799072265625, -0.05560302734375, -0.023406982421875, 0.0087890625, 0.040985107421875, 0.07318115234375, 0.105377197265625, 0.1375732421875, 0.169769287109375, 0.20196533203125, 0.234161376953125, 0.266357421875, 0.298553466796875, 0.33074951171875, 0.362945556640625, 0.3951416015625, 0.427337646484375, 0.45953369140625, 0.491729736328125, 0.52392578125, 0.556121826171875, 0.58831787109375, 0.620513916015625, 0.6527099609375, 0.684906005859375, 0.71710205078125, 0.749298095703125, 0.781494140625, 0.813690185546875, 0.84588623046875, 0.878082275390625, 0.9102783203125, 0.942474365234375, 0.97467041015625, 1.006866455078125, 1.0390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 64.0, 386.0, 464.0, 60.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014507770538330078, -0.00014170538634061813, -0.00013833306729793549, -0.00013496074825525284, -0.0001315884292125702, -0.00012821611016988754, -0.0001248437911272049, -0.00012147147208452225, -0.0001180991530418396, -0.00011472683399915695, -0.0001113545149564743, -0.00010798219591379166, -0.00010460987687110901, -0.00010123755782842636, -9.786523878574371e-05, -9.449291974306107e-05, -9.112060070037842e-05, -8.774828165769577e-05, -8.437596261501312e-05, -8.100364357233047e-05, -7.763132452964783e-05, -7.425900548696518e-05, -7.088668644428253e-05, -6.751436740159988e-05, -6.414204835891724e-05, -6.076972931623459e-05, -5.739741027355194e-05, -5.402509123086929e-05, -5.0652772188186646e-05, -4.7280453145504e-05, -4.390813410282135e-05, -4.05358150601387e-05, -3.7163496017456055e-05, -3.379117697477341e-05, -3.041885793209076e-05, -2.704653888940811e-05, -2.3674219846725464e-05, -2.0301900804042816e-05, -1.692958176136017e-05, -1.355726271867752e-05, -1.0184943675994873e-05, -6.812624633312225e-06, -3.4403055906295776e-06, -6.798654794692993e-08, 3.3043324947357178e-06, 6.6766515374183655e-06, 1.0048970580101013e-05, 1.3421289622783661e-05, 1.679360866546631e-05, 2.0165927708148956e-05, 2.3538246750831604e-05, 2.6910565793514252e-05, 3.02828848361969e-05, 3.365520387887955e-05, 3.7027522921562195e-05, 4.039984196424484e-05, 4.377216100692749e-05, 4.714448004961014e-05, 5.0516799092292786e-05, 5.388911813497543e-05, 5.726143717765808e-05, 6.063375622034073e-05, 6.400607526302338e-05, 6.737839430570602e-05, 7.075071334838867e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 9.0, 11.0, 15.0, 19.0, 41.0, 44.0, 59.0, 92.0, 156.0, 228.0, 355.0, 600.0, 1080.0, 2074.0, 4197.0, 8801.0, 21454.0, 58008.0, 157316.0, 311881.0, 279115.0, 125132.0, 45891.0, 17252.0, 7310.0, 3356.0, 1658.0, 940.0, 520.0, 331.0, 184.0, 132.0, 82.0, 62.0, 30.0, 35.0, 25.0, 15.0, 8.0, 10.0, 6.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0653076171875, -0.06325912475585938, -0.06121063232421875, -0.059162139892578125, -0.0571136474609375, -0.055065155029296875, -0.05301666259765625, -0.050968170166015625, -0.048919677734375, -0.046871185302734375, -0.04482269287109375, -0.042774200439453125, -0.0407257080078125, -0.038677215576171875, -0.03662872314453125, -0.034580230712890625, -0.03253173828125, -0.030483245849609375, -0.02843475341796875, -0.026386260986328125, -0.0243377685546875, -0.022289276123046875, -0.02024078369140625, -0.018192291259765625, -0.016143798828125, -0.014095306396484375, -0.01204681396484375, -0.009998321533203125, -0.0079498291015625, -0.005901336669921875, -0.00385284423828125, -0.001804351806640625, 0.000244140625, 0.002292633056640625, 0.00434112548828125, 0.006389617919921875, 0.0084381103515625, 0.010486602783203125, 0.01253509521484375, 0.014583587646484375, 0.016632080078125, 0.018680572509765625, 0.02072906494140625, 0.022777557373046875, 0.0248260498046875, 0.026874542236328125, 0.02892303466796875, 0.030971527099609375, 0.03302001953125, 0.035068511962890625, 0.03711700439453125, 0.039165496826171875, 0.0412139892578125, 0.043262481689453125, 0.04531097412109375, 0.047359466552734375, 0.049407958984375, 0.051456451416015625, 0.05350494384765625, 0.055553436279296875, 0.0576019287109375, 0.059650421142578125, 0.06169891357421875, 0.06374740600585938, 0.0657958984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 10.0, 14.0, 15.0, 26.0, 26.0, 23.0, 25.0, 36.0, 34.0, 54.0, 48.0, 42.0, 47.0, 45.0, 56.0, 70.0, 43.0, 50.0, 44.0, 46.0, 33.0, 44.0, 27.0, 26.0, 18.0, 15.0, 19.0, 10.0, 7.0, 8.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03375244140625, -0.03260231018066406, -0.031452178955078125, -0.030302047729492188, -0.02915191650390625, -0.028001785278320312, -0.026851654052734375, -0.025701522827148438, -0.0245513916015625, -0.023401260375976562, -0.022251129150390625, -0.021100997924804688, -0.01995086669921875, -0.018800735473632812, -0.017650604248046875, -0.016500473022460938, -0.015350341796875, -0.014200210571289062, -0.013050079345703125, -0.011899948120117188, -0.01074981689453125, -0.009599685668945312, -0.008449554443359375, -0.0072994232177734375, -0.0061492919921875, -0.0049991607666015625, -0.003849029541015625, -0.0026988983154296875, -0.00154876708984375, -0.0003986358642578125, 0.000751495361328125, 0.0019016265869140625, 0.0030517578125, 0.0042018890380859375, 0.005352020263671875, 0.0065021514892578125, 0.00765228271484375, 0.008802413940429688, 0.009952545166015625, 0.011102676391601562, 0.0122528076171875, 0.013402938842773438, 0.014553070068359375, 0.015703201293945312, 0.01685333251953125, 0.018003463745117188, 0.019153594970703125, 0.020303726196289062, 0.021453857421875, 0.022603988647460938, 0.023754119873046875, 0.024904251098632812, 0.02605438232421875, 0.027204513549804688, 0.028354644775390625, 0.029504776000976562, 0.0306549072265625, 0.03180503845214844, 0.032955169677734375, 0.03410530090332031, 0.03525543212890625, 0.03640556335449219, 0.037555694580078125, 0.03870582580566406, 0.03985595703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 8.0, 93.0, 384.0, 407.0, 96.0, 21.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1925667524337769, -1.1134214401245117, -1.0342762470245361, -0.955130934715271, -0.8759857416152954, -0.7968404293060303, -0.7176951766014099, -0.6385499238967896, -0.5594046711921692, -0.48025941848754883, -0.40111416578292847, -0.3219688832759857, -0.24282363057136536, -0.163678377866745, -0.08453309535980225, -0.005387842655181885, 0.07375741004943848, 0.15290266275405884, 0.2320479303598404, 0.31119319796562195, 0.3903384506702423, 0.46948370337486267, 0.5486289858818054, 0.6277742385864258, 0.7069194912910461, 0.7860647439956665, 0.8652099967002869, 0.9443552494049072, 1.0235005617141724, 1.102645754814148, 1.181791067123413, 1.2609362602233887, 1.3400814533233643, 1.4192267656326294, 1.498371958732605, 1.5775172710418701, 1.6566624641418457, 1.7358077764511108, 1.814953088760376, 1.8940982818603516, 1.9732434749603271, 2.0523886680603027, 2.1315340995788574, 2.210679292678833, 2.2898244857788086, 2.368969678878784, 2.448115110397339, 2.5272603034973145, 2.606405735015869, 2.6855509281158447, 2.7646963596343994, 2.843841552734375, 2.9229867458343506, 3.002131938934326, 3.081277370452881, 3.1604225635528564, 3.239567756652832, 3.3187129497528076, 3.3978583812713623, 3.477003574371338, 3.5561487674713135, 3.635293960571289, 3.7144393920898438, 3.7935845851898193, 3.872729778289795]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 11.0, 11.0, 13.0, 13.0, 13.0, 28.0, 26.0, 31.0, 22.0, 29.0, 31.0, 32.0, 40.0, 46.0, 51.0, 45.0, 36.0, 52.0, 40.0, 35.0, 35.0, 45.0, 40.0, 41.0, 30.0, 43.0, 16.0, 17.0, 20.0, 14.0, 17.0, 16.0, 9.0, 10.0, 10.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.4607633948326111, -0.4480655789375305, -0.43536776304244995, -0.4226699471473694, -0.4099721312522888, -0.39727431535720825, -0.3845764994621277, -0.3718786835670471, -0.35918086767196655, -0.346483051776886, -0.3337852358818054, -0.32108741998672485, -0.3083896040916443, -0.2956917881965637, -0.28299397230148315, -0.2702961564064026, -0.2575983703136444, -0.24490055441856384, -0.23220273852348328, -0.2195049226284027, -0.20680710673332214, -0.19410929083824158, -0.1814114898443222, -0.16871367394924164, -0.15601585805416107, -0.1433180421590805, -0.13062022626399994, -0.11792241781949997, -0.1052246019244194, -0.09252678602933884, -0.07982897758483887, -0.0671311616897583, -0.054433345794677734, -0.04173552989959717, -0.0290377177298069, -0.016339905560016632, -0.0036420896649360657, 0.0090557262301445, 0.02175353467464447, 0.03445135056972504, 0.0471491664648056, 0.05984698235988617, 0.07254479825496674, 0.0852426066994667, 0.09794042259454727, 0.11063823848962784, 0.12333604693412781, 0.13603386282920837, 0.14873167872428894, 0.1614294946193695, 0.17412731051445007, 0.18682512640953064, 0.1995229423046112, 0.21222075819969177, 0.22491855919361115, 0.2376163750886917, 0.2503141760826111, 0.26301199197769165, 0.2757098078727722, 0.2884076237678528, 0.30110543966293335, 0.3138032555580139, 0.3265010714530945, 0.33919888734817505, 0.3518967032432556]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 6.0, 6.0, 14.0, 8.0, 14.0, 29.0, 23.0, 33.0, 40.0, 58.0, 107.0, 165.0, 299.0, 654.0, 2243.0, 13358.0, 177025.0, 3698021.0, 282231.0, 15695.0, 2489.0, 765.0, 381.0, 196.0, 131.0, 79.0, 62.0, 36.0, 28.0, 22.0, 15.0, 12.0, 5.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.2923164367675781, -0.28409576416015625, -0.2758750915527344, -0.2676544189453125, -0.2594337463378906, -0.25121307373046875, -0.24299240112304688, -0.234771728515625, -0.22655105590820312, -0.21833038330078125, -0.21010971069335938, -0.2018890380859375, -0.19366836547851562, -0.18544769287109375, -0.17722702026367188, -0.16900634765625, -0.16078567504882812, -0.15256500244140625, -0.14434432983398438, -0.1361236572265625, -0.12790298461914062, -0.11968231201171875, -0.11146163940429688, -0.103240966796875, -0.09502029418945312, -0.08679962158203125, -0.07857894897460938, -0.0703582763671875, -0.062137603759765625, -0.05391693115234375, -0.045696258544921875, -0.0374755859375, -0.029254913330078125, -0.02103424072265625, -0.012813568115234375, -0.0045928955078125, 0.003627777099609375, 0.01184844970703125, 0.020069122314453125, 0.028289794921875, 0.036510467529296875, 0.04473114013671875, 0.052951812744140625, 0.0611724853515625, 0.06939315795898438, 0.07761383056640625, 0.08583450317382812, 0.09405517578125, 0.10227584838867188, 0.11049652099609375, 0.11871719360351562, 0.1269378662109375, 0.13515853881835938, 0.14337921142578125, 0.15159988403320312, 0.159820556640625, 0.16804122924804688, 0.17626190185546875, 0.18448257446289062, 0.1927032470703125, 0.20092391967773438, 0.20914459228515625, 0.21736526489257812, 0.2255859375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 14.0, 11.0, 14.0, 16.0, 14.0, 34.0, 40.0, 46.0, 42.0, 55.0, 68.0, 65.0, 72.0, 75.0, 58.0, 69.0, 63.0, 48.0, 42.0, 38.0, 38.0, 29.0, 17.0, 14.0, 8.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06650352478027344, -0.06403732299804688, -0.06157112121582031, -0.05910491943359375, -0.05663871765136719, -0.054172515869140625, -0.05170631408691406, -0.0492401123046875, -0.04677391052246094, -0.044307708740234375, -0.04184150695800781, -0.03937530517578125, -0.03690910339355469, -0.034442901611328125, -0.03197669982910156, -0.029510498046875, -0.027044296264648438, -0.024578094482421875, -0.022111892700195312, -0.01964569091796875, -0.017179489135742188, -0.014713287353515625, -0.012247085571289062, -0.0097808837890625, -0.0073146820068359375, -0.004848480224609375, -0.0023822784423828125, 8.392333984375e-05, 0.0025501251220703125, 0.005016326904296875, 0.0074825286865234375, 0.00994873046875, 0.012414932250976562, 0.014881134033203125, 0.017347335815429688, 0.01981353759765625, 0.022279739379882812, 0.024745941162109375, 0.027212142944335938, 0.0296783447265625, 0.03214454650878906, 0.034610748291015625, 0.03707695007324219, 0.03954315185546875, 0.04200935363769531, 0.044475555419921875, 0.04694175720214844, 0.049407958984375, 0.05187416076660156, 0.054340362548828125, 0.05680656433105469, 0.05927276611328125, 0.06173896789550781, 0.06420516967773438, 0.06667137145996094, 0.0691375732421875, 0.07160377502441406, 0.07406997680664062, 0.07653617858886719, 0.07900238037109375, 0.08146858215332031, 0.08393478393554688, 0.08640098571777344, 0.0888671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 20.0, 17.0, 35.0, 56.0, 103.0, 240.0, 646.0, 2804.0, 48495.0, 3682898.0, 449317.0, 7881.0, 1126.0, 354.0, 151.0, 66.0, 30.0, 16.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3076171875, -0.2940826416015625, -0.280548095703125, -0.2670135498046875, -0.25347900390625, -0.2399444580078125, -0.226409912109375, -0.2128753662109375, -0.1993408203125, -0.1858062744140625, -0.172271728515625, -0.1587371826171875, -0.14520263671875, -0.1316680908203125, -0.118133544921875, -0.1045989990234375, -0.091064453125, -0.0775299072265625, -0.063995361328125, -0.0504608154296875, -0.03692626953125, -0.0233917236328125, -0.009857177734375, 0.0036773681640625, 0.0172119140625, 0.0307464599609375, 0.044281005859375, 0.0578155517578125, 0.07135009765625, 0.0848846435546875, 0.098419189453125, 0.1119537353515625, 0.12548828125, 0.1390228271484375, 0.152557373046875, 0.1660919189453125, 0.17962646484375, 0.1931610107421875, 0.206695556640625, 0.2202301025390625, 0.2337646484375, 0.2472991943359375, 0.260833740234375, 0.2743682861328125, 0.28790283203125, 0.3014373779296875, 0.314971923828125, 0.3285064697265625, 0.342041015625, 0.3555755615234375, 0.369110107421875, 0.3826446533203125, 0.39617919921875, 0.4097137451171875, 0.423248291015625, 0.4367828369140625, 0.4503173828125, 0.4638519287109375, 0.477386474609375, 0.4909210205078125, 0.50445556640625, 0.5179901123046875, 0.531524658203125, 0.5450592041015625, 0.55859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 13.0, 22.0, 25.0, 39.0, 78.0, 106.0, 238.0, 389.0, 608.0, 908.0, 665.0, 354.0, 230.0, 132.0, 90.0, 51.0, 50.0, 19.0, 20.0, 14.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2171630859375, -0.21138763427734375, -0.2056121826171875, -0.19983673095703125, -0.194061279296875, -0.18828582763671875, -0.1825103759765625, -0.17673492431640625, -0.17095947265625, -0.16518402099609375, -0.1594085693359375, -0.15363311767578125, -0.147857666015625, -0.14208221435546875, -0.1363067626953125, -0.13053131103515625, -0.124755859375, -0.11898040771484375, -0.1132049560546875, -0.10742950439453125, -0.101654052734375, -0.09587860107421875, -0.0901031494140625, -0.08432769775390625, -0.07855224609375, -0.07277679443359375, -0.0670013427734375, -0.06122589111328125, -0.055450439453125, -0.04967498779296875, -0.0438995361328125, -0.03812408447265625, -0.0323486328125, -0.02657318115234375, -0.0207977294921875, -0.01502227783203125, -0.009246826171875, -0.00347137451171875, 0.0023040771484375, 0.00807952880859375, 0.01385498046875, 0.01963043212890625, 0.0254058837890625, 0.03118133544921875, 0.036956787109375, 0.04273223876953125, 0.0485076904296875, 0.05428314208984375, 0.06005859375, 0.06583404541015625, 0.0716094970703125, 0.07738494873046875, 0.083160400390625, 0.08893585205078125, 0.0947113037109375, 0.10048675537109375, 0.10626220703125, 0.11203765869140625, 0.1178131103515625, 0.12358856201171875, 0.129364013671875, 0.13513946533203125, 0.1409149169921875, 0.14669036865234375, 0.1524658203125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 15.0, 20.0, 32.0, 59.0, 71.0, 103.0, 120.0, 149.0, 117.0, 106.0, 70.0, 40.0, 34.0, 17.0, 5.0, 6.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7012661695480347, -0.6824561953544617, -0.6636462211608887, -0.6448361873626709, -0.6260262131690979, -0.6072162389755249, -0.5884062647819519, -0.5695962905883789, -0.5507862567901611, -0.5319762825965881, -0.5131663084030151, -0.49435630440711975, -0.47554630041122437, -0.45673632621765137, -0.43792635202407837, -0.41911637783050537, -0.4003064036369324, -0.3814964294433594, -0.362686425447464, -0.343876451253891, -0.3250664472579956, -0.3062564730644226, -0.2874464988708496, -0.2686365246772766, -0.24982652068138123, -0.23101653158664703, -0.21220654249191284, -0.19339656829833984, -0.17458657920360565, -0.15577659010887146, -0.13696661591529846, -0.11815662682056427, -0.09934669733047485, -0.08053670823574066, -0.06172672659158707, -0.04291674122214317, -0.02410675585269928, -0.005296766757965088, 0.013513214886188507, 0.0323231965303421, 0.051133185625076294, 0.06994317471981049, 0.08875315636396408, 0.10756313800811768, 0.12637312710285187, 0.14518311619758606, 0.16399309039115906, 0.18280307948589325, 0.20161306858062744, 0.22042305767536163, 0.23923304677009583, 0.2580430209636688, 0.2768530249595642, 0.2956629991531372, 0.3144729733467102, 0.3332829475402832, 0.3520929515361786, 0.3709029257297516, 0.389712929725647, 0.40852290391921997, 0.42733287811279297, 0.44614288210868835, 0.46495285630226135, 0.48376286029815674, 0.5025728344917297]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 10.0, 7.0, 13.0, 24.0, 20.0, 21.0, 27.0, 30.0, 20.0, 36.0, 38.0, 35.0, 38.0, 31.0, 46.0, 50.0, 56.0, 41.0, 43.0, 37.0, 47.0, 49.0, 32.0, 31.0, 33.0, 25.0, 21.0, 35.0, 13.0, 13.0, 9.0, 19.0, 10.0, 6.0, 4.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3198435306549072, -0.30688780546188354, -0.2939320504665375, -0.2809763252735138, -0.2680205702781677, -0.25506484508514404, -0.24210911989212036, -0.22915337979793549, -0.2161976397037506, -0.20324189960956573, -0.19028615951538086, -0.17733043432235718, -0.1643746942281723, -0.15141895413398743, -0.13846322894096375, -0.12550748884677887, -0.112551748752594, -0.09959600865840912, -0.08664027601480484, -0.07368454337120056, -0.060728803277015686, -0.04777306318283081, -0.03481733053922653, -0.021861597895622253, -0.008905857801437378, 0.004049878567457199, 0.017005614936351776, 0.029961351305246353, 0.04291708767414093, 0.055872827768325806, 0.06882856041193008, 0.08178429305553436, 0.09474003314971924, 0.10769577324390411, 0.12065150588750839, 0.13360723853111267, 0.14656297862529755, 0.15951871871948242, 0.1724744439125061, 0.18543018400669098, 0.19838592410087585, 0.21134166419506073, 0.2242974042892456, 0.2372531294822693, 0.25020885467529297, 0.26316460967063904, 0.2761203348636627, 0.2890760898590088, 0.30203181505203247, 0.31498754024505615, 0.3279432952404022, 0.3408990204334259, 0.353854775428772, 0.36681050062179565, 0.37976622581481934, 0.392721951007843, 0.4056777060031891, 0.41863343119621277, 0.43158918619155884, 0.4445449113845825, 0.4575006365776062, 0.47045639157295227, 0.48341211676597595, 0.496367871761322, 0.5093235969543457]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 8.0, 4.0, 20.0, 15.0, 24.0, 31.0, 39.0, 47.0, 83.0, 148.0, 242.0, 407.0, 776.0, 1620.0, 3236.0, 6736.0, 14486.0, 31071.0, 69336.0, 148760.0, 258348.0, 252075.0, 140532.0, 64902.0, 29469.0, 13352.0, 6444.0, 2973.0, 1516.0, 793.0, 419.0, 222.0, 134.0, 77.0, 61.0, 39.0, 29.0, 24.0, 14.0, 7.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1263427734375, -0.12262248992919922, -0.11890220642089844, -0.11518192291259766, -0.11146163940429688, -0.1077413558959961, -0.10402107238769531, -0.10030078887939453, -0.09658050537109375, -0.09286022186279297, -0.08913993835449219, -0.0854196548461914, -0.08169937133789062, -0.07797908782958984, -0.07425880432128906, -0.07053852081298828, -0.0668182373046875, -0.06309795379638672, -0.05937767028808594, -0.055657386779785156, -0.051937103271484375, -0.048216819763183594, -0.04449653625488281, -0.04077625274658203, -0.03705596923828125, -0.03333568572998047, -0.029615402221679688, -0.025895118713378906, -0.022174835205078125, -0.018454551696777344, -0.014734268188476562, -0.011013984680175781, -0.007293701171875, -0.0035734176635742188, 0.0001468658447265625, 0.0038671493530273438, 0.007587432861328125, 0.011307716369628906, 0.015027999877929688, 0.01874828338623047, 0.02246856689453125, 0.02618885040283203, 0.029909133911132812, 0.033629417419433594, 0.037349700927734375, 0.041069984436035156, 0.04479026794433594, 0.04851055145263672, 0.0522308349609375, 0.05595111846923828, 0.05967140197753906, 0.06339168548583984, 0.06711196899414062, 0.0708322525024414, 0.07455253601074219, 0.07827281951904297, 0.08199310302734375, 0.08571338653564453, 0.08943367004394531, 0.0931539535522461, 0.09687423706054688, 0.10059452056884766, 0.10431480407714844, 0.10803508758544922, 0.11175537109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 15.0, 14.0, 23.0, 38.0, 40.0, 30.0, 48.0, 44.0, 56.0, 47.0, 68.0, 56.0, 85.0, 68.0, 65.0, 56.0, 50.0, 51.0, 46.0, 18.0, 19.0, 15.0, 14.0, 6.0, 4.0, 12.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05255126953125, -0.050327301025390625, -0.04810333251953125, -0.045879364013671875, -0.0436553955078125, -0.041431427001953125, -0.03920745849609375, -0.036983489990234375, -0.034759521484375, -0.032535552978515625, -0.03031158447265625, -0.028087615966796875, -0.0258636474609375, -0.023639678955078125, -0.02141571044921875, -0.019191741943359375, -0.0169677734375, -0.014743804931640625, -0.01251983642578125, -0.010295867919921875, -0.0080718994140625, -0.005847930908203125, -0.00362396240234375, -0.001399993896484375, 0.000823974609375, 0.003047943115234375, 0.00527191162109375, 0.007495880126953125, 0.0097198486328125, 0.011943817138671875, 0.01416778564453125, 0.016391754150390625, 0.01861572265625, 0.020839691162109375, 0.02306365966796875, 0.025287628173828125, 0.0275115966796875, 0.029735565185546875, 0.03195953369140625, 0.034183502197265625, 0.036407470703125, 0.038631439208984375, 0.04085540771484375, 0.043079376220703125, 0.0453033447265625, 0.047527313232421875, 0.04975128173828125, 0.051975250244140625, 0.05419921875, 0.056423187255859375, 0.05864715576171875, 0.060871124267578125, 0.0630950927734375, 0.06531906127929688, 0.06754302978515625, 0.06976699829101562, 0.071990966796875, 0.07421493530273438, 0.07643890380859375, 0.07866287231445312, 0.0808868408203125, 0.08311080932617188, 0.08533477783203125, 0.08755874633789062, 0.08978271484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 10.0, 12.0, 18.0, 26.0, 36.0, 46.0, 75.0, 88.0, 192.0, 313.0, 603.0, 1280.0, 3649.0, 13867.0, 79460.0, 439179.0, 417425.0, 73275.0, 12956.0, 3371.0, 1259.0, 552.0, 325.0, 193.0, 105.0, 62.0, 55.0, 35.0, 28.0, 13.0, 9.0, 8.0, 3.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2490234375, -0.2414722442626953, -0.23392105102539062, -0.22636985778808594, -0.21881866455078125, -0.21126747131347656, -0.20371627807617188, -0.1961650848388672, -0.1886138916015625, -0.1810626983642578, -0.17351150512695312, -0.16596031188964844, -0.15840911865234375, -0.15085792541503906, -0.14330673217773438, -0.1357555389404297, -0.128204345703125, -0.12065315246582031, -0.11310195922851562, -0.10555076599121094, -0.09799957275390625, -0.09044837951660156, -0.08289718627929688, -0.07534599304199219, -0.0677947998046875, -0.06024360656738281, -0.052692413330078125, -0.04514122009277344, -0.03759002685546875, -0.030038833618164062, -0.022487640380859375, -0.014936447143554688, -0.00738525390625, 0.0001659393310546875, 0.007717132568359375, 0.015268325805664062, 0.02281951904296875, 0.030370712280273438, 0.037921905517578125, 0.04547309875488281, 0.0530242919921875, 0.06057548522949219, 0.06812667846679688, 0.07567787170410156, 0.08322906494140625, 0.09078025817871094, 0.09833145141601562, 0.10588264465332031, 0.113433837890625, 0.12098503112792969, 0.12853622436523438, 0.13608741760253906, 0.14363861083984375, 0.15118980407714844, 0.15874099731445312, 0.1662921905517578, 0.1738433837890625, 0.1813945770263672, 0.18894577026367188, 0.19649696350097656, 0.20404815673828125, 0.21159934997558594, 0.21915054321289062, 0.2267017364501953, 0.2342529296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 15.0, 18.0, 18.0, 20.0, 11.0, 35.0, 27.0, 32.0, 49.0, 47.0, 37.0, 47.0, 39.0, 54.0, 50.0, 57.0, 52.0, 47.0, 29.0, 50.0, 42.0, 35.0, 26.0, 21.0, 24.0, 24.0, 16.0, 5.0, 11.0, 8.0, 7.0, 10.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13925743103027344, -0.13459396362304688, -0.1299304962158203, -0.12526702880859375, -0.12060356140136719, -0.11594009399414062, -0.11127662658691406, -0.1066131591796875, -0.10194969177246094, -0.09728622436523438, -0.09262275695800781, -0.08795928955078125, -0.08329582214355469, -0.07863235473632812, -0.07396888732910156, -0.069305419921875, -0.06464195251464844, -0.059978485107421875, -0.05531501770019531, -0.05065155029296875, -0.04598808288574219, -0.041324615478515625, -0.03666114807128906, -0.0319976806640625, -0.027334213256835938, -0.022670745849609375, -0.018007278442382812, -0.01334381103515625, -0.008680343627929688, -0.004016876220703125, 0.0006465911865234375, 0.00531005859375, 0.009973526000976562, 0.014636993408203125, 0.019300460815429688, 0.02396392822265625, 0.028627395629882812, 0.033290863037109375, 0.03795433044433594, 0.0426177978515625, 0.04728126525878906, 0.051944732666015625, 0.05660820007324219, 0.06127166748046875, 0.06593513488769531, 0.07059860229492188, 0.07526206970214844, 0.079925537109375, 0.08458900451660156, 0.08925247192382812, 0.09391593933105469, 0.09857940673828125, 0.10324287414550781, 0.10790634155273438, 0.11256980895996094, 0.1172332763671875, 0.12189674377441406, 0.12656021118164062, 0.1312236785888672, 0.13588714599609375, 0.1405506134033203, 0.14521408081054688, 0.14987754821777344, 0.154541015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 5.0, 10.0, 10.0, 16.0, 37.0, 66.0, 100.0, 197.0, 401.0, 843.0, 2220.0, 9678.0, 65850.0, 407188.0, 462135.0, 83444.0, 11917.0, 2617.0, 937.0, 384.0, 211.0, 127.0, 56.0, 42.0, 18.0, 17.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08056640625, -0.07769489288330078, -0.07482337951660156, -0.07195186614990234, -0.06908035278320312, -0.0662088394165039, -0.06333732604980469, -0.06046581268310547, -0.05759429931640625, -0.05472278594970703, -0.05185127258300781, -0.048979759216308594, -0.046108245849609375, -0.043236732482910156, -0.04036521911621094, -0.03749370574951172, -0.0346221923828125, -0.03175067901611328, -0.028879165649414062, -0.026007652282714844, -0.023136138916015625, -0.020264625549316406, -0.017393112182617188, -0.014521598815917969, -0.01165008544921875, -0.008778572082519531, -0.0059070587158203125, -0.0030355453491210938, -0.000164031982421875, 0.0027074813842773438, 0.0055789947509765625, 0.008450508117675781, 0.011322021484375, 0.014193534851074219, 0.017065048217773438, 0.019936561584472656, 0.022808074951171875, 0.025679588317871094, 0.028551101684570312, 0.03142261505126953, 0.03429412841796875, 0.03716564178466797, 0.04003715515136719, 0.042908668518066406, 0.045780181884765625, 0.048651695251464844, 0.05152320861816406, 0.05439472198486328, 0.0572662353515625, 0.06013774871826172, 0.06300926208496094, 0.06588077545166016, 0.06875228881835938, 0.0716238021850586, 0.07449531555175781, 0.07736682891845703, 0.08023834228515625, 0.08310985565185547, 0.08598136901855469, 0.0888528823852539, 0.09172439575195312, 0.09459590911865234, 0.09746742248535156, 0.10033893585205078, 0.10321044921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 12.0, 8.0, 9.0, 14.0, 16.0, 25.0, 32.0, 26.0, 42.0, 43.0, 64.0, 62.0, 68.0, 67.0, 62.0, 55.0, 69.0, 59.0, 50.0, 46.0, 30.0, 24.0, 16.0, 12.0, 17.0, 10.0, 10.0, 10.0, 8.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.417533874511719e-06, -9.10833477973938e-06, -8.799135684967041e-06, -8.489936590194702e-06, -8.180737495422363e-06, -7.871538400650024e-06, -7.5623393058776855e-06, -7.253140211105347e-06, -6.943941116333008e-06, -6.634742021560669e-06, -6.32554292678833e-06, -6.016343832015991e-06, -5.707144737243652e-06, -5.3979456424713135e-06, -5.088746547698975e-06, -4.779547452926636e-06, -4.470348358154297e-06, -4.161149263381958e-06, -3.851950168609619e-06, -3.5427510738372803e-06, -3.2335519790649414e-06, -2.9243528842926025e-06, -2.6151537895202637e-06, -2.305954694747925e-06, -1.996755599975586e-06, -1.687556505203247e-06, -1.3783574104309082e-06, -1.0691583156585693e-06, -7.599592208862305e-07, -4.507601261138916e-07, -1.4156103134155273e-07, 1.6763806343078613e-07, 4.76837158203125e-07, 7.860362529754639e-07, 1.0952353477478027e-06, 1.4044344425201416e-06, 1.7136335372924805e-06, 2.0228326320648193e-06, 2.332031726837158e-06, 2.641230821609497e-06, 2.950429916381836e-06, 3.259629011154175e-06, 3.5688281059265137e-06, 3.8780272006988525e-06, 4.187226295471191e-06, 4.49642539024353e-06, 4.805624485015869e-06, 5.114823579788208e-06, 5.424022674560547e-06, 5.733221769332886e-06, 6.042420864105225e-06, 6.3516199588775635e-06, 6.660819053649902e-06, 6.970018148422241e-06, 7.27921724319458e-06, 7.588416337966919e-06, 7.897615432739258e-06, 8.206814527511597e-06, 8.516013622283936e-06, 8.825212717056274e-06, 9.134411811828613e-06, 9.443610906600952e-06, 9.752810001373291e-06, 1.006200909614563e-05, 1.0371208190917969e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 12.0, 3.0, 12.0, 16.0, 24.0, 35.0, 64.0, 111.0, 184.0, 314.0, 695.0, 1405.0, 3704.0, 13422.0, 70896.0, 351577.0, 457528.0, 119113.0, 20720.0, 5107.0, 1806.0, 791.0, 425.0, 260.0, 135.0, 69.0, 44.0, 28.0, 16.0, 14.0, 14.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09210205078125, -0.0895538330078125, -0.087005615234375, -0.0844573974609375, -0.0819091796875, -0.0793609619140625, -0.076812744140625, -0.0742645263671875, -0.07171630859375, -0.0691680908203125, -0.066619873046875, -0.0640716552734375, -0.0615234375, -0.0589752197265625, -0.056427001953125, -0.0538787841796875, -0.05133056640625, -0.0487823486328125, -0.046234130859375, -0.0436859130859375, -0.0411376953125, -0.0385894775390625, -0.036041259765625, -0.0334930419921875, -0.03094482421875, -0.0283966064453125, -0.025848388671875, -0.0233001708984375, -0.020751953125, -0.0182037353515625, -0.015655517578125, -0.0131072998046875, -0.01055908203125, -0.0080108642578125, -0.005462646484375, -0.0029144287109375, -0.0003662109375, 0.0021820068359375, 0.004730224609375, 0.0072784423828125, 0.00982666015625, 0.0123748779296875, 0.014923095703125, 0.0174713134765625, 0.02001953125, 0.0225677490234375, 0.025115966796875, 0.0276641845703125, 0.03021240234375, 0.0327606201171875, 0.035308837890625, 0.0378570556640625, 0.0404052734375, 0.0429534912109375, 0.045501708984375, 0.0480499267578125, 0.05059814453125, 0.0531463623046875, 0.055694580078125, 0.0582427978515625, 0.060791015625, 0.0633392333984375, 0.065887451171875, 0.0684356689453125, 0.07098388671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 21.0, 24.0, 33.0, 43.0, 47.0, 77.0, 96.0, 107.0, 123.0, 108.0, 88.0, 65.0, 47.0, 31.0, 22.0, 18.0, 16.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07981538772583008, -0.07778263092041016, -0.07574987411499023, -0.07371711730957031, -0.07168436050415039, -0.06965160369873047, -0.06761884689331055, -0.06558609008789062, -0.0635533332824707, -0.06152057647705078, -0.05948781967163086, -0.05745506286621094, -0.055422306060791016, -0.053389549255371094, -0.05135679244995117, -0.04932403564453125, -0.04729127883911133, -0.045258522033691406, -0.043225765228271484, -0.04119300842285156, -0.03916025161743164, -0.03712749481201172, -0.0350947380065918, -0.033061981201171875, -0.031029224395751953, -0.02899646759033203, -0.02696371078491211, -0.024930953979492188, -0.022898197174072266, -0.020865440368652344, -0.018832683563232422, -0.0167999267578125, -0.014767169952392578, -0.012734413146972656, -0.010701656341552734, -0.008668899536132812, -0.006636142730712891, -0.004603385925292969, -0.002570629119873047, -0.000537872314453125, 0.0014948844909667969, 0.0035276412963867188, 0.005560398101806641, 0.0075931549072265625, 0.009625911712646484, 0.011658668518066406, 0.013691425323486328, 0.01572418212890625, 0.017756938934326172, 0.019789695739746094, 0.021822452545166016, 0.023855209350585938, 0.02588796615600586, 0.02792072296142578, 0.029953479766845703, 0.031986236572265625, 0.03401899337768555, 0.03605175018310547, 0.03808450698852539, 0.04011726379394531, 0.042150020599365234, 0.044182777404785156, 0.04621553421020508, 0.048248291015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 14.0, 35.0, 112.0, 318.0, 308.0, 132.0, 54.0, 16.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392715811729431, -0.7006892561912537, -0.6621068716049194, -0.62352454662323, -0.5849422216415405, -0.5463598370552063, -0.5077775120735168, -0.469195157289505, -0.43061280250549316, -0.3920304477214813, -0.3534480929374695, -0.31486576795578003, -0.2762834131717682, -0.23770105838775635, -0.1991187185049057, -0.16053637862205505, -0.12195402383804321, -0.08337167650461197, -0.044789329171180725, -0.006206981837749481, 0.03237536549568176, 0.0709577202796936, 0.10954006016254425, 0.1481224000453949, 0.18670475482940674, 0.22528710961341858, 0.2638694643974304, 0.3024517893791199, 0.3410341441631317, 0.37961649894714355, 0.418198823928833, 0.45678117871284485, 0.4953634738922119, 0.5339457988739014, 0.5725281834602356, 0.611110508441925, 0.6496928930282593, 0.6882752180099487, 0.7268575429916382, 0.7654398679733276, 0.8040222525596619, 0.8426045775413513, 0.8811869621276855, 0.919769287109375, 0.9583516120910645, 0.9969339966773987, 1.035516381263733, 1.0740987062454224, 1.1126810312271118, 1.1512633562088013, 1.1898456811904907, 1.2284281253814697, 1.2670104503631592, 1.3055927753448486, 1.344175100326538, 1.3827574253082275, 1.421339750289917, 1.4599220752716064, 1.498504400253296, 1.537086844444275, 1.5756691694259644, 1.6142514944076538, 1.6528338193893433, 1.6914161443710327, 1.7299985885620117]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 10.0, 6.0, 2.0, 18.0, 11.0, 12.0, 15.0, 20.0, 20.0, 18.0, 20.0, 27.0, 28.0, 32.0, 34.0, 32.0, 35.0, 30.0, 38.0, 37.0, 34.0, 36.0, 51.0, 32.0, 46.0, 25.0, 39.0, 28.0, 33.0, 27.0, 29.0, 22.0, 33.0, 20.0, 14.0, 11.0, 18.0, 4.0, 7.0, 10.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.38444089889526367, -0.3723489046096802, -0.3602568805217743, -0.3481648564338684, -0.3360728621482849, -0.3239808678627014, -0.31188884377479553, -0.29979681968688965, -0.28770482540130615, -0.27561283111572266, -0.2635208070278168, -0.2514287829399109, -0.2393367886543274, -0.2272447794675827, -0.215152770280838, -0.20306076109409332, -0.19096875190734863, -0.17887674272060394, -0.16678473353385925, -0.15469272434711456, -0.14260071516036987, -0.13050870597362518, -0.1184166967868805, -0.1063246876001358, -0.09423267841339111, -0.08214066922664642, -0.07004866003990173, -0.05795665085315704, -0.045864641666412354, -0.033772632479667664, -0.021680623292922974, -0.009588614106178284, 0.0025033950805664062, 0.014595404267311096, 0.026687413454055786, 0.038779422640800476, 0.050871431827545166, 0.06296344101428986, 0.07505545020103455, 0.08714745938777924, 0.09923946857452393, 0.11133147776126862, 0.1234234869480133, 0.135515496134758, 0.14760750532150269, 0.15969951450824738, 0.17179152369499207, 0.18388353288173676, 0.19597554206848145, 0.20806755125522614, 0.22015956044197083, 0.23225156962871552, 0.2443435788154602, 0.2564355731010437, 0.2685275971889496, 0.28061962127685547, 0.29271161556243896, 0.30480360984802246, 0.31689563393592834, 0.32898765802383423, 0.3410796523094177, 0.3531716465950012, 0.3652636706829071, 0.377355694770813, 0.3894476890563965]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 7.0, 2.0, 6.0, 11.0, 16.0, 36.0, 61.0, 94.0, 138.0, 215.0, 442.0, 686.0, 1398.0, 2746.0, 5803.0, 14342.0, 39724.0, 136415.0, 961500.0, 2439696.0, 459521.0, 82540.0, 27095.0, 10984.0, 4957.0, 2459.0, 1317.0, 742.0, 457.0, 279.0, 184.0, 124.0, 84.0, 56.0, 40.0, 32.0, 19.0, 17.0, 11.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.10211181640625, -0.09850788116455078, -0.09490394592285156, -0.09130001068115234, -0.08769607543945312, -0.0840921401977539, -0.08048820495605469, -0.07688426971435547, -0.07328033447265625, -0.06967639923095703, -0.06607246398925781, -0.062468528747558594, -0.058864593505859375, -0.055260658264160156, -0.05165672302246094, -0.04805278778076172, -0.0444488525390625, -0.04084491729736328, -0.03724098205566406, -0.033637046813964844, -0.030033111572265625, -0.026429176330566406, -0.022825241088867188, -0.01922130584716797, -0.01561737060546875, -0.012013435363769531, -0.008409500122070312, -0.004805564880371094, -0.001201629638671875, 0.0024023056030273438, 0.0060062408447265625, 0.009610176086425781, 0.013214111328125, 0.01681804656982422, 0.020421981811523438, 0.024025917053222656, 0.027629852294921875, 0.031233787536621094, 0.03483772277832031, 0.03844165802001953, 0.04204559326171875, 0.04564952850341797, 0.04925346374511719, 0.052857398986816406, 0.056461334228515625, 0.060065269470214844, 0.06366920471191406, 0.06727313995361328, 0.0708770751953125, 0.07448101043701172, 0.07808494567871094, 0.08168888092041016, 0.08529281616210938, 0.0888967514038086, 0.09250068664550781, 0.09610462188720703, 0.09970855712890625, 0.10331249237060547, 0.10691642761230469, 0.1105203628540039, 0.11412429809570312, 0.11772823333740234, 0.12133216857910156, 0.12493610382080078, 0.1285400390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 2.0, 5.0, 6.0, 12.0, 11.0, 16.0, 20.0, 34.0, 29.0, 38.0, 51.0, 60.0, 65.0, 52.0, 55.0, 64.0, 73.0, 56.0, 53.0, 61.0, 44.0, 36.0, 34.0, 30.0, 22.0, 17.0, 17.0, 10.0, 8.0, 5.0, 5.0, 8.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.068603515625, -0.06621074676513672, -0.06381797790527344, -0.061425209045410156, -0.059032440185546875, -0.056639671325683594, -0.05424690246582031, -0.05185413360595703, -0.04946136474609375, -0.04706859588623047, -0.04467582702636719, -0.042283058166503906, -0.039890289306640625, -0.037497520446777344, -0.03510475158691406, -0.03271198272705078, -0.0303192138671875, -0.02792644500732422, -0.025533676147460938, -0.023140907287597656, -0.020748138427734375, -0.018355369567871094, -0.015962600708007812, -0.013569831848144531, -0.01117706298828125, -0.008784294128417969, -0.0063915252685546875, -0.003998756408691406, -0.001605987548828125, 0.0007867813110351562, 0.0031795501708984375, 0.005572319030761719, 0.007965087890625, 0.010357856750488281, 0.012750625610351562, 0.015143394470214844, 0.017536163330078125, 0.019928932189941406, 0.022321701049804688, 0.02471446990966797, 0.02710723876953125, 0.02950000762939453, 0.03189277648925781, 0.034285545349121094, 0.036678314208984375, 0.039071083068847656, 0.04146385192871094, 0.04385662078857422, 0.0462493896484375, 0.04864215850830078, 0.05103492736816406, 0.053427696228027344, 0.055820465087890625, 0.058213233947753906, 0.06060600280761719, 0.06299877166748047, 0.06539154052734375, 0.06778430938720703, 0.07017707824707031, 0.0725698471069336, 0.07496261596679688, 0.07735538482666016, 0.07974815368652344, 0.08214092254638672, 0.08453369140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 17.0, 24.0, 52.0, 143.0, 397.0, 2329.0, 1459260.0, 2728699.0, 2657.0, 423.0, 169.0, 60.0, 30.0, 18.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1767578125, -1.1500320434570312, -1.1233062744140625, -1.0965805053710938, -1.069854736328125, -1.0431289672851562, -1.0164031982421875, -0.9896774291992188, -0.96295166015625, -0.9362258911132812, -0.9095001220703125, -0.8827743530273438, -0.856048583984375, -0.8293228149414062, -0.8025970458984375, -0.7758712768554688, -0.7491455078125, -0.7224197387695312, -0.6956939697265625, -0.6689682006835938, -0.642242431640625, -0.6155166625976562, -0.5887908935546875, -0.5620651245117188, -0.53533935546875, -0.5086135864257812, -0.4818878173828125, -0.45516204833984375, -0.428436279296875, -0.40171051025390625, -0.3749847412109375, -0.34825897216796875, -0.321533203125, -0.29480743408203125, -0.2680816650390625, -0.24135589599609375, -0.214630126953125, -0.18790435791015625, -0.1611785888671875, -0.13445281982421875, -0.10772705078125, -0.08100128173828125, -0.0542755126953125, -0.02754974365234375, -0.000823974609375, 0.02590179443359375, 0.0526275634765625, 0.07935333251953125, 0.1060791015625, 0.13280487060546875, 0.1595306396484375, 0.18625640869140625, 0.212982177734375, 0.23970794677734375, 0.2664337158203125, 0.29315948486328125, 0.31988525390625, 0.34661102294921875, 0.3733367919921875, 0.40006256103515625, 0.426788330078125, 0.45351409912109375, 0.4802398681640625, 0.5069656372070312, 0.53369140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 12.0, 20.0, 41.0, 74.0, 151.0, 315.0, 712.0, 1315.0, 798.0, 319.0, 144.0, 91.0, 40.0, 17.0, 8.0, 11.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.1758861541748047, -0.16732406616210938, -0.15876197814941406, -0.15019989013671875, -0.14163780212402344, -0.13307571411132812, -0.12451362609863281, -0.1159515380859375, -0.10738945007324219, -0.09882736206054688, -0.09026527404785156, -0.08170318603515625, -0.07314109802246094, -0.06457901000976562, -0.05601692199707031, -0.047454833984375, -0.03889274597167969, -0.030330657958984375, -0.021768569946289062, -0.01320648193359375, -0.0046443939208984375, 0.003917694091796875, 0.012479782104492188, 0.0210418701171875, 0.029603958129882812, 0.038166046142578125, 0.04672813415527344, 0.05529022216796875, 0.06385231018066406, 0.07241439819335938, 0.08097648620605469, 0.08953857421875, 0.09810066223144531, 0.10666275024414062, 0.11522483825683594, 0.12378692626953125, 0.13234901428222656, 0.14091110229492188, 0.1494731903076172, 0.1580352783203125, 0.1665973663330078, 0.17515945434570312, 0.18372154235839844, 0.19228363037109375, 0.20084571838378906, 0.20940780639648438, 0.2179698944091797, 0.226531982421875, 0.2350940704345703, 0.24365615844726562, 0.25221824645996094, 0.26078033447265625, 0.26934242248535156, 0.2779045104980469, 0.2864665985107422, 0.2950286865234375, 0.3035907745361328, 0.3121528625488281, 0.32071495056152344, 0.32927703857421875, 0.33783912658691406, 0.3464012145996094, 0.3549633026123047, 0.363525390625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 16.0, 18.0, 79.0, 164.0, 299.0, 255.0, 115.0, 50.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7479544281959534, -0.7035009264945984, -0.6590474247932434, -0.6145938634872437, -0.5701403617858887, -0.5256868600845337, -0.4812333583831787, -0.43677985668182373, -0.39232635498046875, -0.34787285327911377, -0.3034193515777588, -0.2589658200740814, -0.21451231837272644, -0.17005881667137146, -0.1256052851676941, -0.08115178346633911, -0.03669828176498413, 0.0077552273869514465, 0.052208736538887024, 0.0966622531414032, 0.14111575484275818, 0.18556925654411316, 0.23002278804779053, 0.2744762897491455, 0.3189297914505005, 0.36338329315185547, 0.40783679485321045, 0.4522903263568878, 0.4967438280582428, 0.5411972999572754, 0.5856508612632751, 0.6301043629646301, 0.6745579242706299, 0.7190114259719849, 0.7634649276733398, 0.8079184293746948, 0.8523719310760498, 0.8968254327774048, 0.9412789940834045, 0.9857324957847595, 1.0301859378814697, 1.0746394395828247, 1.1190929412841797, 1.1635464429855347, 1.2079999446868896, 1.2524534463882446, 1.2969069480895996, 1.3413605690002441, 1.3858140707015991, 1.430267572402954, 1.474721074104309, 1.519174575805664, 1.563628077507019, 1.608081579208374, 1.6525352001190186, 1.696988582611084, 1.7414422035217285, 1.7858957052230835, 1.8303492069244385, 1.8748027086257935, 1.9192562103271484, 1.9637097120285034, 2.0081632137298584, 2.052616834640503, 2.0970702171325684]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 8.0, 11.0, 16.0, 25.0, 24.0, 27.0, 43.0, 35.0, 34.0, 47.0, 59.0, 58.0, 69.0, 53.0, 58.0, 67.0, 55.0, 49.0, 48.0, 27.0, 31.0, 25.0, 26.0, 19.0, 15.0, 12.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4012495279312134, -0.38445669412612915, -0.3676638603210449, -0.3508710265159607, -0.33407819271087646, -0.31728535890579224, -0.300492525100708, -0.2836996912956238, -0.26690685749053955, -0.2501140236854553, -0.2333211898803711, -0.21652835607528687, -0.19973552227020264, -0.1829426884651184, -0.16614986956119537, -0.14935703575611115, -0.1325642168521881, -0.11577138304710388, -0.09897854924201965, -0.08218572288751602, -0.0653928890824318, -0.048600055277347565, -0.03180722892284393, -0.015014395117759705, 0.001778438687324524, 0.018571270629763603, 0.03536410257220268, 0.05215693265199661, 0.06894976645708084, 0.08574260026216507, 0.1025354266166687, 0.11932826042175293, 0.13612109422683716, 0.1529139280319214, 0.16970676183700562, 0.18649959564208984, 0.20329242944717407, 0.2200852632522583, 0.23687808215618134, 0.25367093086242676, 0.270463764667511, 0.2872565984725952, 0.30404943227767944, 0.32084226608276367, 0.3376350998878479, 0.35442793369293213, 0.37122076749801636, 0.3880136013031006, 0.4048064053058624, 0.42159923911094666, 0.4383920729160309, 0.4551849067211151, 0.47197774052619934, 0.48877057433128357, 0.5055633783340454, 0.5223562121391296, 0.5391490459442139, 0.5559418797492981, 0.5727347135543823, 0.5895275473594666, 0.6063203811645508, 0.623113214969635, 0.6399060487747192, 0.6566988825798035, 0.6734917163848877]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 3.0, 6.0, 6.0, 16.0, 21.0, 23.0, 32.0, 31.0, 53.0, 71.0, 107.0, 172.0, 203.0, 346.0, 554.0, 868.0, 1525.0, 2828.0, 5867.0, 12258.0, 27556.0, 63375.0, 149841.0, 284198.0, 266330.0, 130914.0, 55392.0, 23908.0, 10674.0, 5114.0, 2564.0, 1374.0, 822.0, 486.0, 328.0, 209.0, 142.0, 91.0, 75.0, 57.0, 33.0, 27.0, 14.0, 13.0, 5.0, 9.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.107421875, -0.10405635833740234, -0.10069084167480469, -0.09732532501220703, -0.09395980834960938, -0.09059429168701172, -0.08722877502441406, -0.0838632583618164, -0.08049774169921875, -0.0771322250366211, -0.07376670837402344, -0.07040119171142578, -0.06703567504882812, -0.06367015838623047, -0.06030464172363281, -0.056939125061035156, -0.0535736083984375, -0.050208091735839844, -0.04684257507324219, -0.04347705841064453, -0.040111541748046875, -0.03674602508544922, -0.03338050842285156, -0.030014991760253906, -0.02664947509765625, -0.023283958435058594, -0.019918441772460938, -0.01655292510986328, -0.013187408447265625, -0.009821891784667969, -0.0064563751220703125, -0.0030908584594726562, 0.000274658203125, 0.0036401748657226562, 0.0070056915283203125, 0.010371208190917969, 0.013736724853515625, 0.01710224151611328, 0.020467758178710938, 0.023833274841308594, 0.02719879150390625, 0.030564308166503906, 0.03392982482910156, 0.03729534149169922, 0.040660858154296875, 0.04402637481689453, 0.04739189147949219, 0.050757408142089844, 0.0541229248046875, 0.057488441467285156, 0.06085395812988281, 0.06421947479248047, 0.06758499145507812, 0.07095050811767578, 0.07431602478027344, 0.0776815414428711, 0.08104705810546875, 0.0844125747680664, 0.08777809143066406, 0.09114360809326172, 0.09450912475585938, 0.09787464141845703, 0.10124015808105469, 0.10460567474365234, 0.10797119140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 5.0, 6.0, 4.0, 10.0, 19.0, 21.0, 34.0, 43.0, 44.0, 61.0, 52.0, 71.0, 99.0, 69.0, 48.0, 60.0, 66.0, 66.0, 42.0, 30.0, 41.0, 26.0, 22.0, 28.0, 11.0, 9.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06318378448486328, -0.06075477600097656, -0.058325767517089844, -0.055896759033203125, -0.053467750549316406, -0.05103874206542969, -0.04860973358154297, -0.04618072509765625, -0.04375171661376953, -0.04132270812988281, -0.038893699645996094, -0.036464691162109375, -0.034035682678222656, -0.03160667419433594, -0.02917766571044922, -0.0267486572265625, -0.02431964874267578, -0.021890640258789062, -0.019461631774902344, -0.017032623291015625, -0.014603614807128906, -0.012174606323242188, -0.009745597839355469, -0.00731658935546875, -0.004887580871582031, -0.0024585723876953125, -2.956390380859375e-05, 0.002399444580078125, 0.004828453063964844, 0.0072574615478515625, 0.009686470031738281, 0.012115478515625, 0.014544486999511719, 0.016973495483398438, 0.019402503967285156, 0.021831512451171875, 0.024260520935058594, 0.026689529418945312, 0.02911853790283203, 0.03154754638671875, 0.03397655487060547, 0.03640556335449219, 0.038834571838378906, 0.041263580322265625, 0.043692588806152344, 0.04612159729003906, 0.04855060577392578, 0.0509796142578125, 0.05340862274169922, 0.05583763122558594, 0.058266639709472656, 0.060695648193359375, 0.0631246566772461, 0.06555366516113281, 0.06798267364501953, 0.07041168212890625, 0.07284069061279297, 0.07526969909667969, 0.0776987075805664, 0.08012771606445312, 0.08255672454833984, 0.08498573303222656, 0.08741474151611328, 0.08984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 10.0, 13.0, 13.0, 24.0, 23.0, 24.0, 33.0, 44.0, 55.0, 81.0, 216.0, 531.0, 1889.0, 7583.0, 39831.0, 278600.0, 577075.0, 117610.0, 18838.0, 4164.0, 1073.0, 364.0, 128.0, 65.0, 47.0, 43.0, 27.0, 22.0, 9.0, 18.0, 13.0, 11.0, 7.0, 10.0, 8.0, 4.0, 3.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2342529296875, -0.22721481323242188, -0.22017669677734375, -0.21313858032226562, -0.2061004638671875, -0.19906234741210938, -0.19202423095703125, -0.18498611450195312, -0.177947998046875, -0.17090988159179688, -0.16387176513671875, -0.15683364868164062, -0.1497955322265625, -0.14275741577148438, -0.13571929931640625, -0.12868118286132812, -0.12164306640625, -0.11460494995117188, -0.10756683349609375, -0.10052871704101562, -0.0934906005859375, -0.08645248413085938, -0.07941436767578125, -0.07237625122070312, -0.065338134765625, -0.058300018310546875, -0.05126190185546875, -0.044223785400390625, -0.0371856689453125, -0.030147552490234375, -0.02310943603515625, -0.016071319580078125, -0.009033203125, -0.001995086669921875, 0.00504302978515625, 0.012081146240234375, 0.0191192626953125, 0.026157379150390625, 0.03319549560546875, 0.040233612060546875, 0.047271728515625, 0.054309844970703125, 0.06134796142578125, 0.06838607788085938, 0.0754241943359375, 0.08246231079101562, 0.08950042724609375, 0.09653854370117188, 0.10357666015625, 0.11061477661132812, 0.11765289306640625, 0.12469100952148438, 0.1317291259765625, 0.13876724243164062, 0.14580535888671875, 0.15284347534179688, 0.159881591796875, 0.16691970825195312, 0.17395782470703125, 0.18099594116210938, 0.1880340576171875, 0.19507217407226562, 0.20211029052734375, 0.20914840698242188, 0.2161865234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 1.0, 6.0, 9.0, 7.0, 8.0, 11.0, 10.0, 16.0, 11.0, 21.0, 19.0, 34.0, 28.0, 30.0, 24.0, 31.0, 39.0, 45.0, 49.0, 44.0, 38.0, 34.0, 53.0, 45.0, 42.0, 29.0, 36.0, 28.0, 33.0, 39.0, 29.0, 21.0, 24.0, 27.0, 14.0, 10.0, 13.0, 9.0, 11.0, 5.0, 5.0, 0.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.1269989013671875, -0.122772216796875, -0.1185455322265625, -0.11431884765625, -0.1100921630859375, -0.105865478515625, -0.1016387939453125, -0.097412109375, -0.0931854248046875, -0.088958740234375, -0.0847320556640625, -0.08050537109375, -0.0762786865234375, -0.072052001953125, -0.0678253173828125, -0.0635986328125, -0.0593719482421875, -0.055145263671875, -0.0509185791015625, -0.04669189453125, -0.0424652099609375, -0.038238525390625, -0.0340118408203125, -0.02978515625, -0.0255584716796875, -0.021331787109375, -0.0171051025390625, -0.01287841796875, -0.0086517333984375, -0.004425048828125, -0.0001983642578125, 0.0040283203125, 0.0082550048828125, 0.012481689453125, 0.0167083740234375, 0.02093505859375, 0.0251617431640625, 0.029388427734375, 0.0336151123046875, 0.037841796875, 0.0420684814453125, 0.046295166015625, 0.0505218505859375, 0.05474853515625, 0.0589752197265625, 0.063201904296875, 0.0674285888671875, 0.0716552734375, 0.0758819580078125, 0.080108642578125, 0.0843353271484375, 0.08856201171875, 0.0927886962890625, 0.097015380859375, 0.1012420654296875, 0.10546875, 0.1096954345703125, 0.113922119140625, 0.1181488037109375, 0.12237548828125, 0.1266021728515625, 0.130828857421875, 0.1350555419921875, 0.1392822265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 3.0, 10.0, 12.0, 21.0, 25.0, 43.0, 74.0, 91.0, 174.0, 251.0, 440.0, 677.0, 1395.0, 2864.0, 6690.0, 17253.0, 48316.0, 131475.0, 274093.0, 301540.0, 163548.0, 61730.0, 22124.0, 8389.0, 3504.0, 1700.0, 852.0, 488.0, 287.0, 177.0, 98.0, 70.0, 47.0, 19.0, 24.0, 16.0, 14.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03350830078125, -0.03235769271850586, -0.03120708465576172, -0.030056476593017578, -0.028905868530273438, -0.027755260467529297, -0.026604652404785156, -0.025454044342041016, -0.024303436279296875, -0.023152828216552734, -0.022002220153808594, -0.020851612091064453, -0.019701004028320312, -0.018550395965576172, -0.01739978790283203, -0.01624917984008789, -0.01509857177734375, -0.01394796371459961, -0.012797355651855469, -0.011646747589111328, -0.010496139526367188, -0.009345531463623047, -0.008194923400878906, -0.007044315338134766, -0.005893707275390625, -0.004743099212646484, -0.0035924911499023438, -0.002441883087158203, -0.0012912750244140625, -0.00014066696166992188, 0.0010099411010742188, 0.0021605491638183594, 0.0033111572265625, 0.004461765289306641, 0.005612373352050781, 0.006762981414794922, 0.007913589477539062, 0.009064197540283203, 0.010214805603027344, 0.011365413665771484, 0.012516021728515625, 0.013666629791259766, 0.014817237854003906, 0.015967845916748047, 0.017118453979492188, 0.018269062042236328, 0.01941967010498047, 0.02057027816772461, 0.02172088623046875, 0.02287149429321289, 0.02402210235595703, 0.025172710418701172, 0.026323318481445312, 0.027473926544189453, 0.028624534606933594, 0.029775142669677734, 0.030925750732421875, 0.032076358795166016, 0.033226966857910156, 0.0343775749206543, 0.03552818298339844, 0.03667879104614258, 0.03782939910888672, 0.03898000717163086, 0.040130615234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 7.0, 11.0, 9.0, 8.0, 6.0, 19.0, 24.0, 21.0, 18.0, 42.0, 33.0, 33.0, 44.0, 37.0, 64.0, 69.0, 51.0, 58.0, 60.0, 30.0, 51.0, 48.0, 37.0, 46.0, 34.0, 23.0, 15.0, 22.0, 9.0, 13.0, 6.0, 5.0, 9.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3909759521484375e-06, -7.1721151471138e-06, -6.953254342079163e-06, -6.734393537044525e-06, -6.515532732009888e-06, -6.29667192697525e-06, -6.077811121940613e-06, -5.858950316905975e-06, -5.640089511871338e-06, -5.4212287068367004e-06, -5.202367901802063e-06, -4.9835070967674255e-06, -4.764646291732788e-06, -4.545785486698151e-06, -4.326924681663513e-06, -4.108063876628876e-06, -3.889203071594238e-06, -3.670342266559601e-06, -3.4514814615249634e-06, -3.232620656490326e-06, -3.0137598514556885e-06, -2.794899046421051e-06, -2.5760382413864136e-06, -2.357177436351776e-06, -2.1383166313171387e-06, -1.9194558262825012e-06, -1.7005950212478638e-06, -1.4817342162132263e-06, -1.2628734111785889e-06, -1.0440126061439514e-06, -8.25151801109314e-07, -6.062909960746765e-07, -3.8743019104003906e-07, -1.685693860054016e-07, 5.029141902923584e-08, 2.691522240638733e-07, 4.880130290985107e-07, 7.068738341331482e-07, 9.257346391677856e-07, 1.144595444202423e-06, 1.3634562492370605e-06, 1.582317054271698e-06, 1.8011778593063354e-06, 2.020038664340973e-06, 2.2388994693756104e-06, 2.457760274410248e-06, 2.6766210794448853e-06, 2.8954818844795227e-06, 3.11434268951416e-06, 3.3332034945487976e-06, 3.552064299583435e-06, 3.7709251046180725e-06, 3.98978590965271e-06, 4.208646714687347e-06, 4.427507519721985e-06, 4.646368324756622e-06, 4.86522912979126e-06, 5.084089934825897e-06, 5.302950739860535e-06, 5.521811544895172e-06, 5.7406723499298096e-06, 5.959533154964447e-06, 6.1783939599990845e-06, 6.397254765033722e-06, 6.616115570068359e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 7.0, 8.0, 6.0, 8.0, 24.0, 27.0, 36.0, 48.0, 67.0, 131.0, 233.0, 520.0, 1098.0, 2908.0, 8565.0, 30747.0, 114980.0, 317440.0, 358420.0, 153196.0, 42245.0, 11497.0, 3656.0, 1378.0, 575.0, 297.0, 164.0, 82.0, 58.0, 47.0, 26.0, 17.0, 21.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043609619140625, -0.042208194732666016, -0.04080677032470703, -0.03940534591674805, -0.03800392150878906, -0.03660249710083008, -0.035201072692871094, -0.03379964828491211, -0.032398223876953125, -0.03099679946899414, -0.029595375061035156, -0.028193950653076172, -0.026792526245117188, -0.025391101837158203, -0.02398967742919922, -0.022588253021240234, -0.02118682861328125, -0.019785404205322266, -0.01838397979736328, -0.016982555389404297, -0.015581130981445312, -0.014179706573486328, -0.012778282165527344, -0.01137685775756836, -0.009975433349609375, -0.00857400894165039, -0.007172584533691406, -0.005771160125732422, -0.0043697357177734375, -0.002968311309814453, -0.0015668869018554688, -0.00016546249389648438, 0.0012359619140625, 0.0026373863220214844, 0.004038810729980469, 0.005440235137939453, 0.0068416595458984375, 0.008243083953857422, 0.009644508361816406, 0.01104593276977539, 0.012447357177734375, 0.01384878158569336, 0.015250205993652344, 0.016651630401611328, 0.018053054809570312, 0.019454479217529297, 0.02085590362548828, 0.022257328033447266, 0.02365875244140625, 0.025060176849365234, 0.02646160125732422, 0.027863025665283203, 0.029264450073242188, 0.030665874481201172, 0.032067298889160156, 0.03346872329711914, 0.034870147705078125, 0.03627157211303711, 0.037672996520996094, 0.03907442092895508, 0.04047584533691406, 0.04187726974487305, 0.04327869415283203, 0.044680118560791016, 0.04608154296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 16.0, 20.0, 22.0, 28.0, 27.0, 32.0, 42.0, 50.0, 54.0, 53.0, 62.0, 69.0, 66.0, 73.0, 50.0, 67.0, 56.0, 51.0, 29.0, 22.0, 18.0, 20.0, 13.0, 14.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281524658203125, -0.027207136154174805, -0.02626180648803711, -0.025316476821899414, -0.02437114715576172, -0.023425817489624023, -0.022480487823486328, -0.021535158157348633, -0.020589828491210938, -0.019644498825073242, -0.018699169158935547, -0.01775383949279785, -0.016808509826660156, -0.01586318016052246, -0.014917850494384766, -0.01397252082824707, -0.013027191162109375, -0.01208186149597168, -0.011136531829833984, -0.010191202163696289, -0.009245872497558594, -0.008300542831420898, -0.007355213165283203, -0.006409883499145508, -0.0054645538330078125, -0.004519224166870117, -0.003573894500732422, -0.0026285648345947266, -0.0016832351684570312, -0.0007379055023193359, 0.00020742416381835938, 0.0011527538299560547, 0.00209808349609375, 0.0030434131622314453, 0.003988742828369141, 0.004934072494506836, 0.005879402160644531, 0.0068247318267822266, 0.007770061492919922, 0.008715391159057617, 0.009660720825195312, 0.010606050491333008, 0.011551380157470703, 0.012496709823608398, 0.013442039489746094, 0.014387369155883789, 0.015332698822021484, 0.01627802848815918, 0.017223358154296875, 0.01816868782043457, 0.019114017486572266, 0.02005934715270996, 0.021004676818847656, 0.02195000648498535, 0.022895336151123047, 0.023840665817260742, 0.024785995483398438, 0.025731325149536133, 0.026676654815673828, 0.027621984481811523, 0.02856731414794922, 0.029512643814086914, 0.03045797348022461, 0.031403303146362305, 0.0323486328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 18.0, 80.0, 572.0, 303.0, 25.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6038464307785034, -1.5304702520370483, -1.4570940732955933, -1.3837178945541382, -1.310341715812683, -1.236965537071228, -1.1635892391204834, -1.0902130603790283, -1.0168368816375732, -0.9434607028961182, -0.8700845241546631, -0.796708345413208, -0.7233321666717529, -0.6499559879302979, -0.576579749584198, -0.5032035708427429, -0.4298274517059326, -0.35645127296447754, -0.28307509422302246, -0.209698885679245, -0.13632270693778992, -0.06294652819633484, 0.010429680347442627, 0.0838058590888977, 0.15718203783035278, 0.23055821657180786, 0.30393439531326294, 0.3773106038570404, 0.4506867825984955, 0.524062991142273, 0.597439169883728, 0.6708153486251831, 0.7441916465759277, 0.8175678253173828, 0.8909440040588379, 0.964320182800293, 1.037696361541748, 1.1110725402832031, 1.1844487190246582, 1.2578248977661133, 1.3312010765075684, 1.4045772552490234, 1.4779534339904785, 1.5513296127319336, 1.6247057914733887, 1.6980819702148438, 1.7714581489562988, 1.844834327697754, 1.9182106256484985, 1.9915868043899536, 2.0649631023406982, 2.1383392810821533, 2.2117154598236084, 2.2850916385650635, 2.3584678173065186, 2.4318439960479736, 2.5052201747894287, 2.578596353530884, 2.651972532272339, 2.725348711013794, 2.798724889755249, 2.872101068496704, 2.945477247238159, 3.0188534259796143, 3.0922296047210693]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 10.0, 9.0, 17.0, 16.0, 14.0, 19.0, 20.0, 33.0, 36.0, 25.0, 41.0, 40.0, 57.0, 47.0, 51.0, 48.0, 45.0, 44.0, 32.0, 52.0, 34.0, 35.0, 30.0, 34.0, 28.0, 26.0, 19.0, 19.0, 24.0, 12.0, 15.0, 9.0, 15.0, 4.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.48203420639038086, -0.4675138294696808, -0.4529934525489807, -0.43847307562828064, -0.42395269870758057, -0.4094323515892029, -0.3949119746685028, -0.38039159774780273, -0.36587122082710266, -0.3513508439064026, -0.3368304669857025, -0.32231009006500244, -0.30778974294662476, -0.2932693362236023, -0.2787489891052246, -0.26422861218452454, -0.24970823526382446, -0.2351878583431244, -0.22066748142242432, -0.20614711940288544, -0.19162674248218536, -0.1771063655614853, -0.1625860035419464, -0.14806562662124634, -0.13354524970054626, -0.11902487277984619, -0.10450450330972672, -0.08998413383960724, -0.07546375691890717, -0.06094337999820709, -0.046423010528087616, -0.03190264105796814, -0.017382264137268066, -0.0028618909418582916, 0.011658482253551483, 0.026178855448961258, 0.04069922864437103, 0.055219605565071106, 0.06973997503519058, 0.08426034450531006, 0.09878072142601013, 0.1133010983467102, 0.12782147526741028, 0.14234183728694916, 0.15686221420764923, 0.1713825911283493, 0.18590295314788818, 0.20042333006858826, 0.21494370698928833, 0.2294640839099884, 0.24398446083068848, 0.25850483775138855, 0.2730252146720886, 0.2875455617904663, 0.3020659387111664, 0.31658631563186646, 0.33110669255256653, 0.3456270694732666, 0.3601474463939667, 0.37466782331466675, 0.38918817043304443, 0.4037085771560669, 0.4182289242744446, 0.43274930119514465, 0.4472696781158447]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 8.0, 11.0, 10.0, 26.0, 35.0, 69.0, 89.0, 142.0, 255.0, 488.0, 837.0, 1677.0, 3259.0, 7110.0, 17336.0, 47803.0, 173721.0, 1084054.0, 2204814.0, 511700.0, 90399.0, 28506.0, 11292.0, 5002.0, 2428.0, 1295.0, 696.0, 452.0, 267.0, 130.0, 114.0, 70.0, 53.0, 32.0, 24.0, 15.0, 14.0, 16.0, 5.0, 7.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0997314453125, -0.09654521942138672, -0.09335899353027344, -0.09017276763916016, -0.08698654174804688, -0.0838003158569336, -0.08061408996582031, -0.07742786407470703, -0.07424163818359375, -0.07105541229248047, -0.06786918640136719, -0.0646829605102539, -0.061496734619140625, -0.058310508728027344, -0.05512428283691406, -0.05193805694580078, -0.0487518310546875, -0.04556560516357422, -0.04237937927246094, -0.039193153381347656, -0.036006927490234375, -0.032820701599121094, -0.029634475708007812, -0.02644824981689453, -0.02326202392578125, -0.02007579803466797, -0.016889572143554688, -0.013703346252441406, -0.010517120361328125, -0.007330894470214844, -0.0041446685791015625, -0.0009584426879882812, 0.002227783203125, 0.005414009094238281, 0.008600234985351562, 0.011786460876464844, 0.014972686767578125, 0.018158912658691406, 0.021345138549804688, 0.02453136444091797, 0.02771759033203125, 0.03090381622314453, 0.03409004211425781, 0.037276268005371094, 0.040462493896484375, 0.043648719787597656, 0.04683494567871094, 0.05002117156982422, 0.0532073974609375, 0.05639362335205078, 0.05957984924316406, 0.06276607513427734, 0.06595230102539062, 0.0691385269165039, 0.07232475280761719, 0.07551097869873047, 0.07869720458984375, 0.08188343048095703, 0.08506965637207031, 0.0882558822631836, 0.09144210815429688, 0.09462833404541016, 0.09781455993652344, 0.10100078582763672, 0.10418701171875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 11.0, 13.0, 12.0, 23.0, 35.0, 47.0, 52.0, 47.0, 67.0, 71.0, 73.0, 75.0, 69.0, 56.0, 63.0, 58.0, 55.0, 38.0, 25.0, 23.0, 22.0, 18.0, 10.0, 12.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.07475948333740234, -0.07206535339355469, -0.06937122344970703, -0.06667709350585938, -0.06398296356201172, -0.06128883361816406, -0.058594703674316406, -0.05590057373046875, -0.053206443786621094, -0.05051231384277344, -0.04781818389892578, -0.045124053955078125, -0.04242992401123047, -0.03973579406738281, -0.037041664123535156, -0.0343475341796875, -0.031653404235839844, -0.028959274291992188, -0.02626514434814453, -0.023571014404296875, -0.02087688446044922, -0.018182754516601562, -0.015488624572753906, -0.01279449462890625, -0.010100364685058594, -0.0074062347412109375, -0.004712104797363281, -0.002017974853515625, 0.0006761550903320312, 0.0033702850341796875, 0.006064414978027344, 0.008758544921875, 0.011452674865722656, 0.014146804809570312, 0.01684093475341797, 0.019535064697265625, 0.02222919464111328, 0.024923324584960938, 0.027617454528808594, 0.03031158447265625, 0.033005714416503906, 0.03569984436035156, 0.03839397430419922, 0.041088104248046875, 0.04378223419189453, 0.04647636413574219, 0.049170494079589844, 0.0518646240234375, 0.054558753967285156, 0.05725288391113281, 0.05994701385498047, 0.06264114379882812, 0.06533527374267578, 0.06802940368652344, 0.0707235336303711, 0.07341766357421875, 0.0761117935180664, 0.07880592346191406, 0.08150005340576172, 0.08419418334960938, 0.08688831329345703, 0.08958244323730469, 0.09227657318115234, 0.094970703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 14.0, 23.0, 18.0, 32.0, 34.0, 44.0, 89.0, 126.0, 220.0, 596.0, 2107.0, 24687.0, 3174840.0, 977582.0, 11402.0, 1478.0, 445.0, 213.0, 100.0, 68.0, 47.0, 35.0, 16.0, 20.0, 10.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3447265625, -0.3327903747558594, -0.32085418701171875, -0.3089179992675781, -0.2969818115234375, -0.2850456237792969, -0.27310943603515625, -0.2611732482910156, -0.249237060546875, -0.23730087280273438, -0.22536468505859375, -0.21342849731445312, -0.2014923095703125, -0.18955612182617188, -0.17761993408203125, -0.16568374633789062, -0.15374755859375, -0.14181137084960938, -0.12987518310546875, -0.11793899536132812, -0.1060028076171875, -0.09406661987304688, -0.08213043212890625, -0.07019424438476562, -0.058258056640625, -0.046321868896484375, -0.03438568115234375, -0.022449493408203125, -0.0105133056640625, 0.001422882080078125, 0.01335906982421875, 0.025295257568359375, 0.0372314453125, 0.049167633056640625, 0.06110382080078125, 0.07304000854492188, 0.0849761962890625, 0.09691238403320312, 0.10884857177734375, 0.12078475952148438, 0.132720947265625, 0.14465713500976562, 0.15659332275390625, 0.16852951049804688, 0.1804656982421875, 0.19240188598632812, 0.20433807373046875, 0.21627426147460938, 0.22821044921875, 0.24014663696289062, 0.25208282470703125, 0.2640190124511719, 0.2759552001953125, 0.2878913879394531, 0.29982757568359375, 0.3117637634277344, 0.323699951171875, 0.3356361389160156, 0.34757232666015625, 0.3595085144042969, 0.3714447021484375, 0.3833808898925781, 0.39531707763671875, 0.4072532653808594, 0.419189453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 9.0, 3.0, 9.0, 22.0, 25.0, 33.0, 53.0, 66.0, 92.0, 152.0, 241.0, 360.0, 592.0, 635.0, 608.0, 388.0, 237.0, 153.0, 110.0, 73.0, 47.0, 38.0, 38.0, 30.0, 14.0, 13.0, 8.0, 10.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14453125, -0.14057350158691406, -0.13661575317382812, -0.1326580047607422, -0.12870025634765625, -0.12474250793457031, -0.12078475952148438, -0.11682701110839844, -0.1128692626953125, -0.10891151428222656, -0.10495376586914062, -0.10099601745605469, -0.09703826904296875, -0.09308052062988281, -0.08912277221679688, -0.08516502380371094, -0.081207275390625, -0.07724952697753906, -0.07329177856445312, -0.06933403015136719, -0.06537628173828125, -0.06141853332519531, -0.057460784912109375, -0.05350303649902344, -0.0495452880859375, -0.04558753967285156, -0.041629791259765625, -0.03767204284667969, -0.03371429443359375, -0.029756546020507812, -0.025798797607421875, -0.021841049194335938, -0.01788330078125, -0.013925552368164062, -0.009967803955078125, -0.0060100555419921875, -0.00205230712890625, 0.0019054412841796875, 0.005863189697265625, 0.009820938110351562, 0.0137786865234375, 0.017736434936523438, 0.021694183349609375, 0.025651931762695312, 0.02960968017578125, 0.03356742858886719, 0.037525177001953125, 0.04148292541503906, 0.045440673828125, 0.04939842224121094, 0.053356170654296875, 0.05731391906738281, 0.06127166748046875, 0.06522941589355469, 0.06918716430664062, 0.07314491271972656, 0.0771026611328125, 0.08106040954589844, 0.08501815795898438, 0.08897590637207031, 0.09293365478515625, 0.09689140319824219, 0.10084915161132812, 0.10480690002441406, 0.1087646484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 26.0, 80.0, 211.0, 281.0, 230.0, 101.0, 29.0, 14.0, 7.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.9772794246673584, -1.9394958019256592, -1.9017120599746704, -1.8639284372329712, -1.8261446952819824, -1.7883610725402832, -1.7505773305892944, -1.7127937078475952, -1.6750099658966064, -1.6372263431549072, -1.5994426012039185, -1.5616589784622192, -1.5238752365112305, -1.4860916137695312, -1.4483078718185425, -1.4105242490768433, -1.3727405071258545, -1.3349568843841553, -1.2971731424331665, -1.2593895196914673, -1.2216057777404785, -1.1838221549987793, -1.1460384130477905, -1.1082547903060913, -1.070471167564392, -1.0326875448226929, -0.9949038028717041, -0.9571201205253601, -0.9193364381790161, -0.8815527558326721, -0.8437690734863281, -0.8059854507446289, -0.7682017683982849, -0.7304180860519409, -0.6926344037055969, -0.6548507213592529, -0.6170670390129089, -0.5792833566665649, -0.5414997339248657, -0.503715991973877, -0.46593233942985535, -0.42814865708351135, -0.39036497473716736, -0.35258132219314575, -0.31479763984680176, -0.27701395750045776, -0.23923027515411377, -0.20144659280776978, -0.16366291046142578, -0.1258792281150818, -0.08809555321931839, -0.05031187832355499, -0.012528195977210999, 0.025255486369132996, 0.0630391538143158, 0.10082283616065979, 0.13860651850700378, 0.17639020085334778, 0.21417388319969177, 0.2519575357437134, 0.2897412180900574, 0.32752490043640137, 0.36530858278274536, 0.40309226512908936, 0.44087594747543335]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 10.0, 9.0, 11.0, 8.0, 13.0, 13.0, 24.0, 15.0, 18.0, 24.0, 37.0, 48.0, 35.0, 36.0, 34.0, 38.0, 36.0, 38.0, 43.0, 54.0, 47.0, 40.0, 38.0, 41.0, 35.0, 42.0, 20.0, 42.0, 32.0, 24.0, 17.0, 8.0, 12.0, 8.0, 16.0, 6.0, 6.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.41162818670272827, -0.4003381133079529, -0.3890480101108551, -0.3777579367160797, -0.3664678633213043, -0.35517776012420654, -0.34388768672943115, -0.33259761333465576, -0.321307510137558, -0.3100174367427826, -0.2987273335456848, -0.2874372601509094, -0.27614718675613403, -0.26485708355903625, -0.25356701016426086, -0.24227692186832428, -0.2309868484735489, -0.2196967601776123, -0.20840668678283691, -0.19711659848690033, -0.18582651019096375, -0.17453643679618835, -0.16324634850025177, -0.15195626020431519, -0.1406661868095398, -0.1293760985136032, -0.11808601766824722, -0.10679593682289124, -0.09550584852695465, -0.08421576768159866, -0.07292568683624268, -0.06163559854030609, -0.05034551024436951, -0.03905542567372322, -0.027765342965722084, -0.016475260257720947, -0.005185175687074661, 0.006104908883571625, 0.017394989728927612, 0.028685078024864197, 0.039975158870220184, 0.05126524344086647, 0.06255532801151276, 0.07384540885686874, 0.08513548970222473, 0.09642557799816132, 0.1077156588435173, 0.11900574713945389, 0.13029582798480988, 0.14158591628074646, 0.15287598967552185, 0.16416607797145844, 0.17545616626739502, 0.1867462396621704, 0.198036327958107, 0.20932641625404358, 0.22061648964881897, 0.23190657794475555, 0.24319665133953094, 0.25448673963546753, 0.2657768130302429, 0.2770669162273407, 0.2883569896221161, 0.29964709281921387, 0.31093716621398926]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 3.0, 11.0, 14.0, 20.0, 18.0, 39.0, 61.0, 76.0, 129.0, 217.0, 379.0, 568.0, 1126.0, 2317.0, 5099.0, 12617.0, 35594.0, 109705.0, 299995.0, 352434.0, 150102.0, 48675.0, 17107.0, 6268.0, 2785.0, 1337.0, 782.0, 406.0, 252.0, 140.0, 72.0, 69.0, 38.0, 31.0, 23.0, 15.0, 18.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.14905929565429688, -0.14394378662109375, -0.13882827758789062, -0.1337127685546875, -0.12859725952148438, -0.12348175048828125, -0.11836624145507812, -0.113250732421875, -0.10813522338867188, -0.10301971435546875, -0.09790420532226562, -0.0927886962890625, -0.08767318725585938, -0.08255767822265625, -0.07744216918945312, -0.07232666015625, -0.06721115112304688, -0.06209564208984375, -0.056980133056640625, -0.0518646240234375, -0.046749114990234375, -0.04163360595703125, -0.036518096923828125, -0.031402587890625, -0.026287078857421875, -0.02117156982421875, -0.016056060791015625, -0.0109405517578125, -0.005825042724609375, -0.00070953369140625, 0.004405975341796875, 0.009521484375, 0.014636993408203125, 0.01975250244140625, 0.024868011474609375, 0.0299835205078125, 0.035099029541015625, 0.04021453857421875, 0.045330047607421875, 0.050445556640625, 0.055561065673828125, 0.06067657470703125, 0.06579208374023438, 0.0709075927734375, 0.07602310180664062, 0.08113861083984375, 0.08625411987304688, 0.09136962890625, 0.09648513793945312, 0.10160064697265625, 0.10671615600585938, 0.1118316650390625, 0.11694717407226562, 0.12206268310546875, 0.12717819213867188, 0.132293701171875, 0.13740921020507812, 0.14252471923828125, 0.14764022827148438, 0.1527557373046875, 0.15787124633789062, 0.16298675537109375, 0.16810226440429688, 0.1732177734375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 9.0, 27.0, 22.0, 32.0, 39.0, 57.0, 49.0, 63.0, 66.0, 84.0, 74.0, 68.0, 83.0, 64.0, 63.0, 56.0, 34.0, 27.0, 20.0, 22.0, 14.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07813072204589844, -0.07538986206054688, -0.07264900207519531, -0.06990814208984375, -0.06716728210449219, -0.06442642211914062, -0.06168556213378906, -0.0589447021484375, -0.05620384216308594, -0.053462982177734375, -0.05072212219238281, -0.04798126220703125, -0.04524040222167969, -0.042499542236328125, -0.03975868225097656, -0.037017822265625, -0.03427696228027344, -0.031536102294921875, -0.028795242309570312, -0.02605438232421875, -0.023313522338867188, -0.020572662353515625, -0.017831802368164062, -0.0150909423828125, -0.012350082397460938, -0.009609222412109375, -0.0068683624267578125, -0.00412750244140625, -0.0013866424560546875, 0.001354217529296875, 0.0040950775146484375, 0.0068359375, 0.009576797485351562, 0.012317657470703125, 0.015058517456054688, 0.01779937744140625, 0.020540237426757812, 0.023281097412109375, 0.026021957397460938, 0.0287628173828125, 0.03150367736816406, 0.034244537353515625, 0.03698539733886719, 0.03972625732421875, 0.04246711730957031, 0.045207977294921875, 0.04794883728027344, 0.050689697265625, 0.05343055725097656, 0.056171417236328125, 0.05891227722167969, 0.06165313720703125, 0.06439399719238281, 0.06713485717773438, 0.06987571716308594, 0.0726165771484375, 0.07535743713378906, 0.07809829711914062, 0.08083915710449219, 0.08358001708984375, 0.08632087707519531, 0.08906173706054688, 0.09180259704589844, 0.09454345703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 10.0, 10.0, 8.0, 9.0, 21.0, 27.0, 42.0, 61.0, 86.0, 142.0, 258.0, 461.0, 941.0, 2320.0, 7897.0, 37736.0, 227311.0, 566796.0, 166616.0, 27886.0, 6307.0, 1805.0, 820.0, 386.0, 206.0, 109.0, 89.0, 49.0, 29.0, 30.0, 15.0, 16.0, 14.0, 11.0, 10.0, 7.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2451171875, -0.23819541931152344, -0.23127365112304688, -0.2243518829345703, -0.21743011474609375, -0.2105083465576172, -0.20358657836914062, -0.19666481018066406, -0.1897430419921875, -0.18282127380371094, -0.17589950561523438, -0.1689777374267578, -0.16205596923828125, -0.1551342010498047, -0.14821243286132812, -0.14129066467285156, -0.134368896484375, -0.12744712829589844, -0.12052536010742188, -0.11360359191894531, -0.10668182373046875, -0.09976005554199219, -0.09283828735351562, -0.08591651916503906, -0.0789947509765625, -0.07207298278808594, -0.06515121459960938, -0.05822944641113281, -0.05130767822265625, -0.04438591003417969, -0.037464141845703125, -0.030542373657226562, -0.02362060546875, -0.016698837280273438, -0.009777069091796875, -0.0028553009033203125, 0.00406646728515625, 0.010988235473632812, 0.017910003662109375, 0.024831771850585938, 0.0317535400390625, 0.03867530822753906, 0.045597076416015625, 0.05251884460449219, 0.05944061279296875, 0.06636238098144531, 0.07328414916992188, 0.08020591735839844, 0.087127685546875, 0.09404945373535156, 0.10097122192382812, 0.10789299011230469, 0.11481475830078125, 0.12173652648925781, 0.12865829467773438, 0.13558006286621094, 0.1425018310546875, 0.14942359924316406, 0.15634536743164062, 0.1632671356201172, 0.17018890380859375, 0.1771106719970703, 0.18403244018554688, 0.19095420837402344, 0.1978759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 12.0, 10.0, 10.0, 11.0, 14.0, 11.0, 23.0, 16.0, 31.0, 23.0, 24.0, 40.0, 28.0, 39.0, 30.0, 50.0, 41.0, 55.0, 40.0, 44.0, 44.0, 43.0, 48.0, 30.0, 47.0, 43.0, 32.0, 32.0, 30.0, 21.0, 21.0, 15.0, 7.0, 9.0, 5.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12350654602050781, -0.11896133422851562, -0.11441612243652344, -0.10987091064453125, -0.10532569885253906, -0.10078048706054688, -0.09623527526855469, -0.0916900634765625, -0.08714485168457031, -0.08259963989257812, -0.07805442810058594, -0.07350921630859375, -0.06896400451660156, -0.06441879272460938, -0.05987358093261719, -0.055328369140625, -0.05078315734863281, -0.046237945556640625, -0.04169273376464844, -0.03714752197265625, -0.03260231018066406, -0.028057098388671875, -0.023511886596679688, -0.0189666748046875, -0.014421463012695312, -0.009876251220703125, -0.0053310394287109375, -0.00078582763671875, 0.0037593841552734375, 0.008304595947265625, 0.012849807739257812, 0.01739501953125, 0.021940231323242188, 0.026485443115234375, 0.031030654907226562, 0.03557586669921875, 0.04012107849121094, 0.044666290283203125, 0.04921150207519531, 0.0537567138671875, 0.05830192565917969, 0.06284713745117188, 0.06739234924316406, 0.07193756103515625, 0.07648277282714844, 0.08102798461914062, 0.08557319641113281, 0.090118408203125, 0.09466361999511719, 0.09920883178710938, 0.10375404357910156, 0.10829925537109375, 0.11284446716308594, 0.11738967895507812, 0.12193489074707031, 0.1264801025390625, 0.1310253143310547, 0.13557052612304688, 0.14011573791503906, 0.14466094970703125, 0.14920616149902344, 0.15375137329101562, 0.1582965850830078, 0.162841796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 6.0, 10.0, 20.0, 30.0, 44.0, 60.0, 119.0, 175.0, 322.0, 674.0, 1575.0, 4150.0, 12834.0, 51686.0, 253220.0, 492821.0, 179428.0, 36108.0, 9459.0, 3267.0, 1257.0, 551.0, 293.0, 161.0, 85.0, 74.0, 43.0, 23.0, 17.0, 6.0, 9.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049224853515625, -0.04728555679321289, -0.04534626007080078, -0.04340696334838867, -0.04146766662597656, -0.03952836990356445, -0.037589073181152344, -0.035649776458740234, -0.033710479736328125, -0.031771183013916016, -0.029831886291503906, -0.027892589569091797, -0.025953292846679688, -0.024013996124267578, -0.02207469940185547, -0.02013540267944336, -0.01819610595703125, -0.01625680923461914, -0.014317512512207031, -0.012378215789794922, -0.010438919067382812, -0.008499622344970703, -0.006560325622558594, -0.004621028900146484, -0.002681732177734375, -0.0007424354553222656, 0.0011968612670898438, 0.003136157989501953, 0.0050754547119140625, 0.007014751434326172, 0.008954048156738281, 0.01089334487915039, 0.0128326416015625, 0.01477193832397461, 0.01671123504638672, 0.018650531768798828, 0.020589828491210938, 0.022529125213623047, 0.024468421936035156, 0.026407718658447266, 0.028347015380859375, 0.030286312103271484, 0.032225608825683594, 0.0341649055480957, 0.03610420227050781, 0.03804349899291992, 0.03998279571533203, 0.04192209243774414, 0.04386138916015625, 0.04580068588256836, 0.04773998260498047, 0.04967927932739258, 0.05161857604980469, 0.0535578727722168, 0.055497169494628906, 0.057436466217041016, 0.059375762939453125, 0.061315059661865234, 0.06325435638427734, 0.06519365310668945, 0.06713294982910156, 0.06907224655151367, 0.07101154327392578, 0.07295083999633789, 0.07489013671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 7.0, 15.0, 15.0, 22.0, 21.0, 35.0, 59.0, 35.0, 67.0, 85.0, 73.0, 96.0, 94.0, 55.0, 58.0, 49.0, 55.0, 32.0, 23.0, 26.0, 16.0, 9.0, 10.0, 5.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1563301086425781e-05, -1.1227093636989594e-05, -1.0890886187553406e-05, -1.0554678738117218e-05, -1.021847128868103e-05, -9.882263839244843e-06, -9.546056389808655e-06, -9.209848940372467e-06, -8.87364149093628e-06, -8.537434041500092e-06, -8.201226592063904e-06, -7.865019142627716e-06, -7.528811693191528e-06, -7.1926042437553406e-06, -6.856396794319153e-06, -6.520189344882965e-06, -6.183981895446777e-06, -5.84777444601059e-06, -5.511566996574402e-06, -5.175359547138214e-06, -4.839152097702026e-06, -4.502944648265839e-06, -4.166737198829651e-06, -3.830529749393463e-06, -3.4943222999572754e-06, -3.1581148505210876e-06, -2.8219074010849e-06, -2.485699951648712e-06, -2.1494925022125244e-06, -1.8132850527763367e-06, -1.477077603340149e-06, -1.1408701539039612e-06, -8.046627044677734e-07, -4.684552550315857e-07, -1.3224780559539795e-07, 2.039596438407898e-07, 5.401670932769775e-07, 8.763745427131653e-07, 1.212581992149353e-06, 1.5487894415855408e-06, 1.8849968910217285e-06, 2.2212043404579163e-06, 2.557411789894104e-06, 2.8936192393302917e-06, 3.2298266887664795e-06, 3.5660341382026672e-06, 3.902241587638855e-06, 4.238449037075043e-06, 4.5746564865112305e-06, 4.910863935947418e-06, 5.247071385383606e-06, 5.583278834819794e-06, 5.9194862842559814e-06, 6.255693733692169e-06, 6.591901183128357e-06, 6.928108632564545e-06, 7.264316082000732e-06, 7.60052353143692e-06, 7.936730980873108e-06, 8.272938430309296e-06, 8.609145879745483e-06, 8.945353329181671e-06, 9.281560778617859e-06, 9.617768228054047e-06, 9.953975677490234e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 11.0, 18.0, 31.0, 28.0, 67.0, 125.0, 211.0, 474.0, 1260.0, 3626.0, 15060.0, 98765.0, 585607.0, 296878.0, 35625.0, 7302.0, 1989.0, 742.0, 338.0, 168.0, 86.0, 55.0, 40.0, 21.0, 7.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06529426574707031, -0.06265640258789062, -0.06001853942871094, -0.05738067626953125, -0.05474281311035156, -0.052104949951171875, -0.04946708679199219, -0.0468292236328125, -0.04419136047363281, -0.041553497314453125, -0.03891563415527344, -0.03627777099609375, -0.03363990783691406, -0.031002044677734375, -0.028364181518554688, -0.025726318359375, -0.023088455200195312, -0.020450592041015625, -0.017812728881835938, -0.01517486572265625, -0.012537002563476562, -0.009899139404296875, -0.0072612762451171875, -0.0046234130859375, -0.0019855499267578125, 0.000652313232421875, 0.0032901763916015625, 0.00592803955078125, 0.008565902709960938, 0.011203765869140625, 0.013841629028320312, 0.0164794921875, 0.019117355346679688, 0.021755218505859375, 0.024393081665039062, 0.02703094482421875, 0.029668807983398438, 0.032306671142578125, 0.03494453430175781, 0.0375823974609375, 0.04022026062011719, 0.042858123779296875, 0.04549598693847656, 0.04813385009765625, 0.05077171325683594, 0.053409576416015625, 0.05604743957519531, 0.058685302734375, 0.06132316589355469, 0.06396102905273438, 0.06659889221191406, 0.06923675537109375, 0.07187461853027344, 0.07451248168945312, 0.07715034484863281, 0.0797882080078125, 0.08242607116699219, 0.08506393432617188, 0.08770179748535156, 0.09033966064453125, 0.09297752380371094, 0.09561538696289062, 0.09825325012207031, 0.10089111328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 5.0, 6.0, 9.0, 8.0, 16.0, 17.0, 22.0, 19.0, 32.0, 39.0, 38.0, 66.0, 64.0, 66.0, 75.0, 71.0, 67.0, 62.0, 73.0, 36.0, 38.0, 42.0, 31.0, 23.0, 7.0, 14.0, 16.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04083251953125, -0.03970003128051758, -0.038567543029785156, -0.037435054779052734, -0.03630256652832031, -0.03517007827758789, -0.03403759002685547, -0.03290510177612305, -0.031772613525390625, -0.030640125274658203, -0.02950763702392578, -0.02837514877319336, -0.027242660522460938, -0.026110172271728516, -0.024977684020996094, -0.023845195770263672, -0.02271270751953125, -0.021580219268798828, -0.020447731018066406, -0.019315242767333984, -0.018182754516601562, -0.01705026626586914, -0.01591777801513672, -0.014785289764404297, -0.013652801513671875, -0.012520313262939453, -0.011387825012207031, -0.01025533676147461, -0.009122848510742188, -0.007990360260009766, -0.006857872009277344, -0.005725383758544922, -0.0045928955078125, -0.003460407257080078, -0.0023279190063476562, -0.0011954307556152344, -6.29425048828125e-05, 0.0010695457458496094, 0.0022020339965820312, 0.003334522247314453, 0.004467010498046875, 0.005599498748779297, 0.006731986999511719, 0.00786447525024414, 0.008996963500976562, 0.010129451751708984, 0.011261940002441406, 0.012394428253173828, 0.01352691650390625, 0.014659404754638672, 0.015791893005371094, 0.016924381256103516, 0.018056869506835938, 0.01918935775756836, 0.02032184600830078, 0.021454334259033203, 0.022586822509765625, 0.023719310760498047, 0.02485179901123047, 0.02598428726196289, 0.027116775512695312, 0.028249263763427734, 0.029381752014160156, 0.030514240264892578, 0.031646728515625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 21.0, 64.0, 221.0, 353.0, 221.0, 72.0, 24.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.832862138748169, -0.792169988155365, -0.7514777779579163, -0.7107856273651123, -0.6700934171676636, -0.6294012665748596, -0.5887091159820557, -0.5480169057846069, -0.507324755191803, -0.46663257479667664, -0.4259403944015503, -0.38524824380874634, -0.34455606341362, -0.30386388301849365, -0.2631717324256897, -0.22247955203056335, -0.181787371635437, -0.14109519124031067, -0.10040302574634552, -0.059710852801799774, -0.01901867985725403, 0.021673500537872314, 0.06236566603183746, 0.10305783152580261, 0.14375001192092896, 0.1844421923160553, 0.22513435781002045, 0.2658265233039856, 0.30651870369911194, 0.3472108840942383, 0.38790303468704224, 0.4285952150821686, 0.4692875146865845, 0.5099796652793884, 0.5506718754768372, 0.5913640260696411, 0.6320562362670898, 0.6727483868598938, 0.7134405374526978, 0.7541327476501465, 0.7948248982429504, 0.8355170488357544, 0.8762092590332031, 0.9169014096260071, 0.957593560218811, 0.9982857704162598, 1.0389779806137085, 1.0796700716018677, 1.1203622817993164, 1.1610544919967651, 1.2017465829849243, 1.242438793182373, 1.2831310033798218, 1.3238232135772705, 1.3645153045654297, 1.4052075147628784, 1.4458997249603271, 1.4865919351577759, 1.527284026145935, 1.5679762363433838, 1.6086684465408325, 1.6493606567382812, 1.6900527477264404, 1.7307449579238892, 1.7714370489120483]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 3.0, 6.0, 13.0, 13.0, 19.0, 20.0, 21.0, 16.0, 21.0, 22.0, 27.0, 19.0, 28.0, 28.0, 27.0, 46.0, 27.0, 42.0, 31.0, 43.0, 37.0, 28.0, 32.0, 41.0, 27.0, 29.0, 38.0, 31.0, 29.0, 25.0, 24.0, 24.0, 18.0, 19.0, 22.0, 17.0, 13.0, 11.0, 13.0, 3.0, 8.0, 0.0, 12.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.38854140043258667, -0.376456618309021, -0.3643718361854553, -0.35228705406188965, -0.340202271938324, -0.3281174898147583, -0.3160327076911926, -0.30394789576530457, -0.2918631136417389, -0.2797783315181732, -0.26769354939460754, -0.25560876727104187, -0.243523970246315, -0.23143918812274933, -0.21935440599918365, -0.2072696089744568, -0.1951848417520523, -0.18310005962848663, -0.17101527750492096, -0.1589304804801941, -0.14684569835662842, -0.13476091623306274, -0.12267613410949707, -0.1105913445353508, -0.09850656241178513, -0.08642178028821945, -0.07433699071407318, -0.06225220859050751, -0.050167422741651535, -0.03808263689279556, -0.02599785476922989, -0.013913065195083618, -0.0018282830715179443, 0.010256501846015453, 0.02234128676354885, 0.034426070749759674, 0.046510856598615646, 0.05859564244747162, 0.07068042457103729, 0.08276521414518356, 0.09484999626874924, 0.10693477839231491, 0.11901956796646118, 0.13110435009002686, 0.14318913221359253, 0.1552739143371582, 0.16735869646072388, 0.17944349348545074, 0.19152827560901642, 0.2036130577325821, 0.21569783985614777, 0.22778263688087463, 0.2398674190044403, 0.251952201128006, 0.26403698325157166, 0.27612176537513733, 0.288206547498703, 0.3002913296222687, 0.31237611174583435, 0.3244608938694, 0.3365456759929657, 0.34863048791885376, 0.36071527004241943, 0.3728000521659851, 0.3848848342895508]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 9.0, 10.0, 15.0, 13.0, 24.0, 28.0, 64.0, 88.0, 181.0, 402.0, 872.0, 2465.0, 8177.0, 31018.0, 208813.0, 2474820.0, 1352483.0, 89463.0, 17401.0, 4850.0, 1670.0, 665.0, 308.0, 157.0, 100.0, 70.0, 42.0, 32.0, 24.0, 17.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11865234375, -0.11387252807617188, -0.10909271240234375, -0.10431289672851562, -0.0995330810546875, -0.09475326538085938, -0.08997344970703125, -0.08519363403320312, -0.080413818359375, -0.07563400268554688, -0.07085418701171875, -0.06607437133789062, -0.0612945556640625, -0.056514739990234375, -0.05173492431640625, -0.046955108642578125, -0.04217529296875, -0.037395477294921875, -0.03261566162109375, -0.027835845947265625, -0.0230560302734375, -0.018276214599609375, -0.01349639892578125, -0.008716583251953125, -0.003936767578125, 0.000843048095703125, 0.00562286376953125, 0.010402679443359375, 0.0151824951171875, 0.019962310791015625, 0.02474212646484375, 0.029521942138671875, 0.0343017578125, 0.039081573486328125, 0.04386138916015625, 0.048641204833984375, 0.0534210205078125, 0.058200836181640625, 0.06298065185546875, 0.06776046752929688, 0.072540283203125, 0.07732009887695312, 0.08209991455078125, 0.08687973022460938, 0.0916595458984375, 0.09643936157226562, 0.10121917724609375, 0.10599899291992188, 0.11077880859375, 0.11555862426757812, 0.12033843994140625, 0.12511825561523438, 0.1298980712890625, 0.13467788696289062, 0.13945770263671875, 0.14423751831054688, 0.149017333984375, 0.15379714965820312, 0.15857696533203125, 0.16335678100585938, 0.1681365966796875, 0.17291641235351562, 0.17769622802734375, 0.18247604370117188, 0.187255859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 13.0, 15.0, 20.0, 18.0, 36.0, 38.0, 51.0, 55.0, 59.0, 76.0, 78.0, 69.0, 74.0, 61.0, 63.0, 54.0, 36.0, 44.0, 46.0, 25.0, 19.0, 17.0, 10.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09429931640625, -0.0909872055053711, -0.08767509460449219, -0.08436298370361328, -0.08105087280273438, -0.07773876190185547, -0.07442665100097656, -0.07111454010009766, -0.06780242919921875, -0.06449031829833984, -0.06117820739746094, -0.05786609649658203, -0.054553985595703125, -0.05124187469482422, -0.04792976379394531, -0.044617652893066406, -0.0413055419921875, -0.037993431091308594, -0.03468132019042969, -0.03136920928955078, -0.028057098388671875, -0.02474498748779297, -0.021432876586914062, -0.018120765686035156, -0.01480865478515625, -0.011496543884277344, -0.008184432983398438, -0.004872322082519531, -0.001560211181640625, 0.0017518997192382812, 0.0050640106201171875, 0.008376121520996094, 0.011688232421875, 0.015000343322753906, 0.018312454223632812, 0.02162456512451172, 0.024936676025390625, 0.02824878692626953, 0.03156089782714844, 0.034873008728027344, 0.03818511962890625, 0.041497230529785156, 0.04480934143066406, 0.04812145233154297, 0.051433563232421875, 0.05474567413330078, 0.05805778503417969, 0.061369895935058594, 0.0646820068359375, 0.0679941177368164, 0.07130622863769531, 0.07461833953857422, 0.07793045043945312, 0.08124256134033203, 0.08455467224121094, 0.08786678314208984, 0.09117889404296875, 0.09449100494384766, 0.09780311584472656, 0.10111522674560547, 0.10442733764648438, 0.10773944854736328, 0.11105155944824219, 0.1143636703491211, 0.11767578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 7.0, 5.0, 11.0, 15.0, 14.0, 16.0, 33.0, 38.0, 70.0, 106.0, 211.0, 422.0, 1217.0, 4807.0, 36811.0, 1497920.0, 2592452.0, 51859.0, 5808.0, 1412.0, 493.0, 206.0, 101.0, 72.0, 42.0, 28.0, 27.0, 12.0, 12.0, 18.0, 10.0, 8.0, 6.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.2547111511230469, -0.24623870849609375, -0.23776626586914062, -0.2292938232421875, -0.22082138061523438, -0.21234893798828125, -0.20387649536132812, -0.195404052734375, -0.18693161010742188, -0.17845916748046875, -0.16998672485351562, -0.1615142822265625, -0.15304183959960938, -0.14456939697265625, -0.13609695434570312, -0.12762451171875, -0.11915206909179688, -0.11067962646484375, -0.10220718383789062, -0.0937347412109375, -0.08526229858398438, -0.07678985595703125, -0.06831741333007812, -0.059844970703125, -0.051372528076171875, -0.04290008544921875, -0.034427642822265625, -0.0259552001953125, -0.017482757568359375, -0.00901031494140625, -0.000537872314453125, 0.0079345703125, 0.016407012939453125, 0.02487945556640625, 0.033351898193359375, 0.0418243408203125, 0.050296783447265625, 0.05876922607421875, 0.06724166870117188, 0.075714111328125, 0.08418655395507812, 0.09265899658203125, 0.10113143920898438, 0.1096038818359375, 0.11807632446289062, 0.12654876708984375, 0.13502120971679688, 0.14349365234375, 0.15196609497070312, 0.16043853759765625, 0.16891098022460938, 0.1773834228515625, 0.18585586547851562, 0.19432830810546875, 0.20280075073242188, 0.211273193359375, 0.21974563598632812, 0.22821807861328125, 0.23669052124023438, 0.2451629638671875, 0.2536354064941406, 0.26210784912109375, 0.2705802917480469, 0.279052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 16.0, 13.0, 11.0, 13.0, 24.0, 20.0, 36.0, 45.0, 73.0, 103.0, 134.0, 255.0, 473.0, 698.0, 739.0, 546.0, 297.0, 177.0, 113.0, 81.0, 55.0, 33.0, 25.0, 18.0, 12.0, 19.0, 8.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1571044921875, -0.15250015258789062, -0.14789581298828125, -0.14329147338867188, -0.1386871337890625, -0.13408279418945312, -0.12947845458984375, -0.12487411499023438, -0.120269775390625, -0.11566543579101562, -0.11106109619140625, -0.10645675659179688, -0.1018524169921875, -0.09724807739257812, -0.09264373779296875, -0.08803939819335938, -0.08343505859375, -0.07883071899414062, -0.07422637939453125, -0.06962203979492188, -0.0650177001953125, -0.060413360595703125, -0.05580902099609375, -0.051204681396484375, -0.046600341796875, -0.041996002197265625, -0.03739166259765625, -0.032787322998046875, -0.0281829833984375, -0.023578643798828125, -0.01897430419921875, -0.014369964599609375, -0.009765625, -0.005161285400390625, -0.00055694580078125, 0.004047393798828125, 0.0086517333984375, 0.013256072998046875, 0.01786041259765625, 0.022464752197265625, 0.027069091796875, 0.031673431396484375, 0.03627777099609375, 0.040882110595703125, 0.0454864501953125, 0.050090789794921875, 0.05469512939453125, 0.059299468994140625, 0.06390380859375, 0.06850814819335938, 0.07311248779296875, 0.07771682739257812, 0.0823211669921875, 0.08692550659179688, 0.09152984619140625, 0.09613418579101562, 0.100738525390625, 0.10534286499023438, 0.10994720458984375, 0.11455154418945312, 0.1191558837890625, 0.12376022338867188, 0.12836456298828125, 0.13296890258789062, 0.1375732421875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 9.0, 4.0, 36.0, 132.0, 284.0, 365.0, 144.0, 21.0, 10.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3484253883361816, -1.298510193824768, -1.2485949993133545, -1.1986799240112305, -1.148764729499817, -1.0988495349884033, -1.0489343404769897, -0.999019205570221, -0.9491040706634521, -0.8991888761520386, -0.8492737412452698, -0.7993585467338562, -0.7494434118270874, -0.6995282173156738, -0.6496130228042603, -0.5996978878974915, -0.5497826933860779, -0.4998675286769867, -0.4499523639678955, -0.40003716945648193, -0.35012203454971313, -0.30020684003829956, -0.2502916753292084, -0.2003765106201172, -0.150461345911026, -0.10054618120193481, -0.05063100904226303, -0.0007158368825912476, 0.04919932782649994, 0.09911449253559113, 0.1490296721458435, 0.1989448368549347, 0.24886000156402588, 0.29877516627311707, 0.34869033098220825, 0.3986055254936218, 0.4485206604003906, 0.4984358549118042, 0.5483510494232178, 0.5982661843299866, 0.6481813192367554, 0.698096513748169, 0.7480116486549377, 0.7979268431663513, 0.8478419780731201, 0.8977571725845337, 0.9476723670959473, 0.9975875020027161, 1.0475027561187744, 1.097417950630188, 1.1473331451416016, 1.1972482204437256, 1.2471634149551392, 1.2970786094665527, 1.3469938039779663, 1.3969089984893799, 1.446824073791504, 1.4967392683029175, 1.546654462814331, 1.596569538116455, 1.6464847326278687, 1.6963999271392822, 1.7463151216506958, 1.7962303161621094, 1.8461453914642334]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 14.0, 19.0, 30.0, 19.0, 30.0, 29.0, 45.0, 29.0, 53.0, 44.0, 48.0, 36.0, 58.0, 64.0, 47.0, 41.0, 45.0, 37.0, 50.0, 41.0, 37.0, 28.0, 32.0, 24.0, 22.0, 12.0, 17.0, 11.0, 4.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3978846073150635, -0.3827719986438751, -0.36765938997268677, -0.3525467813014984, -0.33743417263031006, -0.3223215639591217, -0.30720895528793335, -0.2920963168144226, -0.27698373794555664, -0.2618711292743683, -0.24675852060317993, -0.23164591193199158, -0.21653330326080322, -0.20142069458961487, -0.18630807101726532, -0.17119546234607697, -0.15608283877372742, -0.14097023010253906, -0.1258576214313507, -0.11074500530958176, -0.0956323966383934, -0.08051978796720505, -0.0654071718454361, -0.05029456317424774, -0.03518195450305939, -0.020069343969225883, -0.00495673343539238, 0.010155878961086273, 0.025268487632274628, 0.04038109630346298, 0.055493712425231934, 0.07060632109642029, 0.08571892976760864, 0.100831538438797, 0.11594414710998535, 0.1310567557811737, 0.14616936445236206, 0.16128197312355042, 0.17639459669589996, 0.19150720536708832, 0.20661981403827667, 0.22173242270946503, 0.23684503138065338, 0.25195765495300293, 0.2670702636241913, 0.28218287229537964, 0.297295480966568, 0.31240808963775635, 0.3275206983089447, 0.34263330698013306, 0.3577459156513214, 0.37285852432250977, 0.3879711329936981, 0.4030837416648865, 0.4181963801383972, 0.4333089590072632, 0.4484215974807739, 0.4635342061519623, 0.47864681482315063, 0.493759423494339, 0.5088720321655273, 0.5239846706390381, 0.539097249507904, 0.5542098879814148, 0.5693224668502808]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 14.0, 6.0, 15.0, 16.0, 51.0, 33.0, 45.0, 95.0, 147.0, 226.0, 421.0, 732.0, 1449.0, 3076.0, 7590.0, 20731.0, 63453.0, 205654.0, 419281.0, 220683.0, 68465.0, 21792.0, 7916.0, 3268.0, 1484.0, 767.0, 401.0, 243.0, 148.0, 91.0, 79.0, 42.0, 38.0, 21.0, 19.0, 12.0, 9.0, 3.0, 7.0, 5.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.146240234375, -0.14174461364746094, -0.13724899291992188, -0.1327533721923828, -0.12825775146484375, -0.12376213073730469, -0.11926651000976562, -0.11477088928222656, -0.1102752685546875, -0.10577964782714844, -0.10128402709960938, -0.09678840637207031, -0.09229278564453125, -0.08779716491699219, -0.08330154418945312, -0.07880592346191406, -0.074310302734375, -0.06981468200683594, -0.06531906127929688, -0.06082344055175781, -0.05632781982421875, -0.05183219909667969, -0.047336578369140625, -0.04284095764160156, -0.0383453369140625, -0.03384971618652344, -0.029354095458984375, -0.024858474731445312, -0.02036285400390625, -0.015867233276367188, -0.011371612548828125, -0.0068759918212890625, -0.00238037109375, 0.0021152496337890625, 0.006610870361328125, 0.011106491088867188, 0.01560211181640625, 0.020097732543945312, 0.024593353271484375, 0.029088973999023438, 0.0335845947265625, 0.03808021545410156, 0.042575836181640625, 0.04707145690917969, 0.05156707763671875, 0.05606269836425781, 0.060558319091796875, 0.06505393981933594, 0.069549560546875, 0.07404518127441406, 0.07854080200195312, 0.08303642272949219, 0.08753204345703125, 0.09202766418457031, 0.09652328491210938, 0.10101890563964844, 0.1055145263671875, 0.11001014709472656, 0.11450576782226562, 0.11900138854980469, 0.12349700927734375, 0.1279926300048828, 0.13248825073242188, 0.13698387145996094, 0.1414794921875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 8.0, 11.0, 26.0, 39.0, 40.0, 52.0, 57.0, 93.0, 86.0, 92.0, 116.0, 76.0, 75.0, 44.0, 68.0, 27.0, 27.0, 24.0, 12.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09665393829345703, -0.09290504455566406, -0.0891561508178711, -0.08540725708007812, -0.08165836334228516, -0.07790946960449219, -0.07416057586669922, -0.07041168212890625, -0.06666278839111328, -0.06291389465332031, -0.059165000915527344, -0.055416107177734375, -0.051667213439941406, -0.04791831970214844, -0.04416942596435547, -0.0404205322265625, -0.03667163848876953, -0.03292274475097656, -0.029173851013183594, -0.025424957275390625, -0.021676063537597656, -0.017927169799804688, -0.014178276062011719, -0.01042938232421875, -0.006680488586425781, -0.0029315948486328125, 0.0008172988891601562, 0.004566192626953125, 0.008315086364746094, 0.012063980102539062, 0.01581287384033203, 0.019561767578125, 0.02331066131591797, 0.027059555053710938, 0.030808448791503906, 0.034557342529296875, 0.038306236267089844, 0.04205513000488281, 0.04580402374267578, 0.04955291748046875, 0.05330181121826172, 0.05705070495605469, 0.060799598693847656, 0.06454849243164062, 0.0682973861694336, 0.07204627990722656, 0.07579517364501953, 0.0795440673828125, 0.08329296112060547, 0.08704185485839844, 0.0907907485961914, 0.09453964233398438, 0.09828853607177734, 0.10203742980957031, 0.10578632354736328, 0.10953521728515625, 0.11328411102294922, 0.11703300476074219, 0.12078189849853516, 0.12453079223632812, 0.1282796859741211, 0.13202857971191406, 0.13577747344970703, 0.1395263671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 3.0, 3.0, 10.0, 7.0, 13.0, 25.0, 23.0, 32.0, 45.0, 79.0, 111.0, 192.0, 437.0, 1144.0, 4138.0, 22586.0, 228042.0, 692009.0, 85030.0, 10708.0, 2328.0, 786.0, 325.0, 166.0, 102.0, 56.0, 28.0, 28.0, 22.0, 15.0, 6.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27734375, -0.2690162658691406, -0.26068878173828125, -0.2523612976074219, -0.2440338134765625, -0.23570632934570312, -0.22737884521484375, -0.21905136108398438, -0.210723876953125, -0.20239639282226562, -0.19406890869140625, -0.18574142456054688, -0.1774139404296875, -0.16908645629882812, -0.16075897216796875, -0.15243148803710938, -0.14410400390625, -0.13577651977539062, -0.12744903564453125, -0.11912155151367188, -0.1107940673828125, -0.10246658325195312, -0.09413909912109375, -0.08581161499023438, -0.077484130859375, -0.06915664672851562, -0.06082916259765625, -0.052501678466796875, -0.0441741943359375, -0.035846710205078125, -0.02751922607421875, -0.019191741943359375, -0.0108642578125, -0.002536773681640625, 0.00579071044921875, 0.014118194580078125, 0.0224456787109375, 0.030773162841796875, 0.03910064697265625, 0.047428131103515625, 0.055755615234375, 0.06408309936523438, 0.07241058349609375, 0.08073806762695312, 0.0890655517578125, 0.09739303588867188, 0.10572052001953125, 0.11404800415039062, 0.12237548828125, 0.13070297241210938, 0.13903045654296875, 0.14735794067382812, 0.1556854248046875, 0.16401290893554688, 0.17234039306640625, 0.18066787719726562, 0.188995361328125, 0.19732284545898438, 0.20565032958984375, 0.21397781372070312, 0.2223052978515625, 0.23063278198242188, 0.23896026611328125, 0.24728775024414062, 0.255615234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 9.0, 16.0, 7.0, 11.0, 17.0, 28.0, 12.0, 25.0, 35.0, 35.0, 51.0, 34.0, 49.0, 53.0, 50.0, 61.0, 56.0, 54.0, 47.0, 45.0, 44.0, 32.0, 40.0, 38.0, 25.0, 23.0, 21.0, 17.0, 14.0, 10.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18761444091796875, -0.1815032958984375, -0.17539215087890625, -0.169281005859375, -0.16316986083984375, -0.1570587158203125, -0.15094757080078125, -0.14483642578125, -0.13872528076171875, -0.1326141357421875, -0.12650299072265625, -0.120391845703125, -0.11428070068359375, -0.1081695556640625, -0.10205841064453125, -0.095947265625, -0.08983612060546875, -0.0837249755859375, -0.07761383056640625, -0.071502685546875, -0.06539154052734375, -0.0592803955078125, -0.05316925048828125, -0.04705810546875, -0.04094696044921875, -0.0348358154296875, -0.02872467041015625, -0.022613525390625, -0.01650238037109375, -0.0103912353515625, -0.00428009033203125, 0.0018310546875, 0.00794219970703125, 0.0140533447265625, 0.02016448974609375, 0.026275634765625, 0.03238677978515625, 0.0384979248046875, 0.04460906982421875, 0.05072021484375, 0.05683135986328125, 0.0629425048828125, 0.06905364990234375, 0.075164794921875, 0.08127593994140625, 0.0873870849609375, 0.09349822998046875, 0.099609375, 0.10572052001953125, 0.1118316650390625, 0.11794281005859375, 0.124053955078125, 0.13016510009765625, 0.1362762451171875, 0.14238739013671875, 0.14849853515625, 0.15460968017578125, 0.1607208251953125, 0.16683197021484375, 0.172943115234375, 0.17905426025390625, 0.1851654052734375, 0.19127655029296875, 0.1973876953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 9.0, 9.0, 17.0, 25.0, 37.0, 57.0, 94.0, 185.0, 484.0, 1151.0, 3615.0, 16125.0, 102440.0, 638354.0, 245507.0, 31198.0, 6311.0, 1661.0, 650.0, 279.0, 147.0, 67.0, 53.0, 18.0, 13.0, 9.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07623291015625, -0.07403564453125, -0.07183837890625, -0.06964111328125, -0.06744384765625, -0.06524658203125, -0.06304931640625, -0.06085205078125, -0.05865478515625, -0.05645751953125, -0.05426025390625, -0.05206298828125, -0.04986572265625, -0.04766845703125, -0.04547119140625, -0.04327392578125, -0.04107666015625, -0.03887939453125, -0.03668212890625, -0.03448486328125, -0.03228759765625, -0.03009033203125, -0.02789306640625, -0.02569580078125, -0.02349853515625, -0.02130126953125, -0.01910400390625, -0.01690673828125, -0.01470947265625, -0.01251220703125, -0.01031494140625, -0.00811767578125, -0.00592041015625, -0.00372314453125, -0.00152587890625, 0.00067138671875, 0.00286865234375, 0.00506591796875, 0.00726318359375, 0.00946044921875, 0.01165771484375, 0.01385498046875, 0.01605224609375, 0.01824951171875, 0.02044677734375, 0.02264404296875, 0.02484130859375, 0.02703857421875, 0.02923583984375, 0.03143310546875, 0.03363037109375, 0.03582763671875, 0.03802490234375, 0.04022216796875, 0.04241943359375, 0.04461669921875, 0.04681396484375, 0.04901123046875, 0.05120849609375, 0.05340576171875, 0.05560302734375, 0.05780029296875, 0.05999755859375, 0.06219482421875, 0.06439208984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 2.0, 13.0, 11.0, 11.0, 16.0, 27.0, 25.0, 39.0, 33.0, 56.0, 62.0, 76.0, 81.0, 99.0, 83.0, 74.0, 49.0, 43.0, 34.0, 42.0, 32.0, 21.0, 11.0, 11.0, 8.0, 4.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.225440979003906e-06, -7.934868335723877e-06, -7.644295692443848e-06, -7.353723049163818e-06, -7.063150405883789e-06, -6.77257776260376e-06, -6.4820051193237305e-06, -6.191432476043701e-06, -5.900859832763672e-06, -5.610287189483643e-06, -5.319714546203613e-06, -5.029141902923584e-06, -4.738569259643555e-06, -4.447996616363525e-06, -4.157423973083496e-06, -3.866851329803467e-06, -3.5762786865234375e-06, -3.285706043243408e-06, -2.995133399963379e-06, -2.7045607566833496e-06, -2.4139881134033203e-06, -2.123415470123291e-06, -1.8328428268432617e-06, -1.5422701835632324e-06, -1.2516975402832031e-06, -9.611248970031738e-07, -6.705522537231445e-07, -3.7997961044311523e-07, -8.940696716308594e-08, 2.0116567611694336e-07, 4.917383193969727e-07, 7.82310962677002e-07, 1.0728836059570312e-06, 1.3634562492370605e-06, 1.6540288925170898e-06, 1.944601535797119e-06, 2.2351741790771484e-06, 2.5257468223571777e-06, 2.816319465637207e-06, 3.1068921089172363e-06, 3.3974647521972656e-06, 3.688037395477295e-06, 3.978610038757324e-06, 4.2691826820373535e-06, 4.559755325317383e-06, 4.850327968597412e-06, 5.140900611877441e-06, 5.431473255157471e-06, 5.7220458984375e-06, 6.012618541717529e-06, 6.303191184997559e-06, 6.593763828277588e-06, 6.884336471557617e-06, 7.1749091148376465e-06, 7.465481758117676e-06, 7.756054401397705e-06, 8.046627044677734e-06, 8.337199687957764e-06, 8.627772331237793e-06, 8.918344974517822e-06, 9.208917617797852e-06, 9.499490261077881e-06, 9.79006290435791e-06, 1.008063554763794e-05, 1.0371208190917969e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 12.0, 19.0, 19.0, 29.0, 51.0, 85.0, 133.0, 305.0, 612.0, 1680.0, 5494.0, 25620.0, 209811.0, 669358.0, 112882.0, 16104.0, 3880.0, 1344.0, 525.0, 246.0, 118.0, 76.0, 41.0, 21.0, 13.0, 15.0, 10.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06524276733398438, -0.06285858154296875, -0.060474395751953125, -0.0580902099609375, -0.055706024169921875, -0.05332183837890625, -0.050937652587890625, -0.048553466796875, -0.046169281005859375, -0.04378509521484375, -0.041400909423828125, -0.0390167236328125, -0.036632537841796875, -0.03424835205078125, -0.031864166259765625, -0.02947998046875, -0.027095794677734375, -0.02471160888671875, -0.022327423095703125, -0.0199432373046875, -0.017559051513671875, -0.01517486572265625, -0.012790679931640625, -0.010406494140625, -0.008022308349609375, -0.00563812255859375, -0.003253936767578125, -0.0008697509765625, 0.001514434814453125, 0.00389862060546875, 0.006282806396484375, 0.0086669921875, 0.011051177978515625, 0.01343536376953125, 0.015819549560546875, 0.0182037353515625, 0.020587921142578125, 0.02297210693359375, 0.025356292724609375, 0.027740478515625, 0.030124664306640625, 0.03250885009765625, 0.034893035888671875, 0.0372772216796875, 0.039661407470703125, 0.04204559326171875, 0.044429779052734375, 0.04681396484375, 0.049198150634765625, 0.05158233642578125, 0.053966522216796875, 0.0563507080078125, 0.058734893798828125, 0.06111907958984375, 0.06350326538085938, 0.065887451171875, 0.06827163696289062, 0.07065582275390625, 0.07304000854492188, 0.0754241943359375, 0.07780838012695312, 0.08019256591796875, 0.08257675170898438, 0.0849609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 6.0, 5.0, 12.0, 21.0, 21.0, 28.0, 32.0, 56.0, 69.0, 92.0, 102.0, 104.0, 103.0, 86.0, 65.0, 44.0, 22.0, 26.0, 22.0, 12.0, 7.0, 12.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06602764129638672, -0.06412315368652344, -0.062218666076660156, -0.060314178466796875, -0.058409690856933594, -0.05650520324707031, -0.05460071563720703, -0.05269622802734375, -0.05079174041748047, -0.04888725280761719, -0.046982765197753906, -0.045078277587890625, -0.043173789978027344, -0.04126930236816406, -0.03936481475830078, -0.0374603271484375, -0.03555583953857422, -0.03365135192871094, -0.031746864318847656, -0.029842376708984375, -0.027937889099121094, -0.026033401489257812, -0.02412891387939453, -0.02222442626953125, -0.02031993865966797, -0.018415451049804688, -0.016510963439941406, -0.014606475830078125, -0.012701988220214844, -0.010797500610351562, -0.008893013000488281, -0.006988525390625, -0.005084037780761719, -0.0031795501708984375, -0.0012750625610351562, 0.000629425048828125, 0.0025339126586914062, 0.0044384002685546875, 0.006342887878417969, 0.00824737548828125, 0.010151863098144531, 0.012056350708007812, 0.013960838317871094, 0.015865325927734375, 0.017769813537597656, 0.019674301147460938, 0.02157878875732422, 0.0234832763671875, 0.02538776397705078, 0.027292251586914062, 0.029196739196777344, 0.031101226806640625, 0.033005714416503906, 0.03491020202636719, 0.03681468963623047, 0.03871917724609375, 0.04062366485595703, 0.04252815246582031, 0.044432640075683594, 0.046337127685546875, 0.048241615295410156, 0.05014610290527344, 0.05205059051513672, 0.053955078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 7.0, 28.0, 307.0, 525.0, 118.0, 19.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48746418952941895, -0.4088039994239807, -0.33014383912086487, -0.251483678817749, -0.1728234887123108, -0.09416329860687256, -0.015503138303756714, 0.06315702199935913, 0.14181721210479736, 0.2204773873090744, 0.29913756251335144, 0.3777977228164673, 0.4564579129219055, 0.5351181030273438, 0.6137782335281372, 0.6924384236335754, 0.7710986137390137, 0.8497588038444519, 0.9284189939498901, 1.0070791244506836, 1.0857393741607666, 1.16439950466156, 1.2430596351623535, 1.3217198848724365, 1.40038001537323, 1.4790401458740234, 1.5577003955841064, 1.6363605260849, 1.7150206565856934, 1.7936809062957764, 1.8723410367965698, 1.9510011672973633, 2.0296616554260254, 2.1083219051361084, 2.1869819164276123, 2.2656421661376953, 2.3443024158477783, 2.4229626655578613, 2.5016226768493652, 2.5802829265594482, 2.6589431762695312, 2.7376034259796143, 2.816263437271118, 2.894923686981201, 2.973583936691284, 3.052244186401367, 3.130904197692871, 3.209564447402954, 3.288224458694458, 3.366884708404541, 3.445544719696045, 3.524204969406128, 3.602865219116211, 3.681525230407715, 3.760185480117798, 3.838845729827881, 3.9175057411193848, 3.9961659908294678, 4.074826240539551, 4.153486251831055, 4.232146263122559, 4.310806751251221, 4.389466762542725, 4.4681267738342285, 4.546787261962891]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 8.0, 3.0, 10.0, 3.0, 9.0, 14.0, 11.0, 14.0, 11.0, 19.0, 21.0, 22.0, 35.0, 29.0, 37.0, 41.0, 53.0, 38.0, 36.0, 45.0, 47.0, 39.0, 46.0, 45.0, 40.0, 54.0, 37.0, 35.0, 31.0, 26.0, 22.0, 19.0, 17.0, 24.0, 19.0, 10.0, 10.0, 8.0, 3.0, 11.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5686251521110535, -0.5497246384620667, -0.5308240652084351, -0.5119235515594482, -0.49302300810813904, -0.47412246465682983, -0.455221951007843, -0.4363214075565338, -0.4174208641052246, -0.3985203206539154, -0.3796197772026062, -0.3607192635536194, -0.3418187201023102, -0.322918176651001, -0.30401766300201416, -0.28511711955070496, -0.26621657609939575, -0.24731603264808655, -0.22841550409793854, -0.20951497554779053, -0.19061443209648132, -0.17171388864517212, -0.1528133600950241, -0.1339128315448761, -0.1150122880935669, -0.09611175209283829, -0.07721121609210968, -0.05831068009138107, -0.039410144090652466, -0.02050960808992386, -0.0016090720891952515, 0.01729145646095276, 0.03619199991226196, 0.05509253591299057, 0.07399307191371918, 0.09289360791444778, 0.11179414391517639, 0.1306946873664856, 0.1495952159166336, 0.16849574446678162, 0.18739628791809082, 0.20629683136940002, 0.22519735991954803, 0.24409788846969604, 0.26299843192100525, 0.28189897537231445, 0.30079948902130127, 0.3197000324726105, 0.3386005759239197, 0.3575011193752289, 0.3764016628265381, 0.3953021764755249, 0.4142027199268341, 0.4331032633781433, 0.4520037770271301, 0.47090432047843933, 0.48980486392974854, 0.5087053775787354, 0.5276059508323669, 0.5465064644813538, 0.5654070377349854, 0.5843075513839722, 0.603208065032959, 0.6221085786819458, 0.6410091519355774]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 12.0, 23.0, 38.0, 55.0, 107.0, 196.0, 419.0, 978.0, 3105.0, 8735.0, 35112.0, 309713.0, 2642224.0, 1092825.0, 78431.0, 15034.0, 4105.0, 1529.0, 656.0, 383.0, 187.0, 129.0, 84.0, 53.0, 36.0, 26.0, 19.0, 19.0, 10.0, 10.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.124755859375, -0.12025642395019531, -0.11575698852539062, -0.11125755310058594, -0.10675811767578125, -0.10225868225097656, -0.09775924682617188, -0.09325981140136719, -0.0887603759765625, -0.08426094055175781, -0.07976150512695312, -0.07526206970214844, -0.07076263427734375, -0.06626319885253906, -0.061763763427734375, -0.05726432800292969, -0.052764892578125, -0.04826545715332031, -0.043766021728515625, -0.03926658630371094, -0.03476715087890625, -0.030267715454101562, -0.025768280029296875, -0.021268844604492188, -0.0167694091796875, -0.012269973754882812, -0.007770538330078125, -0.0032711029052734375, 0.00122833251953125, 0.0057277679443359375, 0.010227203369140625, 0.014726638793945312, 0.01922607421875, 0.023725509643554688, 0.028224945068359375, 0.03272438049316406, 0.03722381591796875, 0.04172325134277344, 0.046222686767578125, 0.05072212219238281, 0.0552215576171875, 0.05972099304199219, 0.06422042846679688, 0.06871986389160156, 0.07321929931640625, 0.07771873474121094, 0.08221817016601562, 0.08671760559082031, 0.091217041015625, 0.09571647644042969, 0.10021591186523438, 0.10471534729003906, 0.10921478271484375, 0.11371421813964844, 0.11821365356445312, 0.12271308898925781, 0.1272125244140625, 0.1317119598388672, 0.13621139526367188, 0.14071083068847656, 0.14521026611328125, 0.14970970153808594, 0.15420913696289062, 0.1587085723876953, 0.1632080078125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 16.0, 21.0, 35.0, 30.0, 41.0, 53.0, 68.0, 84.0, 80.0, 64.0, 79.0, 82.0, 67.0, 66.0, 50.0, 45.0, 38.0, 21.0, 13.0, 14.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1021728515625, -0.09805107116699219, -0.09392929077148438, -0.08980751037597656, -0.08568572998046875, -0.08156394958496094, -0.07744216918945312, -0.07332038879394531, -0.0691986083984375, -0.06507682800292969, -0.060955047607421875, -0.05683326721191406, -0.05271148681640625, -0.04858970642089844, -0.044467926025390625, -0.04034614562988281, -0.036224365234375, -0.03210258483886719, -0.027980804443359375, -0.023859024047851562, -0.01973724365234375, -0.015615463256835938, -0.011493682861328125, -0.0073719024658203125, -0.0032501220703125, 0.0008716583251953125, 0.004993438720703125, 0.009115219116210938, 0.01323699951171875, 0.017358779907226562, 0.021480560302734375, 0.025602340698242188, 0.02972412109375, 0.03384590148925781, 0.037967681884765625, 0.04208946228027344, 0.04621124267578125, 0.05033302307128906, 0.054454803466796875, 0.05857658386230469, 0.0626983642578125, 0.06682014465332031, 0.07094192504882812, 0.07506370544433594, 0.07918548583984375, 0.08330726623535156, 0.08742904663085938, 0.09155082702636719, 0.095672607421875, 0.09979438781738281, 0.10391616821289062, 0.10803794860839844, 0.11215972900390625, 0.11628150939941406, 0.12040328979492188, 0.12452507019042969, 0.1286468505859375, 0.1327686309814453, 0.13689041137695312, 0.14101219177246094, 0.14513397216796875, 0.14925575256347656, 0.15337753295898438, 0.1574993133544922, 0.16162109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 10.0, 6.0, 20.0, 24.0, 49.0, 50.0, 101.0, 172.0, 374.0, 758.0, 1771.0, 5178.0, 19985.0, 130363.0, 2181839.0, 1719173.0, 109074.0, 17474.0, 4720.0, 1640.0, 704.0, 328.0, 160.0, 108.0, 71.0, 41.0, 31.0, 11.0, 13.0, 8.0, 9.0, 5.0, 3.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1566162109375, -0.15138816833496094, -0.14616012573242188, -0.1409320831298828, -0.13570404052734375, -0.1304759979248047, -0.12524795532226562, -0.12001991271972656, -0.1147918701171875, -0.10956382751464844, -0.10433578491210938, -0.09910774230957031, -0.09387969970703125, -0.08865165710449219, -0.08342361450195312, -0.07819557189941406, -0.072967529296875, -0.06773948669433594, -0.06251144409179688, -0.05728340148925781, -0.05205535888671875, -0.04682731628417969, -0.041599273681640625, -0.03637123107910156, -0.0311431884765625, -0.025915145874023438, -0.020687103271484375, -0.015459060668945312, -0.01023101806640625, -0.0050029754638671875, 0.000225067138671875, 0.0054531097412109375, 0.01068115234375, 0.015909194946289062, 0.021137237548828125, 0.026365280151367188, 0.03159332275390625, 0.03682136535644531, 0.042049407958984375, 0.04727745056152344, 0.0525054931640625, 0.05773353576660156, 0.06296157836914062, 0.06818962097167969, 0.07341766357421875, 0.07864570617675781, 0.08387374877929688, 0.08910179138183594, 0.094329833984375, 0.09955787658691406, 0.10478591918945312, 0.11001396179199219, 0.11524200439453125, 0.12047004699707031, 0.12569808959960938, 0.13092613220214844, 0.1361541748046875, 0.14138221740722656, 0.14661026000976562, 0.1518383026123047, 0.15706634521484375, 0.1622943878173828, 0.16752243041992188, 0.17275047302246094, 0.177978515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 10.0, 5.0, 9.0, 11.0, 20.0, 24.0, 26.0, 50.0, 65.0, 94.0, 118.0, 213.0, 329.0, 508.0, 683.0, 632.0, 425.0, 236.0, 144.0, 109.0, 76.0, 61.0, 59.0, 31.0, 33.0, 18.0, 24.0, 6.0, 8.0, 10.0, 13.0, 11.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12249755859375, -0.11809062957763672, -0.11368370056152344, -0.10927677154541016, -0.10486984252929688, -0.1004629135131836, -0.09605598449707031, -0.09164905548095703, -0.08724212646484375, -0.08283519744873047, -0.07842826843261719, -0.0740213394165039, -0.06961441040039062, -0.06520748138427734, -0.06080055236816406, -0.05639362335205078, -0.0519866943359375, -0.04757976531982422, -0.04317283630371094, -0.038765907287597656, -0.034358978271484375, -0.029952049255371094, -0.025545120239257812, -0.02113819122314453, -0.01673126220703125, -0.012324333190917969, -0.007917404174804688, -0.0035104751586914062, 0.000896453857421875, 0.005303382873535156, 0.009710311889648438, 0.014117240905761719, 0.018524169921875, 0.02293109893798828, 0.027338027954101562, 0.031744956970214844, 0.036151885986328125, 0.040558815002441406, 0.04496574401855469, 0.04937267303466797, 0.05377960205078125, 0.05818653106689453, 0.06259346008300781, 0.0670003890991211, 0.07140731811523438, 0.07581424713134766, 0.08022117614746094, 0.08462810516357422, 0.0890350341796875, 0.09344196319580078, 0.09784889221191406, 0.10225582122802734, 0.10666275024414062, 0.1110696792602539, 0.11547660827636719, 0.11988353729248047, 0.12429046630859375, 0.12869739532470703, 0.1331043243408203, 0.1375112533569336, 0.14191818237304688, 0.14632511138916016, 0.15073204040527344, 0.15513896942138672, 0.1595458984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 33.0, 71.0, 174.0, 269.0, 244.0, 112.0, 44.0, 24.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6676065921783447, -0.6336123943328857, -0.5996181964874268, -0.5656239986419678, -0.5316298007965088, -0.4976356029510498, -0.4636414051055908, -0.42964720726013184, -0.39565300941467285, -0.36165881156921387, -0.3276646137237549, -0.2936704158782959, -0.2596762180328369, -0.22568202018737793, -0.19168782234191895, -0.15769362449645996, -0.12369942665100098, -0.08970522880554199, -0.05571103096008301, -0.021716833114624023, 0.012277364730834961, 0.046271562576293945, 0.08026576042175293, 0.11425995826721191, 0.1482541561126709, 0.18224835395812988, 0.21624255180358887, 0.25023674964904785, 0.28423094749450684, 0.3182251453399658, 0.3522193431854248, 0.3862135410308838, 0.4202076196670532, 0.4542018175125122, 0.4881960153579712, 0.5221902132034302, 0.5561844110488892, 0.5901786088943481, 0.6241728067398071, 0.6581670045852661, 0.6921612024307251, 0.7261554002761841, 0.7601495981216431, 0.794143795967102, 0.828137993812561, 0.86213219165802, 0.896126389503479, 0.930120587348938, 0.964114785194397, 0.998108983039856, 1.032103180885315, 1.066097378730774, 1.100091576576233, 1.134085774421692, 1.1680799722671509, 1.2020741701126099, 1.2360683679580688, 1.2700625658035278, 1.3040567636489868, 1.3380509614944458, 1.3720451593399048, 1.4060393571853638, 1.4400335550308228, 1.4740277528762817, 1.5080219507217407]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 13.0, 9.0, 12.0, 13.0, 11.0, 20.0, 16.0, 30.0, 33.0, 25.0, 33.0, 35.0, 40.0, 50.0, 27.0, 47.0, 41.0, 40.0, 38.0, 34.0, 30.0, 35.0, 42.0, 38.0, 25.0, 24.0, 30.0, 30.0, 22.0, 19.0, 21.0, 12.0, 8.0, 12.0, 12.0, 9.0, 11.0, 6.0, 9.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.3876100778579712, -0.3756057620048523, -0.3636014461517334, -0.3515971302986145, -0.3395927846431732, -0.3275884687900543, -0.3155841529369354, -0.30357983708381653, -0.29157549142837524, -0.27957117557525635, -0.26756685972213745, -0.25556254386901855, -0.24355819821357727, -0.23155388236045837, -0.21954956650733948, -0.20754525065422058, -0.19554093480110168, -0.1835366189479828, -0.1715322881937027, -0.1595279723405838, -0.1475236415863037, -0.13551932573318481, -0.12351500988006592, -0.11151068657636642, -0.09950636327266693, -0.08750203996896744, -0.07549771666526794, -0.06349340081214905, -0.051489077508449554, -0.03948475420475006, -0.027480438351631165, -0.015476115047931671, -0.0034717917442321777, 0.008532529696822166, 0.02053685113787651, 0.032541170716285706, 0.0445454940199852, 0.05654981732368469, 0.06855413317680359, 0.08055845648050308, 0.09256277978420258, 0.10456710308790207, 0.11657142639160156, 0.12857574224472046, 0.14058005809783936, 0.15258438885211945, 0.16458870470523834, 0.17659303545951843, 0.18859735131263733, 0.20060166716575623, 0.21260599792003632, 0.2246103137731552, 0.2366146445274353, 0.2486189603805542, 0.2606232762336731, 0.272627592086792, 0.2846319079399109, 0.2966362237930298, 0.3086405396461487, 0.3206448554992676, 0.33264920115470886, 0.34465351700782776, 0.35665783286094666, 0.36866214871406555, 0.38066649436950684]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 3.0, 9.0, 8.0, 11.0, 16.0, 19.0, 29.0, 29.0, 60.0, 81.0, 107.0, 134.0, 171.0, 240.0, 427.0, 664.0, 1211.0, 2179.0, 4704.0, 10502.0, 25462.0, 65323.0, 161982.0, 304666.0, 264896.0, 122426.0, 48242.0, 18905.0, 7901.0, 3602.0, 1757.0, 973.0, 553.0, 388.0, 241.0, 166.0, 127.0, 92.0, 65.0, 49.0, 35.0, 26.0, 16.0, 15.0, 8.0, 12.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0850830078125, -0.08223152160644531, -0.07938003540039062, -0.07652854919433594, -0.07367706298828125, -0.07082557678222656, -0.06797409057617188, -0.06512260437011719, -0.0622711181640625, -0.05941963195800781, -0.056568145751953125, -0.05371665954589844, -0.05086517333984375, -0.04801368713378906, -0.045162200927734375, -0.04231071472167969, -0.039459228515625, -0.03660774230957031, -0.033756256103515625, -0.030904769897460938, -0.02805328369140625, -0.025201797485351562, -0.022350311279296875, -0.019498825073242188, -0.0166473388671875, -0.013795852661132812, -0.010944366455078125, -0.008092880249023438, -0.00524139404296875, -0.0023899078369140625, 0.000461578369140625, 0.0033130645751953125, 0.00616455078125, 0.009016036987304688, 0.011867523193359375, 0.014719009399414062, 0.01757049560546875, 0.020421981811523438, 0.023273468017578125, 0.026124954223632812, 0.0289764404296875, 0.03182792663574219, 0.034679412841796875, 0.03753089904785156, 0.04038238525390625, 0.04323387145996094, 0.046085357666015625, 0.04893684387207031, 0.051788330078125, 0.05463981628417969, 0.057491302490234375, 0.06034278869628906, 0.06319427490234375, 0.06604576110839844, 0.06889724731445312, 0.07174873352050781, 0.0746002197265625, 0.07745170593261719, 0.08030319213867188, 0.08315467834472656, 0.08600616455078125, 0.08885765075683594, 0.09170913696289062, 0.09456062316894531, 0.097412109375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 12.0, 14.0, 23.0, 28.0, 39.0, 56.0, 79.0, 71.0, 75.0, 85.0, 77.0, 79.0, 84.0, 73.0, 60.0, 38.0, 40.0, 17.0, 9.0, 11.0, 15.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10479736328125, -0.10094928741455078, -0.09710121154785156, -0.09325313568115234, -0.08940505981445312, -0.0855569839477539, -0.08170890808105469, -0.07786083221435547, -0.07401275634765625, -0.07016468048095703, -0.06631660461425781, -0.062468528747558594, -0.058620452880859375, -0.054772377014160156, -0.05092430114746094, -0.04707622528076172, -0.0432281494140625, -0.03938007354736328, -0.03553199768066406, -0.031683921813964844, -0.027835845947265625, -0.023987770080566406, -0.020139694213867188, -0.01629161834716797, -0.01244354248046875, -0.008595466613769531, -0.0047473907470703125, -0.0008993148803710938, 0.002948760986328125, 0.006796836853027344, 0.010644912719726562, 0.014492988586425781, 0.018341064453125, 0.02218914031982422, 0.026037216186523438, 0.029885292053222656, 0.033733367919921875, 0.037581443786621094, 0.04142951965332031, 0.04527759552001953, 0.04912567138671875, 0.05297374725341797, 0.05682182312011719, 0.060669898986816406, 0.06451797485351562, 0.06836605072021484, 0.07221412658691406, 0.07606220245361328, 0.0799102783203125, 0.08375835418701172, 0.08760643005371094, 0.09145450592041016, 0.09530258178710938, 0.0991506576538086, 0.10299873352050781, 0.10684680938720703, 0.11069488525390625, 0.11454296112060547, 0.11839103698730469, 0.1222391128540039, 0.12608718872070312, 0.12993526458740234, 0.13378334045410156, 0.13763141632080078, 0.1414794921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 9.0, 12.0, 13.0, 18.0, 22.0, 41.0, 38.0, 42.0, 55.0, 102.0, 210.0, 812.0, 4159.0, 36730.0, 563527.0, 412347.0, 25962.0, 3218.0, 661.0, 216.0, 91.0, 53.0, 31.0, 28.0, 31.0, 18.0, 22.0, 16.0, 12.0, 6.0, 9.0, 8.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2969627380371094, -0.28704071044921875, -0.2771186828613281, -0.2671966552734375, -0.2572746276855469, -0.24735260009765625, -0.23743057250976562, -0.227508544921875, -0.21758651733398438, -0.20766448974609375, -0.19774246215820312, -0.1878204345703125, -0.17789840698242188, -0.16797637939453125, -0.15805435180664062, -0.14813232421875, -0.13821029663085938, -0.12828826904296875, -0.11836624145507812, -0.1084442138671875, -0.09852218627929688, -0.08860015869140625, -0.07867813110351562, -0.068756103515625, -0.058834075927734375, -0.04891204833984375, -0.038990020751953125, -0.0290679931640625, -0.019145965576171875, -0.00922393798828125, 0.000698089599609375, 0.0106201171875, 0.020542144775390625, 0.03046417236328125, 0.040386199951171875, 0.0503082275390625, 0.060230255126953125, 0.07015228271484375, 0.08007431030273438, 0.089996337890625, 0.09991836547851562, 0.10984039306640625, 0.11976242065429688, 0.1296844482421875, 0.13960647583007812, 0.14952850341796875, 0.15945053100585938, 0.16937255859375, 0.17929458618164062, 0.18921661376953125, 0.19913864135742188, 0.2090606689453125, 0.21898269653320312, 0.22890472412109375, 0.23882675170898438, 0.248748779296875, 0.2586708068847656, 0.26859283447265625, 0.2785148620605469, 0.2884368896484375, 0.2983589172363281, 0.30828094482421875, 0.3182029724121094, 0.328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 13.0, 16.0, 14.0, 22.0, 26.0, 28.0, 33.0, 40.0, 38.0, 47.0, 62.0, 58.0, 60.0, 49.0, 59.0, 44.0, 51.0, 41.0, 42.0, 27.0, 46.0, 35.0, 35.0, 27.0, 13.0, 15.0, 8.0, 12.0, 9.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.2482318878173828, -0.24060440063476562, -0.23297691345214844, -0.22534942626953125, -0.21772193908691406, -0.21009445190429688, -0.2024669647216797, -0.1948394775390625, -0.1872119903564453, -0.17958450317382812, -0.17195701599121094, -0.16432952880859375, -0.15670204162597656, -0.14907455444335938, -0.1414470672607422, -0.133819580078125, -0.1261920928955078, -0.11856460571289062, -0.11093711853027344, -0.10330963134765625, -0.09568214416503906, -0.08805465698242188, -0.08042716979980469, -0.0727996826171875, -0.06517219543457031, -0.057544708251953125, -0.04991722106933594, -0.04228973388671875, -0.03466224670410156, -0.027034759521484375, -0.019407272338867188, -0.01177978515625, -0.0041522979736328125, 0.003475189208984375, 0.011102676391601562, 0.01873016357421875, 0.026357650756835938, 0.033985137939453125, 0.04161262512207031, 0.0492401123046875, 0.05686759948730469, 0.06449508666992188, 0.07212257385253906, 0.07975006103515625, 0.08737754821777344, 0.09500503540039062, 0.10263252258300781, 0.110260009765625, 0.11788749694824219, 0.12551498413085938, 0.13314247131347656, 0.14076995849609375, 0.14839744567871094, 0.15602493286132812, 0.1636524200439453, 0.1712799072265625, 0.1789073944091797, 0.18653488159179688, 0.19416236877441406, 0.20178985595703125, 0.20941734313964844, 0.21704483032226562, 0.2246723175048828, 0.2322998046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 9.0, 10.0, 13.0, 24.0, 37.0, 61.0, 95.0, 199.0, 360.0, 689.0, 1376.0, 3149.0, 7746.0, 21734.0, 65350.0, 188019.0, 353238.0, 257556.0, 97025.0, 32560.0, 11323.0, 4229.0, 1922.0, 862.0, 409.0, 216.0, 126.0, 69.0, 54.0, 24.0, 22.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02960205078125, -0.028696298599243164, -0.027790546417236328, -0.026884794235229492, -0.025979042053222656, -0.02507328987121582, -0.024167537689208984, -0.02326178550720215, -0.022356033325195312, -0.021450281143188477, -0.02054452896118164, -0.019638776779174805, -0.01873302459716797, -0.017827272415161133, -0.016921520233154297, -0.01601576805114746, -0.015110015869140625, -0.014204263687133789, -0.013298511505126953, -0.012392759323120117, -0.011487007141113281, -0.010581254959106445, -0.00967550277709961, -0.008769750595092773, -0.007863998413085938, -0.0069582462310791016, -0.006052494049072266, -0.00514674186706543, -0.004240989685058594, -0.003335237503051758, -0.002429485321044922, -0.001523733139038086, -0.00061798095703125, 0.00028777122497558594, 0.0011935234069824219, 0.002099275588989258, 0.0030050277709960938, 0.00391077995300293, 0.004816532135009766, 0.0057222843170166016, 0.0066280364990234375, 0.0075337886810302734, 0.00843954086303711, 0.009345293045043945, 0.010251045227050781, 0.011156797409057617, 0.012062549591064453, 0.012968301773071289, 0.013874053955078125, 0.014779806137084961, 0.015685558319091797, 0.016591310501098633, 0.01749706268310547, 0.018402814865112305, 0.01930856704711914, 0.020214319229125977, 0.021120071411132812, 0.02202582359313965, 0.022931575775146484, 0.02383732795715332, 0.024743080139160156, 0.025648832321166992, 0.026554584503173828, 0.027460336685180664, 0.0283660888671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 10.0, 12.0, 13.0, 14.0, 28.0, 23.0, 33.0, 34.0, 26.0, 55.0, 41.0, 67.0, 56.0, 51.0, 31.0, 59.0, 56.0, 61.0, 61.0, 53.0, 48.0, 18.0, 24.0, 22.0, 15.0, 16.0, 6.0, 5.0, 5.0, 9.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.304813385009766e-06, -5.1353126764297485e-06, -4.9658119678497314e-06, -4.796311259269714e-06, -4.626810550689697e-06, -4.45730984210968e-06, -4.287809133529663e-06, -4.118308424949646e-06, -3.948807716369629e-06, -3.779307007789612e-06, -3.6098062992095947e-06, -3.4403055906295776e-06, -3.2708048820495605e-06, -3.1013041734695435e-06, -2.9318034648895264e-06, -2.7623027563095093e-06, -2.592802047729492e-06, -2.423301339149475e-06, -2.253800630569458e-06, -2.084299921989441e-06, -1.914799213409424e-06, -1.7452985048294067e-06, -1.5757977962493896e-06, -1.4062970876693726e-06, -1.2367963790893555e-06, -1.0672956705093384e-06, -8.977949619293213e-07, -7.282942533493042e-07, -5.587935447692871e-07, -3.8929283618927e-07, -2.1979212760925293e-07, -5.029141902923584e-08, 1.1920928955078125e-07, 2.8870999813079834e-07, 4.5821070671081543e-07, 6.277114152908325e-07, 7.972121238708496e-07, 9.667128324508667e-07, 1.1362135410308838e-06, 1.3057142496109009e-06, 1.475214958190918e-06, 1.644715666770935e-06, 1.8142163753509521e-06, 1.9837170839309692e-06, 2.1532177925109863e-06, 2.3227185010910034e-06, 2.4922192096710205e-06, 2.6617199182510376e-06, 2.8312206268310547e-06, 3.0007213354110718e-06, 3.170222043991089e-06, 3.339722752571106e-06, 3.509223461151123e-06, 3.67872416973114e-06, 3.848224878311157e-06, 4.017725586891174e-06, 4.187226295471191e-06, 4.3567270040512085e-06, 4.526227712631226e-06, 4.695728421211243e-06, 4.86522912979126e-06, 5.034729838371277e-06, 5.204230546951294e-06, 5.373731255531311e-06, 5.543231964111328e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 10.0, 8.0, 11.0, 15.0, 26.0, 31.0, 71.0, 125.0, 249.0, 683.0, 2540.0, 15529.0, 139687.0, 640019.0, 220397.0, 23949.0, 3657.0, 925.0, 312.0, 116.0, 61.0, 52.0, 25.0, 13.0, 15.0, 9.0, 0.0, 6.0, 3.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049652099609375, -0.04771280288696289, -0.04577350616455078, -0.04383420944213867, -0.04189491271972656, -0.03995561599731445, -0.038016319274902344, -0.036077022552490234, -0.034137725830078125, -0.032198429107666016, -0.030259132385253906, -0.028319835662841797, -0.026380538940429688, -0.024441242218017578, -0.02250194549560547, -0.02056264877319336, -0.01862335205078125, -0.01668405532836914, -0.014744758605957031, -0.012805461883544922, -0.010866165161132812, -0.008926868438720703, -0.006987571716308594, -0.005048274993896484, -0.003108978271484375, -0.0011696815490722656, 0.0007696151733398438, 0.002708911895751953, 0.0046482086181640625, 0.006587505340576172, 0.008526802062988281, 0.01046609878540039, 0.0124053955078125, 0.01434469223022461, 0.01628398895263672, 0.018223285675048828, 0.020162582397460938, 0.022101879119873047, 0.024041175842285156, 0.025980472564697266, 0.027919769287109375, 0.029859066009521484, 0.031798362731933594, 0.0337376594543457, 0.03567695617675781, 0.03761625289916992, 0.03955554962158203, 0.04149484634399414, 0.04343414306640625, 0.04537343978881836, 0.04731273651123047, 0.04925203323364258, 0.05119132995605469, 0.0531306266784668, 0.055069923400878906, 0.057009220123291016, 0.058948516845703125, 0.060887813568115234, 0.06282711029052734, 0.06476640701293945, 0.06670570373535156, 0.06864500045776367, 0.07058429718017578, 0.07252359390258789, 0.074462890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 15.0, 23.0, 26.0, 25.0, 35.0, 35.0, 54.0, 63.0, 88.0, 81.0, 76.0, 77.0, 78.0, 67.0, 44.0, 51.0, 35.0, 30.0, 22.0, 11.0, 6.0, 13.0, 8.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0572509765625, -0.055678367614746094, -0.05410575866699219, -0.05253314971923828, -0.050960540771484375, -0.04938793182373047, -0.04781532287597656, -0.046242713928222656, -0.04467010498046875, -0.043097496032714844, -0.04152488708496094, -0.03995227813720703, -0.038379669189453125, -0.03680706024169922, -0.03523445129394531, -0.033661842346191406, -0.0320892333984375, -0.030516624450683594, -0.028944015502929688, -0.02737140655517578, -0.025798797607421875, -0.02422618865966797, -0.022653579711914062, -0.021080970764160156, -0.01950836181640625, -0.017935752868652344, -0.016363143920898438, -0.014790534973144531, -0.013217926025390625, -0.011645317077636719, -0.010072708129882812, -0.008500099182128906, -0.006927490234375, -0.005354881286621094, -0.0037822723388671875, -0.0022096633911132812, -0.000637054443359375, 0.0009355545043945312, 0.0025081634521484375, 0.004080772399902344, 0.00565338134765625, 0.007225990295410156, 0.008798599243164062, 0.010371208190917969, 0.011943817138671875, 0.013516426086425781, 0.015089035034179688, 0.016661643981933594, 0.0182342529296875, 0.019806861877441406, 0.021379470825195312, 0.02295207977294922, 0.024524688720703125, 0.02609729766845703, 0.027669906616210938, 0.029242515563964844, 0.03081512451171875, 0.032387733459472656, 0.03396034240722656, 0.03553295135498047, 0.037105560302734375, 0.03867816925048828, 0.04025077819824219, 0.041823387145996094, 0.04339599609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 11.0, 235.0, 728.0, 38.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5454102754592896, -0.41753071546554565, -0.28965112566947937, -0.16177153587341309, -0.03389197587966919, 0.09398758411407471, 0.22186720371246338, 0.3497467637062073, 0.47762632369995117, 0.6055058836936951, 0.733385443687439, 0.8612650632858276, 0.9891446232795715, 1.1170241832733154, 1.244903802871704, 1.3727834224700928, 1.500662922859192, 1.6285425424575806, 1.7564220428466797, 1.8843016624450684, 2.012181282043457, 2.1400609016418457, 2.2679405212402344, 2.395819902420044, 2.5236995220184326, 2.6515791416168213, 2.77945876121521, 2.9073381423950195, 3.035217761993408, 3.163097381591797, 3.2909770011901855, 3.418856620788574, 3.546736240386963, 3.6746158599853516, 3.8024954795837402, 3.930375099182129, 4.058254718780518, 4.186134338378906, 4.314013481140137, 4.441893100738525, 4.569772720336914, 4.697652339935303, 4.825531959533691, 4.95341157913208, 5.081291198730469, 5.209170341491699, 5.337050437927246, 5.464929580688477, 5.592809677124023, 5.720689296722412, 5.848568916320801, 5.9764485359191895, 6.104328155517578, 6.232207298278809, 6.3600873947143555, 6.487966537475586, 6.615846157073975, 6.743725776672363, 6.871605396270752, 6.999485015869141, 7.127364635467529, 7.255244255065918, 7.383123397827148, 7.511003017425537, 7.638882637023926]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 9.0, 11.0, 6.0, 8.0, 7.0, 5.0, 17.0, 14.0, 27.0, 24.0, 24.0, 30.0, 36.0, 41.0, 31.0, 40.0, 47.0, 39.0, 41.0, 43.0, 44.0, 50.0, 35.0, 29.0, 42.0, 30.0, 31.0, 29.0, 24.0, 26.0, 30.0, 14.0, 18.0, 27.0, 13.0, 8.0, 8.0, 10.0, 4.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.536846399307251, -0.5196437835693359, -0.5024411678314209, -0.48523858189582825, -0.4680359661579132, -0.45083335041999817, -0.4336307644844055, -0.4164281487464905, -0.39922553300857544, -0.3820229172706604, -0.36482030153274536, -0.3476177155971527, -0.33041509985923767, -0.31321248412132263, -0.29600989818573, -0.27880728244781494, -0.2616046667098999, -0.24440205097198486, -0.22719945013523102, -0.20999684929847717, -0.19279423356056213, -0.1755916178226471, -0.15838901698589325, -0.1411864161491394, -0.12398380041122437, -0.10678119212388992, -0.08957858383655548, -0.07237597554922104, -0.0551733672618866, -0.037970758974552155, -0.020768150687217712, -0.0035655423998832703, 0.013637006282806396, 0.03083961457014084, 0.04804222285747528, 0.06524483114480972, 0.08244743943214417, 0.09965004771947861, 0.11685265600681305, 0.1340552568435669, 0.15125787258148193, 0.16846048831939697, 0.18566308915615082, 0.20286568999290466, 0.2200683057308197, 0.23727092146873474, 0.2544735074043274, 0.27167612314224243, 0.28887873888015747, 0.3060813546180725, 0.32328397035598755, 0.3404865562915802, 0.35768917202949524, 0.3748917877674103, 0.39209437370300293, 0.40929698944091797, 0.426499605178833, 0.44370222091674805, 0.4609048366546631, 0.47810742259025574, 0.4953100383281708, 0.5125126242637634, 0.5297152400016785, 0.5469178557395935, 0.5641204714775085]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 8.0, 23.0, 31.0, 52.0, 94.0, 171.0, 490.0, 1251.0, 2521.0, 6867.0, 26417.0, 216400.0, 1658674.0, 1964349.0, 277523.0, 28688.0, 6616.0, 2239.0, 878.0, 427.0, 213.0, 129.0, 64.0, 47.0, 22.0, 20.0, 11.0, 7.0, 4.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.08952522277832031, -0.08621597290039062, -0.08290672302246094, -0.07959747314453125, -0.07628822326660156, -0.07297897338867188, -0.06966972351074219, -0.0663604736328125, -0.06305122375488281, -0.059741973876953125, -0.05643272399902344, -0.05312347412109375, -0.04981422424316406, -0.046504974365234375, -0.04319572448730469, -0.039886474609375, -0.03657722473144531, -0.033267974853515625, -0.029958724975585938, -0.02664947509765625, -0.023340225219726562, -0.020030975341796875, -0.016721725463867188, -0.0134124755859375, -0.010103225708007812, -0.006793975830078125, -0.0034847259521484375, -0.00017547607421875, 0.0031337738037109375, 0.006443023681640625, 0.009752273559570312, 0.0130615234375, 0.016370773315429688, 0.019680023193359375, 0.022989273071289062, 0.02629852294921875, 0.029607772827148438, 0.032917022705078125, 0.03622627258300781, 0.0395355224609375, 0.04284477233886719, 0.046154022216796875, 0.04946327209472656, 0.05277252197265625, 0.05608177185058594, 0.059391021728515625, 0.06270027160644531, 0.066009521484375, 0.06931877136230469, 0.07262802124023438, 0.07593727111816406, 0.07924652099609375, 0.08255577087402344, 0.08586502075195312, 0.08917427062988281, 0.0924835205078125, 0.09579277038574219, 0.09910202026367188, 0.10241127014160156, 0.10572052001953125, 0.10902976989746094, 0.11233901977539062, 0.11564826965332031, 0.11895751953125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 8.0, 12.0, 16.0, 16.0, 30.0, 37.0, 45.0, 66.0, 78.0, 78.0, 81.0, 95.0, 86.0, 71.0, 60.0, 64.0, 47.0, 33.0, 22.0, 17.0, 20.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12259292602539062, -0.11811065673828125, -0.11362838745117188, -0.1091461181640625, -0.10466384887695312, -0.10018157958984375, -0.09569931030273438, -0.091217041015625, -0.08673477172851562, -0.08225250244140625, -0.07777023315429688, -0.0732879638671875, -0.06880569458007812, -0.06432342529296875, -0.059841156005859375, -0.05535888671875, -0.050876617431640625, -0.04639434814453125, -0.041912078857421875, -0.0374298095703125, -0.032947540283203125, -0.02846527099609375, -0.023983001708984375, -0.019500732421875, -0.015018463134765625, -0.01053619384765625, -0.006053924560546875, -0.0015716552734375, 0.002910614013671875, 0.00739288330078125, 0.011875152587890625, 0.016357421875, 0.020839691162109375, 0.02532196044921875, 0.029804229736328125, 0.0342864990234375, 0.038768768310546875, 0.04325103759765625, 0.047733306884765625, 0.052215576171875, 0.056697845458984375, 0.06118011474609375, 0.06566238403320312, 0.0701446533203125, 0.07462692260742188, 0.07910919189453125, 0.08359146118164062, 0.08807373046875, 0.09255599975585938, 0.09703826904296875, 0.10152053833007812, 0.1060028076171875, 0.11048507690429688, 0.11496734619140625, 0.11944961547851562, 0.123931884765625, 0.12841415405273438, 0.13289642333984375, 0.13737869262695312, 0.1418609619140625, 0.14634323120117188, 0.15082550048828125, 0.15530776977539062, 0.1597900390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 11.0, 20.0, 35.0, 47.0, 113.0, 226.0, 418.0, 1219.0, 3835.0, 19317.0, 248496.0, 3690288.0, 206892.0, 17784.0, 3507.0, 1184.0, 444.0, 205.0, 101.0, 47.0, 21.0, 19.0, 14.0, 1.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1815185546875, -0.17556190490722656, -0.16960525512695312, -0.1636486053466797, -0.15769195556640625, -0.1517353057861328, -0.14577865600585938, -0.13982200622558594, -0.1338653564453125, -0.12790870666503906, -0.12195205688476562, -0.11599540710449219, -0.11003875732421875, -0.10408210754394531, -0.09812545776367188, -0.09216880798339844, -0.086212158203125, -0.08025550842285156, -0.07429885864257812, -0.06834220886230469, -0.06238555908203125, -0.05642890930175781, -0.050472259521484375, -0.04451560974121094, -0.0385589599609375, -0.03260231018066406, -0.026645660400390625, -0.020689010620117188, -0.01473236083984375, -0.008775711059570312, -0.002819061279296875, 0.0031375885009765625, 0.00909423828125, 0.015050888061523438, 0.021007537841796875, 0.026964187622070312, 0.03292083740234375, 0.03887748718261719, 0.044834136962890625, 0.05079078674316406, 0.0567474365234375, 0.06270408630371094, 0.06866073608398438, 0.07461738586425781, 0.08057403564453125, 0.08653068542480469, 0.09248733520507812, 0.09844398498535156, 0.104400634765625, 0.11035728454589844, 0.11631393432617188, 0.12227058410644531, 0.12822723388671875, 0.1341838836669922, 0.14014053344726562, 0.14609718322753906, 0.1520538330078125, 0.15801048278808594, 0.16396713256835938, 0.1699237823486328, 0.17588043212890625, 0.1818370819091797, 0.18779373168945312, 0.19375038146972656, 0.19970703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 14.0, 6.0, 19.0, 42.0, 30.0, 75.0, 126.0, 267.0, 719.0, 1056.0, 853.0, 376.0, 176.0, 103.0, 46.0, 37.0, 26.0, 25.0, 20.0, 5.0, 11.0, 7.0, 1.0, 2.0, 8.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.147705078125, -0.14288902282714844, -0.13807296752929688, -0.1332569122314453, -0.12844085693359375, -0.12362480163574219, -0.11880874633789062, -0.11399269104003906, -0.1091766357421875, -0.10436058044433594, -0.09954452514648438, -0.09472846984863281, -0.08991241455078125, -0.08509635925292969, -0.08028030395507812, -0.07546424865722656, -0.070648193359375, -0.06583213806152344, -0.061016082763671875, -0.05620002746582031, -0.05138397216796875, -0.04656791687011719, -0.041751861572265625, -0.03693580627441406, -0.0321197509765625, -0.027303695678710938, -0.022487640380859375, -0.017671585083007812, -0.01285552978515625, -0.008039474487304688, -0.003223419189453125, 0.0015926361083984375, 0.00640869140625, 0.011224746704101562, 0.016040802001953125, 0.020856857299804688, 0.02567291259765625, 0.030488967895507812, 0.035305023193359375, 0.04012107849121094, 0.0449371337890625, 0.04975318908691406, 0.054569244384765625, 0.05938529968261719, 0.06420135498046875, 0.06901741027832031, 0.07383346557617188, 0.07864952087402344, 0.083465576171875, 0.08828163146972656, 0.09309768676757812, 0.09791374206542969, 0.10272979736328125, 0.10754585266113281, 0.11236190795898438, 0.11717796325683594, 0.1219940185546875, 0.12681007385253906, 0.13162612915039062, 0.1364421844482422, 0.14125823974609375, 0.1460742950439453, 0.15089035034179688, 0.15570640563964844, 0.1605224609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 14.0, 11.0, 41.0, 78.0, 131.0, 187.0, 215.0, 143.0, 90.0, 44.0, 28.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6549149751663208, -0.6368114352226257, -0.6187078952789307, -0.6006042957305908, -0.5825007557868958, -0.5643972158432007, -0.5462936162948608, -0.5281900763511658, -0.5100865364074707, -0.49198299646377563, -0.4738794267177582, -0.4557758569717407, -0.43767231702804565, -0.4195687770843506, -0.40146520733833313, -0.3833616375923157, -0.3652580976486206, -0.34715455770492554, -0.3290509879589081, -0.3109474182128906, -0.29284387826919556, -0.2747403383255005, -0.25663676857948303, -0.23853321373462677, -0.2204296588897705, -0.20232610404491425, -0.18422254920005798, -0.16611899435520172, -0.14801543951034546, -0.1299118846654892, -0.11180832982063293, -0.09370477497577667, -0.07560127973556519, -0.05749772489070892, -0.03939417004585266, -0.0212906152009964, -0.0031870603561401367, 0.014916494488716125, 0.03302004933357239, 0.05112360417842865, 0.06922715902328491, 0.08733071386814117, 0.10543426871299744, 0.1235378235578537, 0.14164137840270996, 0.15974493324756622, 0.17784848809242249, 0.19595204293727875, 0.214055597782135, 0.23215915262699127, 0.25026270747184753, 0.268366277217865, 0.28646981716156006, 0.3045733571052551, 0.3226769268512726, 0.34078049659729004, 0.3588840365409851, 0.3769875764846802, 0.39509114623069763, 0.4131947159767151, 0.43129825592041016, 0.4494017958641052, 0.4675053656101227, 0.48560893535614014, 0.5037124752998352]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 4.0, 7.0, 11.0, 3.0, 8.0, 18.0, 19.0, 15.0, 21.0, 25.0, 24.0, 25.0, 34.0, 40.0, 33.0, 42.0, 41.0, 25.0, 40.0, 43.0, 49.0, 42.0, 35.0, 29.0, 32.0, 41.0, 36.0, 29.0, 37.0, 32.0, 21.0, 23.0, 22.0, 11.0, 12.0, 13.0, 9.0, 9.0, 4.0, 6.0, 7.0, 7.0, 5.0, 3.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2896244525909424, -0.2805178463459015, -0.271411269903183, -0.2623046636581421, -0.2531980872154236, -0.2440914809703827, -0.234984889626503, -0.2258782982826233, -0.2167717069387436, -0.2076651155948639, -0.1985585242509842, -0.1894519329071045, -0.1803453266620636, -0.1712387502193451, -0.1621321439743042, -0.1530255526304245, -0.1439189612865448, -0.1348123699426651, -0.1257057785987854, -0.1165991798043251, -0.1074925884604454, -0.0983859971165657, -0.08927939832210541, -0.08017280697822571, -0.07106621563434601, -0.06195962429046631, -0.05285302922129631, -0.04374643415212631, -0.03463984280824661, -0.025533251464366913, -0.016426656395196915, -0.0073200613260269165, 0.0017865300178527832, 0.010893123224377632, 0.01999971643090248, 0.02910630963742733, 0.03821290284395218, 0.04731949418783188, 0.05642608925700188, 0.06553268432617188, 0.07463927567005157, 0.08374586701393127, 0.09285245835781097, 0.10195905715227127, 0.11106564849615097, 0.12017223984003067, 0.12927883863449097, 0.13838542997837067, 0.14749202132225037, 0.15659861266613007, 0.16570520401000977, 0.17481179535388947, 0.18391838669776917, 0.19302499294281006, 0.20213158428668976, 0.21123817563056946, 0.22034476697444916, 0.22945135831832886, 0.23855794966220856, 0.24766454100608826, 0.25677114725112915, 0.26587772369384766, 0.27498432993888855, 0.28409093618392944, 0.29319751262664795]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 18.0, 9.0, 19.0, 22.0, 25.0, 47.0, 59.0, 68.0, 89.0, 115.0, 149.0, 214.0, 279.0, 472.0, 774.0, 1341.0, 2586.0, 5174.0, 10899.0, 24139.0, 56688.0, 130789.0, 265630.0, 284020.0, 148615.0, 64079.0, 27519.0, 12138.0, 5724.0, 2801.0, 1508.0, 801.0, 554.0, 339.0, 220.0, 155.0, 129.0, 96.0, 64.0, 51.0, 34.0, 24.0, 16.0, 17.0, 16.0, 5.0, 5.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.07879638671875, -0.07641410827636719, -0.07403182983398438, -0.07164955139160156, -0.06926727294921875, -0.06688499450683594, -0.06450271606445312, -0.06212043762207031, -0.0597381591796875, -0.05735588073730469, -0.054973602294921875, -0.05259132385253906, -0.05020904541015625, -0.04782676696777344, -0.045444488525390625, -0.04306221008300781, -0.040679931640625, -0.03829765319824219, -0.035915374755859375, -0.03353309631347656, -0.03115081787109375, -0.028768539428710938, -0.026386260986328125, -0.024003982543945312, -0.0216217041015625, -0.019239425659179688, -0.016857147216796875, -0.014474868774414062, -0.01209259033203125, -0.009710311889648438, -0.007328033447265625, -0.0049457550048828125, -0.0025634765625, -0.0001811981201171875, 0.002201080322265625, 0.0045833587646484375, 0.00696563720703125, 0.009347915649414062, 0.011730194091796875, 0.014112472534179688, 0.0164947509765625, 0.018877029418945312, 0.021259307861328125, 0.023641586303710938, 0.02602386474609375, 0.028406143188476562, 0.030788421630859375, 0.03317070007324219, 0.035552978515625, 0.03793525695800781, 0.040317535400390625, 0.04269981384277344, 0.04508209228515625, 0.04746437072753906, 0.049846649169921875, 0.05222892761230469, 0.0546112060546875, 0.05699348449707031, 0.059375762939453125, 0.06175804138183594, 0.06414031982421875, 0.06652259826660156, 0.06890487670898438, 0.07128715515136719, 0.07366943359375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 14.0, 8.0, 19.0, 29.0, 25.0, 32.0, 48.0, 64.0, 78.0, 65.0, 97.0, 85.0, 84.0, 62.0, 66.0, 50.0, 55.0, 35.0, 26.0, 27.0, 11.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11083984375, -0.10705757141113281, -0.10327529907226562, -0.09949302673339844, -0.09571075439453125, -0.09192848205566406, -0.08814620971679688, -0.08436393737792969, -0.0805816650390625, -0.07679939270019531, -0.07301712036132812, -0.06923484802246094, -0.06545257568359375, -0.06167030334472656, -0.057888031005859375, -0.05410575866699219, -0.050323486328125, -0.04654121398925781, -0.042758941650390625, -0.03897666931152344, -0.03519439697265625, -0.03141212463378906, -0.027629852294921875, -0.023847579956054688, -0.0200653076171875, -0.016283035278320312, -0.012500762939453125, -0.008718490600585938, -0.00493621826171875, -0.0011539459228515625, 0.002628326416015625, 0.0064105987548828125, 0.01019287109375, 0.013975143432617188, 0.017757415771484375, 0.021539688110351562, 0.02532196044921875, 0.029104232788085938, 0.032886505126953125, 0.03666877746582031, 0.0404510498046875, 0.04423332214355469, 0.048015594482421875, 0.05179786682128906, 0.05558013916015625, 0.05936241149902344, 0.06314468383789062, 0.06692695617675781, 0.070709228515625, 0.07449150085449219, 0.07827377319335938, 0.08205604553222656, 0.08583831787109375, 0.08962059020996094, 0.09340286254882812, 0.09718513488769531, 0.1009674072265625, 0.10474967956542969, 0.10853195190429688, 0.11231422424316406, 0.11609649658203125, 0.11987876892089844, 0.12366104125976562, 0.1274433135986328, 0.1312255859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 2.0, 9.0, 6.0, 8.0, 17.0, 12.0, 13.0, 14.0, 23.0, 17.0, 25.0, 18.0, 21.0, 36.0, 42.0, 83.0, 202.0, 731.0, 3688.0, 27512.0, 325924.0, 619742.0, 61440.0, 7051.0, 1202.0, 295.0, 92.0, 55.0, 47.0, 35.0, 31.0, 30.0, 23.0, 21.0, 14.0, 8.0, 11.0, 6.0, 10.0, 12.0, 8.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2125244140625, -0.20548057556152344, -0.19843673706054688, -0.1913928985595703, -0.18434906005859375, -0.1773052215576172, -0.17026138305664062, -0.16321754455566406, -0.1561737060546875, -0.14912986755371094, -0.14208602905273438, -0.1350421905517578, -0.12799835205078125, -0.12095451354980469, -0.11391067504882812, -0.10686683654785156, -0.099822998046875, -0.09277915954589844, -0.08573532104492188, -0.07869148254394531, -0.07164764404296875, -0.06460380554199219, -0.057559967041015625, -0.05051612854003906, -0.0434722900390625, -0.03642845153808594, -0.029384613037109375, -0.022340774536132812, -0.01529693603515625, -0.008253097534179688, -0.001209259033203125, 0.0058345794677734375, 0.01287841796875, 0.019922256469726562, 0.026966094970703125, 0.03400993347167969, 0.04105377197265625, 0.04809761047363281, 0.055141448974609375, 0.06218528747558594, 0.0692291259765625, 0.07627296447753906, 0.08331680297851562, 0.09036064147949219, 0.09740447998046875, 0.10444831848144531, 0.11149215698242188, 0.11853599548339844, 0.125579833984375, 0.13262367248535156, 0.13966751098632812, 0.1467113494873047, 0.15375518798828125, 0.1607990264892578, 0.16784286499023438, 0.17488670349121094, 0.1819305419921875, 0.18897438049316406, 0.19601821899414062, 0.2030620574951172, 0.21010589599609375, 0.2171497344970703, 0.22419357299804688, 0.23123741149902344, 0.23828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 4.0, 6.0, 12.0, 12.0, 7.0, 11.0, 12.0, 14.0, 17.0, 21.0, 34.0, 27.0, 39.0, 27.0, 42.0, 41.0, 32.0, 43.0, 46.0, 29.0, 58.0, 46.0, 32.0, 43.0, 38.0, 32.0, 40.0, 24.0, 26.0, 20.0, 25.0, 22.0, 20.0, 14.0, 9.0, 15.0, 18.0, 10.0, 11.0, 7.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173583984375, -0.16841888427734375, -0.1632537841796875, -0.15808868408203125, -0.152923583984375, -0.14775848388671875, -0.1425933837890625, -0.13742828369140625, -0.13226318359375, -0.12709808349609375, -0.1219329833984375, -0.11676788330078125, -0.111602783203125, -0.10643768310546875, -0.1012725830078125, -0.09610748291015625, -0.0909423828125, -0.08577728271484375, -0.0806121826171875, -0.07544708251953125, -0.070281982421875, -0.06511688232421875, -0.0599517822265625, -0.05478668212890625, -0.04962158203125, -0.04445648193359375, -0.0392913818359375, -0.03412628173828125, -0.028961181640625, -0.02379608154296875, -0.0186309814453125, -0.01346588134765625, -0.00830078125, -0.00313568115234375, 0.0020294189453125, 0.00719451904296875, 0.012359619140625, 0.01752471923828125, 0.0226898193359375, 0.02785491943359375, 0.03302001953125, 0.03818511962890625, 0.0433502197265625, 0.04851531982421875, 0.053680419921875, 0.05884552001953125, 0.0640106201171875, 0.06917572021484375, 0.0743408203125, 0.07950592041015625, 0.0846710205078125, 0.08983612060546875, 0.095001220703125, 0.10016632080078125, 0.1053314208984375, 0.11049652099609375, 0.11566162109375, 0.12082672119140625, 0.1259918212890625, 0.13115692138671875, 0.136322021484375, 0.14148712158203125, 0.1466522216796875, 0.15181732177734375, 0.156982421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 24.0, 23.0, 38.0, 56.0, 100.0, 129.0, 251.0, 340.0, 574.0, 857.0, 1464.0, 2687.0, 4952.0, 9448.0, 19447.0, 40862.0, 85498.0, 166425.0, 245305.0, 218740.0, 128225.0, 62770.0, 29876.0, 14422.0, 7030.0, 3747.0, 2059.0, 1229.0, 706.0, 440.0, 313.0, 187.0, 98.0, 67.0, 40.0, 36.0, 17.0, 17.0, 11.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0178375244140625, -0.017293453216552734, -0.01674938201904297, -0.016205310821533203, -0.015661239624023438, -0.015117168426513672, -0.014573097229003906, -0.01402902603149414, -0.013484954833984375, -0.01294088363647461, -0.012396812438964844, -0.011852741241455078, -0.011308670043945312, -0.010764598846435547, -0.010220527648925781, -0.009676456451416016, -0.00913238525390625, -0.008588314056396484, -0.008044242858886719, -0.007500171661376953, -0.0069561004638671875, -0.006412029266357422, -0.005867958068847656, -0.005323886871337891, -0.004779815673828125, -0.004235744476318359, -0.0036916732788085938, -0.003147602081298828, -0.0026035308837890625, -0.002059459686279297, -0.0015153884887695312, -0.0009713172912597656, -0.00042724609375, 0.00011682510375976562, 0.0006608963012695312, 0.0012049674987792969, 0.0017490386962890625, 0.002293109893798828, 0.0028371810913085938, 0.0033812522888183594, 0.003925323486328125, 0.004469394683837891, 0.005013465881347656, 0.005557537078857422, 0.0061016082763671875, 0.006645679473876953, 0.007189750671386719, 0.007733821868896484, 0.00827789306640625, 0.008821964263916016, 0.009366035461425781, 0.009910106658935547, 0.010454177856445312, 0.010998249053955078, 0.011542320251464844, 0.01208639144897461, 0.012630462646484375, 0.01317453384399414, 0.013718605041503906, 0.014262676239013672, 0.014806747436523438, 0.015350818634033203, 0.01589488983154297, 0.016438961029052734, 0.0169830322265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 5.0, 8.0, 6.0, 12.0, 21.0, 11.0, 28.0, 20.0, 36.0, 35.0, 39.0, 54.0, 64.0, 59.0, 44.0, 70.0, 82.0, 58.0, 53.0, 55.0, 39.0, 34.0, 31.0, 11.0, 25.0, 23.0, 14.0, 10.0, 11.0, 6.0, 10.0, 11.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.887580871582031e-06, -4.715286195278168e-06, -4.542991518974304e-06, -4.370696842670441e-06, -4.198402166366577e-06, -4.026107490062714e-06, -3.85381281375885e-06, -3.6815181374549866e-06, -3.509223461151123e-06, -3.3369287848472595e-06, -3.164634108543396e-06, -2.9923394322395325e-06, -2.820044755935669e-06, -2.6477500796318054e-06, -2.475455403327942e-06, -2.3031607270240784e-06, -2.130866050720215e-06, -1.9585713744163513e-06, -1.7862766981124878e-06, -1.6139820218086243e-06, -1.4416873455047607e-06, -1.2693926692008972e-06, -1.0970979928970337e-06, -9.248033165931702e-07, -7.525086402893066e-07, -5.802139639854431e-07, -4.079192876815796e-07, -2.3562461137771606e-07, -6.332993507385254e-08, 1.0896474123001099e-07, 2.812594175338745e-07, 4.5355409383773804e-07, 6.258487701416016e-07, 7.981434464454651e-07, 9.704381227493286e-07, 1.1427327990531921e-06, 1.3150274753570557e-06, 1.4873221516609192e-06, 1.6596168279647827e-06, 1.8319115042686462e-06, 2.0042061805725098e-06, 2.1765008568763733e-06, 2.348795533180237e-06, 2.5210902094841003e-06, 2.693384885787964e-06, 2.8656795620918274e-06, 3.037974238395691e-06, 3.2102689146995544e-06, 3.382563591003418e-06, 3.5548582673072815e-06, 3.727152943611145e-06, 3.8994476199150085e-06, 4.071742296218872e-06, 4.244036972522736e-06, 4.416331648826599e-06, 4.588626325130463e-06, 4.760921001434326e-06, 4.93321567773819e-06, 5.105510354042053e-06, 5.277805030345917e-06, 5.45009970664978e-06, 5.622394382953644e-06, 5.794689059257507e-06, 5.966983735561371e-06, 6.139278411865234e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 10.0, 14.0, 16.0, 32.0, 41.0, 68.0, 96.0, 161.0, 313.0, 560.0, 1377.0, 4136.0, 17803.0, 105526.0, 486392.0, 353496.0, 62151.0, 11360.0, 2897.0, 977.0, 453.0, 252.0, 154.0, 99.0, 55.0, 42.0, 18.0, 15.0, 12.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04034423828125, -0.038992881774902344, -0.03764152526855469, -0.03629016876220703, -0.034938812255859375, -0.03358745574951172, -0.03223609924316406, -0.030884742736816406, -0.02953338623046875, -0.028182029724121094, -0.026830673217773438, -0.02547931671142578, -0.024127960205078125, -0.02277660369873047, -0.021425247192382812, -0.020073890686035156, -0.0187225341796875, -0.017371177673339844, -0.016019821166992188, -0.014668464660644531, -0.013317108154296875, -0.011965751647949219, -0.010614395141601562, -0.009263038635253906, -0.00791168212890625, -0.006560325622558594, -0.0052089691162109375, -0.0038576126098632812, -0.002506256103515625, -0.0011548995971679688, 0.0001964569091796875, 0.0015478134155273438, 0.002899169921875, 0.004250526428222656, 0.0056018829345703125, 0.006953239440917969, 0.008304595947265625, 0.009655952453613281, 0.011007308959960938, 0.012358665466308594, 0.01371002197265625, 0.015061378479003906, 0.016412734985351562, 0.01776409149169922, 0.019115447998046875, 0.02046680450439453, 0.021818161010742188, 0.023169517517089844, 0.0245208740234375, 0.025872230529785156, 0.027223587036132812, 0.02857494354248047, 0.029926300048828125, 0.03127765655517578, 0.03262901306152344, 0.033980369567871094, 0.03533172607421875, 0.036683082580566406, 0.03803443908691406, 0.03938579559326172, 0.040737152099609375, 0.04208850860595703, 0.04343986511230469, 0.044791221618652344, 0.046142578125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 10.0, 8.0, 8.0, 25.0, 24.0, 22.0, 28.0, 34.0, 29.0, 57.0, 46.0, 57.0, 64.0, 66.0, 54.0, 56.0, 66.0, 64.0, 57.0, 39.0, 39.0, 26.0, 16.0, 22.0, 17.0, 11.0, 14.0, 12.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.029541015625, -0.028631210327148438, -0.027721405029296875, -0.026811599731445312, -0.02590179443359375, -0.024991989135742188, -0.024082183837890625, -0.023172378540039062, -0.0222625732421875, -0.021352767944335938, -0.020442962646484375, -0.019533157348632812, -0.01862335205078125, -0.017713546752929688, -0.016803741455078125, -0.015893936157226562, -0.014984130859375, -0.014074325561523438, -0.013164520263671875, -0.012254714965820312, -0.01134490966796875, -0.010435104370117188, -0.009525299072265625, -0.008615493774414062, -0.0077056884765625, -0.0067958831787109375, -0.005886077880859375, -0.0049762725830078125, -0.00406646728515625, -0.0031566619873046875, -0.002246856689453125, -0.0013370513916015625, -0.00042724609375, 0.0004825592041015625, 0.001392364501953125, 0.0023021697998046875, 0.00321197509765625, 0.0041217803955078125, 0.005031585693359375, 0.0059413909912109375, 0.0068511962890625, 0.0077610015869140625, 0.008670806884765625, 0.009580612182617188, 0.01049041748046875, 0.011400222778320312, 0.012310028076171875, 0.013219833374023438, 0.014129638671875, 0.015039443969726562, 0.015949249267578125, 0.016859054565429688, 0.01776885986328125, 0.018678665161132812, 0.019588470458984375, 0.020498275756835938, 0.0214080810546875, 0.022317886352539062, 0.023227691650390625, 0.024137496948242188, 0.02504730224609375, 0.025957107543945312, 0.026866912841796875, 0.027776718139648438, 0.0286865234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 10.0, 60.0, 386.0, 462.0, 79.0, 12.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3410359025001526, -0.2860242426395416, -0.23101258277893066, -0.1760009378194809, -0.12098927795886993, -0.06597763299942017, -0.010965973138809204, 0.04404568672180176, 0.09905734658241272, 0.15406900644302368, 0.20908066630363464, 0.2640923261642456, 0.3191039562225342, 0.37411561608314514, 0.4291272759437561, 0.48413893580436707, 0.539150595664978, 0.5941622257232666, 0.6491739153862, 0.7041855454444885, 0.7591972351074219, 0.8142088651657104, 0.869220495223999, 0.9242321848869324, 0.9792438745498657, 1.0342555046081543, 1.0892671346664429, 1.144278883934021, 1.1992905139923096, 1.2543021440505981, 1.3093137741088867, 1.3643255233764648, 1.4193371534347534, 1.474348783493042, 1.5293604135513306, 1.5843721628189087, 1.6393837928771973, 1.6943954229354858, 1.7494070529937744, 1.8044188022613525, 1.8594304323196411, 1.9144420623779297, 1.9694536924362183, 2.024465322494507, 2.079477071762085, 2.134488582611084, 2.189500331878662, 2.2445120811462402, 2.2995235919952393, 2.3545353412628174, 2.4095468521118164, 2.4645586013793945, 2.5195701122283936, 2.5745818614959717, 2.62959361076355, 2.684605121612549, 2.739616870880127, 2.794628620147705, 2.849640130996704, 2.9046518802642822, 2.9596633911132812, 3.0146751403808594, 3.0696868896484375, 3.1246984004974365, 3.1797101497650146]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 7.0, 5.0, 7.0, 12.0, 14.0, 13.0, 10.0, 20.0, 16.0, 26.0, 34.0, 30.0, 25.0, 31.0, 34.0, 43.0, 40.0, 39.0, 51.0, 51.0, 53.0, 38.0, 39.0, 31.0, 35.0, 43.0, 37.0, 28.0, 20.0, 25.0, 24.0, 14.0, 15.0, 14.0, 12.0, 13.0, 12.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4288681745529175, -0.4158878028392792, -0.4029074013233185, -0.3899270296096802, -0.37694665789604187, -0.36396628618240356, -0.35098588466644287, -0.33800551295280457, -0.32502514123916626, -0.31204476952552795, -0.29906436800956726, -0.28608399629592896, -0.27310362458229065, -0.26012325286865234, -0.24714285135269165, -0.23416247963905334, -0.22118207812309265, -0.20820169150829315, -0.19522131979465485, -0.18224093317985535, -0.16926056146621704, -0.15628017485141754, -0.14329978823661804, -0.13031941652297974, -0.11733902990818024, -0.10435865074396133, -0.09137827157974243, -0.07839788496494293, -0.06541750580072403, -0.05243712663650513, -0.03945674002170563, -0.026476360857486725, -0.013495981693267822, -0.0005156006664037704, 0.012464780360460281, 0.025445163249969482, 0.038425542414188385, 0.05140592157840729, 0.06438630819320679, 0.07736668735742569, 0.09034706652164459, 0.1033274456858635, 0.1163078248500824, 0.1292882114648819, 0.1422685980796814, 0.1552489697933197, 0.1682293564081192, 0.1812097430229187, 0.194190114736557, 0.2071705013513565, 0.2201508730649948, 0.2331312596797943, 0.24611163139343262, 0.2590920329093933, 0.2720724046230316, 0.2850527763366699, 0.2980331778526306, 0.3110135495662689, 0.3239939510822296, 0.3369743227958679, 0.3499546945095062, 0.36293506622314453, 0.3759154677391052, 0.38889583945274353, 0.40187621116638184]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 20.0, 30.0, 40.0, 58.0, 88.0, 286.0, 1447.0, 7604.0, 214075.0, 3695944.0, 264845.0, 8307.0, 891.0, 296.0, 128.0, 89.0, 33.0, 28.0, 22.0, 12.0, 9.0, 10.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15059471130371094, -0.14469528198242188, -0.1387958526611328, -0.13289642333984375, -0.1269969940185547, -0.12109756469726562, -0.11519813537597656, -0.1092987060546875, -0.10339927673339844, -0.09749984741210938, -0.09160041809082031, -0.08570098876953125, -0.07980155944824219, -0.07390213012695312, -0.06800270080566406, -0.062103271484375, -0.05620384216308594, -0.050304412841796875, -0.04440498352050781, -0.03850555419921875, -0.03260612487792969, -0.026706695556640625, -0.020807266235351562, -0.0149078369140625, -0.009008407592773438, -0.003108978271484375, 0.0027904510498046875, 0.00868988037109375, 0.014589309692382812, 0.020488739013671875, 0.026388168334960938, 0.03228759765625, 0.03818702697753906, 0.044086456298828125, 0.04998588562011719, 0.05588531494140625, 0.06178474426269531, 0.06768417358398438, 0.07358360290527344, 0.0794830322265625, 0.08538246154785156, 0.09128189086914062, 0.09718132019042969, 0.10308074951171875, 0.10898017883300781, 0.11487960815429688, 0.12077903747558594, 0.126678466796875, 0.13257789611816406, 0.13847732543945312, 0.1443767547607422, 0.15027618408203125, 0.1561756134033203, 0.16207504272460938, 0.16797447204589844, 0.1738739013671875, 0.17977333068847656, 0.18567276000976562, 0.1915721893310547, 0.19747161865234375, 0.2033710479736328, 0.20927047729492188, 0.21516990661621094, 0.2210693359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 18.0, 16.0, 21.0, 32.0, 47.0, 41.0, 72.0, 68.0, 89.0, 72.0, 89.0, 75.0, 69.0, 63.0, 58.0, 48.0, 29.0, 33.0, 21.0, 14.0, 7.0, 6.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09730339050292969, -0.09328842163085938, -0.08927345275878906, -0.08525848388671875, -0.08124351501464844, -0.07722854614257812, -0.07321357727050781, -0.0691986083984375, -0.06518363952636719, -0.061168670654296875, -0.05715370178222656, -0.05313873291015625, -0.04912376403808594, -0.045108795166015625, -0.04109382629394531, -0.037078857421875, -0.03306388854980469, -0.029048919677734375, -0.025033950805664062, -0.02101898193359375, -0.017004013061523438, -0.012989044189453125, -0.008974075317382812, -0.0049591064453125, -0.0009441375732421875, 0.003070831298828125, 0.0070858001708984375, 0.01110076904296875, 0.015115737915039062, 0.019130706787109375, 0.023145675659179688, 0.02716064453125, 0.031175613403320312, 0.035190582275390625, 0.03920555114746094, 0.04322052001953125, 0.04723548889160156, 0.051250457763671875, 0.05526542663574219, 0.0592803955078125, 0.06329536437988281, 0.06731033325195312, 0.07132530212402344, 0.07534027099609375, 0.07935523986816406, 0.08337020874023438, 0.08738517761230469, 0.091400146484375, 0.09541511535644531, 0.09943008422851562, 0.10344505310058594, 0.10746002197265625, 0.11147499084472656, 0.11548995971679688, 0.11950492858886719, 0.1235198974609375, 0.1275348663330078, 0.13154983520507812, 0.13556480407714844, 0.13957977294921875, 0.14359474182128906, 0.14760971069335938, 0.1516246795654297, 0.1556396484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 13.0, 22.0, 48.0, 79.0, 121.0, 245.0, 562.0, 1266.0, 3950.0, 19444.0, 264547.0, 3655861.0, 224326.0, 17670.0, 3731.0, 1283.0, 530.0, 265.0, 122.0, 80.0, 39.0, 27.0, 19.0, 10.0, 5.0, 10.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1842041015625, -0.17965316772460938, -0.17510223388671875, -0.17055130004882812, -0.1660003662109375, -0.16144943237304688, -0.15689849853515625, -0.15234756469726562, -0.147796630859375, -0.14324569702148438, -0.13869476318359375, -0.13414382934570312, -0.1295928955078125, -0.12504196166992188, -0.12049102783203125, -0.11594009399414062, -0.11138916015625, -0.10683822631835938, -0.10228729248046875, -0.09773635864257812, -0.0931854248046875, -0.08863449096679688, -0.08408355712890625, -0.07953262329101562, -0.074981689453125, -0.07043075561523438, -0.06587982177734375, -0.061328887939453125, -0.0567779541015625, -0.052227020263671875, -0.04767608642578125, -0.043125152587890625, -0.03857421875, -0.034023284912109375, -0.02947235107421875, -0.024921417236328125, -0.0203704833984375, -0.015819549560546875, -0.01126861572265625, -0.006717681884765625, -0.002166748046875, 0.002384185791015625, 0.00693511962890625, 0.011486053466796875, 0.0160369873046875, 0.020587921142578125, 0.02513885498046875, 0.029689788818359375, 0.03424072265625, 0.038791656494140625, 0.04334259033203125, 0.047893524169921875, 0.0524444580078125, 0.056995391845703125, 0.06154632568359375, 0.06609725952148438, 0.070648193359375, 0.07519912719726562, 0.07975006103515625, 0.08430099487304688, 0.0888519287109375, 0.09340286254882812, 0.09795379638671875, 0.10250473022460938, 0.1070556640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 8.0, 9.0, 15.0, 23.0, 45.0, 110.0, 308.0, 871.0, 1313.0, 770.0, 309.0, 142.0, 54.0, 31.0, 26.0, 14.0, 8.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08758544921875, -0.08351612091064453, -0.07944679260253906, -0.0753774642944336, -0.07130813598632812, -0.06723880767822266, -0.06316947937011719, -0.05910015106201172, -0.05503082275390625, -0.05096149444580078, -0.04689216613769531, -0.042822837829589844, -0.038753509521484375, -0.034684181213378906, -0.030614852905273438, -0.02654552459716797, -0.0224761962890625, -0.01840686798095703, -0.014337539672851562, -0.010268211364746094, -0.006198883056640625, -0.0021295547485351562, 0.0019397735595703125, 0.006009101867675781, 0.01007843017578125, 0.014147758483886719, 0.018217086791992188, 0.022286415100097656, 0.026355743408203125, 0.030425071716308594, 0.03449440002441406, 0.03856372833251953, 0.042633056640625, 0.04670238494873047, 0.05077171325683594, 0.054841041564941406, 0.058910369873046875, 0.06297969818115234, 0.06704902648925781, 0.07111835479736328, 0.07518768310546875, 0.07925701141357422, 0.08332633972167969, 0.08739566802978516, 0.09146499633789062, 0.0955343246459961, 0.09960365295410156, 0.10367298126220703, 0.1077423095703125, 0.11181163787841797, 0.11588096618652344, 0.1199502944946289, 0.12401962280273438, 0.12808895111083984, 0.1321582794189453, 0.13622760772705078, 0.14029693603515625, 0.14436626434326172, 0.1484355926513672, 0.15250492095947266, 0.15657424926757812, 0.1606435775756836, 0.16471290588378906, 0.16878223419189453, 0.1728515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 15.0, 15.0, 36.0, 74.0, 143.0, 193.0, 192.0, 149.0, 97.0, 56.0, 17.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45875707268714905, -0.4444212317466736, -0.4300854206085205, -0.41574957966804504, -0.4014137387275696, -0.3870779275894165, -0.37274208664894104, -0.3584062457084656, -0.3440704345703125, -0.32973459362983704, -0.31539878249168396, -0.3010629415512085, -0.2867271304130554, -0.27239128947257996, -0.2580554485321045, -0.24371962249279022, -0.22938379645347595, -0.21504797041416168, -0.2007121443748474, -0.18637630343437195, -0.17204047739505768, -0.1577046513557434, -0.14336881041526794, -0.12903298437595367, -0.1146971583366394, -0.10036133229732513, -0.08602549880743027, -0.0716896653175354, -0.05735383927822113, -0.04301801323890686, -0.028682179749011993, -0.014346346259117126, -1.049041748046875e-05, 0.0143253393471241, 0.028661169111728668, 0.04299699887633324, 0.057332828640937805, 0.07166865468025208, 0.08600448817014694, 0.10034032166004181, 0.11467614769935608, 0.12901197373867035, 0.14334779977798462, 0.15768364071846008, 0.17201946675777435, 0.18635529279708862, 0.2006911337375641, 0.21502695977687836, 0.22936278581619263, 0.2436986118555069, 0.25803443789482117, 0.27237027883529663, 0.2867060899734497, 0.30104193091392517, 0.31537777185440063, 0.3297135829925537, 0.3440494239330292, 0.35838526487350464, 0.3727210760116577, 0.3870569169521332, 0.40139275789260864, 0.4157285690307617, 0.4300644099712372, 0.44440025091171265, 0.4587360620498657]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 6.0, 5.0, 11.0, 9.0, 17.0, 15.0, 22.0, 25.0, 19.0, 33.0, 39.0, 40.0, 41.0, 41.0, 47.0, 35.0, 39.0, 53.0, 53.0, 39.0, 52.0, 46.0, 48.0, 37.0, 26.0, 34.0, 31.0, 27.0, 23.0, 22.0, 8.0, 17.0, 17.0, 7.0, 10.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26183056831359863, -0.2539794147014618, -0.24612826108932495, -0.23827709257602692, -0.23042593896389008, -0.22257478535175323, -0.2147236168384552, -0.20687246322631836, -0.19902130961418152, -0.19117015600204468, -0.18331900238990784, -0.1754678338766098, -0.16761668026447296, -0.15976552665233612, -0.15191435813903809, -0.14406320452690125, -0.1362120509147644, -0.12836089730262756, -0.12050973623991013, -0.11265857517719269, -0.10480742156505585, -0.096956267952919, -0.08910510689020157, -0.08125394582748413, -0.07340279221534729, -0.06555163860321045, -0.05770047754049301, -0.04984932020306587, -0.04199816286563873, -0.034147005528211594, -0.026295848190784454, -0.018444690853357315, -0.010593533515930176, -0.0027423761785030365, 0.005108781158924103, 0.012959938496351242, 0.02081109583377838, 0.02866225317120552, 0.03651341050863266, 0.0443645678460598, 0.05221572518348694, 0.06006688252091408, 0.06791803985834122, 0.07576920092105865, 0.0836203545331955, 0.09147150814533234, 0.09932266920804977, 0.10717383027076721, 0.11502498388290405, 0.1228761374950409, 0.13072729110717773, 0.13857845962047577, 0.1464296132326126, 0.15428076684474945, 0.16213193535804749, 0.16998308897018433, 0.17783424258232117, 0.185685396194458, 0.19353654980659485, 0.20138771831989288, 0.20923887193202972, 0.21709002554416656, 0.2249411940574646, 0.23279234766960144, 0.24064350128173828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 9.0, 9.0, 2.0, 10.0, 16.0, 23.0, 31.0, 52.0, 77.0, 107.0, 175.0, 254.0, 374.0, 668.0, 1292.0, 2577.0, 5684.0, 14469.0, 42457.0, 135304.0, 377512.0, 313139.0, 101006.0, 32368.0, 11463.0, 4627.0, 2152.0, 1082.0, 587.0, 346.0, 206.0, 160.0, 91.0, 91.0, 43.0, 28.0, 20.0, 17.0, 13.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.1002511978149414, -0.09729194641113281, -0.09433269500732422, -0.09137344360351562, -0.08841419219970703, -0.08545494079589844, -0.08249568939208984, -0.07953643798828125, -0.07657718658447266, -0.07361793518066406, -0.07065868377685547, -0.06769943237304688, -0.06474018096923828, -0.06178092956542969, -0.058821678161621094, -0.0558624267578125, -0.052903175354003906, -0.04994392395019531, -0.04698467254638672, -0.044025421142578125, -0.04106616973876953, -0.03810691833496094, -0.035147666931152344, -0.03218841552734375, -0.029229164123535156, -0.026269912719726562, -0.02331066131591797, -0.020351409912109375, -0.01739215850830078, -0.014432907104492188, -0.011473655700683594, -0.008514404296875, -0.005555152893066406, -0.0025959014892578125, 0.00036334991455078125, 0.003322601318359375, 0.006281852722167969, 0.009241104125976562, 0.012200355529785156, 0.01515960693359375, 0.018118858337402344, 0.021078109741210938, 0.02403736114501953, 0.026996612548828125, 0.02995586395263672, 0.03291511535644531, 0.035874366760253906, 0.0388336181640625, 0.041792869567871094, 0.04475212097167969, 0.04771137237548828, 0.050670623779296875, 0.05362987518310547, 0.05658912658691406, 0.059548377990722656, 0.06250762939453125, 0.06546688079833984, 0.06842613220214844, 0.07138538360595703, 0.07434463500976562, 0.07730388641357422, 0.08026313781738281, 0.0832223892211914, 0.086181640625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 14.0, 24.0, 21.0, 33.0, 47.0, 53.0, 63.0, 86.0, 80.0, 77.0, 92.0, 83.0, 78.0, 69.0, 55.0, 42.0, 21.0, 24.0, 11.0, 8.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115966796875, -0.11193656921386719, -0.10790634155273438, -0.10387611389160156, -0.09984588623046875, -0.09581565856933594, -0.09178543090820312, -0.08775520324707031, -0.0837249755859375, -0.07969474792480469, -0.07566452026367188, -0.07163429260253906, -0.06760406494140625, -0.06357383728027344, -0.059543609619140625, -0.05551338195800781, -0.051483154296875, -0.04745292663574219, -0.043422698974609375, -0.03939247131347656, -0.03536224365234375, -0.03133201599121094, -0.027301788330078125, -0.023271560668945312, -0.0192413330078125, -0.015211105346679688, -0.011180877685546875, -0.0071506500244140625, -0.00312042236328125, 0.0009098052978515625, 0.004940032958984375, 0.008970260620117188, 0.01300048828125, 0.017030715942382812, 0.021060943603515625, 0.025091171264648438, 0.02912139892578125, 0.03315162658691406, 0.037181854248046875, 0.04121208190917969, 0.0452423095703125, 0.04927253723144531, 0.053302764892578125, 0.05733299255371094, 0.06136322021484375, 0.06539344787597656, 0.06942367553710938, 0.07345390319824219, 0.077484130859375, 0.08151435852050781, 0.08554458618164062, 0.08957481384277344, 0.09360504150390625, 0.09763526916503906, 0.10166549682617188, 0.10569572448730469, 0.1097259521484375, 0.11375617980957031, 0.11778640747070312, 0.12181663513183594, 0.12584686279296875, 0.12987709045410156, 0.13390731811523438, 0.1379375457763672, 0.1419677734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 6.0, 14.0, 11.0, 14.0, 28.0, 16.0, 25.0, 33.0, 41.0, 37.0, 46.0, 125.0, 320.0, 1555.0, 14385.0, 339491.0, 660823.0, 28148.0, 2530.0, 446.0, 136.0, 64.0, 51.0, 38.0, 31.0, 33.0, 20.0, 15.0, 12.0, 6.0, 14.0, 8.0, 8.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.29248046875, -0.2841529846191406, -0.27582550048828125, -0.2674980163574219, -0.2591705322265625, -0.2508430480957031, -0.24251556396484375, -0.23418807983398438, -0.225860595703125, -0.21753311157226562, -0.20920562744140625, -0.20087814331054688, -0.1925506591796875, -0.18422317504882812, -0.17589569091796875, -0.16756820678710938, -0.15924072265625, -0.15091323852539062, -0.14258575439453125, -0.13425827026367188, -0.1259307861328125, -0.11760330200195312, -0.10927581787109375, -0.10094833374023438, -0.092620849609375, -0.08429336547851562, -0.07596588134765625, -0.06763839721679688, -0.0593109130859375, -0.050983428955078125, -0.04265594482421875, -0.034328460693359375, -0.0260009765625, -0.017673492431640625, -0.00934600830078125, -0.001018524169921875, 0.0073089599609375, 0.015636444091796875, 0.02396392822265625, 0.032291412353515625, 0.040618896484375, 0.048946380615234375, 0.05727386474609375, 0.06560134887695312, 0.0739288330078125, 0.08225631713867188, 0.09058380126953125, 0.09891128540039062, 0.10723876953125, 0.11556625366210938, 0.12389373779296875, 0.13222122192382812, 0.1405487060546875, 0.14887619018554688, 0.15720367431640625, 0.16553115844726562, 0.173858642578125, 0.18218612670898438, 0.19051361083984375, 0.19884109497070312, 0.2071685791015625, 0.21549606323242188, 0.22382354736328125, 0.23215103149414062, 0.240478515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 5.0, 7.0, 9.0, 10.0, 10.0, 15.0, 23.0, 26.0, 27.0, 36.0, 44.0, 32.0, 48.0, 44.0, 51.0, 46.0, 57.0, 40.0, 51.0, 55.0, 49.0, 56.0, 26.0, 38.0, 37.0, 25.0, 27.0, 21.0, 17.0, 12.0, 18.0, 15.0, 4.0, 2.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.1577434539794922, -0.15166854858398438, -0.14559364318847656, -0.13951873779296875, -0.13344383239746094, -0.12736892700195312, -0.12129402160644531, -0.1152191162109375, -0.10914421081542969, -0.10306930541992188, -0.09699440002441406, -0.09091949462890625, -0.08484458923339844, -0.07876968383789062, -0.07269477844238281, -0.066619873046875, -0.06054496765136719, -0.054470062255859375, -0.04839515686035156, -0.04232025146484375, -0.03624534606933594, -0.030170440673828125, -0.024095535278320312, -0.0180206298828125, -0.011945724487304688, -0.005870819091796875, 0.0002040863037109375, 0.00627899169921875, 0.012353897094726562, 0.018428802490234375, 0.024503707885742188, 0.03057861328125, 0.03665351867675781, 0.042728424072265625, 0.04880332946777344, 0.05487823486328125, 0.06095314025878906, 0.06702804565429688, 0.07310295104980469, 0.0791778564453125, 0.08525276184082031, 0.09132766723632812, 0.09740257263183594, 0.10347747802734375, 0.10955238342285156, 0.11562728881835938, 0.12170219421386719, 0.127777099609375, 0.1338520050048828, 0.13992691040039062, 0.14600181579589844, 0.15207672119140625, 0.15815162658691406, 0.16422653198242188, 0.1703014373779297, 0.1763763427734375, 0.1824512481689453, 0.18852615356445312, 0.19460105895996094, 0.20067596435546875, 0.20675086975097656, 0.21282577514648438, 0.2189006805419922, 0.2249755859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 11.0, 8.0, 11.0, 19.0, 20.0, 24.0, 36.0, 72.0, 91.0, 150.0, 278.0, 504.0, 1046.0, 2053.0, 4560.0, 11242.0, 31809.0, 105173.0, 356227.0, 369523.0, 111282.0, 33485.0, 11792.0, 4674.0, 2070.0, 1112.0, 505.0, 281.0, 147.0, 121.0, 60.0, 43.0, 21.0, 18.0, 21.0, 15.0, 12.0, 10.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0251312255859375, -0.024370193481445312, -0.023609161376953125, -0.022848129272460938, -0.02208709716796875, -0.021326065063476562, -0.020565032958984375, -0.019804000854492188, -0.01904296875, -0.018281936645507812, -0.017520904541015625, -0.016759872436523438, -0.01599884033203125, -0.015237808227539062, -0.014476776123046875, -0.013715744018554688, -0.0129547119140625, -0.012193679809570312, -0.011432647705078125, -0.010671615600585938, -0.00991058349609375, -0.009149551391601562, -0.008388519287109375, -0.0076274871826171875, -0.006866455078125, -0.0061054229736328125, -0.005344390869140625, -0.0045833587646484375, -0.00382232666015625, -0.0030612945556640625, -0.002300262451171875, -0.0015392303466796875, -0.0007781982421875, -1.71661376953125e-05, 0.000743865966796875, 0.0015048980712890625, 0.00226593017578125, 0.0030269622802734375, 0.003787994384765625, 0.0045490264892578125, 0.00531005859375, 0.0060710906982421875, 0.006832122802734375, 0.0075931549072265625, 0.00835418701171875, 0.009115219116210938, 0.009876251220703125, 0.010637283325195312, 0.0113983154296875, 0.012159347534179688, 0.012920379638671875, 0.013681411743164062, 0.01444244384765625, 0.015203475952148438, 0.015964508056640625, 0.016725540161132812, 0.017486572265625, 0.018247604370117188, 0.019008636474609375, 0.019769668579101562, 0.02053070068359375, 0.021291732788085938, 0.022052764892578125, 0.022813796997070312, 0.0235748291015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 10.0, 6.0, 11.0, 13.0, 12.0, 21.0, 13.0, 43.0, 28.0, 47.0, 68.0, 60.0, 109.0, 82.0, 74.0, 68.0, 65.0, 65.0, 42.0, 32.0, 35.0, 16.0, 21.0, 12.0, 7.0, 7.0, 7.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.900859832763672e-06, -5.709938704967499e-06, -5.519017577171326e-06, -5.328096449375153e-06, -5.1371753215789795e-06, -4.946254193782806e-06, -4.755333065986633e-06, -4.56441193819046e-06, -4.373490810394287e-06, -4.182569682598114e-06, -3.991648554801941e-06, -3.800727427005768e-06, -3.6098062992095947e-06, -3.4188851714134216e-06, -3.2279640436172485e-06, -3.0370429158210754e-06, -2.8461217880249023e-06, -2.6552006602287292e-06, -2.464279532432556e-06, -2.273358404636383e-06, -2.08243727684021e-06, -1.8915161490440369e-06, -1.7005950212478638e-06, -1.5096738934516907e-06, -1.3187527656555176e-06, -1.1278316378593445e-06, -9.369105100631714e-07, -7.459893822669983e-07, -5.550682544708252e-07, -3.641471266746521e-07, -1.73225998878479e-07, 1.7695128917694092e-08, 2.086162567138672e-07, 3.995373845100403e-07, 5.904585123062134e-07, 7.813796401023865e-07, 9.723007678985596e-07, 1.1632218956947327e-06, 1.3541430234909058e-06, 1.5450641512870789e-06, 1.735985279083252e-06, 1.926906406879425e-06, 2.117827534675598e-06, 2.3087486624717712e-06, 2.4996697902679443e-06, 2.6905909180641174e-06, 2.8815120458602905e-06, 3.0724331736564636e-06, 3.2633543014526367e-06, 3.45427542924881e-06, 3.645196557044983e-06, 3.836117684841156e-06, 4.027038812637329e-06, 4.217959940433502e-06, 4.408881068229675e-06, 4.599802196025848e-06, 4.7907233238220215e-06, 4.981644451618195e-06, 5.172565579414368e-06, 5.363486707210541e-06, 5.554407835006714e-06, 5.745328962802887e-06, 5.93625009059906e-06, 6.127171218395233e-06, 6.318092346191406e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 9.0, 4.0, 8.0, 16.0, 31.0, 68.0, 149.0, 269.0, 632.0, 1666.0, 5296.0, 21947.0, 124424.0, 585995.0, 253608.0, 41414.0, 8825.0, 2588.0, 864.0, 383.0, 148.0, 83.0, 37.0, 32.0, 19.0, 6.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033843994140625, -0.03266429901123047, -0.03148460388183594, -0.030304908752441406, -0.029125213623046875, -0.027945518493652344, -0.026765823364257812, -0.02558612823486328, -0.02440643310546875, -0.02322673797607422, -0.022047042846679688, -0.020867347717285156, -0.019687652587890625, -0.018507957458496094, -0.017328262329101562, -0.01614856719970703, -0.0149688720703125, -0.013789176940917969, -0.012609481811523438, -0.011429786682128906, -0.010250091552734375, -0.009070396423339844, -0.007890701293945312, -0.006711006164550781, -0.00553131103515625, -0.004351615905761719, -0.0031719207763671875, -0.0019922256469726562, -0.000812530517578125, 0.00036716461181640625, 0.0015468597412109375, 0.0027265548706054688, 0.00390625, 0.005085945129394531, 0.0062656402587890625, 0.007445335388183594, 0.008625030517578125, 0.009804725646972656, 0.010984420776367188, 0.012164115905761719, 0.01334381103515625, 0.014523506164550781, 0.015703201293945312, 0.016882896423339844, 0.018062591552734375, 0.019242286682128906, 0.020421981811523438, 0.02160167694091797, 0.0227813720703125, 0.02396106719970703, 0.025140762329101562, 0.026320457458496094, 0.027500152587890625, 0.028679847717285156, 0.029859542846679688, 0.03103923797607422, 0.03221893310546875, 0.03339862823486328, 0.03457832336425781, 0.035758018493652344, 0.036937713623046875, 0.038117408752441406, 0.03929710388183594, 0.04047679901123047, 0.041656494140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 7.0, 16.0, 14.0, 12.0, 15.0, 24.0, 29.0, 37.0, 41.0, 47.0, 58.0, 76.0, 92.0, 79.0, 86.0, 75.0, 53.0, 37.0, 36.0, 26.0, 18.0, 13.0, 21.0, 15.0, 7.0, 15.0, 3.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02557373046875, -0.024779319763183594, -0.023984909057617188, -0.02319049835205078, -0.022396087646484375, -0.02160167694091797, -0.020807266235351562, -0.020012855529785156, -0.01921844482421875, -0.018424034118652344, -0.017629623413085938, -0.01683521270751953, -0.016040802001953125, -0.015246391296386719, -0.014451980590820312, -0.013657569885253906, -0.0128631591796875, -0.012068748474121094, -0.011274337768554688, -0.010479927062988281, -0.009685516357421875, -0.008891105651855469, -0.008096694946289062, -0.007302284240722656, -0.00650787353515625, -0.005713462829589844, -0.0049190521240234375, -0.004124641418457031, -0.003330230712890625, -0.0025358200073242188, -0.0017414093017578125, -0.0009469985961914062, -0.000152587890625, 0.0006418228149414062, 0.0014362335205078125, 0.0022306442260742188, 0.003025054931640625, 0.0038194656372070312, 0.0046138763427734375, 0.005408287048339844, 0.00620269775390625, 0.006997108459472656, 0.0077915191650390625, 0.008585929870605469, 0.009380340576171875, 0.010174751281738281, 0.010969161987304688, 0.011763572692871094, 0.0125579833984375, 0.013352394104003906, 0.014146804809570312, 0.014941215515136719, 0.015735626220703125, 0.01653003692626953, 0.017324447631835938, 0.018118858337402344, 0.01891326904296875, 0.019707679748535156, 0.020502090454101562, 0.02129650115966797, 0.022090911865234375, 0.02288532257080078, 0.023679733276367188, 0.024474143981933594, 0.0252685546875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 15.0, 22.0, 36.0, 54.0, 74.0, 111.0, 141.0, 174.0, 138.0, 89.0, 46.0, 40.0, 22.0, 11.0, 9.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5754420757293701, -0.5627127289772034, -0.5499834418296814, -0.5372540950775146, -0.5245248079299927, -0.5117954611778259, -0.49906617403030396, -0.4863368272781372, -0.47360754013061523, -0.4608782231807709, -0.4481489062309265, -0.43541958928108215, -0.4226902723312378, -0.40996095538139343, -0.3972316384315491, -0.3845022916793823, -0.37177297472953796, -0.3590436577796936, -0.34631434082984924, -0.3335850238800049, -0.3208557069301605, -0.30812638998031616, -0.2953970432281494, -0.28266775608062744, -0.2699384093284607, -0.25720909237861633, -0.24447977542877197, -0.2317504584789276, -0.21902114152908325, -0.2062918245792389, -0.19356249272823334, -0.18083317577838898, -0.168103888630867, -0.15537457168102264, -0.14264525473117828, -0.12991592288017273, -0.11718661338090897, -0.1044572964310646, -0.09172797203063965, -0.07899865508079529, -0.06626933813095093, -0.05354002118110657, -0.04081070050597191, -0.02808137983083725, -0.01535206288099289, -0.002622745931148529, 0.010106578469276428, 0.02283589541912079, 0.03556521236896515, 0.04829452931880951, 0.06102384999394417, 0.07375317066907883, 0.08648248761892319, 0.09921180456876755, 0.1119411289691925, 0.12467044591903687, 0.13739976286888123, 0.15012907981872559, 0.16285839676856995, 0.1755877137184143, 0.18831703066825867, 0.20104634761810303, 0.21377567946910858, 0.22650499641895294, 0.2392343133687973]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 5.0, 12.0, 9.0, 22.0, 22.0, 25.0, 19.0, 21.0, 32.0, 34.0, 30.0, 39.0, 41.0, 29.0, 36.0, 31.0, 49.0, 45.0, 46.0, 42.0, 43.0, 34.0, 32.0, 39.0, 39.0, 17.0, 32.0, 22.0, 28.0, 20.0, 15.0, 11.0, 14.0, 8.0, 11.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4168620705604553, -0.40348106622695923, -0.39010006189346313, -0.37671905755996704, -0.36333802342414856, -0.34995701909065247, -0.33657601475715637, -0.3231950104236603, -0.3098139762878418, -0.2964329719543457, -0.2830519676208496, -0.2696709632873535, -0.25628992915153503, -0.24290892481803894, -0.22952792048454285, -0.21614691615104675, -0.20276591181755066, -0.18938490748405457, -0.17600388824939728, -0.16262288391590118, -0.1492418646812439, -0.1358608603477478, -0.12247985601425171, -0.10909884423017502, -0.09571783244609833, -0.08233682066202164, -0.06895580887794495, -0.05557480454444885, -0.04219379276037216, -0.02881278097629547, -0.015431776642799377, -0.0020507648587226868, 0.011330246925354004, 0.024711256846785545, 0.03809226676821709, 0.05147327482700348, 0.06485428661108017, 0.07823529839515686, 0.09161630272865295, 0.10499731451272964, 0.11837832629680634, 0.13175933063030243, 0.14514034986495972, 0.1585213541984558, 0.1719023585319519, 0.1852833777666092, 0.19866438210010529, 0.21204540133476257, 0.22542640566825867, 0.23880741000175476, 0.25218841433525085, 0.26556944847106934, 0.27895045280456543, 0.2923314571380615, 0.3057124614715576, 0.3190934658050537, 0.3324744701385498, 0.3458554744720459, 0.359236478805542, 0.3726174831390381, 0.38599851727485657, 0.39937952160835266, 0.41276052594184875, 0.42614153027534485, 0.43952256441116333]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 14.0, 9.0, 24.0, 29.0, 91.0, 247.0, 610.0, 1130.0, 3035.0, 11932.0, 92342.0, 1079063.0, 2714329.0, 262004.0, 23429.0, 4311.0, 1031.0, 309.0, 145.0, 70.0, 43.0, 27.0, 16.0, 14.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06939697265625, -0.06627178192138672, -0.06314659118652344, -0.060021400451660156, -0.056896209716796875, -0.053771018981933594, -0.05064582824707031, -0.04752063751220703, -0.04439544677734375, -0.04127025604248047, -0.03814506530761719, -0.035019874572753906, -0.031894683837890625, -0.028769493103027344, -0.025644302368164062, -0.02251911163330078, -0.0193939208984375, -0.01626873016357422, -0.013143539428710938, -0.010018348693847656, -0.006893157958984375, -0.0037679672241210938, -0.0006427764892578125, 0.0024824142456054688, 0.00560760498046875, 0.008732795715332031, 0.011857986450195312, 0.014983177185058594, 0.018108367919921875, 0.021233558654785156, 0.024358749389648438, 0.02748394012451172, 0.030609130859375, 0.03373432159423828, 0.03685951232910156, 0.039984703063964844, 0.043109893798828125, 0.046235084533691406, 0.04936027526855469, 0.05248546600341797, 0.05561065673828125, 0.05873584747314453, 0.06186103820800781, 0.0649862289428711, 0.06811141967773438, 0.07123661041259766, 0.07436180114746094, 0.07748699188232422, 0.0806121826171875, 0.08373737335205078, 0.08686256408691406, 0.08998775482177734, 0.09311294555664062, 0.0962381362915039, 0.09936332702636719, 0.10248851776123047, 0.10561370849609375, 0.10873889923095703, 0.11186408996582031, 0.1149892807006836, 0.11811447143554688, 0.12123966217041016, 0.12436485290527344, 0.12749004364013672, 0.130615234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 11.0, 8.0, 15.0, 35.0, 30.0, 47.0, 55.0, 65.0, 56.0, 85.0, 83.0, 89.0, 84.0, 62.0, 70.0, 52.0, 45.0, 28.0, 18.0, 17.0, 12.0, 12.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.0947275161743164, -0.09076118469238281, -0.08679485321044922, -0.08282852172851562, -0.07886219024658203, -0.07489585876464844, -0.07092952728271484, -0.06696319580078125, -0.06299686431884766, -0.05903053283691406, -0.05506420135498047, -0.051097869873046875, -0.04713153839111328, -0.04316520690917969, -0.039198875427246094, -0.0352325439453125, -0.031266212463378906, -0.027299880981445312, -0.02333354949951172, -0.019367218017578125, -0.015400886535644531, -0.011434555053710938, -0.007468223571777344, -0.00350189208984375, 0.00046443939208984375, 0.0044307708740234375, 0.008397102355957031, 0.012363433837890625, 0.01632976531982422, 0.020296096801757812, 0.024262428283691406, 0.028228759765625, 0.032195091247558594, 0.03616142272949219, 0.04012775421142578, 0.044094085693359375, 0.04806041717529297, 0.05202674865722656, 0.055993080139160156, 0.05995941162109375, 0.06392574310302734, 0.06789207458496094, 0.07185840606689453, 0.07582473754882812, 0.07979106903076172, 0.08375740051269531, 0.0877237319946289, 0.0916900634765625, 0.0956563949584961, 0.09962272644042969, 0.10358905792236328, 0.10755538940429688, 0.11152172088623047, 0.11548805236816406, 0.11945438385009766, 0.12342071533203125, 0.12738704681396484, 0.13135337829589844, 0.13531970977783203, 0.13928604125976562, 0.14325237274169922, 0.1472187042236328, 0.1511850357055664, 0.1551513671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 16.0, 15.0, 45.0, 60.0, 134.0, 297.0, 805.0, 2293.0, 11859.0, 385527.0, 3739371.0, 46868.0, 4748.0, 1264.0, 508.0, 213.0, 100.0, 59.0, 35.0, 25.0, 17.0, 13.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.256103515625, -0.2498950958251953, -0.24368667602539062, -0.23747825622558594, -0.23126983642578125, -0.22506141662597656, -0.21885299682617188, -0.2126445770263672, -0.2064361572265625, -0.2002277374267578, -0.19401931762695312, -0.18781089782714844, -0.18160247802734375, -0.17539405822753906, -0.16918563842773438, -0.1629772186279297, -0.156768798828125, -0.1505603790283203, -0.14435195922851562, -0.13814353942871094, -0.13193511962890625, -0.12572669982910156, -0.11951828002929688, -0.11330986022949219, -0.1071014404296875, -0.10089302062988281, -0.09468460083007812, -0.08847618103027344, -0.08226776123046875, -0.07605934143066406, -0.06985092163085938, -0.06364250183105469, -0.05743408203125, -0.05122566223144531, -0.045017242431640625, -0.03880882263183594, -0.03260040283203125, -0.026391983032226562, -0.020183563232421875, -0.013975143432617188, -0.0077667236328125, -0.0015583038330078125, 0.004650115966796875, 0.010858535766601562, 0.01706695556640625, 0.023275375366210938, 0.029483795166015625, 0.03569221496582031, 0.041900634765625, 0.04810905456542969, 0.054317474365234375, 0.06052589416503906, 0.06673431396484375, 0.07294273376464844, 0.07915115356445312, 0.08535957336425781, 0.0915679931640625, 0.09777641296386719, 0.10398483276367188, 0.11019325256347656, 0.11640167236328125, 0.12261009216308594, 0.12881851196289062, 0.1350269317626953, 0.1412353515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 14.0, 23.0, 62.0, 203.0, 828.0, 1807.0, 780.0, 203.0, 68.0, 33.0, 25.0, 8.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1077880859375, -0.1027679443359375, -0.097747802734375, -0.0927276611328125, -0.08770751953125, -0.0826873779296875, -0.077667236328125, -0.0726470947265625, -0.067626953125, -0.0626068115234375, -0.057586669921875, -0.0525665283203125, -0.04754638671875, -0.0425262451171875, -0.037506103515625, -0.0324859619140625, -0.0274658203125, -0.0224456787109375, -0.017425537109375, -0.0124053955078125, -0.00738525390625, -0.0023651123046875, 0.002655029296875, 0.0076751708984375, 0.0126953125, 0.0177154541015625, 0.022735595703125, 0.0277557373046875, 0.03277587890625, 0.0377960205078125, 0.042816162109375, 0.0478363037109375, 0.0528564453125, 0.0578765869140625, 0.062896728515625, 0.0679168701171875, 0.07293701171875, 0.0779571533203125, 0.082977294921875, 0.0879974365234375, 0.093017578125, 0.0980377197265625, 0.103057861328125, 0.1080780029296875, 0.11309814453125, 0.1181182861328125, 0.123138427734375, 0.1281585693359375, 0.1331787109375, 0.1381988525390625, 0.143218994140625, 0.1482391357421875, 0.15325927734375, 0.1582794189453125, 0.163299560546875, 0.1683197021484375, 0.17333984375, 0.1783599853515625, 0.183380126953125, 0.1884002685546875, 0.19342041015625, 0.1984405517578125, 0.203460693359375, 0.2084808349609375, 0.2135009765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 29.0, 47.0, 80.0, 128.0, 169.0, 185.0, 141.0, 116.0, 46.0, 28.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5105319619178772, -0.500556230545044, -0.4905804395675659, -0.4806046783924103, -0.47062891721725464, -0.4606531858444214, -0.45067742466926575, -0.4407016634941101, -0.43072590231895447, -0.42075014114379883, -0.4107743799686432, -0.40079861879348755, -0.3908228874206543, -0.38084712624549866, -0.370871365070343, -0.3608956038951874, -0.35091984272003174, -0.3409440815448761, -0.33096832036972046, -0.3209925591945648, -0.3110167980194092, -0.3010410666465759, -0.2910653054714203, -0.28108954429626465, -0.271113783121109, -0.26113802194595337, -0.25116226077079773, -0.24118651449680328, -0.23121075332164764, -0.221234992146492, -0.21125924587249756, -0.20128348469734192, -0.19130770862102509, -0.18133194744586945, -0.171356201171875, -0.16138043999671936, -0.15140467882156372, -0.14142891764640808, -0.13145315647125244, -0.121477410197258, -0.11150164902210236, -0.10152588784694672, -0.09155013412237167, -0.08157438039779663, -0.07159861922264099, -0.06162286177277565, -0.05164710432291031, -0.041671350598335266, -0.031695589423179626, -0.021719831973314285, -0.011744074523448944, -0.001768317073583603, 0.008207440376281738, 0.01818319782614708, 0.02815895527601242, 0.03813470900058746, 0.0481104701757431, 0.058086227625608444, 0.06806198507547379, 0.07803773880004883, 0.08801349997520447, 0.09798926115036011, 0.10796501487493515, 0.11794076859951019, 0.12791652977466583]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 6.0, 8.0, 9.0, 11.0, 13.0, 19.0, 25.0, 11.0, 24.0, 20.0, 31.0, 37.0, 26.0, 30.0, 40.0, 37.0, 39.0, 44.0, 47.0, 45.0, 48.0, 30.0, 43.0, 31.0, 38.0, 26.0, 40.0, 32.0, 35.0, 22.0, 26.0, 20.0, 12.0, 13.0, 13.0, 9.0, 6.0, 6.0, 3.0, 1.0, 10.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14292824268341064, -0.13808299601078033, -0.13323773443698883, -0.12839248776435852, -0.12354724109172821, -0.1187019869685173, -0.1138567328453064, -0.10901148617267609, -0.10416623204946518, -0.09932097792625427, -0.09447573125362396, -0.08963047713041306, -0.08478522300720215, -0.07993997633457184, -0.07509472221136093, -0.07024946808815002, -0.06540422141551971, -0.060558971017599106, -0.0557137206196785, -0.05086846649646759, -0.04602321609854698, -0.04117796570062637, -0.036332711577415466, -0.03148746117949486, -0.02664221078157425, -0.02179696038365364, -0.016951708123087883, -0.0121064567938447, -0.007261205464601517, -0.002415955066680908, 0.0024292971938848495, 0.007274549454450607, 0.012119799852371216, 0.016965050250291824, 0.021810302510857582, 0.02665555477142334, 0.03150080516934395, 0.03634605556726456, 0.041191309690475464, 0.04603656008839607, 0.05088181048631668, 0.05572706088423729, 0.0605723112821579, 0.0654175654053688, 0.07026281952857971, 0.07510806620121002, 0.07995332032442093, 0.08479857444763184, 0.08964382112026215, 0.09448907524347305, 0.09933432191610336, 0.10417957603931427, 0.10902482271194458, 0.11387007683515549, 0.1187153309583664, 0.1235605776309967, 0.1284058392047882, 0.13325108587741852, 0.13809634745121002, 0.14294159412384033, 0.14778684079647064, 0.15263208746910095, 0.15747734904289246, 0.16232259571552277, 0.16716784238815308]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 7.0, 11.0, 9.0, 27.0, 34.0, 38.0, 60.0, 64.0, 96.0, 130.0, 245.0, 345.0, 475.0, 841.0, 1499.0, 2986.0, 6183.0, 14801.0, 37997.0, 108053.0, 290875.0, 350160.0, 147252.0, 51086.0, 19174.0, 7942.0, 3603.0, 1823.0, 983.0, 587.0, 363.0, 250.0, 157.0, 106.0, 76.0, 54.0, 47.0, 34.0, 23.0, 15.0, 9.0, 7.0, 3.0, 8.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07470703125, -0.07238292694091797, -0.07005882263183594, -0.0677347183227539, -0.06541061401367188, -0.06308650970458984, -0.06076240539550781, -0.05843830108642578, -0.05611419677734375, -0.05379009246826172, -0.05146598815917969, -0.049141883850097656, -0.046817779541015625, -0.044493675231933594, -0.04216957092285156, -0.03984546661376953, -0.0375213623046875, -0.03519725799560547, -0.03287315368652344, -0.030549049377441406, -0.028224945068359375, -0.025900840759277344, -0.023576736450195312, -0.02125263214111328, -0.01892852783203125, -0.01660442352294922, -0.014280319213867188, -0.011956214904785156, -0.009632110595703125, -0.007308006286621094, -0.0049839019775390625, -0.0026597976684570312, -0.000335693359375, 0.0019884109497070312, 0.0043125152587890625, 0.006636619567871094, 0.008960723876953125, 0.011284828186035156, 0.013608932495117188, 0.01593303680419922, 0.01825714111328125, 0.02058124542236328, 0.022905349731445312, 0.025229454040527344, 0.027553558349609375, 0.029877662658691406, 0.03220176696777344, 0.03452587127685547, 0.0368499755859375, 0.03917407989501953, 0.04149818420410156, 0.043822288513183594, 0.046146392822265625, 0.048470497131347656, 0.05079460144042969, 0.05311870574951172, 0.05544281005859375, 0.05776691436767578, 0.06009101867675781, 0.062415122985839844, 0.06473922729492188, 0.0670633316040039, 0.06938743591308594, 0.07171154022216797, 0.07403564453125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 12.0, 9.0, 25.0, 40.0, 50.0, 62.0, 71.0, 82.0, 104.0, 98.0, 73.0, 93.0, 68.0, 57.0, 41.0, 36.0, 21.0, 13.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11029052734375, -0.10612201690673828, -0.10195350646972656, -0.09778499603271484, -0.09361648559570312, -0.0894479751586914, -0.08527946472167969, -0.08111095428466797, -0.07694244384765625, -0.07277393341064453, -0.06860542297363281, -0.0644369125366211, -0.060268402099609375, -0.056099891662597656, -0.05193138122558594, -0.04776287078857422, -0.0435943603515625, -0.03942584991455078, -0.03525733947753906, -0.031088829040527344, -0.026920318603515625, -0.022751808166503906, -0.018583297729492188, -0.014414787292480469, -0.01024627685546875, -0.006077766418457031, -0.0019092559814453125, 0.0022592544555664062, 0.006427764892578125, 0.010596275329589844, 0.014764785766601562, 0.01893329620361328, 0.023101806640625, 0.02727031707763672, 0.03143882751464844, 0.035607337951660156, 0.039775848388671875, 0.043944358825683594, 0.04811286926269531, 0.05228137969970703, 0.05644989013671875, 0.06061840057373047, 0.06478691101074219, 0.0689554214477539, 0.07312393188476562, 0.07729244232177734, 0.08146095275878906, 0.08562946319580078, 0.0897979736328125, 0.09396648406982422, 0.09813499450683594, 0.10230350494384766, 0.10647201538085938, 0.1106405258178711, 0.11480903625488281, 0.11897754669189453, 0.12314605712890625, 0.12731456756591797, 0.1314830780029297, 0.1356515884399414, 0.13982009887695312, 0.14398860931396484, 0.14815711975097656, 0.15232563018798828, 0.156494140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 2.0, 1.0, 8.0, 7.0, 11.0, 14.0, 14.0, 24.0, 23.0, 21.0, 28.0, 29.0, 39.0, 54.0, 76.0, 246.0, 1035.0, 7049.0, 93976.0, 803427.0, 131547.0, 8966.0, 1234.0, 292.0, 111.0, 49.0, 49.0, 31.0, 29.0, 32.0, 30.0, 20.0, 14.0, 13.0, 14.0, 6.0, 7.0, 9.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2042236328125, -0.1973133087158203, -0.19040298461914062, -0.18349266052246094, -0.17658233642578125, -0.16967201232910156, -0.16276168823242188, -0.1558513641357422, -0.1489410400390625, -0.1420307159423828, -0.13512039184570312, -0.12821006774902344, -0.12129974365234375, -0.11438941955566406, -0.10747909545898438, -0.10056877136230469, -0.093658447265625, -0.08674812316894531, -0.07983779907226562, -0.07292747497558594, -0.06601715087890625, -0.05910682678222656, -0.052196502685546875, -0.04528617858886719, -0.0383758544921875, -0.03146553039550781, -0.024555206298828125, -0.017644882202148438, -0.01073455810546875, -0.0038242340087890625, 0.003086090087890625, 0.009996414184570312, 0.01690673828125, 0.023817062377929688, 0.030727386474609375, 0.03763771057128906, 0.04454803466796875, 0.05145835876464844, 0.058368682861328125, 0.06527900695800781, 0.0721893310546875, 0.07909965515136719, 0.08600997924804688, 0.09292030334472656, 0.09983062744140625, 0.10674095153808594, 0.11365127563476562, 0.12056159973144531, 0.127471923828125, 0.1343822479248047, 0.14129257202148438, 0.14820289611816406, 0.15511322021484375, 0.16202354431152344, 0.16893386840820312, 0.1758441925048828, 0.1827545166015625, 0.1896648406982422, 0.19657516479492188, 0.20348548889160156, 0.21039581298828125, 0.21730613708496094, 0.22421646118164062, 0.2311267852783203, 0.238037109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 1.0, 1.0, 7.0, 8.0, 6.0, 5.0, 16.0, 18.0, 12.0, 25.0, 39.0, 33.0, 32.0, 33.0, 43.0, 39.0, 33.0, 47.0, 48.0, 44.0, 54.0, 46.0, 47.0, 38.0, 42.0, 38.0, 33.0, 38.0, 33.0, 21.0, 29.0, 18.0, 20.0, 13.0, 13.0, 5.0, 4.0, 6.0, 3.0, 6.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1873779296875, -0.18207359313964844, -0.17676925659179688, -0.1714649200439453, -0.16616058349609375, -0.1608562469482422, -0.15555191040039062, -0.15024757385253906, -0.1449432373046875, -0.13963890075683594, -0.13433456420898438, -0.1290302276611328, -0.12372589111328125, -0.11842155456542969, -0.11311721801757812, -0.10781288146972656, -0.102508544921875, -0.09720420837402344, -0.09189987182617188, -0.08659553527832031, -0.08129119873046875, -0.07598686218261719, -0.07068252563476562, -0.06537818908691406, -0.0600738525390625, -0.05476951599121094, -0.049465179443359375, -0.04416084289550781, -0.03885650634765625, -0.03355216979980469, -0.028247833251953125, -0.022943496704101562, -0.01763916015625, -0.012334823608398438, -0.007030487060546875, -0.0017261505126953125, 0.00357818603515625, 0.008882522583007812, 0.014186859130859375, 0.019491195678710938, 0.0247955322265625, 0.030099868774414062, 0.035404205322265625, 0.04070854187011719, 0.04601287841796875, 0.05131721496582031, 0.056621551513671875, 0.06192588806152344, 0.067230224609375, 0.07253456115722656, 0.07783889770507812, 0.08314323425292969, 0.08844757080078125, 0.09375190734863281, 0.09905624389648438, 0.10436058044433594, 0.1096649169921875, 0.11496925354003906, 0.12027359008789062, 0.1255779266357422, 0.13088226318359375, 0.1361865997314453, 0.14149093627929688, 0.14679527282714844, 0.152099609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 5.0, 23.0, 16.0, 32.0, 28.0, 52.0, 59.0, 110.0, 142.0, 246.0, 389.0, 588.0, 970.0, 1672.0, 3177.0, 6617.0, 15334.0, 43636.0, 159050.0, 413375.0, 280732.0, 78638.0, 24159.0, 9519.0, 4437.0, 2140.0, 1244.0, 752.0, 469.0, 317.0, 191.0, 145.0, 88.0, 52.0, 33.0, 31.0, 18.0, 18.0, 13.0, 6.0, 5.0, 7.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0216827392578125, -0.020928144454956055, -0.02017354965209961, -0.019418954849243164, -0.01866436004638672, -0.017909765243530273, -0.017155170440673828, -0.016400575637817383, -0.015645980834960938, -0.014891386032104492, -0.014136791229248047, -0.013382196426391602, -0.012627601623535156, -0.011873006820678711, -0.011118412017822266, -0.01036381721496582, -0.009609222412109375, -0.00885462760925293, -0.008100032806396484, -0.007345438003540039, -0.006590843200683594, -0.0058362483978271484, -0.005081653594970703, -0.004327058792114258, -0.0035724639892578125, -0.002817869186401367, -0.002063274383544922, -0.0013086795806884766, -0.0005540847778320312, 0.00020051002502441406, 0.0009551048278808594, 0.0017096996307373047, 0.00246429443359375, 0.0032188892364501953, 0.003973484039306641, 0.004728078842163086, 0.005482673645019531, 0.0062372684478759766, 0.006991863250732422, 0.007746458053588867, 0.008501052856445312, 0.009255647659301758, 0.010010242462158203, 0.010764837265014648, 0.011519432067871094, 0.012274026870727539, 0.013028621673583984, 0.01378321647644043, 0.014537811279296875, 0.01529240608215332, 0.016047000885009766, 0.01680159568786621, 0.017556190490722656, 0.0183107852935791, 0.019065380096435547, 0.019819974899291992, 0.020574569702148438, 0.021329164505004883, 0.022083759307861328, 0.022838354110717773, 0.02359294891357422, 0.024347543716430664, 0.02510213851928711, 0.025856733322143555, 0.026611328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 8.0, 2.0, 8.0, 20.0, 24.0, 23.0, 33.0, 44.0, 51.0, 83.0, 83.0, 92.0, 85.0, 97.0, 75.0, 55.0, 55.0, 41.0, 34.0, 18.0, 21.0, 15.0, 4.0, 2.0, 3.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.498768925666809e-06, -6.2622129917144775e-06, -6.025657057762146e-06, -5.7891011238098145e-06, -5.552545189857483e-06, -5.315989255905151e-06, -5.07943332195282e-06, -4.842877388000488e-06, -4.606321454048157e-06, -4.369765520095825e-06, -4.133209586143494e-06, -3.896653652191162e-06, -3.6600977182388306e-06, -3.423541784286499e-06, -3.1869858503341675e-06, -2.950429916381836e-06, -2.7138739824295044e-06, -2.477318048477173e-06, -2.2407621145248413e-06, -2.0042061805725098e-06, -1.7676502466201782e-06, -1.5310943126678467e-06, -1.2945383787155151e-06, -1.0579824447631836e-06, -8.21426510810852e-07, -5.848705768585205e-07, -3.4831464290618896e-07, -1.1175870895385742e-07, 1.2479722499847412e-07, 3.6135315895080566e-07, 5.979090929031372e-07, 8.344650268554688e-07, 1.0710209608078003e-06, 1.3075768947601318e-06, 1.5441328287124634e-06, 1.780688762664795e-06, 2.0172446966171265e-06, 2.253800630569458e-06, 2.4903565645217896e-06, 2.726912498474121e-06, 2.9634684324264526e-06, 3.200024366378784e-06, 3.4365803003311157e-06, 3.6731362342834473e-06, 3.909692168235779e-06, 4.14624810218811e-06, 4.382804036140442e-06, 4.6193599700927734e-06, 4.855915904045105e-06, 5.0924718379974365e-06, 5.329027771949768e-06, 5.5655837059021e-06, 5.802139639854431e-06, 6.038695573806763e-06, 6.275251507759094e-06, 6.511807441711426e-06, 6.748363375663757e-06, 6.984919309616089e-06, 7.22147524356842e-06, 7.458031177520752e-06, 7.694587111473083e-06, 7.931143045425415e-06, 8.167698979377747e-06, 8.404254913330078e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 11.0, 19.0, 26.0, 54.0, 134.0, 491.0, 2956.0, 43674.0, 895646.0, 99715.0, 4830.0, 688.0, 159.0, 73.0, 36.0, 19.0, 13.0, 7.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058929443359375, -0.05620241165161133, -0.053475379943847656, -0.050748348236083984, -0.04802131652832031, -0.04529428482055664, -0.04256725311279297, -0.0398402214050293, -0.037113189697265625, -0.03438615798950195, -0.03165912628173828, -0.02893209457397461, -0.026205062866210938, -0.023478031158447266, -0.020750999450683594, -0.018023967742919922, -0.01529693603515625, -0.012569904327392578, -0.009842872619628906, -0.007115840911865234, -0.0043888092041015625, -0.0016617774963378906, 0.0010652542114257812, 0.003792285919189453, 0.006519317626953125, 0.009246349334716797, 0.011973381042480469, 0.01470041275024414, 0.017427444458007812, 0.020154476165771484, 0.022881507873535156, 0.025608539581298828, 0.0283355712890625, 0.031062602996826172, 0.033789634704589844, 0.036516666412353516, 0.03924369812011719, 0.04197072982788086, 0.04469776153564453, 0.0474247932434082, 0.050151824951171875, 0.05287885665893555, 0.05560588836669922, 0.05833292007446289, 0.06105995178222656, 0.06378698348999023, 0.0665140151977539, 0.06924104690551758, 0.07196807861328125, 0.07469511032104492, 0.0774221420288086, 0.08014917373657227, 0.08287620544433594, 0.08560323715209961, 0.08833026885986328, 0.09105730056762695, 0.09378433227539062, 0.0965113639831543, 0.09923839569091797, 0.10196542739868164, 0.10469245910644531, 0.10741949081420898, 0.11014652252197266, 0.11287355422973633, 0.1156005859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 14.0, 13.0, 23.0, 24.0, 84.0, 117.0, 185.0, 191.0, 144.0, 90.0, 42.0, 27.0, 19.0, 10.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08636474609375, -0.0843653678894043, -0.0823659896850586, -0.08036661148071289, -0.07836723327636719, -0.07636785507202148, -0.07436847686767578, -0.07236909866333008, -0.07036972045898438, -0.06837034225463867, -0.06637096405029297, -0.06437158584594727, -0.06237220764160156, -0.06037282943725586, -0.058373451232910156, -0.05637407302856445, -0.05437469482421875, -0.05237531661987305, -0.050375938415527344, -0.04837656021118164, -0.04637718200683594, -0.044377803802490234, -0.04237842559814453, -0.04037904739379883, -0.038379669189453125, -0.03638029098510742, -0.03438091278076172, -0.032381534576416016, -0.030382156372070312, -0.02838277816772461, -0.026383399963378906, -0.024384021759033203, -0.0223846435546875, -0.020385265350341797, -0.018385887145996094, -0.01638650894165039, -0.014387130737304688, -0.012387752532958984, -0.010388374328613281, -0.008388996124267578, -0.006389617919921875, -0.004390239715576172, -0.0023908615112304688, -0.0003914833068847656, 0.0016078948974609375, 0.0036072731018066406, 0.005606651306152344, 0.007606029510498047, 0.00960540771484375, 0.011604785919189453, 0.013604164123535156, 0.01560354232788086, 0.017602920532226562, 0.019602298736572266, 0.02160167694091797, 0.023601055145263672, 0.025600433349609375, 0.027599811553955078, 0.02959918975830078, 0.031598567962646484, 0.03359794616699219, 0.03559732437133789, 0.037596702575683594, 0.0395960807800293, 0.041595458984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 11.0, 14.0, 18.0, 33.0, 52.0, 83.0, 100.0, 131.0, 139.0, 115.0, 95.0, 69.0, 36.0, 31.0, 12.0, 22.0, 12.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.4524803161621094, -0.442394882440567, -0.43230944871902466, -0.4222240149974823, -0.41213858127593994, -0.4020531177520752, -0.3919677138328552, -0.3818822503089905, -0.3717968165874481, -0.36171138286590576, -0.3516259491443634, -0.34154051542282104, -0.3314550817012787, -0.32136964797973633, -0.3112841844558716, -0.3011987507343292, -0.29111331701278687, -0.2810278832912445, -0.27094244956970215, -0.2608570158481598, -0.25077158212661743, -0.24068613350391388, -0.23060069978237152, -0.22051525115966797, -0.210429847240448, -0.20034441351890564, -0.19025897979736328, -0.18017354607582092, -0.17008809745311737, -0.160002663731575, -0.14991723001003265, -0.1398317813873291, -0.12974633276462555, -0.11966089904308319, -0.10957545787096024, -0.09949002414941788, -0.08940458297729492, -0.07931914925575256, -0.0692337155342102, -0.05914827436208725, -0.04906284064054489, -0.038977403193712234, -0.028891967609524727, -0.01880653202533722, -0.008721094578504562, 0.0013643428683280945, 0.011449776589870453, 0.021535217761993408, 0.03162065148353577, 0.04170608893036842, 0.05179152637720108, 0.06187696009874344, 0.0719624012708664, 0.08204783499240875, 0.09213326871395111, 0.10221870988607407, 0.11230414360761642, 0.12238957732915878, 0.13247501850128174, 0.1425604522228241, 0.15264588594436646, 0.1627313196659088, 0.17281675338745117, 0.18290220201015472, 0.19298763573169708]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 8.0, 13.0, 14.0, 11.0, 9.0, 23.0, 24.0, 19.0, 23.0, 31.0, 31.0, 36.0, 37.0, 37.0, 43.0, 43.0, 41.0, 45.0, 43.0, 47.0, 39.0, 46.0, 47.0, 33.0, 40.0, 27.0, 20.0, 30.0, 30.0, 13.0, 19.0, 14.0, 12.0, 10.0, 8.0, 5.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3890150785446167, -0.3772421181201935, -0.3654691278934479, -0.35369616746902466, -0.34192317724227905, -0.33015021681785583, -0.3183772563934326, -0.306604266166687, -0.2948313057422638, -0.2830583453178406, -0.27128535509109497, -0.25951239466667175, -0.24773941934108734, -0.23596644401550293, -0.2241934835910797, -0.2124205082654953, -0.2006475329399109, -0.18887455761432648, -0.17710158228874207, -0.16532862186431885, -0.15355564653873444, -0.14178267121315002, -0.1300097107887268, -0.1182367354631424, -0.10646376013755798, -0.09469078481197357, -0.08291781693696976, -0.07114484906196594, -0.05937187373638153, -0.04759890213608742, -0.035825930535793304, -0.02405296266078949, -0.012279987335205078, -0.000507015734910965, 0.011265955865383148, 0.02303892746567726, 0.034811899065971375, 0.04658487066626549, 0.0583578422665596, 0.07013081014156342, 0.08190378546714783, 0.09367676079273224, 0.10544972866773605, 0.11722269654273987, 0.12899567186832428, 0.1407686471939087, 0.1525416076183319, 0.16431458294391632, 0.17608755826950073, 0.18786053359508514, 0.19963350892066956, 0.21140646934509277, 0.22317944467067719, 0.2349524199962616, 0.24672538042068481, 0.2584983706474304, 0.27027133107185364, 0.28204429149627686, 0.29381728172302246, 0.3055902421474457, 0.3173632025718689, 0.3291361927986145, 0.3409091532230377, 0.35268211364746094, 0.36445510387420654]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 8.0, 10.0, 20.0, 39.0, 48.0, 57.0, 98.0, 199.0, 994.0, 2596.0, 12403.0, 208654.0, 3235000.0, 704927.0, 24372.0, 3647.0, 611.0, 213.0, 138.0, 81.0, 52.0, 30.0, 35.0, 9.0, 13.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12322998046875, -0.11843013763427734, -0.11363029479980469, -0.10883045196533203, -0.10403060913085938, -0.09923076629638672, -0.09443092346191406, -0.0896310806274414, -0.08483123779296875, -0.0800313949584961, -0.07523155212402344, -0.07043170928955078, -0.06563186645507812, -0.06083202362060547, -0.05603218078613281, -0.051232337951660156, -0.0464324951171875, -0.041632652282714844, -0.03683280944824219, -0.03203296661376953, -0.027233123779296875, -0.02243328094482422, -0.017633438110351562, -0.012833595275878906, -0.00803375244140625, -0.0032339096069335938, 0.0015659332275390625, 0.006365776062011719, 0.011165618896484375, 0.01596546173095703, 0.020765304565429688, 0.025565147399902344, 0.030364990234375, 0.035164833068847656, 0.03996467590332031, 0.04476451873779297, 0.049564361572265625, 0.05436420440673828, 0.05916404724121094, 0.0639638900756836, 0.06876373291015625, 0.0735635757446289, 0.07836341857910156, 0.08316326141357422, 0.08796310424804688, 0.09276294708251953, 0.09756278991699219, 0.10236263275146484, 0.1071624755859375, 0.11196231842041016, 0.11676216125488281, 0.12156200408935547, 0.12636184692382812, 0.13116168975830078, 0.13596153259277344, 0.1407613754272461, 0.14556121826171875, 0.1503610610961914, 0.15516090393066406, 0.15996074676513672, 0.16476058959960938, 0.16956043243408203, 0.1743602752685547, 0.17916011810302734, 0.1839599609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 14.0, 28.0, 29.0, 46.0, 70.0, 62.0, 81.0, 92.0, 93.0, 89.0, 85.0, 92.0, 59.0, 50.0, 16.0, 21.0, 18.0, 20.0, 17.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12225341796875, -0.11784648895263672, -0.11343955993652344, -0.10903263092041016, -0.10462570190429688, -0.1002187728881836, -0.09581184387207031, -0.09140491485595703, -0.08699798583984375, -0.08259105682373047, -0.07818412780761719, -0.0737771987915039, -0.06937026977539062, -0.06496334075927734, -0.06055641174316406, -0.05614948272705078, -0.0517425537109375, -0.04733562469482422, -0.04292869567871094, -0.038521766662597656, -0.034114837646484375, -0.029707908630371094, -0.025300979614257812, -0.02089405059814453, -0.01648712158203125, -0.012080192565917969, -0.0076732635498046875, -0.0032663345336914062, 0.001140594482421875, 0.005547523498535156, 0.009954452514648438, 0.014361381530761719, 0.018768310546875, 0.02317523956298828, 0.027582168579101562, 0.031989097595214844, 0.036396026611328125, 0.040802955627441406, 0.04520988464355469, 0.04961681365966797, 0.05402374267578125, 0.05843067169189453, 0.06283760070800781, 0.0672445297241211, 0.07165145874023438, 0.07605838775634766, 0.08046531677246094, 0.08487224578857422, 0.0892791748046875, 0.09368610382080078, 0.09809303283691406, 0.10249996185302734, 0.10690689086914062, 0.1113138198852539, 0.11572074890136719, 0.12012767791748047, 0.12453460693359375, 0.12894153594970703, 0.1333484649658203, 0.1377553939819336, 0.14216232299804688, 0.14656925201416016, 0.15097618103027344, 0.15538311004638672, 0.1597900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 11.0, 7.0, 9.0, 23.0, 17.0, 33.0, 48.0, 53.0, 57.0, 79.0, 117.0, 174.0, 242.0, 392.0, 711.0, 1428.0, 3183.0, 8575.0, 30751.0, 184627.0, 2963126.0, 901831.0, 72435.0, 16401.0, 5212.0, 2103.0, 1043.0, 526.0, 327.0, 183.0, 141.0, 100.0, 81.0, 47.0, 47.0, 32.0, 35.0, 23.0, 18.0, 11.0, 8.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08868408203125, -0.08549022674560547, -0.08229637145996094, -0.0791025161743164, -0.07590866088867188, -0.07271480560302734, -0.06952095031738281, -0.06632709503173828, -0.06313323974609375, -0.05993938446044922, -0.05674552917480469, -0.053551673889160156, -0.050357818603515625, -0.047163963317871094, -0.04397010803222656, -0.04077625274658203, -0.0375823974609375, -0.03438854217529297, -0.031194686889648438, -0.028000831604003906, -0.024806976318359375, -0.021613121032714844, -0.018419265747070312, -0.015225410461425781, -0.01203155517578125, -0.008837699890136719, -0.0056438446044921875, -0.0024499893188476562, 0.000743865966796875, 0.003937721252441406, 0.0071315765380859375, 0.010325431823730469, 0.013519287109375, 0.01671314239501953, 0.019906997680664062, 0.023100852966308594, 0.026294708251953125, 0.029488563537597656, 0.03268241882324219, 0.03587627410888672, 0.03907012939453125, 0.04226398468017578, 0.04545783996582031, 0.048651695251464844, 0.051845550537109375, 0.055039405822753906, 0.05823326110839844, 0.06142711639404297, 0.0646209716796875, 0.06781482696533203, 0.07100868225097656, 0.0742025375366211, 0.07739639282226562, 0.08059024810791016, 0.08378410339355469, 0.08697795867919922, 0.09017181396484375, 0.09336566925048828, 0.09655952453613281, 0.09975337982177734, 0.10294723510742188, 0.1061410903930664, 0.10933494567871094, 0.11252880096435547, 0.11572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 5.0, 9.0, 15.0, 20.0, 33.0, 49.0, 67.0, 153.0, 378.0, 857.0, 1111.0, 751.0, 323.0, 120.0, 57.0, 32.0, 27.0, 13.0, 16.0, 5.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1365966796875, -0.1326150894165039, -0.1286334991455078, -0.12465190887451172, -0.12067031860351562, -0.11668872833251953, -0.11270713806152344, -0.10872554779052734, -0.10474395751953125, -0.10076236724853516, -0.09678077697753906, -0.09279918670654297, -0.08881759643554688, -0.08483600616455078, -0.08085441589355469, -0.0768728256225586, -0.0728912353515625, -0.0689096450805664, -0.06492805480957031, -0.06094646453857422, -0.056964874267578125, -0.05298328399658203, -0.04900169372558594, -0.045020103454589844, -0.04103851318359375, -0.037056922912597656, -0.03307533264160156, -0.02909374237060547, -0.025112152099609375, -0.02113056182861328, -0.017148971557617188, -0.013167381286621094, -0.009185791015625, -0.005204200744628906, -0.0012226104736328125, 0.0027589797973632812, 0.006740570068359375, 0.010722160339355469, 0.014703750610351562, 0.018685340881347656, 0.02266693115234375, 0.026648521423339844, 0.030630111694335938, 0.03461170196533203, 0.038593292236328125, 0.04257488250732422, 0.04655647277832031, 0.050538063049316406, 0.0545196533203125, 0.058501243591308594, 0.06248283386230469, 0.06646442413330078, 0.07044601440429688, 0.07442760467529297, 0.07840919494628906, 0.08239078521728516, 0.08637237548828125, 0.09035396575927734, 0.09433555603027344, 0.09831714630126953, 0.10229873657226562, 0.10628032684326172, 0.11026191711425781, 0.1142435073852539, 0.11822509765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 11.0, 43.0, 335.0, 514.0, 97.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.1229145526885986, -3.067455530166626, -3.0119965076446533, -2.9565374851226807, -2.901078462600708, -2.8456194400787354, -2.7901604175567627, -2.73470139503479, -2.6792423725128174, -2.6237833499908447, -2.568324327468872, -2.5128653049468994, -2.4574062824249268, -2.401947259902954, -2.3464882373809814, -2.291029214859009, -2.235570192337036, -2.1801111698150635, -2.124652147293091, -2.069193124771118, -2.0137341022491455, -1.9582750797271729, -1.9028160572052002, -1.8473570346832275, -1.7918980121612549, -1.7364389896392822, -1.6809799671173096, -1.625520944595337, -1.5700619220733643, -1.5146028995513916, -1.459143877029419, -1.4036848545074463, -1.3482258319854736, -1.292766809463501, -1.2373077869415283, -1.1818487644195557, -1.126389741897583, -1.0709307193756104, -1.0154716968536377, -0.960012674331665, -0.9045536518096924, -0.8490946292877197, -0.7936356067657471, -0.7381765842437744, -0.6827175617218018, -0.6272585391998291, -0.5717995166778564, -0.5163404941558838, -0.46088147163391113, -0.4054224491119385, -0.3499634265899658, -0.29450440406799316, -0.2390453815460205, -0.18358635902404785, -0.1281273365020752, -0.07266831398010254, -0.017209291458129883, 0.03824973106384277, 0.09370875358581543, 0.14916777610778809, 0.20462679862976074, 0.2600858211517334, 0.31554484367370605, 0.3710038661956787, 0.42646288871765137]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 8.0, 10.0, 15.0, 16.0, 26.0, 34.0, 28.0, 24.0, 39.0, 42.0, 47.0, 58.0, 42.0, 54.0, 48.0, 57.0, 56.0, 48.0, 56.0, 38.0, 49.0, 23.0, 24.0, 28.0, 32.0, 15.0, 13.0, 8.0, 13.0, 9.0, 6.0, 6.0, 3.0, 8.0, 1.0, 2.0, 1.0], "bins": [-0.42355990409851074, -0.4133116602897644, -0.4030633866786957, -0.39281514286994934, -0.3825668692588806, -0.3723186254501343, -0.36207035183906555, -0.3518221080303192, -0.3415738344192505, -0.33132559061050415, -0.3210773169994354, -0.3108290731906891, -0.30058079957962036, -0.290332555770874, -0.2800842821598053, -0.26983603835105896, -0.25958776473999023, -0.2493395060300827, -0.23909124732017517, -0.22884298861026764, -0.2185947299003601, -0.20834647119045258, -0.19809821248054504, -0.1878499686717987, -0.17760172486305237, -0.16735346615314484, -0.1571052074432373, -0.14685694873332977, -0.13660869002342224, -0.1263604313135147, -0.11611218005418777, -0.10586392134428024, -0.09561565518379211, -0.08536739647388458, -0.07511913776397705, -0.06487087905406952, -0.054622624069452286, -0.044374365359544754, -0.03412611037492752, -0.02387785166501999, -0.013629592955112457, -0.0033813351765275, 0.006866922602057457, 0.01711517944931984, 0.02736343815922737, 0.0376116968691349, 0.047859951853752136, 0.05810821056365967, 0.0683564692735672, 0.07860472798347473, 0.08885298669338226, 0.0991012454032898, 0.10934950411319733, 0.11959776282310486, 0.1298460066318512, 0.14009428024291992, 0.15034252405166626, 0.1605907827615738, 0.17083904147148132, 0.18108730018138885, 0.1913355588912964, 0.20158381760120392, 0.21183207631111145, 0.2220803201198578, 0.2323285937309265]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 10.0, 18.0, 24.0, 30.0, 40.0, 40.0, 78.0, 118.0, 150.0, 247.0, 439.0, 745.0, 1328.0, 2837.0, 6135.0, 14773.0, 37073.0, 99851.0, 263621.0, 353019.0, 166682.0, 60567.0, 22866.0, 9379.0, 4045.0, 1890.0, 985.0, 553.0, 315.0, 209.0, 146.0, 96.0, 59.0, 46.0, 42.0, 31.0, 16.0, 17.0, 5.0, 9.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0892333984375, -0.08662796020507812, -0.08402252197265625, -0.08141708374023438, -0.0788116455078125, -0.07620620727539062, -0.07360076904296875, -0.07099533081054688, -0.068389892578125, -0.06578445434570312, -0.06317901611328125, -0.060573577880859375, -0.0579681396484375, -0.055362701416015625, -0.05275726318359375, -0.050151824951171875, -0.04754638671875, -0.044940948486328125, -0.04233551025390625, -0.039730072021484375, -0.0371246337890625, -0.034519195556640625, -0.03191375732421875, -0.029308319091796875, -0.026702880859375, -0.024097442626953125, -0.02149200439453125, -0.018886566162109375, -0.0162811279296875, -0.013675689697265625, -0.01107025146484375, -0.008464813232421875, -0.005859375, -0.003253936767578125, -0.00064849853515625, 0.001956939697265625, 0.0045623779296875, 0.007167816162109375, 0.00977325439453125, 0.012378692626953125, 0.014984130859375, 0.017589569091796875, 0.02019500732421875, 0.022800445556640625, 0.0254058837890625, 0.028011322021484375, 0.03061676025390625, 0.033222198486328125, 0.03582763671875, 0.038433074951171875, 0.04103851318359375, 0.043643951416015625, 0.0462493896484375, 0.048854827880859375, 0.05146026611328125, 0.054065704345703125, 0.056671142578125, 0.059276580810546875, 0.06188201904296875, 0.06448745727539062, 0.0670928955078125, 0.06969833374023438, 0.07230377197265625, 0.07490921020507812, 0.0775146484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 12.0, 18.0, 34.0, 29.0, 30.0, 47.0, 54.0, 77.0, 80.0, 100.0, 89.0, 69.0, 54.0, 79.0, 70.0, 34.0, 28.0, 26.0, 24.0, 11.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.11010932922363281, -0.10632705688476562, -0.10254478454589844, -0.09876251220703125, -0.09498023986816406, -0.09119796752929688, -0.08741569519042969, -0.0836334228515625, -0.07985115051269531, -0.07606887817382812, -0.07228660583496094, -0.06850433349609375, -0.06472206115722656, -0.060939788818359375, -0.05715751647949219, -0.053375244140625, -0.04959297180175781, -0.045810699462890625, -0.04202842712402344, -0.03824615478515625, -0.03446388244628906, -0.030681610107421875, -0.026899337768554688, -0.0231170654296875, -0.019334793090820312, -0.015552520751953125, -0.011770248413085938, -0.00798797607421875, -0.0042057037353515625, -0.000423431396484375, 0.0033588409423828125, 0.00714111328125, 0.010923385620117188, 0.014705657958984375, 0.018487930297851562, 0.02227020263671875, 0.026052474975585938, 0.029834747314453125, 0.03361701965332031, 0.0373992919921875, 0.04118156433105469, 0.044963836669921875, 0.04874610900878906, 0.05252838134765625, 0.05631065368652344, 0.060092926025390625, 0.06387519836425781, 0.067657470703125, 0.07143974304199219, 0.07522201538085938, 0.07900428771972656, 0.08278656005859375, 0.08656883239746094, 0.09035110473632812, 0.09413337707519531, 0.0979156494140625, 0.10169792175292969, 0.10548019409179688, 0.10926246643066406, 0.11304473876953125, 0.11682701110839844, 0.12060928344726562, 0.12439155578613281, 0.128173828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 3.0, 7.0, 12.0, 12.0, 17.0, 18.0, 25.0, 21.0, 37.0, 47.0, 69.0, 110.0, 183.0, 372.0, 670.0, 1507.0, 3544.0, 9842.0, 29692.0, 99538.0, 331858.0, 388888.0, 125545.0, 36863.0, 11779.0, 4359.0, 1686.0, 817.0, 396.0, 213.0, 132.0, 83.0, 57.0, 35.0, 24.0, 17.0, 15.0, 9.0, 14.0, 6.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10615348815917969, -0.10250473022460938, -0.09885597229003906, -0.09520721435546875, -0.09155845642089844, -0.08790969848632812, -0.08426094055175781, -0.0806121826171875, -0.07696342468261719, -0.07331466674804688, -0.06966590881347656, -0.06601715087890625, -0.06236839294433594, -0.058719635009765625, -0.05507087707519531, -0.051422119140625, -0.04777336120605469, -0.044124603271484375, -0.04047584533691406, -0.03682708740234375, -0.03317832946777344, -0.029529571533203125, -0.025880813598632812, -0.0222320556640625, -0.018583297729492188, -0.014934539794921875, -0.011285781860351562, -0.00763702392578125, -0.0039882659912109375, -0.000339508056640625, 0.0033092498779296875, 0.0069580078125, 0.010606765747070312, 0.014255523681640625, 0.017904281616210938, 0.02155303955078125, 0.025201797485351562, 0.028850555419921875, 0.03249931335449219, 0.0361480712890625, 0.03979682922363281, 0.043445587158203125, 0.04709434509277344, 0.05074310302734375, 0.05439186096191406, 0.058040618896484375, 0.06168937683105469, 0.065338134765625, 0.06898689270019531, 0.07263565063476562, 0.07628440856933594, 0.07993316650390625, 0.08358192443847656, 0.08723068237304688, 0.09087944030761719, 0.0945281982421875, 0.09817695617675781, 0.10182571411132812, 0.10547447204589844, 0.10912322998046875, 0.11277198791503906, 0.11642074584960938, 0.12006950378417969, 0.12371826171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 1.0, 9.0, 3.0, 8.0, 8.0, 9.0, 17.0, 11.0, 13.0, 22.0, 25.0, 20.0, 21.0, 34.0, 31.0, 28.0, 37.0, 28.0, 48.0, 34.0, 39.0, 45.0, 31.0, 38.0, 39.0, 26.0, 38.0, 30.0, 28.0, 28.0, 29.0, 25.0, 25.0, 22.0, 14.0, 19.0, 22.0, 14.0, 19.0, 10.0, 6.0, 6.0, 11.0, 5.0, 11.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1798095703125, -0.17461776733398438, -0.16942596435546875, -0.16423416137695312, -0.1590423583984375, -0.15385055541992188, -0.14865875244140625, -0.14346694946289062, -0.138275146484375, -0.13308334350585938, -0.12789154052734375, -0.12269973754882812, -0.1175079345703125, -0.11231613159179688, -0.10712432861328125, -0.10193252563476562, -0.09674072265625, -0.09154891967773438, -0.08635711669921875, -0.08116531372070312, -0.0759735107421875, -0.07078170776367188, -0.06558990478515625, -0.060398101806640625, -0.055206298828125, -0.050014495849609375, -0.04482269287109375, -0.039630889892578125, -0.0344390869140625, -0.029247283935546875, -0.02405548095703125, -0.018863677978515625, -0.013671875, -0.008480072021484375, -0.00328826904296875, 0.001903533935546875, 0.0070953369140625, 0.012287139892578125, 0.01747894287109375, 0.022670745849609375, 0.027862548828125, 0.033054351806640625, 0.03824615478515625, 0.043437957763671875, 0.0486297607421875, 0.053821563720703125, 0.05901336669921875, 0.06420516967773438, 0.06939697265625, 0.07458877563476562, 0.07978057861328125, 0.08497238159179688, 0.0901641845703125, 0.09535598754882812, 0.10054779052734375, 0.10573959350585938, 0.110931396484375, 0.11612319946289062, 0.12131500244140625, 0.12650680541992188, 0.1316986083984375, 0.13689041137695312, 0.14208221435546875, 0.14727401733398438, 0.1524658203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 7.0, 4.0, 12.0, 21.0, 25.0, 26.0, 43.0, 70.0, 93.0, 132.0, 191.0, 349.0, 686.0, 1125.0, 2185.0, 4656.0, 9393.0, 20852.0, 47882.0, 110091.0, 234167.0, 299690.0, 175991.0, 77406.0, 33818.0, 15375.0, 6962.0, 3313.0, 1699.0, 938.0, 514.0, 281.0, 170.0, 106.0, 82.0, 49.0, 32.0, 35.0, 23.0, 23.0, 14.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185394287109375, -0.01792740821838379, -0.017315387725830078, -0.016703367233276367, -0.016091346740722656, -0.015479326248168945, -0.014867305755615234, -0.014255285263061523, -0.013643264770507812, -0.013031244277954102, -0.01241922378540039, -0.01180720329284668, -0.011195182800292969, -0.010583162307739258, -0.009971141815185547, -0.009359121322631836, -0.008747100830078125, -0.008135080337524414, -0.007523059844970703, -0.006911039352416992, -0.006299018859863281, -0.00568699836730957, -0.005074977874755859, -0.0044629573822021484, -0.0038509368896484375, -0.0032389163970947266, -0.0026268959045410156, -0.0020148754119873047, -0.0014028549194335938, -0.0007908344268798828, -0.00017881393432617188, 0.00043320655822753906, 0.00104522705078125, 0.001657247543334961, 0.002269268035888672, 0.002881288528442383, 0.0034933090209960938, 0.004105329513549805, 0.004717350006103516, 0.0053293704986572266, 0.0059413909912109375, 0.0065534114837646484, 0.007165431976318359, 0.00777745246887207, 0.008389472961425781, 0.009001493453979492, 0.009613513946533203, 0.010225534439086914, 0.010837554931640625, 0.011449575424194336, 0.012061595916748047, 0.012673616409301758, 0.013285636901855469, 0.01389765739440918, 0.01450967788696289, 0.015121698379516602, 0.015733718872070312, 0.016345739364624023, 0.016957759857177734, 0.017569780349731445, 0.018181800842285156, 0.018793821334838867, 0.019405841827392578, 0.02001786231994629, 0.0206298828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 6.0, 10.0, 15.0, 14.0, 26.0, 31.0, 33.0, 61.0, 49.0, 56.0, 77.0, 80.0, 72.0, 64.0, 71.0, 59.0, 57.0, 49.0, 26.0, 30.0, 23.0, 15.0, 17.0, 7.0, 17.0, 5.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.463859558105469e-06, -8.22450965642929e-06, -7.985159754753113e-06, -7.745809853076935e-06, -7.506459951400757e-06, -7.267110049724579e-06, -7.027760148048401e-06, -6.788410246372223e-06, -6.549060344696045e-06, -6.309710443019867e-06, -6.070360541343689e-06, -5.831010639667511e-06, -5.591660737991333e-06, -5.352310836315155e-06, -5.112960934638977e-06, -4.873611032962799e-06, -4.634261131286621e-06, -4.394911229610443e-06, -4.155561327934265e-06, -3.916211426258087e-06, -3.676861524581909e-06, -3.437511622905731e-06, -3.1981617212295532e-06, -2.9588118195533752e-06, -2.7194619178771973e-06, -2.4801120162010193e-06, -2.2407621145248413e-06, -2.0014122128486633e-06, -1.7620623111724854e-06, -1.5227124094963074e-06, -1.2833625078201294e-06, -1.0440126061439514e-06, -8.046627044677734e-07, -5.653128027915955e-07, -3.259629011154175e-07, -8.66129994392395e-08, 1.5273690223693848e-07, 3.9208680391311646e-07, 6.314367055892944e-07, 8.707866072654724e-07, 1.1101365089416504e-06, 1.3494864106178284e-06, 1.5888363122940063e-06, 1.8281862139701843e-06, 2.0675361156463623e-06, 2.3068860173225403e-06, 2.5462359189987183e-06, 2.7855858206748962e-06, 3.0249357223510742e-06, 3.264285624027252e-06, 3.50363552570343e-06, 3.742985427379608e-06, 3.982335329055786e-06, 4.221685230731964e-06, 4.461035132408142e-06, 4.70038503408432e-06, 4.939734935760498e-06, 5.179084837436676e-06, 5.418434739112854e-06, 5.657784640789032e-06, 5.89713454246521e-06, 6.136484444141388e-06, 6.375834345817566e-06, 6.615184247493744e-06, 6.854534149169922e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 8.0, 16.0, 24.0, 41.0, 48.0, 65.0, 120.0, 164.0, 320.0, 586.0, 1143.0, 2557.0, 5873.0, 14163.0, 37100.0, 100096.0, 252672.0, 345989.0, 178318.0, 66550.0, 25192.0, 9632.0, 4009.0, 1796.0, 935.0, 441.0, 276.0, 141.0, 96.0, 46.0, 48.0, 17.0, 22.0, 14.0, 7.0, 8.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.024505615234375, -0.023769617080688477, -0.023033618927001953, -0.02229762077331543, -0.021561622619628906, -0.020825624465942383, -0.02008962631225586, -0.019353628158569336, -0.018617630004882812, -0.01788163185119629, -0.017145633697509766, -0.016409635543823242, -0.01567363739013672, -0.014937639236450195, -0.014201641082763672, -0.013465642929077148, -0.012729644775390625, -0.011993646621704102, -0.011257648468017578, -0.010521650314331055, -0.009785652160644531, -0.009049654006958008, -0.008313655853271484, -0.007577657699584961, -0.0068416595458984375, -0.006105661392211914, -0.005369663238525391, -0.004633665084838867, -0.0038976669311523438, -0.0031616687774658203, -0.002425670623779297, -0.0016896724700927734, -0.00095367431640625, -0.00021767616271972656, 0.0005183219909667969, 0.0012543201446533203, 0.0019903182983398438, 0.002726316452026367, 0.0034623146057128906, 0.004198312759399414, 0.0049343109130859375, 0.005670309066772461, 0.006406307220458984, 0.007142305374145508, 0.007878303527832031, 0.008614301681518555, 0.009350299835205078, 0.010086297988891602, 0.010822296142578125, 0.011558294296264648, 0.012294292449951172, 0.013030290603637695, 0.013766288757324219, 0.014502286911010742, 0.015238285064697266, 0.01597428321838379, 0.016710281372070312, 0.017446279525756836, 0.01818227767944336, 0.018918275833129883, 0.019654273986816406, 0.02039027214050293, 0.021126270294189453, 0.021862268447875977, 0.0225982666015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0, 14.0, 19.0, 17.0, 24.0, 31.0, 37.0, 30.0, 65.0, 48.0, 57.0, 64.0, 73.0, 61.0, 57.0, 65.0, 51.0, 42.0, 43.0, 33.0, 36.0, 25.0, 14.0, 11.0, 13.0, 11.0, 6.0, 11.0, 8.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.032958984375, -0.03208208084106445, -0.031205177307128906, -0.03032827377319336, -0.029451370239257812, -0.028574466705322266, -0.02769756317138672, -0.026820659637451172, -0.025943756103515625, -0.025066852569580078, -0.02418994903564453, -0.023313045501708984, -0.022436141967773438, -0.02155923843383789, -0.020682334899902344, -0.019805431365966797, -0.01892852783203125, -0.018051624298095703, -0.017174720764160156, -0.01629781723022461, -0.015420913696289062, -0.014544010162353516, -0.013667106628417969, -0.012790203094482422, -0.011913299560546875, -0.011036396026611328, -0.010159492492675781, -0.009282588958740234, -0.008405685424804688, -0.007528781890869141, -0.006651878356933594, -0.005774974822998047, -0.0048980712890625, -0.004021167755126953, -0.0031442642211914062, -0.0022673606872558594, -0.0013904571533203125, -0.0005135536193847656, 0.00036334991455078125, 0.0012402534484863281, 0.002117156982421875, 0.002994060516357422, 0.0038709640502929688, 0.004747867584228516, 0.0056247711181640625, 0.006501674652099609, 0.007378578186035156, 0.008255481719970703, 0.00913238525390625, 0.010009288787841797, 0.010886192321777344, 0.01176309585571289, 0.012639999389648438, 0.013516902923583984, 0.014393806457519531, 0.015270709991455078, 0.016147613525390625, 0.017024517059326172, 0.01790142059326172, 0.018778324127197266, 0.019655227661132812, 0.02053213119506836, 0.021409034729003906, 0.022285938262939453, 0.023162841796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 7.0, 12.0, 25.0, 78.0, 171.0, 361.0, 222.0, 86.0, 25.0, 15.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2730594873428345, -1.2362333536148071, -1.1994073390960693, -1.162581205368042, -1.1257550716400146, -1.0889289379119873, -1.05210280418396, -1.0152767896652222, -0.9784506559371948, -0.9416245222091675, -0.9047984480857849, -0.8679723739624023, -0.831146240234375, -0.7943201065063477, -0.7574940323829651, -0.7206679582595825, -0.6838418245315552, -0.6470156908035278, -0.6101896166801453, -0.5733635425567627, -0.5365374088287354, -0.4997113049030304, -0.46288520097732544, -0.4260590970516205, -0.3892329931259155, -0.35240688920021057, -0.3155807852745056, -0.27875468134880066, -0.2419285774230957, -0.20510247349739075, -0.1682763695716858, -0.13145026564598083, -0.09462404251098633, -0.05779793858528137, -0.020971834659576416, 0.01585426926612854, 0.052680373191833496, 0.08950647711753845, 0.1263325810432434, 0.16315868496894836, 0.19998478889465332, 0.23681089282035828, 0.27363699674606323, 0.3104631006717682, 0.34728920459747314, 0.3841153085231781, 0.42094141244888306, 0.457767516374588, 0.49459362030029297, 0.5314197540283203, 0.5682458281517029, 0.6050719022750854, 0.6418980360031128, 0.6787241697311401, 0.7155502438545227, 0.7523763179779053, 0.7892024517059326, 0.82602858543396, 0.8628546595573425, 0.8996807336807251, 0.9365068674087524, 0.9733330011367798, 1.0101590156555176, 1.046985149383545, 1.0838112831115723]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 9.0, 9.0, 5.0, 4.0, 12.0, 14.0, 13.0, 13.0, 22.0, 20.0, 24.0, 20.0, 27.0, 25.0, 31.0, 32.0, 34.0, 38.0, 34.0, 37.0, 33.0, 35.0, 33.0, 33.0, 37.0, 34.0, 38.0, 31.0, 40.0, 31.0, 31.0, 26.0, 21.0, 14.0, 24.0, 21.0, 16.0, 15.0, 14.0, 13.0, 9.0, 12.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4522865414619446, -0.43807974457740784, -0.4238729476928711, -0.40966618061065674, -0.39545938372612, -0.38125258684158325, -0.3670458197593689, -0.35283902287483215, -0.3386322259902954, -0.32442542910575867, -0.3102186322212219, -0.29601186513900757, -0.2818050682544708, -0.2675982713699341, -0.2533915042877197, -0.23918470740318298, -0.22497791051864624, -0.2107711136341095, -0.19656433165073395, -0.1823575496673584, -0.16815075278282166, -0.1539439558982849, -0.13973717391490936, -0.1255303919315338, -0.11132359504699707, -0.09711680561304092, -0.08291001617908478, -0.06870322674512863, -0.054496437311172485, -0.04028964787721634, -0.026082858443260193, -0.011876069009304047, 0.0023307204246520996, 0.016537509858608246, 0.030744299292564392, 0.04495108872652054, 0.059157878160476685, 0.07336466759443283, 0.08757145702838898, 0.10177824646234512, 0.11598503589630127, 0.130191832780838, 0.14439861476421356, 0.1586053967475891, 0.17281219363212585, 0.1870189905166626, 0.20122577250003815, 0.2154325544834137, 0.22963935136795044, 0.24384614825248718, 0.2580529451370239, 0.2722597122192383, 0.286466509103775, 0.30067330598831177, 0.3148800730705261, 0.32908686995506287, 0.3432936668395996, 0.35750046372413635, 0.3717072606086731, 0.38591402769088745, 0.4001208245754242, 0.41432762145996094, 0.4285343885421753, 0.44274118542671204, 0.4569479823112488]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 17.0, 39.0, 44.0, 136.0, 385.0, 1222.0, 3453.0, 13317.0, 80237.0, 805697.0, 2608030.0, 608303.0, 58722.0, 10406.0, 3020.0, 738.0, 236.0, 126.0, 54.0, 39.0, 14.0, 15.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0927734375, -0.08939170837402344, -0.08600997924804688, -0.08262825012207031, -0.07924652099609375, -0.07586479187011719, -0.07248306274414062, -0.06910133361816406, -0.0657196044921875, -0.06233787536621094, -0.058956146240234375, -0.05557441711425781, -0.05219268798828125, -0.04881095886230469, -0.045429229736328125, -0.04204750061035156, -0.038665771484375, -0.03528404235839844, -0.031902313232421875, -0.028520584106445312, -0.02513885498046875, -0.021757125854492188, -0.018375396728515625, -0.014993667602539062, -0.0116119384765625, -0.008230209350585938, -0.004848480224609375, -0.0014667510986328125, 0.00191497802734375, 0.0052967071533203125, 0.008678436279296875, 0.012060165405273438, 0.01544189453125, 0.018823623657226562, 0.022205352783203125, 0.025587081909179688, 0.02896881103515625, 0.03235054016113281, 0.035732269287109375, 0.03911399841308594, 0.0424957275390625, 0.04587745666503906, 0.049259185791015625, 0.05264091491699219, 0.05602264404296875, 0.05940437316894531, 0.06278610229492188, 0.06616783142089844, 0.069549560546875, 0.07293128967285156, 0.07631301879882812, 0.07969474792480469, 0.08307647705078125, 0.08645820617675781, 0.08983993530273438, 0.09322166442871094, 0.0966033935546875, 0.09998512268066406, 0.10336685180664062, 0.10674858093261719, 0.11013031005859375, 0.11351203918457031, 0.11689376831054688, 0.12027549743652344, 0.1236572265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 8.0, 12.0, 29.0, 35.0, 39.0, 53.0, 52.0, 70.0, 81.0, 74.0, 76.0, 76.0, 64.0, 74.0, 42.0, 43.0, 45.0, 34.0, 23.0, 18.0, 10.0, 15.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1239013671875, -0.11969947814941406, -0.11549758911132812, -0.11129570007324219, -0.10709381103515625, -0.10289192199707031, -0.09869003295898438, -0.09448814392089844, -0.0902862548828125, -0.08608436584472656, -0.08188247680664062, -0.07768058776855469, -0.07347869873046875, -0.06927680969238281, -0.06507492065429688, -0.06087303161621094, -0.056671142578125, -0.05246925354003906, -0.048267364501953125, -0.04406547546386719, -0.03986358642578125, -0.03566169738769531, -0.031459808349609375, -0.027257919311523438, -0.0230560302734375, -0.018854141235351562, -0.014652252197265625, -0.010450363159179688, -0.00624847412109375, -0.0020465850830078125, 0.002155303955078125, 0.0063571929931640625, 0.01055908203125, 0.014760971069335938, 0.018962860107421875, 0.023164749145507812, 0.02736663818359375, 0.03156852722167969, 0.035770416259765625, 0.03997230529785156, 0.0441741943359375, 0.04837608337402344, 0.052577972412109375, 0.05677986145019531, 0.06098175048828125, 0.06518363952636719, 0.06938552856445312, 0.07358741760253906, 0.077789306640625, 0.08199119567871094, 0.08619308471679688, 0.09039497375488281, 0.09459686279296875, 0.09879875183105469, 0.10300064086914062, 0.10720252990722656, 0.1114044189453125, 0.11560630798339844, 0.11980819702148438, 0.12401008605957031, 0.12821197509765625, 0.1324138641357422, 0.13661575317382812, 0.14081764221191406, 0.14501953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 10.0, 13.0, 13.0, 26.0, 38.0, 61.0, 105.0, 153.0, 201.0, 357.0, 561.0, 974.0, 2048.0, 4856.0, 13960.0, 53312.0, 344235.0, 3125125.0, 549225.0, 69866.0, 17935.0, 6006.0, 2424.0, 1130.0, 587.0, 410.0, 228.0, 139.0, 122.0, 55.0, 41.0, 33.0, 16.0, 10.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09716796875, -0.0932159423828125, -0.089263916015625, -0.0853118896484375, -0.08135986328125, -0.0774078369140625, -0.073455810546875, -0.0695037841796875, -0.0655517578125, -0.0615997314453125, -0.057647705078125, -0.0536956787109375, -0.04974365234375, -0.0457916259765625, -0.041839599609375, -0.0378875732421875, -0.033935546875, -0.0299835205078125, -0.026031494140625, -0.0220794677734375, -0.01812744140625, -0.0141754150390625, -0.010223388671875, -0.0062713623046875, -0.0023193359375, 0.0016326904296875, 0.005584716796875, 0.0095367431640625, 0.01348876953125, 0.0174407958984375, 0.021392822265625, 0.0253448486328125, 0.029296875, 0.0332489013671875, 0.037200927734375, 0.0411529541015625, 0.04510498046875, 0.0490570068359375, 0.053009033203125, 0.0569610595703125, 0.0609130859375, 0.0648651123046875, 0.068817138671875, 0.0727691650390625, 0.07672119140625, 0.0806732177734375, 0.084625244140625, 0.0885772705078125, 0.092529296875, 0.0964813232421875, 0.100433349609375, 0.1043853759765625, 0.10833740234375, 0.1122894287109375, 0.116241455078125, 0.1201934814453125, 0.1241455078125, 0.1280975341796875, 0.132049560546875, 0.1360015869140625, 0.13995361328125, 0.1439056396484375, 0.147857666015625, 0.1518096923828125, 0.15576171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 21.0, 28.0, 40.0, 58.0, 124.0, 248.0, 599.0, 1120.0, 860.0, 453.0, 187.0, 90.0, 74.0, 35.0, 31.0, 20.0, 16.0, 18.0, 10.0, 7.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.202392578125, -0.197174072265625, -0.19195556640625, -0.186737060546875, -0.1815185546875, -0.176300048828125, -0.17108154296875, -0.165863037109375, -0.16064453125, -0.155426025390625, -0.15020751953125, -0.144989013671875, -0.1397705078125, -0.134552001953125, -0.12933349609375, -0.124114990234375, -0.118896484375, -0.113677978515625, -0.10845947265625, -0.103240966796875, -0.0980224609375, -0.092803955078125, -0.08758544921875, -0.082366943359375, -0.0771484375, -0.071929931640625, -0.06671142578125, -0.061492919921875, -0.0562744140625, -0.051055908203125, -0.04583740234375, -0.040618896484375, -0.035400390625, -0.030181884765625, -0.02496337890625, -0.019744873046875, -0.0145263671875, -0.009307861328125, -0.00408935546875, 0.001129150390625, 0.00634765625, 0.011566162109375, 0.01678466796875, 0.022003173828125, 0.0272216796875, 0.032440185546875, 0.03765869140625, 0.042877197265625, 0.048095703125, 0.053314208984375, 0.05853271484375, 0.063751220703125, 0.0689697265625, 0.074188232421875, 0.07940673828125, 0.084625244140625, 0.08984375, 0.095062255859375, 0.10028076171875, 0.105499267578125, 0.1107177734375, 0.115936279296875, 0.12115478515625, 0.126373291015625, 0.131591796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 22.0, 133.0, 454.0, 330.0, 55.0, 8.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.579484701156616, -3.5153255462646484, -3.4511666297912598, -3.387007713317871, -3.3228485584259033, -3.2586894035339355, -3.194530487060547, -3.130371570587158, -3.0662124156951904, -3.0020532608032227, -2.937894344329834, -2.8737354278564453, -2.8095762729644775, -2.7454171180725098, -2.681258201599121, -2.6170992851257324, -2.5529401302337646, -2.488780975341797, -2.424622058868408, -2.3604631423950195, -2.2963039875030518, -2.232144832611084, -2.1679859161376953, -2.1038269996643066, -2.039667844772339, -1.9755088090896606, -1.9113497734069824, -1.8471907377243042, -1.783031702041626, -1.7188726663589478, -1.6547136306762695, -1.5905545949935913, -1.5263954401016235, -1.4622364044189453, -1.398077368736267, -1.3339183330535889, -1.2697592973709106, -1.2056002616882324, -1.1414412260055542, -1.077282190322876, -1.0131231546401978, -0.9489641189575195, -0.8848050832748413, -0.8206460475921631, -0.7564870119094849, -0.6923279762268066, -0.6281689405441284, -0.5640099048614502, -0.499850869178772, -0.43569183349609375, -0.3715327978134155, -0.3073737621307373, -0.24321472644805908, -0.17905569076538086, -0.11489665508270264, -0.050737619400024414, 0.013421416282653809, 0.07758045196533203, 0.14173948764801025, 0.20589852333068848, 0.2700575590133667, 0.3342165946960449, 0.39837563037872314, 0.46253466606140137, 0.5266937017440796]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 7.0, 5.0, 10.0, 16.0, 14.0, 15.0, 15.0, 24.0, 27.0, 37.0, 45.0, 46.0, 41.0, 31.0, 45.0, 53.0, 54.0, 44.0, 46.0, 45.0, 42.0, 37.0, 42.0, 31.0, 30.0, 27.0, 31.0, 22.0, 19.0, 26.0, 12.0, 19.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.4235583543777466, -0.41212132573127747, -0.40068432688713074, -0.3892472982406616, -0.3778102993965149, -0.3663732707500458, -0.35493627190589905, -0.34349924325942993, -0.3320622444152832, -0.3206252157688141, -0.30918821692466736, -0.29775118827819824, -0.2863141894340515, -0.2748771607875824, -0.26344016194343567, -0.25200313329696655, -0.24056611955165863, -0.2291291058063507, -0.21769209206104279, -0.20625507831573486, -0.19481806457042694, -0.18338105082511902, -0.1719440221786499, -0.16050702333450317, -0.14906999468803406, -0.13763298094272614, -0.1261959671974182, -0.11475895345211029, -0.10332193970680237, -0.09188492596149445, -0.08044790476560593, -0.069010891020298, -0.05757388472557068, -0.046136870980262756, -0.034699857234954834, -0.023262839764356613, -0.01182582601904869, -0.00038881227374076843, 0.011048205196857452, 0.022485218942165375, 0.0339222326874733, 0.04535924643278122, 0.05679626017808914, 0.06823328137397766, 0.07967029511928558, 0.0911073088645935, 0.10254432260990143, 0.11398133635520935, 0.12541835010051727, 0.1368553638458252, 0.14829237759113312, 0.15972939133644104, 0.17116640508174896, 0.18260341882705688, 0.194040447473526, 0.20547744631767273, 0.21691447496414185, 0.22835148870944977, 0.2397885024547577, 0.2512255311012268, 0.26266252994537354, 0.27409955859184265, 0.2855365574359894, 0.2969735860824585, 0.3084105849266052]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 8.0, 7.0, 6.0, 13.0, 17.0, 21.0, 28.0, 45.0, 78.0, 96.0, 186.0, 271.0, 360.0, 634.0, 1100.0, 2005.0, 4289.0, 9598.0, 23518.0, 60707.0, 161344.0, 340743.0, 267353.0, 106512.0, 40184.0, 15847.0, 6599.0, 3105.0, 1567.0, 799.0, 531.0, 303.0, 202.0, 146.0, 99.0, 65.0, 47.0, 45.0, 19.0, 19.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08660888671875, -0.08379554748535156, -0.08098220825195312, -0.07816886901855469, -0.07535552978515625, -0.07254219055175781, -0.06972885131835938, -0.06691551208496094, -0.0641021728515625, -0.06128883361816406, -0.058475494384765625, -0.05566215515136719, -0.05284881591796875, -0.05003547668457031, -0.047222137451171875, -0.04440879821777344, -0.041595458984375, -0.03878211975097656, -0.035968780517578125, -0.03315544128417969, -0.03034210205078125, -0.027528762817382812, -0.024715423583984375, -0.021902084350585938, -0.0190887451171875, -0.016275405883789062, -0.013462066650390625, -0.010648727416992188, -0.00783538818359375, -0.0050220489501953125, -0.002208709716796875, 0.0006046295166015625, 0.00341796875, 0.0062313079833984375, 0.009044647216796875, 0.011857986450195312, 0.01467132568359375, 0.017484664916992188, 0.020298004150390625, 0.023111343383789062, 0.0259246826171875, 0.028738021850585938, 0.031551361083984375, 0.03436470031738281, 0.03717803955078125, 0.03999137878417969, 0.042804718017578125, 0.04561805725097656, 0.048431396484375, 0.05124473571777344, 0.054058074951171875, 0.05687141418457031, 0.05968475341796875, 0.06249809265136719, 0.06531143188476562, 0.06812477111816406, 0.0709381103515625, 0.07375144958496094, 0.07656478881835938, 0.07937812805175781, 0.08219146728515625, 0.08500480651855469, 0.08781814575195312, 0.09063148498535156, 0.09344482421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 5.0, 11.0, 16.0, 26.0, 31.0, 41.0, 47.0, 66.0, 60.0, 71.0, 96.0, 83.0, 75.0, 72.0, 66.0, 56.0, 52.0, 36.0, 34.0, 15.0, 13.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13916015625, -0.1349773406982422, -0.13079452514648438, -0.12661170959472656, -0.12242889404296875, -0.11824607849121094, -0.11406326293945312, -0.10988044738769531, -0.1056976318359375, -0.10151481628417969, -0.09733200073242188, -0.09314918518066406, -0.08896636962890625, -0.08478355407714844, -0.08060073852539062, -0.07641792297363281, -0.072235107421875, -0.06805229187011719, -0.06386947631835938, -0.05968666076660156, -0.05550384521484375, -0.05132102966308594, -0.047138214111328125, -0.04295539855957031, -0.0387725830078125, -0.03458976745605469, -0.030406951904296875, -0.026224136352539062, -0.02204132080078125, -0.017858505249023438, -0.013675689697265625, -0.009492874145507812, -0.00531005859375, -0.0011272430419921875, 0.003055572509765625, 0.0072383880615234375, 0.01142120361328125, 0.015604019165039062, 0.019786834716796875, 0.023969650268554688, 0.0281524658203125, 0.03233528137207031, 0.036518096923828125, 0.04070091247558594, 0.04488372802734375, 0.04906654357910156, 0.053249359130859375, 0.05743217468261719, 0.061614990234375, 0.06579780578613281, 0.06998062133789062, 0.07416343688964844, 0.07834625244140625, 0.08252906799316406, 0.08671188354492188, 0.09089469909667969, 0.0950775146484375, 0.09926033020019531, 0.10344314575195312, 0.10762596130371094, 0.11180877685546875, 0.11599159240722656, 0.12017440795898438, 0.12435722351074219, 0.1285400390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 0.0, 3.0, 2.0, 3.0, 10.0, 6.0, 7.0, 9.0, 12.0, 20.0, 25.0, 31.0, 39.0, 80.0, 172.0, 385.0, 1136.0, 4152.0, 18108.0, 110786.0, 634946.0, 235883.0, 33125.0, 6759.0, 1744.0, 589.0, 224.0, 108.0, 48.0, 38.0, 24.0, 21.0, 16.0, 8.0, 6.0, 7.0, 4.0, 5.0, 8.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20668792724609375, -0.2003631591796875, -0.19403839111328125, -0.187713623046875, -0.18138885498046875, -0.1750640869140625, -0.16873931884765625, -0.16241455078125, -0.15608978271484375, -0.1497650146484375, -0.14344024658203125, -0.137115478515625, -0.13079071044921875, -0.1244659423828125, -0.11814117431640625, -0.11181640625, -0.10549163818359375, -0.0991668701171875, -0.09284210205078125, -0.086517333984375, -0.08019256591796875, -0.0738677978515625, -0.06754302978515625, -0.06121826171875, -0.05489349365234375, -0.0485687255859375, -0.04224395751953125, -0.035919189453125, -0.02959442138671875, -0.0232696533203125, -0.01694488525390625, -0.0106201171875, -0.00429534912109375, 0.0020294189453125, 0.00835418701171875, 0.014678955078125, 0.02100372314453125, 0.0273284912109375, 0.03365325927734375, 0.03997802734375, 0.04630279541015625, 0.0526275634765625, 0.05895233154296875, 0.065277099609375, 0.07160186767578125, 0.0779266357421875, 0.08425140380859375, 0.090576171875, 0.09690093994140625, 0.1032257080078125, 0.10955047607421875, 0.115875244140625, 0.12220001220703125, 0.1285247802734375, 0.13484954833984375, 0.14117431640625, 0.14749908447265625, 0.1538238525390625, 0.16014862060546875, 0.166473388671875, 0.17279815673828125, 0.1791229248046875, 0.18544769287109375, 0.1917724609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 15.0, 18.0, 18.0, 21.0, 20.0, 22.0, 37.0, 51.0, 46.0, 45.0, 54.0, 45.0, 59.0, 57.0, 53.0, 58.0, 52.0, 40.0, 37.0, 36.0, 33.0, 21.0, 22.0, 25.0, 14.0, 15.0, 13.0, 7.0, 8.0, 3.0, 6.0, 1.0, 4.0, 7.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2080078125, -0.20084381103515625, -0.1936798095703125, -0.18651580810546875, -0.179351806640625, -0.17218780517578125, -0.1650238037109375, -0.15785980224609375, -0.15069580078125, -0.14353179931640625, -0.1363677978515625, -0.12920379638671875, -0.122039794921875, -0.11487579345703125, -0.1077117919921875, -0.10054779052734375, -0.0933837890625, -0.08621978759765625, -0.0790557861328125, -0.07189178466796875, -0.064727783203125, -0.05756378173828125, -0.0503997802734375, -0.04323577880859375, -0.03607177734375, -0.02890777587890625, -0.0217437744140625, -0.01457977294921875, -0.007415771484375, -0.00025177001953125, 0.0069122314453125, 0.01407623291015625, 0.021240234375, 0.02840423583984375, 0.0355682373046875, 0.04273223876953125, 0.049896240234375, 0.05706024169921875, 0.0642242431640625, 0.07138824462890625, 0.07855224609375, 0.08571624755859375, 0.0928802490234375, 0.10004425048828125, 0.107208251953125, 0.11437225341796875, 0.1215362548828125, 0.12870025634765625, 0.1358642578125, 0.14302825927734375, 0.1501922607421875, 0.15735626220703125, 0.164520263671875, 0.17168426513671875, 0.1788482666015625, 0.18601226806640625, 0.19317626953125, 0.20034027099609375, 0.2075042724609375, 0.21466827392578125, 0.221832275390625, 0.22899627685546875, 0.2361602783203125, 0.24332427978515625, 0.25048828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 28.0, 36.0, 66.0, 85.0, 145.0, 225.0, 380.0, 675.0, 1308.0, 2588.0, 5480.0, 11921.0, 26410.0, 61691.0, 152216.0, 310576.0, 268970.0, 117879.0, 48453.0, 20809.0, 9591.0, 4319.0, 2099.0, 1119.0, 592.0, 328.0, 201.0, 118.0, 65.0, 53.0, 33.0, 19.0, 24.0, 5.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0234832763671875, -0.022722244262695312, -0.021961212158203125, -0.021200180053710938, -0.02043914794921875, -0.019678115844726562, -0.018917083740234375, -0.018156051635742188, -0.01739501953125, -0.016633987426757812, -0.015872955322265625, -0.015111923217773438, -0.01435089111328125, -0.013589859008789062, -0.012828826904296875, -0.012067794799804688, -0.0113067626953125, -0.010545730590820312, -0.009784698486328125, -0.009023666381835938, -0.00826263427734375, -0.0075016021728515625, -0.006740570068359375, -0.0059795379638671875, -0.005218505859375, -0.0044574737548828125, -0.003696441650390625, -0.0029354095458984375, -0.00217437744140625, -0.0014133453369140625, -0.000652313232421875, 0.0001087188720703125, 0.0008697509765625, 0.0016307830810546875, 0.002391815185546875, 0.0031528472900390625, 0.00391387939453125, 0.0046749114990234375, 0.005435943603515625, 0.0061969757080078125, 0.0069580078125, 0.0077190399169921875, 0.008480072021484375, 0.009241104125976562, 0.01000213623046875, 0.010763168334960938, 0.011524200439453125, 0.012285232543945312, 0.0130462646484375, 0.013807296752929688, 0.014568328857421875, 0.015329360961914062, 0.01609039306640625, 0.016851425170898438, 0.017612457275390625, 0.018373489379882812, 0.019134521484375, 0.019895553588867188, 0.020656585693359375, 0.021417617797851562, 0.02217864990234375, 0.022939682006835938, 0.023700714111328125, 0.024461746215820312, 0.0252227783203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 4.0, 4.0, 14.0, 9.0, 12.0, 30.0, 29.0, 33.0, 59.0, 51.0, 73.0, 100.0, 81.0, 105.0, 101.0, 63.0, 51.0, 47.0, 34.0, 24.0, 27.0, 12.0, 13.0, 8.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.867813110351562e-06, -7.549300789833069e-06, -7.230788469314575e-06, -6.9122761487960815e-06, -6.593763828277588e-06, -6.275251507759094e-06, -5.956739187240601e-06, -5.638226866722107e-06, -5.319714546203613e-06, -5.00120222568512e-06, -4.682689905166626e-06, -4.364177584648132e-06, -4.045665264129639e-06, -3.727152943611145e-06, -3.4086406230926514e-06, -3.0901283025741577e-06, -2.771615982055664e-06, -2.4531036615371704e-06, -2.1345913410186768e-06, -1.816079020500183e-06, -1.4975666999816895e-06, -1.1790543794631958e-06, -8.605420589447021e-07, -5.420297384262085e-07, -2.2351741790771484e-07, 9.499490261077881e-08, 4.1350722312927246e-07, 7.320195436477661e-07, 1.0505318641662598e-06, 1.3690441846847534e-06, 1.687556505203247e-06, 2.0060688257217407e-06, 2.3245811462402344e-06, 2.643093466758728e-06, 2.9616057872772217e-06, 3.2801181077957153e-06, 3.598630428314209e-06, 3.917142748832703e-06, 4.235655069351196e-06, 4.55416738986969e-06, 4.872679710388184e-06, 5.191192030906677e-06, 5.509704351425171e-06, 5.8282166719436646e-06, 6.146728992462158e-06, 6.465241312980652e-06, 6.7837536334991455e-06, 7.102265954017639e-06, 7.420778274536133e-06, 7.739290595054626e-06, 8.05780291557312e-06, 8.376315236091614e-06, 8.694827556610107e-06, 9.013339877128601e-06, 9.331852197647095e-06, 9.650364518165588e-06, 9.968876838684082e-06, 1.0287389159202576e-05, 1.060590147972107e-05, 1.0924413800239563e-05, 1.1242926120758057e-05, 1.156143844127655e-05, 1.1879950761795044e-05, 1.2198463082313538e-05, 1.2516975402832031e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 3.0, 10.0, 21.0, 31.0, 33.0, 79.0, 102.0, 188.0, 305.0, 585.0, 1318.0, 3759.0, 13317.0, 63017.0, 383711.0, 474643.0, 83280.0, 16600.0, 4522.0, 1581.0, 592.0, 358.0, 174.0, 123.0, 75.0, 50.0, 24.0, 16.0, 13.0, 9.0, 3.0, 6.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05096435546875, -0.04932451248168945, -0.047684669494628906, -0.04604482650756836, -0.04440498352050781, -0.042765140533447266, -0.04112529754638672, -0.03948545455932617, -0.037845611572265625, -0.03620576858520508, -0.03456592559814453, -0.032926082611083984, -0.03128623962402344, -0.02964639663696289, -0.028006553649902344, -0.026366710662841797, -0.02472686767578125, -0.023087024688720703, -0.021447181701660156, -0.01980733871459961, -0.018167495727539062, -0.016527652740478516, -0.014887809753417969, -0.013247966766357422, -0.011608123779296875, -0.009968280792236328, -0.008328437805175781, -0.006688594818115234, -0.0050487518310546875, -0.0034089088439941406, -0.0017690658569335938, -0.00012922286987304688, 0.0015106201171875, 0.003150463104248047, 0.004790306091308594, 0.006430149078369141, 0.008069992065429688, 0.009709835052490234, 0.011349678039550781, 0.012989521026611328, 0.014629364013671875, 0.016269207000732422, 0.01790904998779297, 0.019548892974853516, 0.021188735961914062, 0.02282857894897461, 0.024468421936035156, 0.026108264923095703, 0.02774810791015625, 0.029387950897216797, 0.031027793884277344, 0.03266763687133789, 0.03430747985839844, 0.035947322845458984, 0.03758716583251953, 0.03922700881958008, 0.040866851806640625, 0.04250669479370117, 0.04414653778076172, 0.045786380767822266, 0.04742622375488281, 0.04906606674194336, 0.050705909729003906, 0.05234575271606445, 0.053985595703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 8.0, 7.0, 9.0, 12.0, 9.0, 13.0, 14.0, 18.0, 30.0, 36.0, 46.0, 50.0, 56.0, 69.0, 89.0, 94.0, 84.0, 62.0, 57.0, 47.0, 40.0, 32.0, 17.0, 16.0, 15.0, 8.0, 8.0, 10.0, 6.0, 6.0, 2.0, 6.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0303802490234375, -0.029306650161743164, -0.028233051300048828, -0.027159452438354492, -0.026085853576660156, -0.02501225471496582, -0.023938655853271484, -0.02286505699157715, -0.021791458129882812, -0.020717859268188477, -0.01964426040649414, -0.018570661544799805, -0.01749706268310547, -0.016423463821411133, -0.015349864959716797, -0.014276266098022461, -0.013202667236328125, -0.012129068374633789, -0.011055469512939453, -0.009981870651245117, -0.008908271789550781, -0.007834672927856445, -0.006761074066162109, -0.0056874752044677734, -0.0046138763427734375, -0.0035402774810791016, -0.0024666786193847656, -0.0013930797576904297, -0.00031948089599609375, 0.0007541179656982422, 0.0018277168273925781, 0.002901315689086914, 0.00397491455078125, 0.005048513412475586, 0.006122112274169922, 0.007195711135864258, 0.008269309997558594, 0.00934290885925293, 0.010416507720947266, 0.011490106582641602, 0.012563705444335938, 0.013637304306030273, 0.01471090316772461, 0.015784502029418945, 0.01685810089111328, 0.017931699752807617, 0.019005298614501953, 0.02007889747619629, 0.021152496337890625, 0.02222609519958496, 0.023299694061279297, 0.024373292922973633, 0.02544689178466797, 0.026520490646362305, 0.02759408950805664, 0.028667688369750977, 0.029741287231445312, 0.03081488609313965, 0.031888484954833984, 0.03296208381652832, 0.034035682678222656, 0.03510928153991699, 0.03618288040161133, 0.037256479263305664, 0.038330078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 21.0, 26.0, 40.0, 103.0, 166.0, 202.0, 170.0, 122.0, 61.0, 46.0, 20.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6674562692642212, -0.6482077240943909, -0.6289592385292053, -0.609710693359375, -0.5904621481895447, -0.5712136030197144, -0.5519651174545288, -0.5327165722846985, -0.5134680271148682, -0.49421951174736023, -0.4749709665775299, -0.455722451210022, -0.43647390604019165, -0.4172253906726837, -0.3979768753051758, -0.37872833013534546, -0.3594798147678375, -0.3402312994003296, -0.32098275423049927, -0.30173423886299133, -0.282485693693161, -0.2632371783256531, -0.24398864805698395, -0.22474011778831482, -0.2054915875196457, -0.18624305725097656, -0.16699452698230743, -0.1477459967136383, -0.12849748134613037, -0.10924894362688065, -0.09000042080879211, -0.07075189054012299, -0.05150336027145386, -0.03225483000278473, -0.013006303459405899, 0.006242223083972931, 0.02549075335264206, 0.04473928362131119, 0.06398780643939972, 0.08323633670806885, 0.10248486697673798, 0.1217333972454071, 0.14098192751407623, 0.16023045778274536, 0.1794789731502533, 0.19872751832008362, 0.21797603368759155, 0.23722456395626068, 0.2564730942249298, 0.27572160959243774, 0.29497015476226807, 0.314218670129776, 0.3334672152996063, 0.35271573066711426, 0.3719642758369446, 0.3912127912044525, 0.41046130657196045, 0.4297098219394684, 0.4489583671092987, 0.46820688247680664, 0.48745542764663696, 0.5067039728164673, 0.5259524583816528, 0.5452010035514832, 0.5644495487213135]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 25.0, 22.0, 17.0, 28.0, 30.0, 30.0, 30.0, 37.0, 31.0, 41.0, 45.0, 31.0, 44.0, 36.0, 35.0, 35.0, 48.0, 41.0, 32.0, 34.0, 35.0, 33.0, 38.0, 23.0, 35.0, 23.0, 13.0, 15.0, 12.0, 9.0, 11.0, 8.0, 8.0, 2.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4753671884536743, -0.46142375469207764, -0.44748032093048096, -0.4335368871688843, -0.41959348320961, -0.4056500494480133, -0.3917066156864166, -0.37776318192481995, -0.36381977796554565, -0.349876344203949, -0.3359329104423523, -0.3219894766807556, -0.3080460727214813, -0.29410263895988464, -0.28015920519828796, -0.2662157714366913, -0.2522723376750946, -0.23832890391349792, -0.22438548505306244, -0.21044205129146576, -0.19649863243103027, -0.1825551986694336, -0.16861176490783691, -0.15466833114624023, -0.14072491228580475, -0.12678147852420807, -0.11283805966377258, -0.0988946259021759, -0.08495119959115982, -0.07100777328014374, -0.05706433951854706, -0.043120913207530975, -0.029177486896514893, -0.01523405872285366, -0.0012906305491924286, 0.012652799487113953, 0.026596225798130035, 0.04053965210914612, 0.0544830858707428, 0.06842651218175888, 0.08236993849277496, 0.09631336480379105, 0.11025679111480713, 0.12420022487640381, 0.1381436586380005, 0.15208707749843597, 0.16603051126003265, 0.17997393012046814, 0.19391736388206482, 0.2078607976436615, 0.22180421650409698, 0.23574765026569366, 0.24969106912612915, 0.26363450288772583, 0.2775779366493225, 0.2915213704109192, 0.30546480417251587, 0.31940823793411255, 0.33335167169570923, 0.3472951054573059, 0.3612385094165802, 0.3751819431781769, 0.38912537693977356, 0.40306881070137024, 0.41701221466064453]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 2.0, 8.0, 10.0, 14.0, 26.0, 48.0, 60.0, 116.0, 199.0, 451.0, 1196.0, 3293.0, 9791.0, 38438.0, 276147.0, 2056055.0, 1586358.0, 182379.0, 27385.0, 7859.0, 2641.0, 913.0, 389.0, 177.0, 112.0, 70.0, 51.0, 31.0, 17.0, 13.0, 3.0, 5.0, 3.0, 6.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1148681640625, -0.11137771606445312, -0.10788726806640625, -0.10439682006835938, -0.1009063720703125, -0.09741592407226562, -0.09392547607421875, -0.09043502807617188, -0.086944580078125, -0.08345413208007812, -0.07996368408203125, -0.07647323608398438, -0.0729827880859375, -0.06949234008789062, -0.06600189208984375, -0.06251144409179688, -0.05902099609375, -0.055530548095703125, -0.05204010009765625, -0.048549652099609375, -0.0450592041015625, -0.041568756103515625, -0.03807830810546875, -0.034587860107421875, -0.031097412109375, -0.027606964111328125, -0.02411651611328125, -0.020626068115234375, -0.0171356201171875, -0.013645172119140625, -0.01015472412109375, -0.006664276123046875, -0.003173828125, 0.000316619873046875, 0.00380706787109375, 0.007297515869140625, 0.0107879638671875, 0.014278411865234375, 0.01776885986328125, 0.021259307861328125, 0.024749755859375, 0.028240203857421875, 0.03173065185546875, 0.035221099853515625, 0.0387115478515625, 0.042201995849609375, 0.04569244384765625, 0.049182891845703125, 0.05267333984375, 0.056163787841796875, 0.05965423583984375, 0.06314468383789062, 0.0666351318359375, 0.07012557983398438, 0.07361602783203125, 0.07710647583007812, 0.080596923828125, 0.08408737182617188, 0.08757781982421875, 0.09106826782226562, 0.0945587158203125, 0.09804916381835938, 0.10153961181640625, 0.10503005981445312, 0.1085205078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 7.0, 16.0, 24.0, 31.0, 46.0, 56.0, 65.0, 86.0, 86.0, 80.0, 77.0, 67.0, 74.0, 71.0, 48.0, 38.0, 45.0, 32.0, 13.0, 11.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.12637901306152344, -0.12202072143554688, -0.11766242980957031, -0.11330413818359375, -0.10894584655761719, -0.10458755493164062, -0.10022926330566406, -0.0958709716796875, -0.09151268005371094, -0.08715438842773438, -0.08279609680175781, -0.07843780517578125, -0.07407951354980469, -0.06972122192382812, -0.06536293029785156, -0.061004638671875, -0.05664634704589844, -0.052288055419921875, -0.04792976379394531, -0.04357147216796875, -0.03921318054199219, -0.034854888916015625, -0.030496597290039062, -0.0261383056640625, -0.021780014038085938, -0.017421722412109375, -0.013063430786132812, -0.00870513916015625, -0.0043468475341796875, 1.1444091796875e-05, 0.0043697357177734375, 0.00872802734375, 0.013086318969726562, 0.017444610595703125, 0.021802902221679688, 0.02616119384765625, 0.030519485473632812, 0.034877777099609375, 0.03923606872558594, 0.0435943603515625, 0.04795265197753906, 0.052310943603515625, 0.05666923522949219, 0.06102752685546875, 0.06538581848144531, 0.06974411010742188, 0.07410240173339844, 0.078460693359375, 0.08281898498535156, 0.08717727661132812, 0.09153556823730469, 0.09589385986328125, 0.10025215148925781, 0.10461044311523438, 0.10896873474121094, 0.1133270263671875, 0.11768531799316406, 0.12204360961914062, 0.1264019012451172, 0.13076019287109375, 0.1351184844970703, 0.13947677612304688, 0.14383506774902344, 0.148193359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 12.0, 15.0, 11.0, 22.0, 20.0, 44.0, 70.0, 104.0, 176.0, 375.0, 803.0, 2064.0, 6316.0, 21767.0, 101741.0, 1246506.0, 2599452.0, 169213.0, 31853.0, 8769.0, 2855.0, 1079.0, 443.0, 217.0, 119.0, 86.0, 52.0, 15.0, 23.0, 22.0, 17.0, 6.0, 5.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13330078125, -0.1287250518798828, -0.12414932250976562, -0.11957359313964844, -0.11499786376953125, -0.11042213439941406, -0.10584640502929688, -0.10127067565917969, -0.0966949462890625, -0.09211921691894531, -0.08754348754882812, -0.08296775817871094, -0.07839202880859375, -0.07381629943847656, -0.06924057006835938, -0.06466484069824219, -0.060089111328125, -0.05551338195800781, -0.050937652587890625, -0.04636192321777344, -0.04178619384765625, -0.03721046447753906, -0.032634735107421875, -0.028059005737304688, -0.0234832763671875, -0.018907546997070312, -0.014331817626953125, -0.009756088256835938, -0.00518035888671875, -0.0006046295166015625, 0.003971099853515625, 0.008546829223632812, 0.01312255859375, 0.017698287963867188, 0.022274017333984375, 0.026849746704101562, 0.03142547607421875, 0.03600120544433594, 0.040576934814453125, 0.04515266418457031, 0.0497283935546875, 0.05430412292480469, 0.058879852294921875, 0.06345558166503906, 0.06803131103515625, 0.07260704040527344, 0.07718276977539062, 0.08175849914550781, 0.086334228515625, 0.09090995788574219, 0.09548568725585938, 0.10006141662597656, 0.10463714599609375, 0.10921287536621094, 0.11378860473632812, 0.11836433410644531, 0.1229400634765625, 0.1275157928466797, 0.13209152221679688, 0.13666725158691406, 0.14124298095703125, 0.14581871032714844, 0.15039443969726562, 0.1549701690673828, 0.1595458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 11.0, 3.0, 15.0, 25.0, 57.0, 59.0, 148.0, 349.0, 952.0, 1280.0, 655.0, 203.0, 126.0, 66.0, 37.0, 33.0, 17.0, 19.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26831626892089844, -0.2619743347167969, -0.2556324005126953, -0.24929046630859375, -0.2429485321044922, -0.23660659790039062, -0.23026466369628906, -0.2239227294921875, -0.21758079528808594, -0.21123886108398438, -0.2048969268798828, -0.19855499267578125, -0.1922130584716797, -0.18587112426757812, -0.17952919006347656, -0.173187255859375, -0.16684532165527344, -0.16050338745117188, -0.1541614532470703, -0.14781951904296875, -0.1414775848388672, -0.13513565063476562, -0.12879371643066406, -0.1224517822265625, -0.11610984802246094, -0.10976791381835938, -0.10342597961425781, -0.09708404541015625, -0.09074211120605469, -0.08440017700195312, -0.07805824279785156, -0.07171630859375, -0.06537437438964844, -0.059032440185546875, -0.05269050598144531, -0.04634857177734375, -0.04000663757324219, -0.033664703369140625, -0.027322769165039062, -0.0209808349609375, -0.014638900756835938, -0.008296966552734375, -0.0019550323486328125, 0.00438690185546875, 0.010728836059570312, 0.017070770263671875, 0.023412704467773438, 0.029754638671875, 0.03609657287597656, 0.042438507080078125, 0.04878044128417969, 0.05512237548828125, 0.06146430969238281, 0.06780624389648438, 0.07414817810058594, 0.0804901123046875, 0.08683204650878906, 0.09317398071289062, 0.09951591491699219, 0.10585784912109375, 0.11219978332519531, 0.11854171752929688, 0.12488365173339844, 0.1312255859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 49.0, 229.0, 439.0, 235.0, 44.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3768868446350098, -2.322251796722412, -2.2676169872283936, -2.212981939315796, -2.1583468914031982, -2.1037120819091797, -2.049077033996582, -1.9944419860839844, -1.9398070573806763, -1.8851721286773682, -1.8305370807647705, -1.7759021520614624, -1.7212672233581543, -1.6666321754455566, -1.6119972467422485, -1.5573623180389404, -1.5027272701263428, -1.4480923414230347, -1.393457293510437, -1.338822364807129, -1.2841873168945312, -1.2295523881912231, -1.174917459487915, -1.1202824115753174, -1.0656474828720093, -1.0110125541687012, -0.9563775062561035, -0.9017425775527954, -0.8471075892448425, -0.7924726009368896, -0.7378376722335815, -0.6832026839256287, -0.6285678148269653, -0.5739328265190125, -0.5192978382110596, -0.46466290950775146, -0.4100279211997986, -0.3553929328918457, -0.3007579743862152, -0.24612301588058472, -0.19148802757263184, -0.13685305416584015, -0.08221808075904846, -0.027583107352256775, 0.027051866054534912, 0.08168685436248779, 0.1363218128681183, 0.19095677137374878, 0.24559175968170166, 0.30022674798965454, 0.35486170649528503, 0.4094966650009155, 0.4641316533088684, 0.5187666416168213, 0.5734015703201294, 0.6280365586280823, 0.6826715469360352, 0.737306535243988, 0.7919415235519409, 0.846576452255249, 0.9012114405632019, 0.9558464288711548, 1.010481357574463, 1.0651164054870605, 1.1197513341903687]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 11.0, 15.0, 29.0, 21.0, 27.0, 32.0, 34.0, 47.0, 43.0, 42.0, 54.0, 62.0, 77.0, 53.0, 69.0, 47.0, 52.0, 61.0, 40.0, 52.0, 32.0, 20.0, 23.0, 15.0, 16.0, 9.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5519155859947205, -0.536873996257782, -0.5218324661254883, -0.5067908763885498, -0.4917493164539337, -0.4767077565193176, -0.46166619658470154, -0.44662463665008545, -0.431583046913147, -0.4165414869785309, -0.4014999270439148, -0.3864583373069763, -0.37141677737236023, -0.35637521743774414, -0.34133365750312805, -0.32629209756851196, -0.3112505078315735, -0.2962089478969574, -0.2811673879623413, -0.26612579822540283, -0.25108423829078674, -0.23604267835617065, -0.22100111842155457, -0.20595954358577728, -0.1909179985523224, -0.1758764386177063, -0.16083486378192902, -0.14579330384731293, -0.13075172901153564, -0.11571016907691956, -0.10066860169172287, -0.08562703430652618, -0.0705854594707489, -0.055543892085552216, -0.04050232470035553, -0.025460761040449142, -0.010419193655252457, 0.004622370004653931, 0.019663937389850616, 0.0347055047750473, 0.04974707216024399, 0.06478863954544067, 0.07983020693063736, 0.09487177431583405, 0.10991333425045013, 0.12495490163564682, 0.1399964690208435, 0.1550380289554596, 0.17007960379123688, 0.18512116372585297, 0.20016273856163025, 0.21520429849624634, 0.23024587333202362, 0.2452874332666397, 0.260329008102417, 0.2753705680370331, 0.29041212797164917, 0.30545368790626526, 0.32049524784088135, 0.3355368375778198, 0.3505783975124359, 0.365619957447052, 0.3806615173816681, 0.3957030773162842, 0.41074466705322266]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 16.0, 15.0, 14.0, 21.0, 27.0, 32.0, 54.0, 81.0, 115.0, 164.0, 232.0, 399.0, 591.0, 910.0, 1543.0, 2900.0, 5258.0, 10169.0, 21140.0, 47252.0, 109953.0, 231756.0, 293383.0, 177069.0, 77987.0, 34025.0, 15871.0, 7791.0, 4044.0, 2259.0, 1234.0, 800.0, 461.0, 286.0, 203.0, 117.0, 102.0, 68.0, 65.0, 37.0, 31.0, 22.0, 18.0, 7.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0755615234375, -0.07322216033935547, -0.07088279724121094, -0.0685434341430664, -0.06620407104492188, -0.06386470794677734, -0.06152534484863281, -0.05918598175048828, -0.05684661865234375, -0.05450725555419922, -0.05216789245605469, -0.049828529357910156, -0.047489166259765625, -0.045149803161621094, -0.04281044006347656, -0.04047107696533203, -0.0381317138671875, -0.03579235076904297, -0.03345298767089844, -0.031113624572753906, -0.028774261474609375, -0.026434898376464844, -0.024095535278320312, -0.02175617218017578, -0.01941680908203125, -0.01707744598388672, -0.014738082885742188, -0.012398719787597656, -0.010059356689453125, -0.007719993591308594, -0.0053806304931640625, -0.0030412673950195312, -0.000701904296875, 0.0016374588012695312, 0.0039768218994140625, 0.006316184997558594, 0.008655548095703125, 0.010994911193847656, 0.013334274291992188, 0.01567363739013672, 0.01801300048828125, 0.02035236358642578, 0.022691726684570312, 0.025031089782714844, 0.027370452880859375, 0.029709815979003906, 0.03204917907714844, 0.03438854217529297, 0.0367279052734375, 0.03906726837158203, 0.04140663146972656, 0.043745994567871094, 0.046085357666015625, 0.048424720764160156, 0.05076408386230469, 0.05310344696044922, 0.05544281005859375, 0.05778217315673828, 0.06012153625488281, 0.062460899353027344, 0.06480026245117188, 0.0671396255493164, 0.06947898864746094, 0.07181835174560547, 0.07415771484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 12.0, 15.0, 20.0, 27.0, 48.0, 48.0, 60.0, 65.0, 78.0, 85.0, 74.0, 78.0, 63.0, 83.0, 45.0, 45.0, 45.0, 26.0, 25.0, 17.0, 16.0, 11.0, 6.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11395263671875, -0.10996150970458984, -0.10597038269042969, -0.10197925567626953, -0.09798812866210938, -0.09399700164794922, -0.09000587463378906, -0.0860147476196289, -0.08202362060546875, -0.0780324935913086, -0.07404136657714844, -0.07005023956298828, -0.06605911254882812, -0.06206798553466797, -0.05807685852050781, -0.054085731506347656, -0.0500946044921875, -0.046103477478027344, -0.04211235046386719, -0.03812122344970703, -0.034130096435546875, -0.03013896942138672, -0.026147842407226562, -0.022156715393066406, -0.01816558837890625, -0.014174461364746094, -0.010183334350585938, -0.006192207336425781, -0.002201080322265625, 0.0017900466918945312, 0.0057811737060546875, 0.009772300720214844, 0.013763427734375, 0.017754554748535156, 0.021745681762695312, 0.02573680877685547, 0.029727935791015625, 0.03371906280517578, 0.03771018981933594, 0.041701316833496094, 0.04569244384765625, 0.049683570861816406, 0.05367469787597656, 0.05766582489013672, 0.061656951904296875, 0.06564807891845703, 0.06963920593261719, 0.07363033294677734, 0.0776214599609375, 0.08161258697509766, 0.08560371398925781, 0.08959484100341797, 0.09358596801757812, 0.09757709503173828, 0.10156822204589844, 0.1055593490600586, 0.10955047607421875, 0.1135416030883789, 0.11753273010253906, 0.12152385711669922, 0.12551498413085938, 0.12950611114501953, 0.1334972381591797, 0.13748836517333984, 0.1414794921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 10.0, 20.0, 25.0, 23.0, 32.0, 46.0, 74.0, 112.0, 176.0, 282.0, 382.0, 609.0, 1036.0, 1569.0, 2640.0, 4637.0, 8049.0, 14869.0, 28493.0, 56791.0, 114986.0, 216100.0, 258950.0, 166709.0, 83015.0, 41071.0, 20996.0, 11243.0, 6210.0, 3627.0, 2123.0, 1262.0, 765.0, 520.0, 378.0, 217.0, 148.0, 98.0, 81.0, 46.0, 31.0, 24.0, 15.0, 19.0, 10.0, 6.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0635986328125, -0.06149768829345703, -0.05939674377441406, -0.057295799255371094, -0.055194854736328125, -0.053093910217285156, -0.05099296569824219, -0.04889202117919922, -0.04679107666015625, -0.04469013214111328, -0.04258918762207031, -0.040488243103027344, -0.038387298583984375, -0.036286354064941406, -0.03418540954589844, -0.03208446502685547, -0.0299835205078125, -0.02788257598876953, -0.025781631469726562, -0.023680686950683594, -0.021579742431640625, -0.019478797912597656, -0.017377853393554688, -0.015276908874511719, -0.01317596435546875, -0.011075019836425781, -0.008974075317382812, -0.006873130798339844, -0.004772186279296875, -0.0026712417602539062, -0.0005702972412109375, 0.0015306472778320312, 0.003631591796875, 0.005732536315917969, 0.007833480834960938, 0.009934425354003906, 0.012035369873046875, 0.014136314392089844, 0.016237258911132812, 0.01833820343017578, 0.02043914794921875, 0.02254009246826172, 0.024641036987304688, 0.026741981506347656, 0.028842926025390625, 0.030943870544433594, 0.03304481506347656, 0.03514575958251953, 0.0372467041015625, 0.03934764862060547, 0.04144859313964844, 0.043549537658691406, 0.045650482177734375, 0.047751426696777344, 0.04985237121582031, 0.05195331573486328, 0.05405426025390625, 0.05615520477294922, 0.05825614929199219, 0.060357093811035156, 0.062458038330078125, 0.0645589828491211, 0.06665992736816406, 0.06876087188720703, 0.07086181640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 4.0, 9.0, 6.0, 9.0, 11.0, 16.0, 15.0, 16.0, 27.0, 27.0, 26.0, 27.0, 34.0, 35.0, 36.0, 37.0, 45.0, 42.0, 45.0, 44.0, 42.0, 49.0, 53.0, 37.0, 33.0, 36.0, 34.0, 36.0, 20.0, 21.0, 28.0, 20.0, 18.0, 11.0, 7.0, 9.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.17431640625, -0.16877365112304688, -0.16323089599609375, -0.15768814086914062, -0.1521453857421875, -0.14660263061523438, -0.14105987548828125, -0.13551712036132812, -0.129974365234375, -0.12443161010742188, -0.11888885498046875, -0.11334609985351562, -0.1078033447265625, -0.10226058959960938, -0.09671783447265625, -0.09117507934570312, -0.08563232421875, -0.08008956909179688, -0.07454681396484375, -0.06900405883789062, -0.0634613037109375, -0.057918548583984375, -0.05237579345703125, -0.046833038330078125, -0.041290283203125, -0.035747528076171875, -0.03020477294921875, -0.024662017822265625, -0.0191192626953125, -0.013576507568359375, -0.00803375244140625, -0.002490997314453125, 0.0030517578125, 0.008594512939453125, 0.01413726806640625, 0.019680023193359375, 0.0252227783203125, 0.030765533447265625, 0.03630828857421875, 0.041851043701171875, 0.047393798828125, 0.052936553955078125, 0.05847930908203125, 0.06402206420898438, 0.0695648193359375, 0.07510757446289062, 0.08065032958984375, 0.08619308471679688, 0.09173583984375, 0.09727859497070312, 0.10282135009765625, 0.10836410522460938, 0.1139068603515625, 0.11944961547851562, 0.12499237060546875, 0.13053512573242188, 0.136077880859375, 0.14162063598632812, 0.14716339111328125, 0.15270614624023438, 0.1582489013671875, 0.16379165649414062, 0.16933441162109375, 0.17487716674804688, 0.180419921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 11.0, 9.0, 17.0, 16.0, 46.0, 52.0, 115.0, 201.0, 324.0, 604.0, 1071.0, 2075.0, 3947.0, 8364.0, 19967.0, 52084.0, 147107.0, 318393.0, 293930.0, 124220.0, 43795.0, 17220.0, 7386.0, 3597.0, 1800.0, 906.0, 557.0, 289.0, 187.0, 107.0, 60.0, 30.0, 27.0, 17.0, 9.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0267486572265625, -0.02588343620300293, -0.02501821517944336, -0.02415299415588379, -0.02328777313232422, -0.02242255210876465, -0.021557331085205078, -0.020692110061645508, -0.019826889038085938, -0.018961668014526367, -0.018096446990966797, -0.017231225967407227, -0.016366004943847656, -0.015500783920288086, -0.014635562896728516, -0.013770341873168945, -0.012905120849609375, -0.012039899826049805, -0.011174678802490234, -0.010309457778930664, -0.009444236755371094, -0.008579015731811523, -0.007713794708251953, -0.006848573684692383, -0.0059833526611328125, -0.005118131637573242, -0.004252910614013672, -0.0033876895904541016, -0.0025224685668945312, -0.001657247543334961, -0.0007920265197753906, 7.319450378417969e-05, 0.00093841552734375, 0.0018036365509033203, 0.0026688575744628906, 0.003534078598022461, 0.004399299621582031, 0.0052645206451416016, 0.006129741668701172, 0.006994962692260742, 0.007860183715820312, 0.008725404739379883, 0.009590625762939453, 0.010455846786499023, 0.011321067810058594, 0.012186288833618164, 0.013051509857177734, 0.013916730880737305, 0.014781951904296875, 0.015647172927856445, 0.016512393951416016, 0.017377614974975586, 0.018242835998535156, 0.019108057022094727, 0.019973278045654297, 0.020838499069213867, 0.021703720092773438, 0.022568941116333008, 0.023434162139892578, 0.02429938316345215, 0.02516460418701172, 0.02602982521057129, 0.02689504623413086, 0.02776026725769043, 0.02862548828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 5.0, 16.0, 17.0, 29.0, 38.0, 55.0, 64.0, 89.0, 107.0, 101.0, 85.0, 88.0, 79.0, 48.0, 52.0, 28.0, 23.0, 14.0, 11.0, 5.0, 6.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0013580322265625e-05, -9.673647582530975e-06, -9.333714842796326e-06, -8.993782103061676e-06, -8.653849363327026e-06, -8.313916623592377e-06, -7.973983883857727e-06, -7.634051144123077e-06, -7.294118404388428e-06, -6.954185664653778e-06, -6.614252924919128e-06, -6.274320185184479e-06, -5.934387445449829e-06, -5.5944547057151794e-06, -5.25452196598053e-06, -4.91458922624588e-06, -4.5746564865112305e-06, -4.234723746776581e-06, -3.894791007041931e-06, -3.5548582673072815e-06, -3.214925527572632e-06, -2.874992787837982e-06, -2.5350600481033325e-06, -2.195127308368683e-06, -1.8551945686340332e-06, -1.5152618288993835e-06, -1.1753290891647339e-06, -8.353963494300842e-07, -4.954636096954346e-07, -1.555308699607849e-07, 1.8440186977386475e-07, 5.243346095085144e-07, 8.642673492431641e-07, 1.2042000889778137e-06, 1.5441328287124634e-06, 1.884065568447113e-06, 2.2239983081817627e-06, 2.5639310479164124e-06, 2.903863787651062e-06, 3.2437965273857117e-06, 3.5837292671203613e-06, 3.923662006855011e-06, 4.263594746589661e-06, 4.60352748632431e-06, 4.94346022605896e-06, 5.28339296579361e-06, 5.623325705528259e-06, 5.963258445262909e-06, 6.303191184997559e-06, 6.643123924732208e-06, 6.983056664466858e-06, 7.3229894042015076e-06, 7.662922143936157e-06, 8.002854883670807e-06, 8.342787623405457e-06, 8.682720363140106e-06, 9.022653102874756e-06, 9.362585842609406e-06, 9.702518582344055e-06, 1.0042451322078705e-05, 1.0382384061813354e-05, 1.0722316801548004e-05, 1.1062249541282654e-05, 1.1402182281017303e-05, 1.1742115020751953e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 10.0, 8.0, 8.0, 20.0, 49.0, 47.0, 106.0, 118.0, 206.0, 330.0, 565.0, 925.0, 1640.0, 2933.0, 5473.0, 11059.0, 23744.0, 53815.0, 121553.0, 231581.0, 271243.0, 173772.0, 81021.0, 35415.0, 16091.0, 7729.0, 4031.0, 2115.0, 1145.0, 667.0, 402.0, 249.0, 186.0, 99.0, 60.0, 40.0, 26.0, 25.0, 12.0, 6.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198516845703125, -0.01917290687561035, -0.018494129180908203, -0.017815351486206055, -0.017136573791503906, -0.016457796096801758, -0.01577901840209961, -0.015100240707397461, -0.014421463012695312, -0.013742685317993164, -0.013063907623291016, -0.012385129928588867, -0.011706352233886719, -0.01102757453918457, -0.010348796844482422, -0.009670019149780273, -0.008991241455078125, -0.008312463760375977, -0.007633686065673828, -0.00695490837097168, -0.006276130676269531, -0.005597352981567383, -0.004918575286865234, -0.004239797592163086, -0.0035610198974609375, -0.002882242202758789, -0.0022034645080566406, -0.0015246868133544922, -0.0008459091186523438, -0.0001671314239501953, 0.0005116462707519531, 0.0011904239654541016, 0.00186920166015625, 0.0025479793548583984, 0.003226757049560547, 0.0039055347442626953, 0.004584312438964844, 0.005263090133666992, 0.005941867828369141, 0.006620645523071289, 0.0072994232177734375, 0.007978200912475586, 0.008656978607177734, 0.009335756301879883, 0.010014533996582031, 0.01069331169128418, 0.011372089385986328, 0.012050867080688477, 0.012729644775390625, 0.013408422470092773, 0.014087200164794922, 0.01476597785949707, 0.015444755554199219, 0.016123533248901367, 0.016802310943603516, 0.017481088638305664, 0.018159866333007812, 0.01883864402770996, 0.01951742172241211, 0.020196199417114258, 0.020874977111816406, 0.021553754806518555, 0.022232532501220703, 0.02291131019592285, 0.023590087890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 13.0, 15.0, 16.0, 18.0, 16.0, 26.0, 32.0, 37.0, 50.0, 53.0, 48.0, 62.0, 62.0, 82.0, 61.0, 58.0, 53.0, 59.0, 39.0, 34.0, 26.0, 25.0, 14.0, 23.0, 16.0, 5.0, 10.0, 10.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247955322265625, -0.023877382278442383, -0.022959232330322266, -0.02204108238220215, -0.02112293243408203, -0.020204782485961914, -0.019286632537841797, -0.01836848258972168, -0.017450332641601562, -0.016532182693481445, -0.015614032745361328, -0.014695882797241211, -0.013777732849121094, -0.012859582901000977, -0.01194143295288086, -0.011023283004760742, -0.010105133056640625, -0.009186983108520508, -0.00826883316040039, -0.0073506832122802734, -0.006432533264160156, -0.005514383316040039, -0.004596233367919922, -0.0036780834197998047, -0.0027599334716796875, -0.0018417835235595703, -0.0009236335754394531, -5.4836273193359375e-06, 0.0009126663208007812, 0.0018308162689208984, 0.0027489662170410156, 0.003667116165161133, 0.00458526611328125, 0.005503416061401367, 0.006421566009521484, 0.0073397159576416016, 0.008257865905761719, 0.009176015853881836, 0.010094165802001953, 0.01101231575012207, 0.011930465698242188, 0.012848615646362305, 0.013766765594482422, 0.014684915542602539, 0.015603065490722656, 0.016521215438842773, 0.01743936538696289, 0.018357515335083008, 0.019275665283203125, 0.020193815231323242, 0.02111196517944336, 0.022030115127563477, 0.022948265075683594, 0.02386641502380371, 0.024784564971923828, 0.025702714920043945, 0.026620864868164062, 0.02753901481628418, 0.028457164764404297, 0.029375314712524414, 0.03029346466064453, 0.03121161460876465, 0.032129764556884766, 0.03304791450500488, 0.033966064453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 13.0, 15.0, 28.0, 81.0, 123.0, 178.0, 207.0, 170.0, 105.0, 43.0, 22.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7778462767601013, -0.7558779716491699, -0.7339096069335938, -0.7119412422180176, -0.6899729371070862, -0.6680046319961548, -0.6460362672805786, -0.6240679025650024, -0.602099597454071, -0.5801312923431396, -0.5581629276275635, -0.5361945629119873, -0.5142262578010559, -0.4922579228878021, -0.47028958797454834, -0.44832125306129456, -0.42635291814804077, -0.404384583234787, -0.3824162483215332, -0.3604479134082794, -0.33847957849502563, -0.31651124358177185, -0.29454290866851807, -0.2725745737552643, -0.2506062388420105, -0.2286379039287567, -0.20666956901550293, -0.18470123410224915, -0.16273289918899536, -0.14076456427574158, -0.11879622936248779, -0.09682789444923401, -0.07485949993133545, -0.052891165018081665, -0.03092283010482788, -0.008954495191574097, 0.013013839721679688, 0.03498217463493347, 0.056950509548187256, 0.07891884446144104, 0.10088717937469482, 0.12285551428794861, 0.1448238492012024, 0.16679218411445618, 0.18876051902770996, 0.21072885394096375, 0.23269718885421753, 0.2546655237674713, 0.2766338586807251, 0.2986021935939789, 0.32057052850723267, 0.34253886342048645, 0.36450719833374023, 0.386475533246994, 0.4084438681602478, 0.4304122030735016, 0.45238053798675537, 0.47434887290000916, 0.49631720781326294, 0.5182855129241943, 0.5402538776397705, 0.5622222423553467, 0.5841905474662781, 0.6061588525772095, 0.6281272172927856]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 4.0, 3.0, 9.0, 3.0, 1.0, 11.0, 9.0, 9.0, 8.0, 17.0, 10.0, 20.0, 23.0, 20.0, 19.0, 37.0, 27.0, 24.0, 37.0, 45.0, 36.0, 44.0, 48.0, 39.0, 31.0, 40.0, 43.0, 36.0, 35.0, 26.0, 37.0, 34.0, 25.0, 27.0, 25.0, 29.0, 16.0, 23.0, 15.0, 14.0, 8.0, 8.0, 11.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3515278100967407, -0.3385515511035919, -0.3255752921104431, -0.3125990033149719, -0.2996227443218231, -0.2866464853286743, -0.2736702263355255, -0.2606939673423767, -0.2477176934480667, -0.2347414344549179, -0.2217651605606079, -0.2087889015674591, -0.1958126425743103, -0.1828363686800003, -0.1698601096868515, -0.1568838357925415, -0.1439075767993927, -0.1309313178062439, -0.1179550439119339, -0.1049787849187851, -0.0920025184750557, -0.0790262520313263, -0.06604999303817749, -0.05307372659444809, -0.04009746015071869, -0.027121195569634438, -0.014144930988550186, -0.001168668270111084, 0.011807598173618317, 0.024783864617347717, 0.03776012361049652, 0.05073639005422592, 0.06371265649795532, 0.07668892294168472, 0.08966518938541412, 0.10264144837856293, 0.11561771482229233, 0.12859398126602173, 0.14157024025917053, 0.15454649925231934, 0.16752277314662933, 0.18049903213977814, 0.19347530603408813, 0.20645156502723694, 0.21942782402038574, 0.23240409791469574, 0.24538035690784454, 0.25835663080215454, 0.27133288979530334, 0.28430914878845215, 0.29728540778160095, 0.31026166677474976, 0.32323795557022095, 0.33621421456336975, 0.34919047355651855, 0.36216673254966736, 0.37514299154281616, 0.38811925053596497, 0.40109550952911377, 0.41407179832458496, 0.42704805731773376, 0.44002431631088257, 0.45300057530403137, 0.4659768342971802, 0.47895312309265137]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 16.0, 19.0, 22.0, 34.0, 32.0, 61.0, 89.0, 97.0, 154.0, 229.0, 370.0, 603.0, 1258.0, 2771.0, 7600.0, 22432.0, 109764.0, 723200.0, 2115563.0, 1006835.0, 158438.0, 28093.0, 9428.0, 3775.0, 1542.0, 672.0, 395.0, 233.0, 162.0, 105.0, 76.0, 44.0, 44.0, 25.0, 22.0, 21.0, 14.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10205078125, -0.09871578216552734, -0.09538078308105469, -0.09204578399658203, -0.08871078491210938, -0.08537578582763672, -0.08204078674316406, -0.0787057876586914, -0.07537078857421875, -0.0720357894897461, -0.06870079040527344, -0.06536579132080078, -0.062030792236328125, -0.05869579315185547, -0.05536079406738281, -0.052025794982910156, -0.0486907958984375, -0.045355796813964844, -0.04202079772949219, -0.03868579864501953, -0.035350799560546875, -0.03201580047607422, -0.028680801391601562, -0.025345802307128906, -0.02201080322265625, -0.018675804138183594, -0.015340805053710938, -0.012005805969238281, -0.008670806884765625, -0.005335807800292969, -0.0020008087158203125, 0.0013341903686523438, 0.004669189453125, 0.008004188537597656, 0.011339187622070312, 0.014674186706542969, 0.018009185791015625, 0.02134418487548828, 0.024679183959960938, 0.028014183044433594, 0.03134918212890625, 0.034684181213378906, 0.03801918029785156, 0.04135417938232422, 0.044689178466796875, 0.04802417755126953, 0.05135917663574219, 0.054694175720214844, 0.0580291748046875, 0.061364173889160156, 0.06469917297363281, 0.06803417205810547, 0.07136917114257812, 0.07470417022705078, 0.07803916931152344, 0.0813741683959961, 0.08470916748046875, 0.0880441665649414, 0.09137916564941406, 0.09471416473388672, 0.09804916381835938, 0.10138416290283203, 0.10471916198730469, 0.10805416107177734, 0.11138916015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 10.0, 15.0, 26.0, 28.0, 37.0, 42.0, 57.0, 68.0, 73.0, 67.0, 70.0, 83.0, 71.0, 58.0, 65.0, 48.0, 35.0, 37.0, 30.0, 17.0, 13.0, 13.0, 14.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1395263671875, -0.1354045867919922, -0.13128280639648438, -0.12716102600097656, -0.12303924560546875, -0.11891746520996094, -0.11479568481445312, -0.11067390441894531, -0.1065521240234375, -0.10243034362792969, -0.09830856323242188, -0.09418678283691406, -0.09006500244140625, -0.08594322204589844, -0.08182144165039062, -0.07769966125488281, -0.073577880859375, -0.06945610046386719, -0.06533432006835938, -0.06121253967285156, -0.05709075927734375, -0.05296897888183594, -0.048847198486328125, -0.04472541809082031, -0.0406036376953125, -0.03648185729980469, -0.032360076904296875, -0.028238296508789062, -0.02411651611328125, -0.019994735717773438, -0.015872955322265625, -0.011751174926757812, -0.00762939453125, -0.0035076141357421875, 0.000614166259765625, 0.0047359466552734375, 0.00885772705078125, 0.012979507446289062, 0.017101287841796875, 0.021223068237304688, 0.0253448486328125, 0.029466629028320312, 0.033588409423828125, 0.03771018981933594, 0.04183197021484375, 0.04595375061035156, 0.050075531005859375, 0.05419731140136719, 0.058319091796875, 0.06244087219238281, 0.06656265258789062, 0.07068443298339844, 0.07480621337890625, 0.07892799377441406, 0.08304977416992188, 0.08717155456542969, 0.0912933349609375, 0.09541511535644531, 0.09953689575195312, 0.10365867614746094, 0.10778045654296875, 0.11190223693847656, 0.11602401733398438, 0.12014579772949219, 0.124267578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 11.0, 14.0, 16.0, 34.0, 32.0, 37.0, 61.0, 107.0, 152.0, 206.0, 327.0, 508.0, 870.0, 1398.0, 2612.0, 4927.0, 10437.0, 23081.0, 59640.0, 183797.0, 970556.0, 2323028.0, 429980.0, 110590.0, 39409.0, 16057.0, 7493.0, 3745.0, 2000.0, 1166.0, 700.0, 430.0, 313.0, 160.0, 111.0, 72.0, 61.0, 34.0, 30.0, 22.0, 16.0, 6.0, 6.0, 10.0, 1.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08697509765625, -0.08419513702392578, -0.08141517639160156, -0.07863521575927734, -0.07585525512695312, -0.0730752944946289, -0.07029533386230469, -0.06751537322998047, -0.06473541259765625, -0.06195545196533203, -0.05917549133300781, -0.056395530700683594, -0.053615570068359375, -0.050835609436035156, -0.04805564880371094, -0.04527568817138672, -0.0424957275390625, -0.03971576690673828, -0.03693580627441406, -0.034155845642089844, -0.031375885009765625, -0.028595924377441406, -0.025815963745117188, -0.02303600311279297, -0.02025604248046875, -0.01747608184814453, -0.014696121215820312, -0.011916160583496094, -0.009136199951171875, -0.006356239318847656, -0.0035762786865234375, -0.0007963180541992188, 0.001983642578125, 0.004763603210449219, 0.0075435638427734375, 0.010323524475097656, 0.013103485107421875, 0.015883445739746094, 0.018663406372070312, 0.02144336700439453, 0.02422332763671875, 0.02700328826904297, 0.029783248901367188, 0.032563209533691406, 0.035343170166015625, 0.038123130798339844, 0.04090309143066406, 0.04368305206298828, 0.0464630126953125, 0.04924297332763672, 0.05202293395996094, 0.054802894592285156, 0.057582855224609375, 0.060362815856933594, 0.06314277648925781, 0.06592273712158203, 0.06870269775390625, 0.07148265838623047, 0.07426261901855469, 0.0770425796508789, 0.07982254028320312, 0.08260250091552734, 0.08538246154785156, 0.08816242218017578, 0.0909423828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 2.0, 16.0, 7.0, 11.0, 24.0, 18.0, 30.0, 50.0, 78.0, 124.0, 209.0, 380.0, 732.0, 952.0, 648.0, 310.0, 146.0, 80.0, 81.0, 42.0, 31.0, 29.0, 22.0, 14.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.15550613403320312, -0.15000152587890625, -0.14449691772460938, -0.1389923095703125, -0.13348770141601562, -0.12798309326171875, -0.12247848510742188, -0.116973876953125, -0.11146926879882812, -0.10596466064453125, -0.10046005249023438, -0.0949554443359375, -0.08945083618164062, -0.08394622802734375, -0.07844161987304688, -0.07293701171875, -0.06743240356445312, -0.06192779541015625, -0.056423187255859375, -0.0509185791015625, -0.045413970947265625, -0.03990936279296875, -0.034404754638671875, -0.028900146484375, -0.023395538330078125, -0.01789093017578125, -0.012386322021484375, -0.0068817138671875, -0.001377105712890625, 0.00412750244140625, 0.009632110595703125, 0.01513671875, 0.020641326904296875, 0.02614593505859375, 0.031650543212890625, 0.0371551513671875, 0.042659759521484375, 0.04816436767578125, 0.053668975830078125, 0.059173583984375, 0.06467819213867188, 0.07018280029296875, 0.07568740844726562, 0.0811920166015625, 0.08669662475585938, 0.09220123291015625, 0.09770584106445312, 0.10321044921875, 0.10871505737304688, 0.11421966552734375, 0.11972427368164062, 0.1252288818359375, 0.13073348999023438, 0.13623809814453125, 0.14174270629882812, 0.147247314453125, 0.15275192260742188, 0.15825653076171875, 0.16376113891601562, 0.1692657470703125, 0.17477035522460938, 0.18027496337890625, 0.18577957153320312, 0.1912841796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 17.0, 26.0, 41.0, 88.0, 113.0, 169.0, 152.0, 138.0, 89.0, 73.0, 43.0, 15.0, 16.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8404838442802429, -0.8165222406387329, -0.7925606966018677, -0.7685990929603577, -0.7446374893188477, -0.7206758856773376, -0.6967143416404724, -0.6727527379989624, -0.6487911343574524, -0.6248295307159424, -0.6008679866790771, -0.5769063830375671, -0.5529447793960571, -0.5289831757545471, -0.5050216317176819, -0.4810600280761719, -0.45709845423698425, -0.43313688039779663, -0.4091752767562866, -0.385213702917099, -0.361252099275589, -0.33729052543640137, -0.31332892179489136, -0.28936734795570374, -0.2654057741165161, -0.2414441853761673, -0.21748259663581848, -0.19352102279663086, -0.16955941915512085, -0.14559784531593323, -0.12163625657558441, -0.0976746678352356, -0.07371306419372559, -0.04975147545337677, -0.025789890438318253, -0.001828305423259735, 0.02213328331708908, 0.0460948720574379, 0.07005645334720612, 0.09401804208755493, 0.11797963082790375, 0.14194121956825256, 0.16590280830860138, 0.1898643970489502, 0.21382597088813782, 0.23778757452964783, 0.26174914836883545, 0.28571075201034546, 0.3096723258495331, 0.3336338996887207, 0.3575955033302307, 0.38155707716941833, 0.40551868081092834, 0.42948025465011597, 0.453441858291626, 0.4774034321308136, 0.5013650059700012, 0.5253266096115112, 0.5492881536483765, 0.5732497572898865, 0.5972113609313965, 0.6211729645729065, 0.6451345086097717, 0.6690961122512817, 0.6930577158927917]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 12.0, 9.0, 21.0, 14.0, 23.0, 15.0, 23.0, 32.0, 34.0, 34.0, 37.0, 28.0, 38.0, 49.0, 36.0, 54.0, 36.0, 45.0, 54.0, 39.0, 37.0, 30.0, 38.0, 33.0, 24.0, 26.0, 18.0, 33.0, 24.0, 16.0, 14.0, 11.0, 18.0, 10.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40573716163635254, -0.3925072252750397, -0.3792773187160492, -0.36604738235473633, -0.35281747579574585, -0.339587539434433, -0.3263576328754425, -0.31312769651412964, -0.29989778995513916, -0.2866678535938263, -0.2734379470348358, -0.26020801067352295, -0.24697810411453247, -0.2337481677532196, -0.22051826119422913, -0.20728832483291626, -0.1940584033727646, -0.18082848191261292, -0.16759856045246124, -0.15436863899230957, -0.1411387175321579, -0.12790879607200623, -0.11467886716127396, -0.10144894570112228, -0.08821902424097061, -0.07498910278081894, -0.06175918132066727, -0.048529256135225296, -0.035299334675073624, -0.022069409489631653, -0.00883948802947998, 0.004390433430671692, 0.017620354890823364, 0.030850276350975037, 0.04408019781112671, 0.05731012299656868, 0.07054004073143005, 0.08376996964216232, 0.096999891102314, 0.11022981256246567, 0.12345973402261734, 0.1366896629333496, 0.14991958439350128, 0.16314950585365295, 0.17637942731380463, 0.1896093487739563, 0.20283927023410797, 0.21606919169425964, 0.22929911315441132, 0.242529034614563, 0.25575897097587585, 0.26898887753486633, 0.2822188138961792, 0.2954487204551697, 0.30867865681648254, 0.321908563375473, 0.3351384997367859, 0.34836843609809875, 0.36159834265708923, 0.3748282790184021, 0.3880581855773926, 0.40128812193870544, 0.4145180284976959, 0.4277479648590088, 0.44097787141799927]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 5.0, 8.0, 7.0, 10.0, 20.0, 24.0, 31.0, 52.0, 86.0, 113.0, 218.0, 317.0, 577.0, 1099.0, 2135.0, 4567.0, 10034.0, 22844.0, 54047.0, 135027.0, 306434.0, 294140.0, 126885.0, 50685.0, 21140.0, 9262.0, 4198.0, 2114.0, 1083.0, 497.0, 333.0, 209.0, 113.0, 79.0, 49.0, 30.0, 25.0, 17.0, 13.0, 12.0, 8.0, 6.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0797119140625, -0.076385498046875, -0.07305908203125, -0.069732666015625, -0.06640625, -0.063079833984375, -0.05975341796875, -0.056427001953125, -0.0531005859375, -0.049774169921875, -0.04644775390625, -0.043121337890625, -0.039794921875, -0.036468505859375, -0.03314208984375, -0.029815673828125, -0.0264892578125, -0.023162841796875, -0.01983642578125, -0.016510009765625, -0.01318359375, -0.009857177734375, -0.00653076171875, -0.003204345703125, 0.0001220703125, 0.003448486328125, 0.00677490234375, 0.010101318359375, 0.013427734375, 0.016754150390625, 0.02008056640625, 0.023406982421875, 0.0267333984375, 0.030059814453125, 0.03338623046875, 0.036712646484375, 0.0400390625, 0.043365478515625, 0.04669189453125, 0.050018310546875, 0.0533447265625, 0.056671142578125, 0.05999755859375, 0.063323974609375, 0.066650390625, 0.069976806640625, 0.07330322265625, 0.076629638671875, 0.0799560546875, 0.083282470703125, 0.08660888671875, 0.089935302734375, 0.09326171875, 0.096588134765625, 0.09991455078125, 0.103240966796875, 0.1065673828125, 0.109893798828125, 0.11322021484375, 0.116546630859375, 0.119873046875, 0.123199462890625, 0.12652587890625, 0.129852294921875, 0.1331787109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 17.0, 21.0, 24.0, 35.0, 42.0, 48.0, 52.0, 67.0, 87.0, 82.0, 93.0, 76.0, 68.0, 75.0, 58.0, 37.0, 33.0, 24.0, 21.0, 14.0, 8.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12213134765625, -0.11778926849365234, -0.11344718933105469, -0.10910511016845703, -0.10476303100585938, -0.10042095184326172, -0.09607887268066406, -0.0917367935180664, -0.08739471435546875, -0.0830526351928711, -0.07871055603027344, -0.07436847686767578, -0.07002639770507812, -0.06568431854248047, -0.06134223937988281, -0.057000160217285156, -0.0526580810546875, -0.048316001892089844, -0.04397392272949219, -0.03963184356689453, -0.035289764404296875, -0.03094768524169922, -0.026605606079101562, -0.022263526916503906, -0.01792144775390625, -0.013579368591308594, -0.009237289428710938, -0.004895210266113281, -0.000553131103515625, 0.0037889480590820312, 0.008131027221679688, 0.012473106384277344, 0.016815185546875, 0.021157264709472656, 0.025499343872070312, 0.02984142303466797, 0.034183502197265625, 0.03852558135986328, 0.04286766052246094, 0.047209739685058594, 0.05155181884765625, 0.055893898010253906, 0.06023597717285156, 0.06457805633544922, 0.06892013549804688, 0.07326221466064453, 0.07760429382324219, 0.08194637298583984, 0.0862884521484375, 0.09063053131103516, 0.09497261047363281, 0.09931468963623047, 0.10365676879882812, 0.10799884796142578, 0.11234092712402344, 0.1166830062866211, 0.12102508544921875, 0.1253671646118164, 0.12970924377441406, 0.13405132293701172, 0.13839340209960938, 0.14273548126220703, 0.1470775604248047, 0.15141963958740234, 0.15576171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 8.0, 9.0, 13.0, 23.0, 38.0, 67.0, 83.0, 112.0, 200.0, 312.0, 485.0, 823.0, 1492.0, 2596.0, 4987.0, 9793.0, 20950.0, 47176.0, 116574.0, 287877.0, 319054.0, 134861.0, 53914.0, 23609.0, 11008.0, 5511.0, 2934.0, 1599.0, 907.0, 546.0, 345.0, 197.0, 129.0, 98.0, 63.0, 48.0, 26.0, 23.0, 18.0, 15.0, 6.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.12701034545898438, -0.12328338623046875, -0.11955642700195312, -0.1158294677734375, -0.11210250854492188, -0.10837554931640625, -0.10464859008789062, -0.100921630859375, -0.09719467163085938, -0.09346771240234375, -0.08974075317382812, -0.0860137939453125, -0.08228683471679688, -0.07855987548828125, -0.07483291625976562, -0.07110595703125, -0.06737899780273438, -0.06365203857421875, -0.059925079345703125, -0.0561981201171875, -0.052471160888671875, -0.04874420166015625, -0.045017242431640625, -0.041290283203125, -0.037563323974609375, -0.03383636474609375, -0.030109405517578125, -0.0263824462890625, -0.022655487060546875, -0.01892852783203125, -0.015201568603515625, -0.011474609375, -0.007747650146484375, -0.00402069091796875, -0.000293731689453125, 0.0034332275390625, 0.007160186767578125, 0.01088714599609375, 0.014614105224609375, 0.018341064453125, 0.022068023681640625, 0.02579498291015625, 0.029521942138671875, 0.0332489013671875, 0.036975860595703125, 0.04070281982421875, 0.044429779052734375, 0.04815673828125, 0.051883697509765625, 0.05561065673828125, 0.059337615966796875, 0.0630645751953125, 0.06679153442382812, 0.07051849365234375, 0.07424545288085938, 0.077972412109375, 0.08169937133789062, 0.08542633056640625, 0.08915328979492188, 0.0928802490234375, 0.09660720825195312, 0.10033416748046875, 0.10406112670898438, 0.1077880859375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 4.0, 6.0, 7.0, 6.0, 12.0, 14.0, 12.0, 11.0, 16.0, 20.0, 28.0, 32.0, 36.0, 40.0, 31.0, 48.0, 42.0, 49.0, 42.0, 51.0, 47.0, 50.0, 51.0, 34.0, 45.0, 47.0, 30.0, 25.0, 28.0, 25.0, 22.0, 15.0, 10.0, 17.0, 11.0, 5.0, 2.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.258056640625, -0.2508811950683594, -0.24370574951171875, -0.23653030395507812, -0.2293548583984375, -0.22217941284179688, -0.21500396728515625, -0.20782852172851562, -0.200653076171875, -0.19347763061523438, -0.18630218505859375, -0.17912673950195312, -0.1719512939453125, -0.16477584838867188, -0.15760040283203125, -0.15042495727539062, -0.14324951171875, -0.13607406616210938, -0.12889862060546875, -0.12172317504882812, -0.1145477294921875, -0.10737228393554688, -0.10019683837890625, -0.09302139282226562, -0.085845947265625, -0.07867050170898438, -0.07149505615234375, -0.06431961059570312, -0.0571441650390625, -0.049968719482421875, -0.04279327392578125, -0.035617828369140625, -0.0284423828125, -0.021266937255859375, -0.01409149169921875, -0.006916046142578125, 0.0002593994140625, 0.007434844970703125, 0.01461029052734375, 0.021785736083984375, 0.028961181640625, 0.036136627197265625, 0.04331207275390625, 0.050487518310546875, 0.0576629638671875, 0.06483840942382812, 0.07201385498046875, 0.07918930053710938, 0.08636474609375, 0.09354019165039062, 0.10071563720703125, 0.10789108276367188, 0.1150665283203125, 0.12224197387695312, 0.12941741943359375, 0.13659286499023438, 0.143768310546875, 0.15094375610351562, 0.15811920166015625, 0.16529464721679688, 0.1724700927734375, 0.17964553833007812, 0.18682098388671875, 0.19399642944335938, 0.201171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 12.0, 13.0, 10.0, 36.0, 51.0, 56.0, 85.0, 160.0, 207.0, 367.0, 651.0, 1110.0, 2032.0, 4220.0, 9061.0, 20870.0, 51696.0, 136349.0, 316934.0, 298229.0, 123578.0, 46979.0, 18939.0, 8341.0, 3942.0, 2017.0, 1093.0, 570.0, 341.0, 210.0, 134.0, 95.0, 47.0, 39.0, 30.0, 18.0, 10.0, 6.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.033935546875, -0.03290557861328125, -0.0318756103515625, -0.03084564208984375, -0.029815673828125, -0.02878570556640625, -0.0277557373046875, -0.02672576904296875, -0.02569580078125, -0.02466583251953125, -0.0236358642578125, -0.02260589599609375, -0.021575927734375, -0.02054595947265625, -0.0195159912109375, -0.01848602294921875, -0.0174560546875, -0.01642608642578125, -0.0153961181640625, -0.01436614990234375, -0.013336181640625, -0.01230621337890625, -0.0112762451171875, -0.01024627685546875, -0.00921630859375, -0.00818634033203125, -0.0071563720703125, -0.00612640380859375, -0.005096435546875, -0.00406646728515625, -0.0030364990234375, -0.00200653076171875, -0.0009765625, 5.340576171875e-05, 0.0010833740234375, 0.00211334228515625, 0.003143310546875, 0.00417327880859375, 0.0052032470703125, 0.00623321533203125, 0.00726318359375, 0.00829315185546875, 0.0093231201171875, 0.01035308837890625, 0.011383056640625, 0.01241302490234375, 0.0134429931640625, 0.01447296142578125, 0.0155029296875, 0.01653289794921875, 0.0175628662109375, 0.01859283447265625, 0.019622802734375, 0.02065277099609375, 0.0216827392578125, 0.02271270751953125, 0.02374267578125, 0.02477264404296875, 0.0258026123046875, 0.02683258056640625, 0.027862548828125, 0.02889251708984375, 0.0299224853515625, 0.03095245361328125, 0.031982421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 11.0, 17.0, 24.0, 34.0, 45.0, 57.0, 96.0, 114.0, 109.0, 128.0, 83.0, 83.0, 58.0, 31.0, 22.0, 22.0, 15.0, 16.0, 9.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6689300537109375e-05, -1.6225501894950867e-05, -1.576170325279236e-05, -1.529790461063385e-05, -1.4834105968475342e-05, -1.4370307326316833e-05, -1.3906508684158325e-05, -1.3442710041999817e-05, -1.2978911399841309e-05, -1.25151127576828e-05, -1.2051314115524292e-05, -1.1587515473365784e-05, -1.1123716831207275e-05, -1.0659918189048767e-05, -1.0196119546890259e-05, -9.73232090473175e-06, -9.268522262573242e-06, -8.804723620414734e-06, -8.340924978256226e-06, -7.877126336097717e-06, -7.413327693939209e-06, -6.949529051780701e-06, -6.485730409622192e-06, -6.021931767463684e-06, -5.558133125305176e-06, -5.0943344831466675e-06, -4.630535840988159e-06, -4.166737198829651e-06, -3.7029385566711426e-06, -3.2391399145126343e-06, -2.775341272354126e-06, -2.3115426301956177e-06, -1.8477439880371094e-06, -1.383945345878601e-06, -9.201467037200928e-07, -4.5634806156158447e-07, 7.450580596923828e-09, 4.7124922275543213e-07, 9.350478649139404e-07, 1.3988465070724487e-06, 1.862645149230957e-06, 2.3264437913894653e-06, 2.7902424335479736e-06, 3.254041075706482e-06, 3.7178397178649902e-06, 4.1816383600234985e-06, 4.645437002182007e-06, 5.109235644340515e-06, 5.5730342864990234e-06, 6.036832928657532e-06, 6.50063157081604e-06, 6.964430212974548e-06, 7.428228855133057e-06, 7.892027497291565e-06, 8.355826139450073e-06, 8.819624781608582e-06, 9.28342342376709e-06, 9.747222065925598e-06, 1.0211020708084106e-05, 1.0674819350242615e-05, 1.1138617992401123e-05, 1.1602416634559631e-05, 1.206621527671814e-05, 1.2530013918876648e-05, 1.2993812561035156e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 2.0, 7.0, 7.0, 13.0, 21.0, 26.0, 36.0, 70.0, 78.0, 146.0, 234.0, 438.0, 735.0, 1422.0, 2906.0, 6189.0, 14334.0, 36486.0, 101575.0, 270498.0, 352150.0, 164264.0, 57775.0, 21539.0, 9189.0, 4036.0, 1944.0, 1048.0, 535.0, 311.0, 189.0, 128.0, 82.0, 55.0, 26.0, 19.0, 12.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.034271240234375, -0.03320789337158203, -0.03214454650878906, -0.031081199645996094, -0.030017852783203125, -0.028954505920410156, -0.027891159057617188, -0.02682781219482422, -0.02576446533203125, -0.02470111846923828, -0.023637771606445312, -0.022574424743652344, -0.021511077880859375, -0.020447731018066406, -0.019384384155273438, -0.01832103729248047, -0.0172576904296875, -0.01619434356689453, -0.015130996704101562, -0.014067649841308594, -0.013004302978515625, -0.011940956115722656, -0.010877609252929688, -0.009814262390136719, -0.00875091552734375, -0.007687568664550781, -0.0066242218017578125, -0.005560874938964844, -0.004497528076171875, -0.0034341812133789062, -0.0023708343505859375, -0.0013074874877929688, -0.000244140625, 0.0008192062377929688, 0.0018825531005859375, 0.0029458999633789062, 0.004009246826171875, 0.005072593688964844, 0.0061359405517578125, 0.007199287414550781, 0.00826263427734375, 0.009325981140136719, 0.010389328002929688, 0.011452674865722656, 0.012516021728515625, 0.013579368591308594, 0.014642715454101562, 0.01570606231689453, 0.0167694091796875, 0.01783275604248047, 0.018896102905273438, 0.019959449768066406, 0.021022796630859375, 0.022086143493652344, 0.023149490356445312, 0.02421283721923828, 0.02527618408203125, 0.02633953094482422, 0.027402877807617188, 0.028466224670410156, 0.029529571533203125, 0.030592918395996094, 0.03165626525878906, 0.03271961212158203, 0.033782958984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 14.0, 14.0, 13.0, 14.0, 24.0, 33.0, 39.0, 39.0, 53.0, 67.0, 55.0, 67.0, 64.0, 65.0, 57.0, 56.0, 50.0, 37.0, 27.0, 31.0, 23.0, 24.0, 14.0, 14.0, 13.0, 12.0, 10.0, 3.0, 10.0, 8.0, 1.0, 9.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.03192138671875, -0.030843734741210938, -0.029766082763671875, -0.028688430786132812, -0.02761077880859375, -0.026533126831054688, -0.025455474853515625, -0.024377822875976562, -0.0233001708984375, -0.022222518920898438, -0.021144866943359375, -0.020067214965820312, -0.01898956298828125, -0.017911911010742188, -0.016834259033203125, -0.015756607055664062, -0.014678955078125, -0.013601303100585938, -0.012523651123046875, -0.011445999145507812, -0.01036834716796875, -0.009290695190429688, -0.008213043212890625, -0.0071353912353515625, -0.0060577392578125, -0.0049800872802734375, -0.003902435302734375, -0.0028247833251953125, -0.00174713134765625, -0.0006694793701171875, 0.000408172607421875, 0.0014858245849609375, 0.0025634765625, 0.0036411285400390625, 0.004718780517578125, 0.0057964324951171875, 0.00687408447265625, 0.007951736450195312, 0.009029388427734375, 0.010107040405273438, 0.0111846923828125, 0.012262344360351562, 0.013339996337890625, 0.014417648315429688, 0.01549530029296875, 0.016572952270507812, 0.017650604248046875, 0.018728256225585938, 0.019805908203125, 0.020883560180664062, 0.021961212158203125, 0.023038864135742188, 0.02411651611328125, 0.025194168090820312, 0.026271820068359375, 0.027349472045898438, 0.0284271240234375, 0.029504776000976562, 0.030582427978515625, 0.03166007995605469, 0.03273773193359375, 0.03381538391113281, 0.034893035888671875, 0.03597068786621094, 0.03704833984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 8.0, 19.0, 36.0, 55.0, 108.0, 144.0, 191.0, 167.0, 118.0, 63.0, 41.0, 15.0, 10.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2346285581588745, -1.2082542181015015, -1.1818798780441284, -1.1555055379867554, -1.1291311979293823, -1.1027568578720093, -1.0763825178146362, -1.0500081777572632, -1.0236338376998901, -0.9972594976425171, -0.970885157585144, -0.944510817527771, -0.918136477470398, -0.8917621374130249, -0.8653877973556519, -0.8390134572982788, -0.8126391172409058, -0.7862647771835327, -0.7598904371261597, -0.7335160970687866, -0.7071417570114136, -0.6807674169540405, -0.6543930768966675, -0.6280187368392944, -0.6016444563865662, -0.5752701163291931, -0.5488957762718201, -0.522521436214447, -0.496147096157074, -0.4697727560997009, -0.4433984160423279, -0.41702407598495483, -0.3906497359275818, -0.36427539587020874, -0.3379010558128357, -0.31152671575546265, -0.2851523756980896, -0.25877803564071655, -0.2324037104845047, -0.20602937042713165, -0.1796550303697586, -0.15328069031238556, -0.1269063502550125, -0.10053201764822006, -0.07415767759084702, -0.047783344984054565, -0.02140900492668152, 0.004965335130691528, 0.031339675188064575, 0.05771401524543762, 0.08408835530281067, 0.11046268790960312, 0.13683703541755676, 0.16321136057376862, 0.18958570063114166, 0.2159600406885147, 0.24233438074588776, 0.2687087059020996, 0.29508304595947266, 0.3214573860168457, 0.34783172607421875, 0.3742060661315918, 0.40058040618896484, 0.4269547462463379, 0.45332908630371094]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 8.0, 8.0, 11.0, 7.0, 13.0, 17.0, 11.0, 12.0, 25.0, 34.0, 33.0, 42.0, 38.0, 46.0, 49.0, 40.0, 48.0, 50.0, 40.0, 47.0, 50.0, 42.0, 51.0, 44.0, 34.0, 34.0, 33.0, 25.0, 28.0, 18.0, 13.0, 9.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6699435114860535, -0.6488382816314697, -0.627733051776886, -0.6066278219223022, -0.5855225920677185, -0.5644173622131348, -0.5433120727539062, -0.5222068428993225, -0.5011016130447388, -0.47999638319015503, -0.4588911533355713, -0.43778592348098755, -0.4166806638240814, -0.3955754339694977, -0.37447020411491394, -0.3533649444580078, -0.33225974440574646, -0.3111545145511627, -0.290049284696579, -0.26894402503967285, -0.2478387951850891, -0.22673356533050537, -0.20562833547592163, -0.1845230907201767, -0.16341786086559296, -0.14231263101100922, -0.12120738625526428, -0.10010215640068054, -0.0789969190955162, -0.05789168179035187, -0.03678645193576813, -0.015681207180023193, 0.005424022674560547, 0.026529258117079735, 0.04763449355959892, 0.06873972713947296, 0.0898449644446373, 0.11095020174980164, 0.13205543160438538, 0.1531606763601303, 0.17426590621471405, 0.1953711360692978, 0.21647638082504272, 0.23758161067962646, 0.2586868405342102, 0.27979207038879395, 0.3008973002433777, 0.3220025599002838, 0.34310778975486755, 0.3642130196094513, 0.38531824946403503, 0.40642350912094116, 0.4275287389755249, 0.44863396883010864, 0.4697391986846924, 0.4908444285392761, 0.5119496583938599, 0.5330548882484436, 0.5541601181030273, 0.5752653479576111, 0.5963705778121948, 0.6174758672714233, 0.6385810375213623, 0.6596863269805908, 0.6807915568351746]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 11.0, 21.0, 28.0, 39.0, 42.0, 74.0, 118.0, 132.0, 247.0, 411.0, 760.0, 1543.0, 3181.0, 6649.0, 16071.0, 47138.0, 180925.0, 638685.0, 1480382.0, 1237640.0, 427139.0, 101347.0, 27905.0, 11717.0, 6283.0, 2904.0, 1277.0, 645.0, 359.0, 185.0, 132.0, 86.0, 65.0, 40.0, 21.0, 21.0, 18.0, 10.0, 4.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0885009765625, -0.08580493927001953, -0.08310890197753906, -0.0804128646850586, -0.07771682739257812, -0.07502079010009766, -0.07232475280761719, -0.06962871551513672, -0.06693267822265625, -0.06423664093017578, -0.06154060363769531, -0.058844566345214844, -0.056148529052734375, -0.053452491760253906, -0.05075645446777344, -0.04806041717529297, -0.0453643798828125, -0.04266834259033203, -0.03997230529785156, -0.037276268005371094, -0.034580230712890625, -0.031884193420410156, -0.029188156127929688, -0.02649211883544922, -0.02379608154296875, -0.02110004425048828, -0.018404006958007812, -0.015707969665527344, -0.013011932373046875, -0.010315895080566406, -0.0076198577880859375, -0.004923820495605469, -0.002227783203125, 0.00046825408935546875, 0.0031642913818359375, 0.005860328674316406, 0.008556365966796875, 0.011252403259277344, 0.013948440551757812, 0.01664447784423828, 0.01934051513671875, 0.02203655242919922, 0.024732589721679688, 0.027428627014160156, 0.030124664306640625, 0.032820701599121094, 0.03551673889160156, 0.03821277618408203, 0.0409088134765625, 0.04360485076904297, 0.04630088806152344, 0.048996925354003906, 0.051692962646484375, 0.054388999938964844, 0.05708503723144531, 0.05978107452392578, 0.06247711181640625, 0.06517314910888672, 0.06786918640136719, 0.07056522369384766, 0.07326126098632812, 0.0759572982788086, 0.07865333557128906, 0.08134937286376953, 0.08404541015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 7.0, 19.0, 18.0, 26.0, 37.0, 46.0, 51.0, 69.0, 55.0, 73.0, 77.0, 68.0, 75.0, 69.0, 55.0, 47.0, 38.0, 38.0, 32.0, 30.0, 18.0, 11.0, 10.0, 6.0, 9.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.1481189727783203, -0.14352798461914062, -0.13893699645996094, -0.13434600830078125, -0.12975502014160156, -0.12516403198242188, -0.12057304382324219, -0.1159820556640625, -0.11139106750488281, -0.10680007934570312, -0.10220909118652344, -0.09761810302734375, -0.09302711486816406, -0.08843612670898438, -0.08384513854980469, -0.079254150390625, -0.07466316223144531, -0.07007217407226562, -0.06548118591308594, -0.06089019775390625, -0.05629920959472656, -0.051708221435546875, -0.04711723327636719, -0.0425262451171875, -0.03793525695800781, -0.033344268798828125, -0.028753280639648438, -0.02416229248046875, -0.019571304321289062, -0.014980316162109375, -0.010389328002929688, -0.00579833984375, -0.0012073516845703125, 0.003383636474609375, 0.007974624633789062, 0.01256561279296875, 0.017156600952148438, 0.021747589111328125, 0.026338577270507812, 0.0309295654296875, 0.03552055358886719, 0.040111541748046875, 0.04470252990722656, 0.04929351806640625, 0.05388450622558594, 0.058475494384765625, 0.06306648254394531, 0.067657470703125, 0.07224845886230469, 0.07683944702148438, 0.08143043518066406, 0.08602142333984375, 0.09061241149902344, 0.09520339965820312, 0.09979438781738281, 0.1043853759765625, 0.10897636413574219, 0.11356735229492188, 0.11815834045410156, 0.12274932861328125, 0.12734031677246094, 0.13193130493164062, 0.1365222930908203, 0.14111328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 7.0, 13.0, 21.0, 48.0, 68.0, 103.0, 188.0, 333.0, 639.0, 1281.0, 2769.0, 6041.0, 14730.0, 42015.0, 138316.0, 718767.0, 2541420.0, 549652.0, 116665.0, 37023.0, 13665.0, 5473.0, 2520.0, 1116.0, 617.0, 306.0, 171.0, 113.0, 60.0, 49.0, 36.0, 21.0, 14.0, 3.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1226806640625, -0.11911773681640625, -0.1155548095703125, -0.11199188232421875, -0.108428955078125, -0.10486602783203125, -0.1013031005859375, -0.09774017333984375, -0.09417724609375, -0.09061431884765625, -0.0870513916015625, -0.08348846435546875, -0.079925537109375, -0.07636260986328125, -0.0727996826171875, -0.06923675537109375, -0.065673828125, -0.06211090087890625, -0.0585479736328125, -0.05498504638671875, -0.051422119140625, -0.04785919189453125, -0.0442962646484375, -0.04073333740234375, -0.03717041015625, -0.03360748291015625, -0.0300445556640625, -0.02648162841796875, -0.022918701171875, -0.01935577392578125, -0.0157928466796875, -0.01222991943359375, -0.0086669921875, -0.00510406494140625, -0.0015411376953125, 0.00202178955078125, 0.005584716796875, 0.00914764404296875, 0.0127105712890625, 0.01627349853515625, 0.01983642578125, 0.02339935302734375, 0.0269622802734375, 0.03052520751953125, 0.034088134765625, 0.03765106201171875, 0.0412139892578125, 0.04477691650390625, 0.04833984375, 0.05190277099609375, 0.0554656982421875, 0.05902862548828125, 0.062591552734375, 0.06615447998046875, 0.0697174072265625, 0.07328033447265625, 0.07684326171875, 0.08040618896484375, 0.0839691162109375, 0.08753204345703125, 0.091094970703125, 0.09465789794921875, 0.0982208251953125, 0.10178375244140625, 0.1053466796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 8.0, 5.0, 13.0, 6.0, 9.0, 23.0, 20.0, 34.0, 45.0, 53.0, 55.0, 100.0, 140.0, 235.0, 322.0, 481.0, 592.0, 503.0, 427.0, 285.0, 193.0, 110.0, 100.0, 54.0, 48.0, 33.0, 31.0, 28.0, 29.0, 17.0, 9.0, 9.0, 15.0, 15.0, 7.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.12466812133789062, -0.12018585205078125, -0.11570358276367188, -0.1112213134765625, -0.10673904418945312, -0.10225677490234375, -0.09777450561523438, -0.093292236328125, -0.08880996704101562, -0.08432769775390625, -0.07984542846679688, -0.0753631591796875, -0.07088088989257812, -0.06639862060546875, -0.061916351318359375, -0.05743408203125, -0.052951812744140625, -0.04846954345703125, -0.043987274169921875, -0.0395050048828125, -0.035022735595703125, -0.03054046630859375, -0.026058197021484375, -0.021575927734375, -0.017093658447265625, -0.01261138916015625, -0.008129119873046875, -0.0036468505859375, 0.000835418701171875, 0.00531768798828125, 0.009799957275390625, 0.0142822265625, 0.018764495849609375, 0.02324676513671875, 0.027729034423828125, 0.0322113037109375, 0.036693572998046875, 0.04117584228515625, 0.045658111572265625, 0.050140380859375, 0.054622650146484375, 0.05910491943359375, 0.06358718872070312, 0.0680694580078125, 0.07255172729492188, 0.07703399658203125, 0.08151626586914062, 0.08599853515625, 0.09048080444335938, 0.09496307373046875, 0.09944534301757812, 0.1039276123046875, 0.10840988159179688, 0.11289215087890625, 0.11737442016601562, 0.121856689453125, 0.12633895874023438, 0.13082122802734375, 0.13530349731445312, 0.1397857666015625, 0.14426803588867188, 0.14875030517578125, 0.15323257446289062, 0.15771484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 13.0, 32.0, 34.0, 51.0, 95.0, 116.0, 142.0, 145.0, 138.0, 90.0, 58.0, 37.0, 23.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5300526022911072, -0.5054264068603516, -0.48080021142959595, -0.4561740458011627, -0.4315478503704071, -0.4069216549396515, -0.38229548931121826, -0.35766929388046265, -0.33304309844970703, -0.3084169030189514, -0.2837907075881958, -0.2591645419597626, -0.23453834652900696, -0.20991215109825134, -0.18528597056865692, -0.1606597900390625, -0.13603359460830688, -0.11140740662813187, -0.08678121864795685, -0.06215503066778183, -0.03752884268760681, -0.012902654707431793, 0.011723533272743225, 0.036349713802337646, 0.06097590923309326, 0.08560209721326828, 0.1102282851934433, 0.13485446572303772, 0.15948066115379333, 0.18410685658454895, 0.20873303711414337, 0.2333592176437378, 0.2579854726791382, 0.2826116681098938, 0.3072378635406494, 0.33186402916908264, 0.35649022459983826, 0.38111642003059387, 0.4057425856590271, 0.4303687810897827, 0.45499497652053833, 0.47962117195129395, 0.5042473673820496, 0.5288735628128052, 0.553499698638916, 0.5781258940696716, 0.6027520895004272, 0.6273782849311829, 0.6520044803619385, 0.6766306757926941, 0.7012568712234497, 0.7258830666542053, 0.7505092620849609, 0.7751353979110718, 0.7997615933418274, 0.824387788772583, 0.8490139842033386, 0.8736401796340942, 0.8982663750648499, 0.9228925704956055, 0.9475187063217163, 0.9721449017524719, 0.9967710971832275, 1.021397352218628, 1.0460234880447388]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 9.0, 6.0, 10.0, 9.0, 11.0, 9.0, 22.0, 11.0, 23.0, 26.0, 25.0, 30.0, 30.0, 33.0, 33.0, 41.0, 33.0, 29.0, 49.0, 38.0, 41.0, 45.0, 40.0, 44.0, 38.0, 37.0, 31.0, 37.0, 33.0, 18.0, 25.0, 23.0, 14.0, 18.0, 12.0, 9.0, 4.0, 9.0, 5.0, 9.0, 4.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248574376106262, -0.4096784293651581, -0.39449945092201233, -0.3793204426765442, -0.36414146423339844, -0.3489624559879303, -0.33378344774246216, -0.3186044692993164, -0.30342546105384827, -0.2882464528083801, -0.2730674743652344, -0.25788846611976624, -0.2427094727754593, -0.22753047943115234, -0.2123514711856842, -0.19717247784137726, -0.1819934844970703, -0.16681449115276337, -0.15163549780845642, -0.13645648956298828, -0.12127749621868134, -0.10609850287437439, -0.09091950207948685, -0.0757405012845993, -0.06056150794029236, -0.045382510870695114, -0.03020351380109787, -0.015024516731500626, 0.00015448033809661865, 0.015333473682403564, 0.030512474477291107, 0.04569147527217865, 0.060870468616485596, 0.07604946196079254, 0.09122846275568008, 0.10640746355056763, 0.12158645689487457, 0.13676545023918152, 0.15194445848464966, 0.1671234518289566, 0.18230244517326355, 0.1974814385175705, 0.21266043186187744, 0.22783944010734558, 0.24301843345165253, 0.2581974267959595, 0.2733764350414276, 0.28855544328689575, 0.3037344217300415, 0.31891342997550964, 0.3340924084186554, 0.34927141666412354, 0.3644503951072693, 0.3796294033527374, 0.39480841159820557, 0.4099873900413513, 0.42516639828681946, 0.4403454065322876, 0.45552438497543335, 0.4707033932209015, 0.48588240146636963, 0.5010613799095154, 0.5162403583526611, 0.5314193964004517, 0.5465983748435974]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 8.0, 11.0, 9.0, 22.0, 32.0, 67.0, 67.0, 103.0, 200.0, 296.0, 479.0, 852.0, 1497.0, 2639.0, 5093.0, 9605.0, 18950.0, 39313.0, 84226.0, 187664.0, 304730.0, 209880.0, 95005.0, 43612.0, 21103.0, 10707.0, 5552.0, 2891.0, 1628.0, 914.0, 502.0, 307.0, 210.0, 141.0, 86.0, 55.0, 31.0, 19.0, 16.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.12176513671875, -0.11843585968017578, -0.11510658264160156, -0.11177730560302734, -0.10844802856445312, -0.1051187515258789, -0.10178947448730469, -0.09846019744873047, -0.09513092041015625, -0.09180164337158203, -0.08847236633300781, -0.0851430892944336, -0.08181381225585938, -0.07848453521728516, -0.07515525817871094, -0.07182598114013672, -0.0684967041015625, -0.06516742706298828, -0.06183815002441406, -0.058508872985839844, -0.055179595947265625, -0.051850318908691406, -0.04852104187011719, -0.04519176483154297, -0.04186248779296875, -0.03853321075439453, -0.03520393371582031, -0.031874656677246094, -0.028545379638671875, -0.025216102600097656, -0.021886825561523438, -0.01855754852294922, -0.015228271484375, -0.011898994445800781, -0.008569717407226562, -0.005240440368652344, -0.001911163330078125, 0.0014181137084960938, 0.0047473907470703125, 0.008076667785644531, 0.01140594482421875, 0.014735221862792969, 0.018064498901367188, 0.021393775939941406, 0.024723052978515625, 0.028052330017089844, 0.03138160705566406, 0.03471088409423828, 0.0380401611328125, 0.04136943817138672, 0.04469871520996094, 0.048027992248535156, 0.051357269287109375, 0.054686546325683594, 0.05801582336425781, 0.06134510040283203, 0.06467437744140625, 0.06800365447998047, 0.07133293151855469, 0.0746622085571289, 0.07799148559570312, 0.08132076263427734, 0.08465003967285156, 0.08797931671142578, 0.09130859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 11.0, 19.0, 29.0, 45.0, 31.0, 46.0, 45.0, 53.0, 55.0, 59.0, 75.0, 54.0, 62.0, 62.0, 63.0, 47.0, 45.0, 37.0, 35.0, 30.0, 22.0, 15.0, 14.0, 7.0, 7.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12060546875, -0.1168661117553711, -0.11312675476074219, -0.10938739776611328, -0.10564804077148438, -0.10190868377685547, -0.09816932678222656, -0.09442996978759766, -0.09069061279296875, -0.08695125579833984, -0.08321189880371094, -0.07947254180908203, -0.07573318481445312, -0.07199382781982422, -0.06825447082519531, -0.0645151138305664, -0.0607757568359375, -0.057036399841308594, -0.05329704284667969, -0.04955768585205078, -0.045818328857421875, -0.04207897186279297, -0.03833961486816406, -0.034600257873535156, -0.03086090087890625, -0.027121543884277344, -0.023382186889648438, -0.01964282989501953, -0.015903472900390625, -0.012164115905761719, -0.008424758911132812, -0.004685401916503906, -0.000946044921875, 0.0027933120727539062, 0.0065326690673828125, 0.010272026062011719, 0.014011383056640625, 0.01775074005126953, 0.021490097045898438, 0.025229454040527344, 0.02896881103515625, 0.032708168029785156, 0.03644752502441406, 0.04018688201904297, 0.043926239013671875, 0.04766559600830078, 0.05140495300292969, 0.055144309997558594, 0.0588836669921875, 0.0626230239868164, 0.06636238098144531, 0.07010173797607422, 0.07384109497070312, 0.07758045196533203, 0.08131980895996094, 0.08505916595458984, 0.08879852294921875, 0.09253787994384766, 0.09627723693847656, 0.10001659393310547, 0.10375595092773438, 0.10749530792236328, 0.11123466491699219, 0.1149740219116211, 0.11871337890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 9.0, 7.0, 11.0, 13.0, 18.0, 34.0, 25.0, 47.0, 58.0, 77.0, 140.0, 165.0, 292.0, 458.0, 749.0, 1341.0, 2354.0, 4916.0, 10262.0, 23709.0, 59889.0, 178444.0, 417392.0, 223178.0, 72847.0, 27887.0, 12013.0, 5658.0, 2798.0, 1459.0, 805.0, 497.0, 316.0, 221.0, 130.0, 99.0, 62.0, 50.0, 32.0, 34.0, 12.0, 19.0, 8.0, 3.0, 7.0, 7.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.158203125, -0.1530323028564453, -0.14786148071289062, -0.14269065856933594, -0.13751983642578125, -0.13234901428222656, -0.12717819213867188, -0.12200736999511719, -0.1168365478515625, -0.11166572570800781, -0.10649490356445312, -0.10132408142089844, -0.09615325927734375, -0.09098243713378906, -0.08581161499023438, -0.08064079284667969, -0.075469970703125, -0.07029914855957031, -0.06512832641601562, -0.05995750427246094, -0.05478668212890625, -0.04961585998535156, -0.044445037841796875, -0.03927421569824219, -0.0341033935546875, -0.028932571411132812, -0.023761749267578125, -0.018590927124023438, -0.01342010498046875, -0.008249282836914062, -0.003078460693359375, 0.0020923614501953125, 0.00726318359375, 0.012434005737304688, 0.017604827880859375, 0.022775650024414062, 0.02794647216796875, 0.03311729431152344, 0.038288116455078125, 0.04345893859863281, 0.0486297607421875, 0.05380058288574219, 0.058971405029296875, 0.06414222717285156, 0.06931304931640625, 0.07448387145996094, 0.07965469360351562, 0.08482551574707031, 0.089996337890625, 0.09516716003417969, 0.10033798217773438, 0.10550880432128906, 0.11067962646484375, 0.11585044860839844, 0.12102127075195312, 0.1261920928955078, 0.1313629150390625, 0.1365337371826172, 0.14170455932617188, 0.14687538146972656, 0.15204620361328125, 0.15721702575683594, 0.16238784790039062, 0.1675586700439453, 0.1727294921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 11.0, 14.0, 19.0, 36.0, 24.0, 31.0, 40.0, 48.0, 42.0, 55.0, 61.0, 50.0, 58.0, 58.0, 51.0, 34.0, 61.0, 46.0, 53.0, 44.0, 22.0, 23.0, 19.0, 12.0, 12.0, 12.0, 6.0, 7.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380126953125, -0.3694877624511719, -0.35884857177734375, -0.3482093811035156, -0.3375701904296875, -0.3269309997558594, -0.31629180908203125, -0.3056526184082031, -0.295013427734375, -0.2843742370605469, -0.27373504638671875, -0.2630958557128906, -0.2524566650390625, -0.24181747436523438, -0.23117828369140625, -0.22053909301757812, -0.20989990234375, -0.19926071166992188, -0.18862152099609375, -0.17798233032226562, -0.1673431396484375, -0.15670394897460938, -0.14606475830078125, -0.13542556762695312, -0.124786376953125, -0.11414718627929688, -0.10350799560546875, -0.09286880493164062, -0.0822296142578125, -0.07159042358398438, -0.06095123291015625, -0.050312042236328125, -0.0396728515625, -0.029033660888671875, -0.01839447021484375, -0.007755279541015625, 0.0028839111328125, 0.013523101806640625, 0.02416229248046875, 0.034801483154296875, 0.045440673828125, 0.056079864501953125, 0.06671905517578125, 0.07735824584960938, 0.0879974365234375, 0.09863662719726562, 0.10927581787109375, 0.11991500854492188, 0.13055419921875, 0.14119338989257812, 0.15183258056640625, 0.16247177124023438, 0.1731109619140625, 0.18375015258789062, 0.19438934326171875, 0.20502853393554688, 0.215667724609375, 0.22630691528320312, 0.23694610595703125, 0.24758529663085938, 0.2582244873046875, 0.2688636779785156, 0.27950286865234375, 0.2901420593261719, 0.30078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 10.0, 10.0, 32.0, 26.0, 44.0, 76.0, 105.0, 170.0, 390.0, 633.0, 1341.0, 2673.0, 6479.0, 18376.0, 67599.0, 364062.0, 460817.0, 89219.0, 22659.0, 7565.0, 3122.0, 1458.0, 755.0, 384.0, 207.0, 124.0, 75.0, 47.0, 30.0, 13.0, 18.0, 7.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.073486328125, -0.0710439682006836, -0.06860160827636719, -0.06615924835205078, -0.06371688842773438, -0.06127452850341797, -0.05883216857910156, -0.056389808654785156, -0.05394744873046875, -0.051505088806152344, -0.04906272888183594, -0.04662036895751953, -0.044178009033203125, -0.04173564910888672, -0.03929328918457031, -0.036850929260253906, -0.0344085693359375, -0.031966209411621094, -0.029523849487304688, -0.02708148956298828, -0.024639129638671875, -0.02219676971435547, -0.019754409790039062, -0.017312049865722656, -0.01486968994140625, -0.012427330017089844, -0.009984970092773438, -0.007542610168457031, -0.005100250244140625, -0.0026578903198242188, -0.0002155303955078125, 0.0022268295288085938, 0.004669189453125, 0.007111549377441406, 0.009553909301757812, 0.011996269226074219, 0.014438629150390625, 0.01688098907470703, 0.019323348999023438, 0.021765708923339844, 0.02420806884765625, 0.026650428771972656, 0.029092788696289062, 0.03153514862060547, 0.033977508544921875, 0.03641986846923828, 0.03886222839355469, 0.041304588317871094, 0.0437469482421875, 0.046189308166503906, 0.04863166809082031, 0.05107402801513672, 0.053516387939453125, 0.05595874786376953, 0.05840110778808594, 0.060843467712402344, 0.06328582763671875, 0.06572818756103516, 0.06817054748535156, 0.07061290740966797, 0.07305526733398438, 0.07549762725830078, 0.07793998718261719, 0.0803823471069336, 0.08282470703125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 13.0, 10.0, 22.0, 38.0, 95.0, 156.0, 217.0, 200.0, 107.0, 58.0, 30.0, 19.0, 8.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.165006637573242e-05, -3.042072057723999e-05, -2.919137477874756e-05, -2.7962028980255127e-05, -2.6732683181762695e-05, -2.5503337383270264e-05, -2.4273991584777832e-05, -2.30446457862854e-05, -2.181529998779297e-05, -2.0585954189300537e-05, -1.9356608390808105e-05, -1.8127262592315674e-05, -1.6897916793823242e-05, -1.566857099533081e-05, -1.4439225196838379e-05, -1.3209879398345947e-05, -1.1980533599853516e-05, -1.0751187801361084e-05, -9.521842002868652e-06, -8.29249620437622e-06, -7.063150405883789e-06, -5.833804607391357e-06, -4.604458808898926e-06, -3.375113010406494e-06, -2.1457672119140625e-06, -9.164214134216309e-07, 3.129243850708008e-07, 1.5422701835632324e-06, 2.771615982055664e-06, 4.000961780548096e-06, 5.230307579040527e-06, 6.459653377532959e-06, 7.68899917602539e-06, 8.918344974517822e-06, 1.0147690773010254e-05, 1.1377036571502686e-05, 1.2606382369995117e-05, 1.3835728168487549e-05, 1.506507396697998e-05, 1.6294419765472412e-05, 1.7523765563964844e-05, 1.8753111362457275e-05, 1.9982457160949707e-05, 2.121180295944214e-05, 2.244114875793457e-05, 2.3670494556427002e-05, 2.4899840354919434e-05, 2.6129186153411865e-05, 2.7358531951904297e-05, 2.858787775039673e-05, 2.981722354888916e-05, 3.104656934738159e-05, 3.2275915145874023e-05, 3.3505260944366455e-05, 3.473460674285889e-05, 3.596395254135132e-05, 3.719329833984375e-05, 3.842264413833618e-05, 3.965198993682861e-05, 4.0881335735321045e-05, 4.2110681533813477e-05, 4.334002733230591e-05, 4.456937313079834e-05, 4.579871892929077e-05, 4.70280647277832e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 6.0, 5.0, 5.0, 8.0, 17.0, 17.0, 30.0, 41.0, 83.0, 104.0, 193.0, 258.0, 470.0, 852.0, 1529.0, 2949.0, 6187.0, 15166.0, 41289.0, 140400.0, 442854.0, 278737.0, 73967.0, 24628.0, 9692.0, 4277.0, 2046.0, 1119.0, 615.0, 365.0, 205.0, 145.0, 95.0, 63.0, 50.0, 23.0, 15.0, 9.0, 14.0, 8.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.058441162109375, -0.056656837463378906, -0.05487251281738281, -0.05308818817138672, -0.051303863525390625, -0.04951953887939453, -0.04773521423339844, -0.045950889587402344, -0.04416656494140625, -0.042382240295410156, -0.04059791564941406, -0.03881359100341797, -0.037029266357421875, -0.03524494171142578, -0.03346061706542969, -0.031676292419433594, -0.0298919677734375, -0.028107643127441406, -0.026323318481445312, -0.02453899383544922, -0.022754669189453125, -0.02097034454345703, -0.019186019897460938, -0.017401695251464844, -0.01561737060546875, -0.013833045959472656, -0.012048721313476562, -0.010264396667480469, -0.008480072021484375, -0.006695747375488281, -0.0049114227294921875, -0.0031270980834960938, -0.0013427734375, 0.00044155120849609375, 0.0022258758544921875, 0.004010200500488281, 0.005794525146484375, 0.007578849792480469, 0.009363174438476562, 0.011147499084472656, 0.01293182373046875, 0.014716148376464844, 0.016500473022460938, 0.01828479766845703, 0.020069122314453125, 0.02185344696044922, 0.023637771606445312, 0.025422096252441406, 0.0272064208984375, 0.028990745544433594, 0.030775070190429688, 0.03255939483642578, 0.034343719482421875, 0.03612804412841797, 0.03791236877441406, 0.039696693420410156, 0.04148101806640625, 0.043265342712402344, 0.04504966735839844, 0.04683399200439453, 0.048618316650390625, 0.05040264129638672, 0.05218696594238281, 0.053971290588378906, 0.055755615234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 3.0, 17.0, 9.0, 17.0, 17.0, 32.0, 41.0, 45.0, 55.0, 90.0, 114.0, 129.0, 111.0, 65.0, 64.0, 47.0, 33.0, 33.0, 15.0, 19.0, 18.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09912109375, -0.09640121459960938, -0.09368133544921875, -0.09096145629882812, -0.0882415771484375, -0.08552169799804688, -0.08280181884765625, -0.08008193969726562, -0.077362060546875, -0.07464218139648438, -0.07192230224609375, -0.06920242309570312, -0.0664825439453125, -0.06376266479492188, -0.06104278564453125, -0.058322906494140625, -0.05560302734375, -0.052883148193359375, -0.05016326904296875, -0.047443389892578125, -0.0447235107421875, -0.042003631591796875, -0.03928375244140625, -0.036563873291015625, -0.033843994140625, -0.031124114990234375, -0.02840423583984375, -0.025684356689453125, -0.0229644775390625, -0.020244598388671875, -0.01752471923828125, -0.014804840087890625, -0.0120849609375, -0.009365081787109375, -0.00664520263671875, -0.003925323486328125, -0.0012054443359375, 0.001514434814453125, 0.00423431396484375, 0.006954193115234375, 0.009674072265625, 0.012393951416015625, 0.01511383056640625, 0.017833709716796875, 0.0205535888671875, 0.023273468017578125, 0.02599334716796875, 0.028713226318359375, 0.03143310546875, 0.034152984619140625, 0.03687286376953125, 0.039592742919921875, 0.0423126220703125, 0.045032501220703125, 0.04775238037109375, 0.050472259521484375, 0.053192138671875, 0.055912017822265625, 0.05863189697265625, 0.061351776123046875, 0.0640716552734375, 0.06679153442382812, 0.06951141357421875, 0.07223129272460938, 0.074951171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 12.0, 23.0, 46.0, 98.0, 163.0, 185.0, 175.0, 138.0, 69.0, 37.0, 15.0, 11.0, 3.0, 7.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2210484743118286, -1.1858855485916138, -1.1507225036621094, -1.1155595779418945, -1.0803966522216797, -1.0452337265014648, -1.0100706815719604, -0.9749077558517456, -0.939744770526886, -0.9045817852020264, -0.8694188594818115, -0.8342558741569519, -0.7990928888320923, -0.7639299631118774, -0.7287669777870178, -0.6936039924621582, -0.6584410667419434, -0.6232780814170837, -0.5881151556968689, -0.5529521703720093, -0.5177892446517944, -0.4826262593269348, -0.4474632740020752, -0.41230031847953796, -0.37713736295700073, -0.3419744074344635, -0.30681145191192627, -0.27164846658706665, -0.23648551106452942, -0.2013225555419922, -0.16615958511829376, -0.13099661469459534, -0.09583353996276855, -0.060670576989650726, -0.025507614016532898, 0.00965534895658493, 0.04481831192970276, 0.07998126745223999, 0.11514423787593842, 0.15030720829963684, 0.18547016382217407, 0.2206331193447113, 0.25579607486724854, 0.29095906019210815, 0.3261220157146454, 0.3612849712371826, 0.39644795656204224, 0.43161091208457947, 0.4667738676071167, 0.5019368529319763, 0.5370997786521912, 0.5722627639770508, 0.6074256896972656, 0.6425886750221252, 0.6777516603469849, 0.7129145860671997, 0.7480775713920593, 0.783240556716919, 0.8184034824371338, 0.8535664677619934, 0.888729453086853, 0.9238923788070679, 0.9590553641319275, 0.9942183494567871, 1.029381275177002]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 3.0, 7.0, 6.0, 8.0, 18.0, 16.0, 17.0, 19.0, 11.0, 26.0, 19.0, 29.0, 31.0, 28.0, 34.0, 41.0, 34.0, 36.0, 40.0, 50.0, 49.0, 50.0, 46.0, 37.0, 34.0, 40.0, 33.0, 30.0, 34.0, 18.0, 24.0, 21.0, 16.0, 13.0, 16.0, 8.0, 6.0, 14.0, 4.0, 6.0, 4.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.7333589196205139, -0.711839497089386, -0.6903200149536133, -0.6688005924224854, -0.6472811698913574, -0.6257617473602295, -0.6042422652244568, -0.5827228426933289, -0.5612034201622009, -0.539683997631073, -0.5181645154953003, -0.49664509296417236, -0.47512567043304443, -0.4536062180995941, -0.4320867657661438, -0.41056734323501587, -0.38904789090156555, -0.36752843856811523, -0.3460090160369873, -0.324489563703537, -0.30297014117240906, -0.28145068883895874, -0.2599312663078308, -0.2384118139743805, -0.21689237654209137, -0.19537293910980225, -0.17385350167751312, -0.152334064245224, -0.13081461191177368, -0.10929518193006516, -0.08777573704719543, -0.06625629961490631, -0.04473686218261719, -0.023217422887682915, -0.001697983592748642, 0.01982145756483078, 0.041340894997119904, 0.06286033242940903, 0.08437977731227875, 0.10589921474456787, 0.127418652176857, 0.14893808960914612, 0.17045752704143524, 0.19197696447372437, 0.21349641680717468, 0.2350158393383026, 0.25653529167175293, 0.27805471420288086, 0.2995741665363312, 0.3210936188697815, 0.3426130414009094, 0.36413249373435974, 0.38565191626548767, 0.407171368598938, 0.4286907911300659, 0.45021024346351624, 0.47172969579696655, 0.49324914813041687, 0.5147686004638672, 0.5362880229949951, 0.557807445526123, 0.579326868057251, 0.6008463501930237, 0.6223657727241516, 0.6438851952552795]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 8.0, 9.0, 8.0, 24.0, 25.0, 28.0, 56.0, 79.0, 122.0, 214.0, 356.0, 628.0, 1260.0, 2818.0, 6851.0, 18436.0, 67588.0, 318030.0, 1211644.0, 1680126.0, 675366.0, 151993.0, 36078.0, 13148.0, 5478.0, 2159.0, 868.0, 409.0, 217.0, 117.0, 43.0, 36.0, 22.0, 10.0, 8.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12152099609375, -0.11807441711425781, -0.11462783813476562, -0.11118125915527344, -0.10773468017578125, -0.10428810119628906, -0.10084152221679688, -0.09739494323730469, -0.0939483642578125, -0.09050178527832031, -0.08705520629882812, -0.08360862731933594, -0.08016204833984375, -0.07671546936035156, -0.07326889038085938, -0.06982231140136719, -0.066375732421875, -0.06292915344238281, -0.059482574462890625, -0.05603599548339844, -0.05258941650390625, -0.04914283752441406, -0.045696258544921875, -0.04224967956542969, -0.0388031005859375, -0.03535652160644531, -0.031909942626953125, -0.028463363647460938, -0.02501678466796875, -0.021570205688476562, -0.018123626708984375, -0.014677047729492188, -0.01123046875, -0.0077838897705078125, -0.004337310791015625, -0.0008907318115234375, 0.00255584716796875, 0.0060024261474609375, 0.009449005126953125, 0.012895584106445312, 0.0163421630859375, 0.019788742065429688, 0.023235321044921875, 0.026681900024414062, 0.03012847900390625, 0.03357505798339844, 0.037021636962890625, 0.04046821594238281, 0.043914794921875, 0.04736137390136719, 0.050807952880859375, 0.05425453186035156, 0.05770111083984375, 0.06114768981933594, 0.06459426879882812, 0.06804084777832031, 0.0714874267578125, 0.07493400573730469, 0.07838058471679688, 0.08182716369628906, 0.08527374267578125, 0.08872032165527344, 0.09216690063476562, 0.09561347961425781, 0.09906005859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 17.0, 19.0, 22.0, 17.0, 25.0, 38.0, 47.0, 48.0, 62.0, 62.0, 61.0, 75.0, 78.0, 72.0, 64.0, 56.0, 52.0, 35.0, 25.0, 33.0, 20.0, 13.0, 14.0, 12.0, 7.0, 0.0, 8.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.15661144256591797, -0.15221214294433594, -0.1478128433227539, -0.14341354370117188, -0.13901424407958984, -0.1346149444580078, -0.13021564483642578, -0.12581634521484375, -0.12141704559326172, -0.11701774597167969, -0.11261844635009766, -0.10821914672851562, -0.1038198471069336, -0.09942054748535156, -0.09502124786376953, -0.0906219482421875, -0.08622264862060547, -0.08182334899902344, -0.0774240493774414, -0.07302474975585938, -0.06862545013427734, -0.06422615051269531, -0.05982685089111328, -0.05542755126953125, -0.05102825164794922, -0.04662895202636719, -0.042229652404785156, -0.037830352783203125, -0.033431053161621094, -0.029031753540039062, -0.02463245391845703, -0.020233154296875, -0.01583385467529297, -0.011434555053710938, -0.007035255432128906, -0.002635955810546875, 0.0017633438110351562, 0.0061626434326171875, 0.010561943054199219, 0.01496124267578125, 0.01936054229736328, 0.023759841918945312, 0.028159141540527344, 0.032558441162109375, 0.036957740783691406, 0.04135704040527344, 0.04575634002685547, 0.0501556396484375, 0.05455493927001953, 0.05895423889160156, 0.0633535385131836, 0.06775283813476562, 0.07215213775634766, 0.07655143737792969, 0.08095073699951172, 0.08535003662109375, 0.08974933624267578, 0.09414863586425781, 0.09854793548583984, 0.10294723510742188, 0.1073465347290039, 0.11174583435058594, 0.11614513397216797, 0.12054443359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 19.0, 22.0, 36.0, 68.0, 98.0, 165.0, 241.0, 510.0, 936.0, 1822.0, 4522.0, 12358.0, 41901.0, 173663.0, 1134396.0, 2343215.0, 368621.0, 77285.0, 21501.0, 7192.0, 2788.0, 1332.0, 689.0, 331.0, 208.0, 120.0, 76.0, 47.0, 42.0, 28.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117431640625, -0.11277580261230469, -0.10811996459960938, -0.10346412658691406, -0.09880828857421875, -0.09415245056152344, -0.08949661254882812, -0.08484077453613281, -0.0801849365234375, -0.07552909851074219, -0.07087326049804688, -0.06621742248535156, -0.06156158447265625, -0.05690574645996094, -0.052249908447265625, -0.04759407043457031, -0.042938232421875, -0.03828239440917969, -0.033626556396484375, -0.028970718383789062, -0.02431488037109375, -0.019659042358398438, -0.015003204345703125, -0.010347366333007812, -0.0056915283203125, -0.0010356903076171875, 0.003620147705078125, 0.008275985717773438, 0.01293182373046875, 0.017587661743164062, 0.022243499755859375, 0.026899337768554688, 0.03155517578125, 0.03621101379394531, 0.040866851806640625, 0.04552268981933594, 0.05017852783203125, 0.05483436584472656, 0.059490203857421875, 0.06414604187011719, 0.0688018798828125, 0.07345771789550781, 0.07811355590820312, 0.08276939392089844, 0.08742523193359375, 0.09208106994628906, 0.09673690795898438, 0.10139274597167969, 0.106048583984375, 0.11070442199707031, 0.11536026000976562, 0.12001609802246094, 0.12467193603515625, 0.12932777404785156, 0.13398361206054688, 0.1386394500732422, 0.1432952880859375, 0.1479511260986328, 0.15260696411132812, 0.15726280212402344, 0.16191864013671875, 0.16657447814941406, 0.17123031616210938, 0.1758861541748047, 0.1805419921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 3.0, 12.0, 12.0, 20.0, 30.0, 25.0, 37.0, 67.0, 83.0, 130.0, 195.0, 310.0, 494.0, 560.0, 589.0, 485.0, 285.0, 198.0, 125.0, 97.0, 84.0, 49.0, 53.0, 35.0, 20.0, 14.0, 15.0, 6.0, 7.0, 5.0, 10.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1517333984375, -0.14589691162109375, -0.1400604248046875, -0.13422393798828125, -0.128387451171875, -0.12255096435546875, -0.1167144775390625, -0.11087799072265625, -0.10504150390625, -0.09920501708984375, -0.0933685302734375, -0.08753204345703125, -0.081695556640625, -0.07585906982421875, -0.0700225830078125, -0.06418609619140625, -0.058349609375, -0.05251312255859375, -0.0466766357421875, -0.04084014892578125, -0.035003662109375, -0.02916717529296875, -0.0233306884765625, -0.01749420166015625, -0.01165771484375, -0.00582122802734375, 1.52587890625e-05, 0.00585174560546875, 0.011688232421875, 0.01752471923828125, 0.0233612060546875, 0.02919769287109375, 0.0350341796875, 0.04087066650390625, 0.0467071533203125, 0.05254364013671875, 0.058380126953125, 0.06421661376953125, 0.0700531005859375, 0.07588958740234375, 0.08172607421875, 0.08756256103515625, 0.0933990478515625, 0.09923553466796875, 0.105072021484375, 0.11090850830078125, 0.1167449951171875, 0.12258148193359375, 0.12841796875, 0.13425445556640625, 0.1400909423828125, 0.14592742919921875, 0.151763916015625, 0.15760040283203125, 0.1634368896484375, 0.16927337646484375, 0.17510986328125, 0.18094635009765625, 0.1867828369140625, 0.19261932373046875, 0.198455810546875, 0.20429229736328125, 0.2101287841796875, 0.21596527099609375, 0.2218017578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 2.0, 4.0, 15.0, 34.0, 68.0, 119.0, 185.0, 198.0, 168.0, 101.0, 56.0, 24.0, 15.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322247862815857, -1.2797709703445435, -1.23729407787323, -1.194817066192627, -1.1523401737213135, -1.10986328125, -1.0673863887786865, -1.024909496307373, -0.9824326038360596, -0.9399557113647461, -0.8974787592887878, -0.8550018668174744, -0.8125249743461609, -0.7700480222702026, -0.7275711297988892, -0.6850942373275757, -0.6426172852516174, -0.600140392780304, -0.5576634407043457, -0.5151865482330322, -0.47270965576171875, -0.4302327334880829, -0.387755811214447, -0.34527891874313354, -0.3028019964694977, -0.2603250741958618, -0.21784818172454834, -0.17537125945091248, -0.1328943520784378, -0.09041744470596313, -0.04794052243232727, -0.005463629961013794, 0.03701329231262207, 0.07949019968509674, 0.12196711450815201, 0.16444402933120728, 0.20692093670368195, 0.24939784407615662, 0.2918747663497925, 0.33435165882110596, 0.3768285810947418, 0.4193055033683777, 0.46178239583969116, 0.5042593479156494, 0.5467362403869629, 0.5892131328582764, 0.6316900253295898, 0.6741669178009033, 0.7166438698768616, 0.759120762348175, 0.8015977144241333, 0.8440746068954468, 0.8865514993667603, 0.9290283918380737, 0.971505343914032, 1.0139822959899902, 1.0564591884613037, 1.0989360809326172, 1.1414129734039307, 1.1838898658752441, 1.2263668775558472, 1.2688437700271606, 1.3113206624984741, 1.3537975549697876, 1.396274447441101]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 9.0, 10.0, 12.0, 18.0, 10.0, 15.0, 14.0, 24.0, 35.0, 33.0, 27.0, 39.0, 31.0, 58.0, 47.0, 46.0, 52.0, 47.0, 54.0, 38.0, 31.0, 40.0, 35.0, 30.0, 32.0, 33.0, 36.0, 31.0, 21.0, 14.0, 17.0, 10.0, 19.0, 10.0, 4.0, 1.0, 0.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6431443095207214, -0.6232563257217407, -0.6033682823181152, -0.5834802985191345, -0.5635923147201538, -0.5437042713165283, -0.5238162875175476, -0.5039283037185669, -0.4840402901172638, -0.4641522765159607, -0.44426429271698, -0.4243762791156769, -0.4044882655143738, -0.38460028171539307, -0.36471226811408997, -0.34482425451278687, -0.32493627071380615, -0.30504825711250305, -0.28516027331352234, -0.26527225971221924, -0.24538426101207733, -0.22549626231193542, -0.20560824871063232, -0.18572025001049042, -0.1658322513103485, -0.1459442526102066, -0.1260562539100647, -0.1061682403087616, -0.08628024160861969, -0.06639224290847778, -0.04650423675775528, -0.026616230607032776, -0.006728172302246094, 0.013159830123186111, 0.03304783254861832, 0.05293583497405052, 0.07282383739948273, 0.09271183609962463, 0.11259984225034714, 0.13248784840106964, 0.15237584710121155, 0.17226384580135345, 0.19215184450149536, 0.21203985810279846, 0.23192785680294037, 0.2518158555030823, 0.2717038691043854, 0.2915918827056885, 0.3114798665046692, 0.3313678801059723, 0.351255863904953, 0.3711438775062561, 0.3910318613052368, 0.4109198749065399, 0.430807888507843, 0.45069587230682373, 0.47058388590812683, 0.49047189950942993, 0.5103598833084106, 0.5302478671073914, 0.5501359105110168, 0.5700238943099976, 0.5899118781089783, 0.6097999215126038, 0.6296879053115845]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 13.0, 19.0, 34.0, 21.0, 44.0, 81.0, 141.0, 222.0, 411.0, 700.0, 1516.0, 3070.0, 7290.0, 17091.0, 42218.0, 111632.0, 305374.0, 342035.0, 132261.0, 49081.0, 19739.0, 8341.0, 3656.0, 1659.0, 815.0, 410.0, 270.0, 141.0, 93.0, 59.0, 32.0, 24.0, 16.0, 15.0, 4.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1424560546875, -0.13787269592285156, -0.13328933715820312, -0.1287059783935547, -0.12412261962890625, -0.11953926086425781, -0.11495590209960938, -0.11037254333496094, -0.1057891845703125, -0.10120582580566406, -0.09662246704101562, -0.09203910827636719, -0.08745574951171875, -0.08287239074707031, -0.07828903198242188, -0.07370567321777344, -0.069122314453125, -0.06453895568847656, -0.059955596923828125, -0.05537223815917969, -0.05078887939453125, -0.04620552062988281, -0.041622161865234375, -0.03703880310058594, -0.0324554443359375, -0.027872085571289062, -0.023288726806640625, -0.018705368041992188, -0.01412200927734375, -0.009538650512695312, -0.004955291748046875, -0.0003719329833984375, 0.00421142578125, 0.008794784545898438, 0.013378143310546875, 0.017961502075195312, 0.02254486083984375, 0.027128219604492188, 0.031711578369140625, 0.03629493713378906, 0.0408782958984375, 0.04546165466308594, 0.050045013427734375, 0.05462837219238281, 0.05921173095703125, 0.06379508972167969, 0.06837844848632812, 0.07296180725097656, 0.077545166015625, 0.08212852478027344, 0.08671188354492188, 0.09129524230957031, 0.09587860107421875, 0.10046195983886719, 0.10504531860351562, 0.10962867736816406, 0.1142120361328125, 0.11879539489746094, 0.12337875366210938, 0.1279621124267578, 0.13254547119140625, 0.1371288299560547, 0.14171218872070312, 0.14629554748535156, 0.15087890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 10.0, 17.0, 23.0, 26.0, 36.0, 44.0, 65.0, 66.0, 87.0, 76.0, 90.0, 73.0, 75.0, 69.0, 65.0, 43.0, 34.0, 27.0, 22.0, 15.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1361083984375, -0.131439208984375, -0.12677001953125, -0.122100830078125, -0.117431640625, -0.112762451171875, -0.10809326171875, -0.103424072265625, -0.0987548828125, -0.094085693359375, -0.08941650390625, -0.084747314453125, -0.080078125, -0.075408935546875, -0.07073974609375, -0.066070556640625, -0.0614013671875, -0.056732177734375, -0.05206298828125, -0.047393798828125, -0.042724609375, -0.038055419921875, -0.03338623046875, -0.028717041015625, -0.0240478515625, -0.019378662109375, -0.01470947265625, -0.010040283203125, -0.00537109375, -0.000701904296875, 0.00396728515625, 0.008636474609375, 0.0133056640625, 0.017974853515625, 0.02264404296875, 0.027313232421875, 0.031982421875, 0.036651611328125, 0.04132080078125, 0.045989990234375, 0.0506591796875, 0.055328369140625, 0.05999755859375, 0.064666748046875, 0.0693359375, 0.074005126953125, 0.07867431640625, 0.083343505859375, 0.0880126953125, 0.092681884765625, 0.09735107421875, 0.102020263671875, 0.106689453125, 0.111358642578125, 0.11602783203125, 0.120697021484375, 0.1253662109375, 0.130035400390625, 0.13470458984375, 0.139373779296875, 0.14404296875, 0.148712158203125, 0.15338134765625, 0.158050537109375, 0.1627197265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 5.0, 3.0, 11.0, 12.0, 28.0, 31.0, 43.0, 82.0, 120.0, 232.0, 347.0, 578.0, 1003.0, 2134.0, 4538.0, 10765.0, 26733.0, 75035.0, 242813.0, 432303.0, 163659.0, 53086.0, 19696.0, 7782.0, 3611.0, 1634.0, 893.0, 510.0, 300.0, 182.0, 121.0, 82.0, 55.0, 41.0, 24.0, 18.0, 10.0, 11.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.14900588989257812, -0.14334869384765625, -0.13769149780273438, -0.1320343017578125, -0.12637710571289062, -0.12071990966796875, -0.11506271362304688, -0.109405517578125, -0.10374832153320312, -0.09809112548828125, -0.09243392944335938, -0.0867767333984375, -0.08111953735351562, -0.07546234130859375, -0.06980514526367188, -0.06414794921875, -0.058490753173828125, -0.05283355712890625, -0.047176361083984375, -0.0415191650390625, -0.035861968994140625, -0.03020477294921875, -0.024547576904296875, -0.018890380859375, -0.013233184814453125, -0.00757598876953125, -0.001918792724609375, 0.0037384033203125, 0.009395599365234375, 0.01505279541015625, 0.020709991455078125, 0.0263671875, 0.032024383544921875, 0.03768157958984375, 0.043338775634765625, 0.0489959716796875, 0.054653167724609375, 0.06031036376953125, 0.06596755981445312, 0.071624755859375, 0.07728195190429688, 0.08293914794921875, 0.08859634399414062, 0.0942535400390625, 0.09991073608398438, 0.10556793212890625, 0.11122512817382812, 0.11688232421875, 0.12253952026367188, 0.12819671630859375, 0.13385391235351562, 0.1395111083984375, 0.14516830444335938, 0.15082550048828125, 0.15648269653320312, 0.162139892578125, 0.16779708862304688, 0.17345428466796875, 0.17911148071289062, 0.1847686767578125, 0.19042587280273438, 0.19608306884765625, 0.20174026489257812, 0.2073974609375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 6.0, 7.0, 7.0, 15.0, 18.0, 19.0, 17.0, 38.0, 31.0, 46.0, 38.0, 38.0, 55.0, 63.0, 57.0, 68.0, 55.0, 46.0, 52.0, 42.0, 47.0, 29.0, 33.0, 34.0, 26.0, 23.0, 19.0, 12.0, 17.0, 10.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.25972747802734375, -0.2499237060546875, -0.24011993408203125, -0.230316162109375, -0.22051239013671875, -0.2107086181640625, -0.20090484619140625, -0.19110107421875, -0.18129730224609375, -0.1714935302734375, -0.16168975830078125, -0.151885986328125, -0.14208221435546875, -0.1322784423828125, -0.12247467041015625, -0.1126708984375, -0.10286712646484375, -0.0930633544921875, -0.08325958251953125, -0.073455810546875, -0.06365203857421875, -0.0538482666015625, -0.04404449462890625, -0.03424072265625, -0.02443695068359375, -0.0146331787109375, -0.00482940673828125, 0.004974365234375, 0.01477813720703125, 0.0245819091796875, 0.03438568115234375, 0.044189453125, 0.05399322509765625, 0.0637969970703125, 0.07360076904296875, 0.083404541015625, 0.09320831298828125, 0.1030120849609375, 0.11281585693359375, 0.12261962890625, 0.13242340087890625, 0.1422271728515625, 0.15203094482421875, 0.161834716796875, 0.17163848876953125, 0.1814422607421875, 0.19124603271484375, 0.2010498046875, 0.21085357666015625, 0.2206573486328125, 0.23046112060546875, 0.240264892578125, 0.25006866455078125, 0.2598724365234375, 0.26967620849609375, 0.27947998046875, 0.28928375244140625, 0.2990875244140625, 0.30889129638671875, 0.318695068359375, 0.32849884033203125, 0.3383026123046875, 0.34810638427734375, 0.35791015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 11.0, 5.0, 9.0, 8.0, 13.0, 38.0, 44.0, 60.0, 108.0, 173.0, 265.0, 498.0, 750.0, 1385.0, 2446.0, 4514.0, 8627.0, 17532.0, 41844.0, 112822.0, 295463.0, 333809.0, 136714.0, 49655.0, 20554.0, 9745.0, 5056.0, 2700.0, 1552.0, 833.0, 508.0, 269.0, 181.0, 118.0, 63.0, 42.0, 29.0, 17.0, 26.0, 15.0, 8.0, 9.0, 10.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.037109375, -0.03583383560180664, -0.03455829620361328, -0.03328275680541992, -0.03200721740722656, -0.030731678009033203, -0.029456138610839844, -0.028180599212646484, -0.026905059814453125, -0.025629520416259766, -0.024353981018066406, -0.023078441619873047, -0.021802902221679688, -0.020527362823486328, -0.01925182342529297, -0.01797628402709961, -0.01670074462890625, -0.01542520523071289, -0.014149665832519531, -0.012874126434326172, -0.011598587036132812, -0.010323047637939453, -0.009047508239746094, -0.007771968841552734, -0.006496429443359375, -0.005220890045166016, -0.003945350646972656, -0.002669811248779297, -0.0013942718505859375, -0.00011873245239257812, 0.0011568069458007812, 0.0024323463439941406, 0.0037078857421875, 0.004983425140380859, 0.006258964538574219, 0.007534503936767578, 0.008810043334960938, 0.010085582733154297, 0.011361122131347656, 0.012636661529541016, 0.013912200927734375, 0.015187740325927734, 0.016463279724121094, 0.017738819122314453, 0.019014358520507812, 0.020289897918701172, 0.02156543731689453, 0.02284097671508789, 0.02411651611328125, 0.02539205551147461, 0.02666759490966797, 0.027943134307861328, 0.029218673706054688, 0.030494213104248047, 0.031769752502441406, 0.033045291900634766, 0.034320831298828125, 0.035596370697021484, 0.036871910095214844, 0.0381474494934082, 0.03942298889160156, 0.04069852828979492, 0.04197406768798828, 0.04324960708618164, 0.044525146484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 14.0, 5.0, 13.0, 17.0, 14.0, 17.0, 35.0, 54.0, 42.0, 74.0, 85.0, 109.0, 85.0, 80.0, 85.0, 56.0, 52.0, 35.0, 15.0, 23.0, 14.0, 21.0, 7.0, 9.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.621246337890625e-05, -1.5748664736747742e-05, -1.5284866094589233e-05, -1.4821067452430725e-05, -1.4357268810272217e-05, -1.3893470168113708e-05, -1.34296715259552e-05, -1.2965872883796692e-05, -1.2502074241638184e-05, -1.2038275599479675e-05, -1.1574476957321167e-05, -1.1110678315162659e-05, -1.064687967300415e-05, -1.0183081030845642e-05, -9.719282388687134e-06, -9.255483746528625e-06, -8.791685104370117e-06, -8.327886462211609e-06, -7.8640878200531e-06, -7.400289177894592e-06, -6.936490535736084e-06, -6.472691893577576e-06, -6.008893251419067e-06, -5.545094609260559e-06, -5.081295967102051e-06, -4.6174973249435425e-06, -4.153698682785034e-06, -3.689900040626526e-06, -3.2261013984680176e-06, -2.7623027563095093e-06, -2.298504114151001e-06, -1.8347054719924927e-06, -1.3709068298339844e-06, -9.071081876754761e-07, -4.4330954551696777e-07, 2.0489096641540527e-08, 4.842877388000488e-07, 9.480863809585571e-07, 1.4118850231170654e-06, 1.8756836652755737e-06, 2.339482307434082e-06, 2.8032809495925903e-06, 3.2670795917510986e-06, 3.730878233909607e-06, 4.194676876068115e-06, 4.6584755182266235e-06, 5.122274160385132e-06, 5.58607280254364e-06, 6.0498714447021484e-06, 6.513670086860657e-06, 6.977468729019165e-06, 7.441267371177673e-06, 7.905066013336182e-06, 8.36886465549469e-06, 8.832663297653198e-06, 9.296461939811707e-06, 9.760260581970215e-06, 1.0224059224128723e-05, 1.0687857866287231e-05, 1.115165650844574e-05, 1.1615455150604248e-05, 1.2079253792762756e-05, 1.2543052434921265e-05, 1.3006851077079773e-05, 1.3470649719238281e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 5.0, 9.0, 10.0, 17.0, 18.0, 41.0, 46.0, 64.0, 103.0, 175.0, 300.0, 442.0, 926.0, 1766.0, 3498.0, 7295.0, 17284.0, 47076.0, 147708.0, 379342.0, 292534.0, 94834.0, 31529.0, 12223.0, 5590.0, 2674.0, 1315.0, 675.0, 384.0, 243.0, 138.0, 81.0, 60.0, 36.0, 28.0, 19.0, 13.0, 11.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.050323486328125, -0.04891824722290039, -0.04751300811767578, -0.04610776901245117, -0.04470252990722656, -0.04329729080200195, -0.041892051696777344, -0.040486812591552734, -0.039081573486328125, -0.037676334381103516, -0.036271095275878906, -0.0348658561706543, -0.03346061706542969, -0.03205537796020508, -0.03065013885498047, -0.02924489974975586, -0.02783966064453125, -0.02643442153930664, -0.02502918243408203, -0.023623943328857422, -0.022218704223632812, -0.020813465118408203, -0.019408226013183594, -0.018002986907958984, -0.016597747802734375, -0.015192508697509766, -0.013787269592285156, -0.012382030487060547, -0.010976791381835938, -0.009571552276611328, -0.008166313171386719, -0.006761074066162109, -0.0053558349609375, -0.003950595855712891, -0.0025453567504882812, -0.0011401176452636719, 0.0002651214599609375, 0.0016703605651855469, 0.0030755996704101562, 0.004480838775634766, 0.005886077880859375, 0.007291316986083984, 0.008696556091308594, 0.010101795196533203, 0.011507034301757812, 0.012912273406982422, 0.014317512512207031, 0.01572275161743164, 0.01712799072265625, 0.01853322982788086, 0.01993846893310547, 0.021343708038330078, 0.022748947143554688, 0.024154186248779297, 0.025559425354003906, 0.026964664459228516, 0.028369903564453125, 0.029775142669677734, 0.031180381774902344, 0.03258562088012695, 0.03399085998535156, 0.03539609909057617, 0.03680133819580078, 0.03820657730102539, 0.03961181640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 7.0, 5.0, 5.0, 6.0, 16.0, 7.0, 20.0, 22.0, 33.0, 24.0, 53.0, 65.0, 63.0, 61.0, 96.0, 98.0, 96.0, 79.0, 68.0, 48.0, 34.0, 25.0, 18.0, 22.0, 6.0, 10.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0721435546875, -0.07034158706665039, -0.06853961944580078, -0.06673765182495117, -0.06493568420410156, -0.06313371658325195, -0.061331748962402344, -0.059529781341552734, -0.057727813720703125, -0.055925846099853516, -0.054123878479003906, -0.0523219108581543, -0.05051994323730469, -0.04871797561645508, -0.04691600799560547, -0.04511404037475586, -0.04331207275390625, -0.04151010513305664, -0.03970813751220703, -0.03790616989135742, -0.03610420227050781, -0.0343022346496582, -0.032500267028808594, -0.030698299407958984, -0.028896331787109375, -0.027094364166259766, -0.025292396545410156, -0.023490428924560547, -0.021688461303710938, -0.019886493682861328, -0.01808452606201172, -0.01628255844116211, -0.0144805908203125, -0.01267862319946289, -0.010876655578613281, -0.009074687957763672, -0.0072727203369140625, -0.005470752716064453, -0.0036687850952148438, -0.0018668174743652344, -6.4849853515625e-05, 0.0017371177673339844, 0.0035390853881835938, 0.005341053009033203, 0.0071430206298828125, 0.008944988250732422, 0.010746955871582031, 0.01254892349243164, 0.01435089111328125, 0.01615285873413086, 0.01795482635498047, 0.019756793975830078, 0.021558761596679688, 0.023360729217529297, 0.025162696838378906, 0.026964664459228516, 0.028766632080078125, 0.030568599700927734, 0.032370567321777344, 0.03417253494262695, 0.03597450256347656, 0.03777647018432617, 0.03957843780517578, 0.04138040542602539, 0.043182373046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 10.0, 6.0, 11.0, 15.0, 26.0, 50.0, 76.0, 107.0, 120.0, 147.0, 122.0, 105.0, 91.0, 44.0, 32.0, 14.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0658539533615112, -1.0419737100601196, -1.0180935859680176, -0.994213342666626, -0.9703331589698792, -0.9464529752731323, -0.9225727319717407, -0.8986925482749939, -0.8748123645782471, -0.8509321808815002, -0.8270519971847534, -0.8031717538833618, -0.779291570186615, -0.7554113864898682, -0.7315311431884766, -0.7076509594917297, -0.6837707757949829, -0.6598905920982361, -0.6360104084014893, -0.6121301651000977, -0.5882499814033508, -0.564369797706604, -0.5404895544052124, -0.5166093707084656, -0.49272918701171875, -0.4688490033149719, -0.4449687898159027, -0.4210885763168335, -0.39720839262008667, -0.37332820892333984, -0.34944799542427063, -0.3255677819252014, -0.3016875982284546, -0.27780741453170776, -0.25392720103263855, -0.23004700243473053, -0.2061668038368225, -0.1822866052389145, -0.15840640664100647, -0.13452620804309845, -0.11064600944519043, -0.08676581084728241, -0.06288561224937439, -0.03900541365146637, -0.01512521505355835, 0.00875498354434967, 0.03263518214225769, 0.05651538074016571, 0.08039557933807373, 0.10427577793598175, 0.12815597653388977, 0.1520361751317978, 0.1759163737297058, 0.19979657232761383, 0.22367677092552185, 0.24755696952342987, 0.2714371681213379, 0.2953173518180847, 0.31919756531715393, 0.34307777881622314, 0.36695796251296997, 0.3908381462097168, 0.414718359708786, 0.4385985732078552, 0.46247875690460205]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 3.0, 5.0, 17.0, 13.0, 13.0, 22.0, 17.0, 26.0, 23.0, 44.0, 20.0, 38.0, 34.0, 39.0, 40.0, 34.0, 35.0, 44.0, 43.0, 28.0, 27.0, 46.0, 53.0, 27.0, 41.0, 21.0, 28.0, 25.0, 18.0, 22.0, 17.0, 17.0, 17.0, 16.0, 18.0, 4.0, 11.0, 10.0, 5.0, 10.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.6209492683410645, -0.6029306054115295, -0.5849119424819946, -0.5668932795524597, -0.5488746166229248, -0.5308559536933899, -0.512837290763855, -0.49481862783432007, -0.47679996490478516, -0.45878130197525024, -0.44076263904571533, -0.4227439761161804, -0.4047253131866455, -0.3867066502571106, -0.3686879873275757, -0.35066932439804077, -0.33265066146850586, -0.31463199853897095, -0.29661333560943604, -0.2785946726799011, -0.2605760097503662, -0.2425573468208313, -0.2245386838912964, -0.20652002096176147, -0.18850135803222656, -0.17048269510269165, -0.15246403217315674, -0.13444536924362183, -0.11642670631408691, -0.098408043384552, -0.08038938045501709, -0.06237071752548218, -0.04435211420059204, -0.02633345127105713, -0.008314788341522217, 0.009703874588012695, 0.027722537517547607, 0.04574120044708252, 0.06375986337661743, 0.08177852630615234, 0.09979718923568726, 0.11781585216522217, 0.13583451509475708, 0.153853178024292, 0.1718718409538269, 0.18989050388336182, 0.20790916681289673, 0.22592782974243164, 0.24394649267196655, 0.26196515560150146, 0.2799838185310364, 0.2980024814605713, 0.3160211443901062, 0.3340398073196411, 0.352058470249176, 0.37007713317871094, 0.38809579610824585, 0.40611445903778076, 0.4241331219673157, 0.4421517848968506, 0.4601704478263855, 0.4781891107559204, 0.4962077736854553, 0.5142264366149902, 0.5322450995445251]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 14.0, 9.0, 14.0, 23.0, 46.0, 50.0, 100.0, 144.0, 296.0, 640.0, 1854.0, 6048.0, 22124.0, 124924.0, 951486.0, 2249684.0, 708187.0, 99157.0, 20230.0, 6195.0, 1972.0, 616.0, 232.0, 87.0, 50.0, 28.0, 25.0, 10.0, 14.0, 10.0, 1.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1561279296875, -0.1514568328857422, -0.14678573608398438, -0.14211463928222656, -0.13744354248046875, -0.13277244567871094, -0.12810134887695312, -0.12343025207519531, -0.1187591552734375, -0.11408805847167969, -0.10941696166992188, -0.10474586486816406, -0.10007476806640625, -0.09540367126464844, -0.09073257446289062, -0.08606147766113281, -0.081390380859375, -0.07671928405761719, -0.07204818725585938, -0.06737709045410156, -0.06270599365234375, -0.05803489685058594, -0.053363800048828125, -0.04869270324707031, -0.0440216064453125, -0.03935050964355469, -0.034679412841796875, -0.030008316040039062, -0.02533721923828125, -0.020666122436523438, -0.015995025634765625, -0.011323928833007812, -0.00665283203125, -0.0019817352294921875, 0.002689361572265625, 0.0073604583740234375, 0.01203155517578125, 0.016702651977539062, 0.021373748779296875, 0.026044845581054688, 0.0307159423828125, 0.03538703918457031, 0.040058135986328125, 0.04472923278808594, 0.04940032958984375, 0.05407142639160156, 0.058742523193359375, 0.06341361999511719, 0.068084716796875, 0.07275581359863281, 0.07742691040039062, 0.08209800720214844, 0.08676910400390625, 0.09144020080566406, 0.09611129760742188, 0.10078239440917969, 0.1054534912109375, 0.11012458801269531, 0.11479568481445312, 0.11946678161621094, 0.12413787841796875, 0.12880897521972656, 0.13348007202148438, 0.1381511688232422, 0.142822265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 13.0, 19.0, 28.0, 38.0, 53.0, 49.0, 74.0, 83.0, 94.0, 87.0, 94.0, 66.0, 60.0, 63.0, 44.0, 32.0, 22.0, 27.0, 11.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.190185546875, -0.18507766723632812, -0.17996978759765625, -0.17486190795898438, -0.1697540283203125, -0.16464614868164062, -0.15953826904296875, -0.15443038940429688, -0.149322509765625, -0.14421463012695312, -0.13910675048828125, -0.13399887084960938, -0.1288909912109375, -0.12378311157226562, -0.11867523193359375, -0.11356735229492188, -0.10845947265625, -0.10335159301757812, -0.09824371337890625, -0.09313583374023438, -0.0880279541015625, -0.08292007446289062, -0.07781219482421875, -0.07270431518554688, -0.067596435546875, -0.062488555908203125, -0.05738067626953125, -0.052272796630859375, -0.0471649169921875, -0.042057037353515625, -0.03694915771484375, -0.031841278076171875, -0.0267333984375, -0.021625518798828125, -0.01651763916015625, -0.011409759521484375, -0.0063018798828125, -0.001194000244140625, 0.00391387939453125, 0.009021759033203125, 0.014129638671875, 0.019237518310546875, 0.02434539794921875, 0.029453277587890625, 0.0345611572265625, 0.039669036865234375, 0.04477691650390625, 0.049884796142578125, 0.05499267578125, 0.060100555419921875, 0.06520843505859375, 0.07031631469726562, 0.0754241943359375, 0.08053207397460938, 0.08563995361328125, 0.09074783325195312, 0.095855712890625, 0.10096359252929688, 0.10607147216796875, 0.11117935180664062, 0.1162872314453125, 0.12139511108398438, 0.12650299072265625, 0.13161087036132812, 0.13671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 15.0, 18.0, 34.0, 72.0, 132.0, 332.0, 722.0, 2388.0, 12404.0, 141418.0, 3213946.0, 775366.0, 39721.0, 5290.0, 1366.0, 534.0, 230.0, 126.0, 64.0, 31.0, 28.0, 12.0, 12.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.28675079345703125, -0.2771148681640625, -0.26747894287109375, -0.257843017578125, -0.24820709228515625, -0.2385711669921875, -0.22893524169921875, -0.21929931640625, -0.20966339111328125, -0.2000274658203125, -0.19039154052734375, -0.180755615234375, -0.17111968994140625, -0.1614837646484375, -0.15184783935546875, -0.1422119140625, -0.13257598876953125, -0.1229400634765625, -0.11330413818359375, -0.103668212890625, -0.09403228759765625, -0.0843963623046875, -0.07476043701171875, -0.06512451171875, -0.05548858642578125, -0.0458526611328125, -0.03621673583984375, -0.026580810546875, -0.01694488525390625, -0.0073089599609375, 0.00232696533203125, 0.011962890625, 0.02159881591796875, 0.0312347412109375, 0.04087066650390625, 0.050506591796875, 0.06014251708984375, 0.0697784423828125, 0.07941436767578125, 0.08905029296875, 0.09868621826171875, 0.1083221435546875, 0.11795806884765625, 0.127593994140625, 0.13722991943359375, 0.1468658447265625, 0.15650177001953125, 0.1661376953125, 0.17577362060546875, 0.1854095458984375, 0.19504547119140625, 0.204681396484375, 0.21431732177734375, 0.2239532470703125, 0.23358917236328125, 0.24322509765625, 0.25286102294921875, 0.2624969482421875, 0.27213287353515625, 0.281768798828125, 0.29140472412109375, 0.3010406494140625, 0.31067657470703125, 0.3203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 12.0, 14.0, 18.0, 40.0, 70.0, 82.0, 147.0, 263.0, 431.0, 715.0, 871.0, 566.0, 316.0, 181.0, 111.0, 78.0, 58.0, 40.0, 21.0, 11.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1473388671875, -0.1392650604248047, -0.13119125366210938, -0.12311744689941406, -0.11504364013671875, -0.10696983337402344, -0.09889602661132812, -0.09082221984863281, -0.0827484130859375, -0.07467460632324219, -0.06660079956054688, -0.05852699279785156, -0.05045318603515625, -0.04237937927246094, -0.034305572509765625, -0.026231765747070312, -0.018157958984375, -0.010084152221679688, -0.002010345458984375, 0.0060634613037109375, 0.01413726806640625, 0.022211074829101562, 0.030284881591796875, 0.03835868835449219, 0.0464324951171875, 0.05450630187988281, 0.06258010864257812, 0.07065391540527344, 0.07872772216796875, 0.08680152893066406, 0.09487533569335938, 0.10294914245605469, 0.11102294921875, 0.11909675598144531, 0.12717056274414062, 0.13524436950683594, 0.14331817626953125, 0.15139198303222656, 0.15946578979492188, 0.1675395965576172, 0.1756134033203125, 0.1836872100830078, 0.19176101684570312, 0.19983482360839844, 0.20790863037109375, 0.21598243713378906, 0.22405624389648438, 0.2321300506591797, 0.240203857421875, 0.2482776641845703, 0.2563514709472656, 0.26442527770996094, 0.27249908447265625, 0.28057289123535156, 0.2886466979980469, 0.2967205047607422, 0.3047943115234375, 0.3128681182861328, 0.3209419250488281, 0.32901573181152344, 0.33708953857421875, 0.34516334533691406, 0.3532371520996094, 0.3613109588623047, 0.369384765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 31.0, 70.0, 151.0, 267.0, 223.0, 148.0, 64.0, 24.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.538264513015747, -2.477527379989624, -2.416790246963501, -2.356053113937378, -2.295315980911255, -2.234579086303711, -2.173841953277588, -2.113104820251465, -2.052367687225342, -1.9916305541992188, -1.9308934211730957, -1.8701564073562622, -1.8094192743301392, -1.7486821413040161, -1.687945008277893, -1.6272079944610596, -1.5664708614349365, -1.5057337284088135, -1.4449965953826904, -1.384259581565857, -1.3235224485397339, -1.2627853155136108, -1.2020481824874878, -1.1413111686706543, -1.0805739164352417, -1.0198367834091187, -0.9590997099876404, -0.8983625769615173, -0.8376255035400391, -0.776888370513916, -0.716151237487793, -0.6554141640663147, -0.5946770906448364, -0.5339399576187134, -0.4732028841972351, -0.41246575117111206, -0.3517286777496338, -0.29099154472351074, -0.23025444149971008, -0.16951733827590942, -0.10878023505210876, -0.04804312810301781, 0.01269397884607315, 0.0734310895204544, 0.13416819274425507, 0.19490531086921692, 0.2556424140930176, 0.31637951731681824, 0.3771166205406189, 0.43785372376441956, 0.4985908269882202, 0.5593279600143433, 0.6200650334358215, 0.6808021664619446, 0.7415392398834229, 0.8022763729095459, 0.863013505935669, 0.923750638961792, 0.9844877123832703, 1.0452247858047485, 1.1059619188308716, 1.1666990518569946, 1.2274361848831177, 1.2881731986999512, 1.3489103317260742]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 9.0, 8.0, 17.0, 17.0, 24.0, 20.0, 22.0, 25.0, 24.0, 23.0, 33.0, 37.0, 38.0, 39.0, 44.0, 43.0, 46.0, 44.0, 40.0, 38.0, 33.0, 37.0, 35.0, 37.0, 42.0, 27.0, 35.0, 25.0, 20.0, 23.0, 19.0, 10.0, 13.0, 11.0, 9.0, 7.0, 4.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5009984970092773, -0.48256152868270874, -0.46412453055381775, -0.44568753242492676, -0.42725056409835815, -0.40881359577178955, -0.39037659764289856, -0.37193959951400757, -0.35350263118743896, -0.33506566286087036, -0.31662866473197937, -0.2981916666030884, -0.2797546982765198, -0.26131772994995117, -0.24288073182106018, -0.22444374859333038, -0.20600676536560059, -0.1875697821378708, -0.169132798910141, -0.1506958156824112, -0.1322588324546814, -0.1138218492269516, -0.0953848659992218, -0.076947882771492, -0.05851089954376221, -0.04007391631603241, -0.021636933088302612, -0.003199949860572815, 0.015237033367156982, 0.03367401659488678, 0.05211099982261658, 0.07054798305034637, 0.0889849066734314, 0.1074218899011612, 0.125858873128891, 0.1442958563566208, 0.16273283958435059, 0.18116982281208038, 0.19960680603981018, 0.21804378926753998, 0.23648077249526978, 0.2549177408218384, 0.27335473895072937, 0.29179173707962036, 0.31022870540618896, 0.32866567373275757, 0.34710267186164856, 0.36553966999053955, 0.38397663831710815, 0.40241360664367676, 0.42085060477256775, 0.43928760290145874, 0.45772457122802734, 0.47616153955459595, 0.49459853768348694, 0.5130355358123779, 0.5314725041389465, 0.5499094724655151, 0.5683465003967285, 0.5867834687232971, 0.6052204370498657, 0.6236574053764343, 0.6420943737030029, 0.6605314016342163, 0.6789683699607849]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 18.0, 30.0, 35.0, 44.0, 60.0, 85.0, 137.0, 200.0, 319.0, 518.0, 941.0, 1688.0, 3248.0, 6582.0, 14200.0, 32443.0, 74797.0, 159527.0, 255623.0, 242070.0, 140019.0, 64113.0, 27617.0, 12168.0, 5617.0, 2808.0, 1457.0, 813.0, 467.0, 296.0, 172.0, 137.0, 85.0, 54.0, 35.0, 26.0, 27.0, 17.0, 9.0, 9.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1119384765625, -0.10863685607910156, -0.10533523559570312, -0.10203361511230469, -0.09873199462890625, -0.09543037414550781, -0.09212875366210938, -0.08882713317871094, -0.0855255126953125, -0.08222389221191406, -0.07892227172851562, -0.07562065124511719, -0.07231903076171875, -0.06901741027832031, -0.06571578979492188, -0.06241416931152344, -0.059112548828125, -0.05581092834472656, -0.052509307861328125, -0.04920768737792969, -0.04590606689453125, -0.04260444641113281, -0.039302825927734375, -0.03600120544433594, -0.0326995849609375, -0.029397964477539062, -0.026096343994140625, -0.022794723510742188, -0.01949310302734375, -0.016191482543945312, -0.012889862060546875, -0.009588241577148438, -0.00628662109375, -0.0029850006103515625, 0.000316619873046875, 0.0036182403564453125, 0.00691986083984375, 0.010221481323242188, 0.013523101806640625, 0.016824722290039062, 0.0201263427734375, 0.023427963256835938, 0.026729583740234375, 0.030031204223632812, 0.03333282470703125, 0.03663444519042969, 0.039936065673828125, 0.04323768615722656, 0.046539306640625, 0.04984092712402344, 0.053142547607421875, 0.05644416809082031, 0.05974578857421875, 0.06304740905761719, 0.06634902954101562, 0.06965065002441406, 0.0729522705078125, 0.07625389099121094, 0.07955551147460938, 0.08285713195800781, 0.08615875244140625, 0.08946037292480469, 0.09276199340820312, 0.09606361389160156, 0.099365234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 16.0, 16.0, 39.0, 34.0, 36.0, 48.0, 74.0, 67.0, 77.0, 66.0, 69.0, 83.0, 65.0, 69.0, 45.0, 46.0, 36.0, 28.0, 19.0, 17.0, 11.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1470947265625, -0.142730712890625, -0.13836669921875, -0.134002685546875, -0.129638671875, -0.125274658203125, -0.12091064453125, -0.116546630859375, -0.1121826171875, -0.107818603515625, -0.10345458984375, -0.099090576171875, -0.0947265625, -0.090362548828125, -0.08599853515625, -0.081634521484375, -0.0772705078125, -0.072906494140625, -0.06854248046875, -0.064178466796875, -0.059814453125, -0.055450439453125, -0.05108642578125, -0.046722412109375, -0.0423583984375, -0.037994384765625, -0.03363037109375, -0.029266357421875, -0.02490234375, -0.020538330078125, -0.01617431640625, -0.011810302734375, -0.0074462890625, -0.003082275390625, 0.00128173828125, 0.005645751953125, 0.010009765625, 0.014373779296875, 0.01873779296875, 0.023101806640625, 0.0274658203125, 0.031829833984375, 0.03619384765625, 0.040557861328125, 0.044921875, 0.049285888671875, 0.05364990234375, 0.058013916015625, 0.0623779296875, 0.066741943359375, 0.07110595703125, 0.075469970703125, 0.079833984375, 0.084197998046875, 0.08856201171875, 0.092926025390625, 0.0972900390625, 0.101654052734375, 0.10601806640625, 0.110382080078125, 0.11474609375, 0.119110107421875, 0.12347412109375, 0.127838134765625, 0.1322021484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 11.0, 14.0, 22.0, 18.0, 33.0, 43.0, 82.0, 119.0, 147.0, 253.0, 332.0, 471.0, 777.0, 1321.0, 2254.0, 3831.0, 6669.0, 12862.0, 25112.0, 51413.0, 104261.0, 192190.0, 247554.0, 190379.0, 103771.0, 50614.0, 24991.0, 12758.0, 6624.0, 3789.0, 2170.0, 1299.0, 812.0, 498.0, 343.0, 214.0, 146.0, 107.0, 68.0, 39.0, 48.0, 21.0, 16.0, 17.0, 13.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.10833740234375, -0.1051025390625, -0.10186767578125, -0.0986328125, -0.09539794921875, -0.0921630859375, -0.08892822265625, -0.085693359375, -0.08245849609375, -0.0792236328125, -0.07598876953125, -0.07275390625, -0.06951904296875, -0.0662841796875, -0.06304931640625, -0.059814453125, -0.05657958984375, -0.0533447265625, -0.05010986328125, -0.046875, -0.04364013671875, -0.0404052734375, -0.03717041015625, -0.033935546875, -0.03070068359375, -0.0274658203125, -0.02423095703125, -0.02099609375, -0.01776123046875, -0.0145263671875, -0.01129150390625, -0.008056640625, -0.00482177734375, -0.0015869140625, 0.00164794921875, 0.0048828125, 0.00811767578125, 0.0113525390625, 0.01458740234375, 0.017822265625, 0.02105712890625, 0.0242919921875, 0.02752685546875, 0.03076171875, 0.03399658203125, 0.0372314453125, 0.04046630859375, 0.043701171875, 0.04693603515625, 0.0501708984375, 0.05340576171875, 0.056640625, 0.05987548828125, 0.0631103515625, 0.06634521484375, 0.069580078125, 0.07281494140625, 0.0760498046875, 0.07928466796875, 0.08251953125, 0.08575439453125, 0.0889892578125, 0.09222412109375, 0.095458984375, 0.09869384765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 4.0, 9.0, 11.0, 5.0, 19.0, 16.0, 15.0, 19.0, 24.0, 33.0, 25.0, 41.0, 32.0, 38.0, 29.0, 36.0, 47.0, 45.0, 50.0, 51.0, 40.0, 31.0, 46.0, 34.0, 33.0, 27.0, 35.0, 24.0, 24.0, 25.0, 24.0, 15.0, 11.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 7.0, 7.0, 2.0, 6.0, 3.0, 1.0, 3.0], "bins": [-0.264892578125, -0.2575969696044922, -0.2503013610839844, -0.24300575256347656, -0.23571014404296875, -0.22841453552246094, -0.22111892700195312, -0.2138233184814453, -0.2065277099609375, -0.1992321014404297, -0.19193649291992188, -0.18464088439941406, -0.17734527587890625, -0.17004966735839844, -0.16275405883789062, -0.1554584503173828, -0.148162841796875, -0.1408672332763672, -0.13357162475585938, -0.12627601623535156, -0.11898040771484375, -0.11168479919433594, -0.10438919067382812, -0.09709358215332031, -0.0897979736328125, -0.08250236511230469, -0.07520675659179688, -0.06791114807128906, -0.06061553955078125, -0.05331993103027344, -0.046024322509765625, -0.03872871398925781, -0.03143310546875, -0.024137496948242188, -0.016841888427734375, -0.009546279907226562, -0.00225067138671875, 0.0050449371337890625, 0.012340545654296875, 0.019636154174804688, 0.0269317626953125, 0.03422737121582031, 0.041522979736328125, 0.04881858825683594, 0.05611419677734375, 0.06340980529785156, 0.07070541381835938, 0.07800102233886719, 0.085296630859375, 0.09259223937988281, 0.09988784790039062, 0.10718345642089844, 0.11447906494140625, 0.12177467346191406, 0.12907028198242188, 0.1363658905029297, 0.1436614990234375, 0.1509571075439453, 0.15825271606445312, 0.16554832458496094, 0.17284393310546875, 0.18013954162597656, 0.18743515014648438, 0.1947307586669922, 0.2020263671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 11.0, 9.0, 9.0, 26.0, 41.0, 102.0, 204.0, 540.0, 1714.0, 6673.0, 48445.0, 441223.0, 482974.0, 56369.0, 7355.0, 1843.0, 577.0, 217.0, 101.0, 48.0, 26.0, 17.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1123046875, -0.10890483856201172, -0.10550498962402344, -0.10210514068603516, -0.09870529174804688, -0.0953054428100586, -0.09190559387207031, -0.08850574493408203, -0.08510589599609375, -0.08170604705810547, -0.07830619812011719, -0.0749063491821289, -0.07150650024414062, -0.06810665130615234, -0.06470680236816406, -0.06130695343017578, -0.0579071044921875, -0.05450725555419922, -0.05110740661621094, -0.047707557678222656, -0.044307708740234375, -0.040907859802246094, -0.03750801086425781, -0.03410816192626953, -0.03070831298828125, -0.02730846405029297, -0.023908615112304688, -0.020508766174316406, -0.017108917236328125, -0.013709068298339844, -0.010309219360351562, -0.006909370422363281, -0.003509521484375, -0.00010967254638671875, 0.0032901763916015625, 0.006690025329589844, 0.010089874267578125, 0.013489723205566406, 0.016889572143554688, 0.02028942108154297, 0.02368927001953125, 0.02708911895751953, 0.030488967895507812, 0.033888816833496094, 0.037288665771484375, 0.040688514709472656, 0.04408836364746094, 0.04748821258544922, 0.0508880615234375, 0.05428791046142578, 0.05768775939941406, 0.061087608337402344, 0.06448745727539062, 0.0678873062133789, 0.07128715515136719, 0.07468700408935547, 0.07808685302734375, 0.08148670196533203, 0.08488655090332031, 0.0882863998413086, 0.09168624877929688, 0.09508609771728516, 0.09848594665527344, 0.10188579559326172, 0.10528564453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 7.0, 12.0, 12.0, 23.0, 30.0, 42.0, 36.0, 52.0, 81.0, 65.0, 75.0, 86.0, 71.0, 72.0, 65.0, 53.0, 40.0, 43.0, 23.0, 24.0, 18.0, 13.0, 7.0, 10.0, 10.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2576580047607422e-05, -1.2099742889404297e-05, -1.1622905731201172e-05, -1.1146068572998047e-05, -1.0669231414794922e-05, -1.0192394256591797e-05, -9.715557098388672e-06, -9.238719940185547e-06, -8.761882781982422e-06, -8.285045623779297e-06, -7.808208465576172e-06, -7.331371307373047e-06, -6.854534149169922e-06, -6.377696990966797e-06, -5.900859832763672e-06, -5.424022674560547e-06, -4.947185516357422e-06, -4.470348358154297e-06, -3.993511199951172e-06, -3.516674041748047e-06, -3.039836883544922e-06, -2.562999725341797e-06, -2.086162567138672e-06, -1.6093254089355469e-06, -1.1324882507324219e-06, -6.556510925292969e-07, -1.7881393432617188e-07, 2.980232238769531e-07, 7.748603820800781e-07, 1.2516975402832031e-06, 1.7285346984863281e-06, 2.205371856689453e-06, 2.682209014892578e-06, 3.159046173095703e-06, 3.635883331298828e-06, 4.112720489501953e-06, 4.589557647705078e-06, 5.066394805908203e-06, 5.543231964111328e-06, 6.020069122314453e-06, 6.496906280517578e-06, 6.973743438720703e-06, 7.450580596923828e-06, 7.927417755126953e-06, 8.404254913330078e-06, 8.881092071533203e-06, 9.357929229736328e-06, 9.834766387939453e-06, 1.0311603546142578e-05, 1.0788440704345703e-05, 1.1265277862548828e-05, 1.1742115020751953e-05, 1.2218952178955078e-05, 1.2695789337158203e-05, 1.3172626495361328e-05, 1.3649463653564453e-05, 1.4126300811767578e-05, 1.4603137969970703e-05, 1.5079975128173828e-05, 1.5556812286376953e-05, 1.6033649444580078e-05, 1.6510486602783203e-05, 1.6987323760986328e-05, 1.7464160919189453e-05, 1.7940998077392578e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 13.0, 23.0, 27.0, 37.0, 68.0, 125.0, 178.0, 287.0, 572.0, 1011.0, 1986.0, 4909.0, 15223.0, 63172.0, 244376.0, 430834.0, 211379.0, 53020.0, 13064.0, 4277.0, 1742.0, 936.0, 482.0, 314.0, 202.0, 113.0, 56.0, 36.0, 33.0, 13.0, 13.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0577392578125, -0.055708885192871094, -0.05367851257324219, -0.05164813995361328, -0.049617767333984375, -0.04758739471435547, -0.04555702209472656, -0.043526649475097656, -0.04149627685546875, -0.039465904235839844, -0.03743553161621094, -0.03540515899658203, -0.033374786376953125, -0.03134441375732422, -0.029314041137695312, -0.027283668518066406, -0.0252532958984375, -0.023222923278808594, -0.021192550659179688, -0.01916217803955078, -0.017131805419921875, -0.015101432800292969, -0.013071060180664062, -0.011040687561035156, -0.00901031494140625, -0.006979942321777344, -0.0049495697021484375, -0.0029191970825195312, -0.000888824462890625, 0.0011415481567382812, 0.0031719207763671875, 0.005202293395996094, 0.007232666015625, 0.009263038635253906, 0.011293411254882812, 0.013323783874511719, 0.015354156494140625, 0.01738452911376953, 0.019414901733398438, 0.021445274353027344, 0.02347564697265625, 0.025506019592285156, 0.027536392211914062, 0.02956676483154297, 0.031597137451171875, 0.03362751007080078, 0.03565788269042969, 0.037688255310058594, 0.0397186279296875, 0.041749000549316406, 0.04377937316894531, 0.04580974578857422, 0.047840118408203125, 0.04987049102783203, 0.05190086364746094, 0.053931236267089844, 0.05596160888671875, 0.057991981506347656, 0.06002235412597656, 0.06205272674560547, 0.06408309936523438, 0.06611347198486328, 0.06814384460449219, 0.0701742172241211, 0.07220458984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 10.0, 9.0, 11.0, 18.0, 28.0, 24.0, 29.0, 47.0, 71.0, 86.0, 74.0, 95.0, 95.0, 67.0, 71.0, 60.0, 38.0, 31.0, 34.0, 26.0, 12.0, 8.0, 12.0, 9.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.06298828125, -0.060996055603027344, -0.05900382995605469, -0.05701160430908203, -0.055019378662109375, -0.05302715301513672, -0.05103492736816406, -0.049042701721191406, -0.04705047607421875, -0.045058250427246094, -0.04306602478027344, -0.04107379913330078, -0.039081573486328125, -0.03708934783935547, -0.03509712219238281, -0.033104896545410156, -0.0311126708984375, -0.029120445251464844, -0.027128219604492188, -0.02513599395751953, -0.023143768310546875, -0.02115154266357422, -0.019159317016601562, -0.017167091369628906, -0.01517486572265625, -0.013182640075683594, -0.011190414428710938, -0.009198188781738281, -0.007205963134765625, -0.005213737487792969, -0.0032215118408203125, -0.0012292861938476562, 0.000762939453125, 0.0027551651000976562, 0.0047473907470703125, 0.006739616394042969, 0.008731842041015625, 0.010724067687988281, 0.012716293334960938, 0.014708518981933594, 0.01670074462890625, 0.018692970275878906, 0.020685195922851562, 0.02267742156982422, 0.024669647216796875, 0.02666187286376953, 0.028654098510742188, 0.030646324157714844, 0.0326385498046875, 0.034630775451660156, 0.03662300109863281, 0.03861522674560547, 0.040607452392578125, 0.04259967803955078, 0.04459190368652344, 0.046584129333496094, 0.04857635498046875, 0.050568580627441406, 0.05256080627441406, 0.05455303192138672, 0.056545257568359375, 0.05853748321533203, 0.06052970886230469, 0.06252193450927734, 0.06451416015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 31.0, 89.0, 220.0, 285.0, 227.0, 82.0, 45.0, 10.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5981148481369019, -1.5473631620407104, -1.4966115951538086, -1.4458599090576172, -1.3951083421707153, -1.344356656074524, -1.293605089187622, -1.2428534030914307, -1.1921017169952393, -1.1413500308990479, -1.090598464012146, -1.0398467779159546, -0.9890952110290527, -0.9383435249328613, -0.8875918984413147, -0.8368402719497681, -0.7860887050628662, -0.7353370785713196, -0.684585452079773, -0.6338337659835815, -0.5830821990966797, -0.5323305130004883, -0.48157888650894165, -0.430827260017395, -0.3800756335258484, -0.32932400703430176, -0.2785723805427551, -0.2278207242488861, -0.17706909775733948, -0.12631747126579285, -0.07556581497192383, -0.024814188480377197, 0.025937438011169434, 0.07668907195329666, 0.1274407058954239, 0.1781923472881317, 0.22894397377967834, 0.279695600271225, 0.330447256565094, 0.3811988830566406, 0.43195050954818726, 0.4827021360397339, 0.5334537625312805, 0.5842053890228271, 0.6349570751190186, 0.6857086420059204, 0.7364603281021118, 0.7872119545936584, 0.8379635810852051, 0.8887152075767517, 0.9394668340682983, 0.9902185201644897, 1.0409700870513916, 1.091721773147583, 1.1424734592437744, 1.1932250261306763, 1.2439765930175781, 1.2947282791137695, 1.3454798460006714, 1.3962315320968628, 1.4469830989837646, 1.497734785079956, 1.5484864711761475, 1.5992380380630493, 1.6499897241592407]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 10.0, 14.0, 11.0, 13.0, 10.0, 9.0, 19.0, 23.0, 22.0, 34.0, 27.0, 27.0, 26.0, 36.0, 35.0, 30.0, 38.0, 47.0, 40.0, 40.0, 43.0, 31.0, 41.0, 41.0, 42.0, 39.0, 29.0, 33.0, 20.0, 20.0, 22.0, 20.0, 18.0, 26.0, 11.0, 12.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6336472630500793, -0.6144030094146729, -0.5951587557792664, -0.5759145021438599, -0.5566703081130981, -0.5374260544776917, -0.5181818008422852, -0.49893754720687866, -0.47969329357147217, -0.4604490399360657, -0.44120481610298157, -0.4219605624675751, -0.4027163088321686, -0.3834720849990845, -0.364227831363678, -0.3449835777282715, -0.3257393538951874, -0.3064951002597809, -0.2872508764266968, -0.2680066227912903, -0.2487623691558838, -0.2295181304216385, -0.2102738916873932, -0.1910296380519867, -0.1717853993177414, -0.1525411605834961, -0.1332969069480896, -0.1140526682138443, -0.0948084220290184, -0.0755641758441925, -0.056319937109947205, -0.03707568347454071, -0.01783144474029541, 0.0014127995818853378, 0.020657043904066086, 0.039901286363601685, 0.05914553254842758, 0.07838977873325348, 0.09763401746749878, 0.11687827110290527, 0.13612250983715057, 0.15536674857139587, 0.17461100220680237, 0.19385524094104767, 0.21309947967529297, 0.23234373331069946, 0.25158798694610596, 0.27083224058151245, 0.29007646441459656, 0.30932071805000305, 0.32856494188308716, 0.34780919551849365, 0.36705344915390015, 0.38629770278930664, 0.40554192662239075, 0.42478618025779724, 0.44403040409088135, 0.46327465772628784, 0.48251888155937195, 0.501763105392456, 0.5210073590278625, 0.540251612663269, 0.5594958662986755, 0.578740119934082, 0.5979843735694885]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 6.0, 10.0, 12.0, 20.0, 26.0, 29.0, 44.0, 62.0, 121.0, 290.0, 542.0, 1408.0, 4224.0, 18162.0, 160813.0, 1743116.0, 2013262.0, 218221.0, 25222.0, 5918.0, 1676.0, 581.0, 235.0, 105.0, 66.0, 31.0, 30.0, 15.0, 14.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21923828125, -0.2129840850830078, -0.20672988891601562, -0.20047569274902344, -0.19422149658203125, -0.18796730041503906, -0.18171310424804688, -0.1754589080810547, -0.1692047119140625, -0.1629505157470703, -0.15669631958007812, -0.15044212341308594, -0.14418792724609375, -0.13793373107910156, -0.13167953491210938, -0.1254253387451172, -0.119171142578125, -0.11291694641113281, -0.10666275024414062, -0.10040855407714844, -0.09415435791015625, -0.08790016174316406, -0.08164596557617188, -0.07539176940917969, -0.0691375732421875, -0.06288337707519531, -0.056629180908203125, -0.05037498474121094, -0.04412078857421875, -0.03786659240722656, -0.031612396240234375, -0.025358200073242188, -0.01910400390625, -0.012849807739257812, -0.006595611572265625, -0.0003414154052734375, 0.00591278076171875, 0.012166976928710938, 0.018421173095703125, 0.024675369262695312, 0.0309295654296875, 0.03718376159667969, 0.043437957763671875, 0.04969215393066406, 0.05594635009765625, 0.06220054626464844, 0.06845474243164062, 0.07470893859863281, 0.080963134765625, 0.08721733093261719, 0.09347152709960938, 0.09972572326660156, 0.10597991943359375, 0.11223411560058594, 0.11848831176757812, 0.12474250793457031, 0.1309967041015625, 0.1372509002685547, 0.14350509643554688, 0.14975929260253906, 0.15601348876953125, 0.16226768493652344, 0.16852188110351562, 0.1747760772705078, 0.1810302734375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 12.0, 11.0, 29.0, 20.0, 27.0, 32.0, 37.0, 49.0, 59.0, 53.0, 70.0, 66.0, 81.0, 68.0, 54.0, 50.0, 44.0, 42.0, 40.0, 40.0, 31.0, 21.0, 18.0, 14.0, 6.0, 3.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.18310546875, -0.17854881286621094, -0.17399215698242188, -0.1694355010986328, -0.16487884521484375, -0.1603221893310547, -0.15576553344726562, -0.15120887756347656, -0.1466522216796875, -0.14209556579589844, -0.13753890991210938, -0.1329822540283203, -0.12842559814453125, -0.12386894226074219, -0.11931228637695312, -0.11475563049316406, -0.110198974609375, -0.10564231872558594, -0.10108566284179688, -0.09652900695800781, -0.09197235107421875, -0.08741569519042969, -0.08285903930664062, -0.07830238342285156, -0.0737457275390625, -0.06918907165527344, -0.06463241577148438, -0.06007575988769531, -0.05551910400390625, -0.05096244812011719, -0.046405792236328125, -0.04184913635253906, -0.03729248046875, -0.03273582458496094, -0.028179168701171875, -0.023622512817382812, -0.01906585693359375, -0.014509201049804688, -0.009952545166015625, -0.0053958892822265625, -0.0008392333984375, 0.0037174224853515625, 0.008274078369140625, 0.012830734252929688, 0.01738739013671875, 0.021944046020507812, 0.026500701904296875, 0.031057357788085938, 0.035614013671875, 0.04017066955566406, 0.044727325439453125, 0.04928398132324219, 0.05384063720703125, 0.05839729309082031, 0.06295394897460938, 0.06751060485839844, 0.0720672607421875, 0.07662391662597656, 0.08118057250976562, 0.08573722839355469, 0.09029388427734375, 0.09485054016113281, 0.09940719604492188, 0.10396385192871094, 0.1085205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 11.0, 17.0, 24.0, 34.0, 52.0, 59.0, 105.0, 189.0, 300.0, 555.0, 1140.0, 2147.0, 5060.0, 13887.0, 48119.0, 234598.0, 2210028.0, 1460923.0, 160617.0, 36667.0, 11197.0, 4289.0, 1988.0, 965.0, 514.0, 270.0, 181.0, 115.0, 60.0, 33.0, 38.0, 24.0, 19.0, 15.0, 7.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1539306640625, -0.14841270446777344, -0.14289474487304688, -0.1373767852783203, -0.13185882568359375, -0.1263408660888672, -0.12082290649414062, -0.11530494689941406, -0.1097869873046875, -0.10426902770996094, -0.09875106811523438, -0.09323310852050781, -0.08771514892578125, -0.08219718933105469, -0.07667922973632812, -0.07116127014160156, -0.065643310546875, -0.06012535095214844, -0.054607391357421875, -0.04908943176269531, -0.04357147216796875, -0.03805351257324219, -0.032535552978515625, -0.027017593383789062, -0.0214996337890625, -0.015981674194335938, -0.010463714599609375, -0.0049457550048828125, 0.00057220458984375, 0.0060901641845703125, 0.011608123779296875, 0.017126083374023438, 0.02264404296875, 0.028162002563476562, 0.033679962158203125, 0.03919792175292969, 0.04471588134765625, 0.05023384094238281, 0.055751800537109375, 0.06126976013183594, 0.0667877197265625, 0.07230567932128906, 0.07782363891601562, 0.08334159851074219, 0.08885955810546875, 0.09437751770019531, 0.09989547729492188, 0.10541343688964844, 0.110931396484375, 0.11644935607910156, 0.12196731567382812, 0.1274852752685547, 0.13300323486328125, 0.1385211944580078, 0.14403915405273438, 0.14955711364746094, 0.1550750732421875, 0.16059303283691406, 0.16611099243164062, 0.1716289520263672, 0.17714691162109375, 0.1826648712158203, 0.18818283081054688, 0.19370079040527344, 0.19921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 10.0, 7.0, 2.0, 16.0, 20.0, 34.0, 39.0, 55.0, 97.0, 147.0, 235.0, 500.0, 759.0, 733.0, 551.0, 327.0, 178.0, 105.0, 72.0, 49.0, 41.0, 28.0, 16.0, 13.0, 9.0, 5.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.1539459228515625, -0.147003173828125, -0.1400604248046875, -0.13311767578125, -0.1261749267578125, -0.119232177734375, -0.1122894287109375, -0.1053466796875, -0.0984039306640625, -0.091461181640625, -0.0845184326171875, -0.07757568359375, -0.0706329345703125, -0.063690185546875, -0.0567474365234375, -0.0498046875, -0.0428619384765625, -0.035919189453125, -0.0289764404296875, -0.02203369140625, -0.0150909423828125, -0.008148193359375, -0.0012054443359375, 0.0057373046875, 0.0126800537109375, 0.019622802734375, 0.0265655517578125, 0.03350830078125, 0.0404510498046875, 0.047393798828125, 0.0543365478515625, 0.061279296875, 0.0682220458984375, 0.075164794921875, 0.0821075439453125, 0.08905029296875, 0.0959930419921875, 0.102935791015625, 0.1098785400390625, 0.1168212890625, 0.1237640380859375, 0.130706787109375, 0.1376495361328125, 0.14459228515625, 0.1515350341796875, 0.158477783203125, 0.1654205322265625, 0.17236328125, 0.1793060302734375, 0.186248779296875, 0.1931915283203125, 0.20013427734375, 0.2070770263671875, 0.214019775390625, 0.2209625244140625, 0.2279052734375, 0.2348480224609375, 0.241790771484375, 0.2487335205078125, 0.25567626953125, 0.2626190185546875, 0.269561767578125, 0.2765045166015625, 0.283447265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 10.0, 10.0, 22.0, 60.0, 97.0, 124.0, 160.0, 183.0, 150.0, 78.0, 43.0, 27.0, 18.0, 9.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8734561204910278, -0.8367131948471069, -0.7999702095985413, -0.7632272243499756, -0.7264842987060547, -0.6897413730621338, -0.6529983878135681, -0.6162554025650024, -0.5795124769210815, -0.5427695512771606, -0.506026566028595, -0.4692836105823517, -0.4325406551361084, -0.3957976996898651, -0.3590547442436218, -0.32231178879737854, -0.28556883335113525, -0.24882587790489197, -0.21208292245864868, -0.1753399670124054, -0.1385970115661621, -0.10185405611991882, -0.06511110067367554, -0.02836814522743225, 0.008374810218811035, 0.04511776566505432, 0.08186072111129761, 0.1186036765575409, 0.15534663200378418, 0.19208958745002747, 0.22883254289627075, 0.26557549834251404, 0.3023185729980469, 0.33906152844429016, 0.37580448389053345, 0.41254743933677673, 0.44929039478302, 0.4860333502292633, 0.5227763056755066, 0.5595192909240723, 0.5962622165679932, 0.6330051422119141, 0.6697481274604797, 0.7064911127090454, 0.7432340383529663, 0.7799769639968872, 0.8167199492454529, 0.8534629344940186, 0.8902058601379395, 0.9269487857818604, 0.963691771030426, 1.0004347562789917, 1.0371776819229126, 1.0739206075668335, 1.110663652420044, 1.1474065780639648, 1.1841495037078857, 1.2208924293518066, 1.2576353549957275, 1.294378399848938, 1.3311213254928589, 1.3678642511367798, 1.4046072959899902, 1.4413502216339111, 1.478093147277832]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 11.0, 9.0, 10.0, 10.0, 18.0, 24.0, 22.0, 24.0, 25.0, 36.0, 43.0, 45.0, 44.0, 47.0, 54.0, 56.0, 51.0, 43.0, 53.0, 37.0, 41.0, 44.0, 41.0, 32.0, 19.0, 30.0, 24.0, 26.0, 15.0, 15.0, 15.0, 6.0, 12.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.574685275554657, -0.5561550855636597, -0.5376248955726624, -0.519094705581665, -0.5005645751953125, -0.4820343554019928, -0.46350419521331787, -0.44497400522232056, -0.42644381523132324, -0.4079136252403259, -0.3893834352493286, -0.3708532750606537, -0.35232308506965637, -0.33379289507865906, -0.31526273488998413, -0.2967325448989868, -0.2782023549079895, -0.2596721649169922, -0.24114198982715607, -0.22261181473731995, -0.20408162474632263, -0.18555143475532532, -0.1670212596654892, -0.14849108457565308, -0.12996089458465576, -0.11143071204423904, -0.09290052950382233, -0.07437034696340561, -0.05584016442298889, -0.037309981882572174, -0.018779799342155457, -0.00024962425231933594, 0.01828056573867798, 0.036810748279094696, 0.055340930819511414, 0.07387111335992813, 0.09240129590034485, 0.11093147844076157, 0.12946166098117828, 0.1479918360710144, 0.16652202606201172, 0.18505221605300903, 0.20358239114284515, 0.22211256623268127, 0.2406427562236786, 0.2591729462146759, 0.27770310640335083, 0.29623329639434814, 0.31476348638534546, 0.3332936763763428, 0.3518238663673401, 0.370354026556015, 0.38888421654701233, 0.40741440653800964, 0.42594456672668457, 0.4444747567176819, 0.4630049467086792, 0.4815351366996765, 0.5000653266906738, 0.5185955166816711, 0.5371257066726685, 0.555655837059021, 0.5741860270500183, 0.5927162170410156, 0.6112464070320129]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 0.0, 4.0, 9.0, 6.0, 5.0, 13.0, 17.0, 33.0, 41.0, 83.0, 76.0, 169.0, 249.0, 416.0, 759.0, 1319.0, 2289.0, 4137.0, 7581.0, 13620.0, 25719.0, 46173.0, 84620.0, 148703.0, 215112.0, 203963.0, 131375.0, 73556.0, 39946.0, 21564.0, 12048.0, 6479.0, 3559.0, 1972.0, 1147.0, 701.0, 363.0, 237.0, 157.0, 107.0, 75.0, 49.0, 34.0, 18.0, 14.0, 12.0, 5.0, 8.0, 7.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09765625, -0.09449386596679688, -0.09133148193359375, -0.08816909790039062, -0.0850067138671875, -0.08184432983398438, -0.07868194580078125, -0.07551956176757812, -0.072357177734375, -0.06919479370117188, -0.06603240966796875, -0.06287002563476562, -0.0597076416015625, -0.056545257568359375, -0.05338287353515625, -0.050220489501953125, -0.04705810546875, -0.043895721435546875, -0.04073333740234375, -0.037570953369140625, -0.0344085693359375, -0.031246185302734375, -0.02808380126953125, -0.024921417236328125, -0.021759033203125, -0.018596649169921875, -0.01543426513671875, -0.012271881103515625, -0.0091094970703125, -0.005947113037109375, -0.00278472900390625, 0.000377655029296875, 0.0035400390625, 0.006702423095703125, 0.00986480712890625, 0.013027191162109375, 0.0161895751953125, 0.019351959228515625, 0.02251434326171875, 0.025676727294921875, 0.028839111328125, 0.032001495361328125, 0.03516387939453125, 0.038326263427734375, 0.0414886474609375, 0.044651031494140625, 0.04781341552734375, 0.050975799560546875, 0.05413818359375, 0.057300567626953125, 0.06046295166015625, 0.06362533569335938, 0.0667877197265625, 0.06995010375976562, 0.07311248779296875, 0.07627487182617188, 0.079437255859375, 0.08259963989257812, 0.08576202392578125, 0.08892440795898438, 0.0920867919921875, 0.09524917602539062, 0.09841156005859375, 0.10157394409179688, 0.104736328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 17.0, 16.0, 29.0, 32.0, 46.0, 27.0, 50.0, 42.0, 51.0, 64.0, 61.0, 74.0, 55.0, 55.0, 43.0, 63.0, 37.0, 32.0, 43.0, 26.0, 31.0, 20.0, 14.0, 13.0, 13.0, 13.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.13027286529541016, -0.1262683868408203, -0.12226390838623047, -0.11825942993164062, -0.11425495147705078, -0.11025047302246094, -0.1062459945678711, -0.10224151611328125, -0.0982370376586914, -0.09423255920410156, -0.09022808074951172, -0.08622360229492188, -0.08221912384033203, -0.07821464538574219, -0.07421016693115234, -0.0702056884765625, -0.06620121002197266, -0.06219673156738281, -0.05819225311279297, -0.054187774658203125, -0.05018329620361328, -0.04617881774902344, -0.042174339294433594, -0.03816986083984375, -0.034165382385253906, -0.030160903930664062, -0.02615642547607422, -0.022151947021484375, -0.01814746856689453, -0.014142990112304688, -0.010138511657714844, -0.006134033203125, -0.0021295547485351562, 0.0018749237060546875, 0.005879402160644531, 0.009883880615234375, 0.013888359069824219, 0.017892837524414062, 0.021897315979003906, 0.02590179443359375, 0.029906272888183594, 0.03391075134277344, 0.03791522979736328, 0.041919708251953125, 0.04592418670654297, 0.04992866516113281, 0.053933143615722656, 0.0579376220703125, 0.061942100524902344, 0.06594657897949219, 0.06995105743408203, 0.07395553588867188, 0.07796001434326172, 0.08196449279785156, 0.0859689712524414, 0.08997344970703125, 0.0939779281616211, 0.09798240661621094, 0.10198688507080078, 0.10599136352539062, 0.10999584197998047, 0.11400032043457031, 0.11800479888916016, 0.12200927734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 5.0, 17.0, 29.0, 39.0, 59.0, 88.0, 146.0, 244.0, 384.0, 732.0, 1405.0, 2720.0, 5930.0, 13425.0, 32293.0, 83611.0, 223462.0, 361574.0, 197447.0, 73537.0, 28907.0, 11877.0, 5220.0, 2438.0, 1290.0, 683.0, 391.0, 223.0, 132.0, 83.0, 57.0, 33.0, 20.0, 10.0, 9.0, 4.0, 8.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.14000320434570312, -0.13449859619140625, -0.12899398803710938, -0.1234893798828125, -0.11798477172851562, -0.11248016357421875, -0.10697555541992188, -0.101470947265625, -0.09596633911132812, -0.09046173095703125, -0.08495712280273438, -0.0794525146484375, -0.07394790649414062, -0.06844329833984375, -0.06293869018554688, -0.05743408203125, -0.051929473876953125, -0.04642486572265625, -0.040920257568359375, -0.0354156494140625, -0.029911041259765625, -0.02440643310546875, -0.018901824951171875, -0.013397216796875, -0.007892608642578125, -0.00238800048828125, 0.003116607666015625, 0.0086212158203125, 0.014125823974609375, 0.01963043212890625, 0.025135040283203125, 0.0306396484375, 0.036144256591796875, 0.04164886474609375, 0.047153472900390625, 0.0526580810546875, 0.058162689208984375, 0.06366729736328125, 0.06917190551757812, 0.074676513671875, 0.08018112182617188, 0.08568572998046875, 0.09119033813476562, 0.0966949462890625, 0.10219955444335938, 0.10770416259765625, 0.11320877075195312, 0.11871337890625, 0.12421798706054688, 0.12972259521484375, 0.13522720336914062, 0.1407318115234375, 0.14623641967773438, 0.15174102783203125, 0.15724563598632812, 0.162750244140625, 0.16825485229492188, 0.17375946044921875, 0.17926406860351562, 0.1847686767578125, 0.19027328491210938, 0.19577789306640625, 0.20128250122070312, 0.206787109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 6.0, 9.0, 11.0, 10.0, 15.0, 11.0, 15.0, 16.0, 24.0, 22.0, 15.0, 30.0, 40.0, 32.0, 34.0, 44.0, 52.0, 34.0, 34.0, 50.0, 42.0, 31.0, 41.0, 35.0, 48.0, 42.0, 44.0, 23.0, 32.0, 30.0, 19.0, 22.0, 13.0, 9.0, 14.0, 13.0, 13.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.357421875, -0.34824371337890625, -0.3390655517578125, -0.32988739013671875, -0.320709228515625, -0.31153106689453125, -0.3023529052734375, -0.29317474365234375, -0.28399658203125, -0.27481842041015625, -0.2656402587890625, -0.25646209716796875, -0.247283935546875, -0.23810577392578125, -0.2289276123046875, -0.21974945068359375, -0.2105712890625, -0.20139312744140625, -0.1922149658203125, -0.18303680419921875, -0.173858642578125, -0.16468048095703125, -0.1555023193359375, -0.14632415771484375, -0.13714599609375, -0.12796783447265625, -0.1187896728515625, -0.10961151123046875, -0.100433349609375, -0.09125518798828125, -0.0820770263671875, -0.07289886474609375, -0.063720703125, -0.05454254150390625, -0.0453643798828125, -0.03618621826171875, -0.027008056640625, -0.01782989501953125, -0.0086517333984375, 0.00052642822265625, 0.00970458984375, 0.01888275146484375, 0.0280609130859375, 0.03723907470703125, 0.046417236328125, 0.05559539794921875, 0.0647735595703125, 0.07395172119140625, 0.0831298828125, 0.09230804443359375, 0.1014862060546875, 0.11066436767578125, 0.119842529296875, 0.12902069091796875, 0.1381988525390625, 0.14737701416015625, 0.15655517578125, 0.16573333740234375, 0.1749114990234375, 0.18408966064453125, 0.193267822265625, 0.20244598388671875, 0.2116241455078125, 0.22080230712890625, 0.22998046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 20.0, 21.0, 40.0, 59.0, 110.0, 190.0, 393.0, 710.0, 1534.0, 3229.0, 7203.0, 17610.0, 46101.0, 132995.0, 320137.0, 315106.0, 128181.0, 44715.0, 17030.0, 7070.0, 3072.0, 1529.0, 722.0, 334.0, 188.0, 101.0, 59.0, 33.0, 24.0, 13.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.057037353515625, -0.05525398254394531, -0.053470611572265625, -0.05168724060058594, -0.04990386962890625, -0.04812049865722656, -0.046337127685546875, -0.04455375671386719, -0.0427703857421875, -0.04098701477050781, -0.039203643798828125, -0.03742027282714844, -0.03563690185546875, -0.03385353088378906, -0.032070159912109375, -0.030286788940429688, -0.02850341796875, -0.026720046997070312, -0.024936676025390625, -0.023153305053710938, -0.02136993408203125, -0.019586563110351562, -0.017803192138671875, -0.016019821166992188, -0.0142364501953125, -0.012453079223632812, -0.010669708251953125, -0.008886337280273438, -0.00710296630859375, -0.0053195953369140625, -0.003536224365234375, -0.0017528533935546875, 3.0517578125e-05, 0.0018138885498046875, 0.003597259521484375, 0.0053806304931640625, 0.00716400146484375, 0.008947372436523438, 0.010730743408203125, 0.012514114379882812, 0.0142974853515625, 0.016080856323242188, 0.017864227294921875, 0.019647598266601562, 0.02143096923828125, 0.023214340209960938, 0.024997711181640625, 0.026781082153320312, 0.028564453125, 0.030347824096679688, 0.032131195068359375, 0.03391456604003906, 0.03569793701171875, 0.03748130798339844, 0.039264678955078125, 0.04104804992675781, 0.0428314208984375, 0.04461479187011719, 0.046398162841796875, 0.04818153381347656, 0.04996490478515625, 0.05174827575683594, 0.053531646728515625, 0.05531501770019531, 0.057098388671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 3.0, 6.0, 6.0, 12.0, 15.0, 14.0, 27.0, 32.0, 41.0, 57.0, 63.0, 82.0, 109.0, 102.0, 113.0, 77.0, 54.0, 49.0, 41.0, 24.0, 23.0, 16.0, 15.0, 8.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181529998779297e-05, -2.1141953766345978e-05, -2.0468607544898987e-05, -1.9795261323451996e-05, -1.9121915102005005e-05, -1.8448568880558014e-05, -1.7775222659111023e-05, -1.7101876437664032e-05, -1.642853021621704e-05, -1.575518399477005e-05, -1.5081837773323059e-05, -1.4408491551876068e-05, -1.3735145330429077e-05, -1.3061799108982086e-05, -1.2388452887535095e-05, -1.1715106666088104e-05, -1.1041760444641113e-05, -1.0368414223194122e-05, -9.695068001747131e-06, -9.02172178030014e-06, -8.34837555885315e-06, -7.675029337406158e-06, -7.0016831159591675e-06, -6.3283368945121765e-06, -5.6549906730651855e-06, -4.981644451618195e-06, -4.308298230171204e-06, -3.6349520087242126e-06, -2.9616057872772217e-06, -2.2882595658302307e-06, -1.6149133443832397e-06, -9.415671229362488e-07, -2.682209014892578e-07, 4.0512531995773315e-07, 1.0784715414047241e-06, 1.751817762851715e-06, 2.425163984298706e-06, 3.098510205745697e-06, 3.771856427192688e-06, 4.445202648639679e-06, 5.11854887008667e-06, 5.791895091533661e-06, 6.465241312980652e-06, 7.138587534427643e-06, 7.811933755874634e-06, 8.485279977321625e-06, 9.158626198768616e-06, 9.831972420215607e-06, 1.0505318641662598e-05, 1.1178664863109589e-05, 1.185201108455658e-05, 1.252535730600357e-05, 1.3198703527450562e-05, 1.3872049748897552e-05, 1.4545395970344543e-05, 1.5218742191791534e-05, 1.5892088413238525e-05, 1.6565434634685516e-05, 1.7238780856132507e-05, 1.7912127077579498e-05, 1.858547329902649e-05, 1.925881952047348e-05, 1.993216574192047e-05, 2.0605511963367462e-05, 2.1278858184814453e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 12.0, 10.0, 25.0, 39.0, 71.0, 98.0, 147.0, 256.0, 456.0, 958.0, 1733.0, 3661.0, 7735.0, 17970.0, 42579.0, 102089.0, 217242.0, 290618.0, 201113.0, 92788.0, 38613.0, 16354.0, 7306.0, 3298.0, 1533.0, 790.0, 412.0, 259.0, 134.0, 83.0, 46.0, 37.0, 14.0, 20.0, 12.0, 5.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040130615234375, -0.03871965408325195, -0.037308692932128906, -0.03589773178100586, -0.03448677062988281, -0.033075809478759766, -0.03166484832763672, -0.030253887176513672, -0.028842926025390625, -0.027431964874267578, -0.02602100372314453, -0.024610042572021484, -0.023199081420898438, -0.02178812026977539, -0.020377159118652344, -0.018966197967529297, -0.01755523681640625, -0.016144275665283203, -0.014733314514160156, -0.01332235336303711, -0.011911392211914062, -0.010500431060791016, -0.009089469909667969, -0.007678508758544922, -0.006267547607421875, -0.004856586456298828, -0.0034456253051757812, -0.0020346641540527344, -0.0006237030029296875, 0.0007872581481933594, 0.0021982192993164062, 0.003609180450439453, 0.0050201416015625, 0.006431102752685547, 0.007842063903808594, 0.00925302505493164, 0.010663986206054688, 0.012074947357177734, 0.013485908508300781, 0.014896869659423828, 0.016307830810546875, 0.017718791961669922, 0.01912975311279297, 0.020540714263916016, 0.021951675415039062, 0.02336263656616211, 0.024773597717285156, 0.026184558868408203, 0.02759552001953125, 0.029006481170654297, 0.030417442321777344, 0.03182840347290039, 0.03323936462402344, 0.034650325775146484, 0.03606128692626953, 0.03747224807739258, 0.038883209228515625, 0.04029417037963867, 0.04170513153076172, 0.043116092681884766, 0.04452705383300781, 0.04593801498413086, 0.047348976135253906, 0.04875993728637695, 0.0501708984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 12.0, 8.0, 18.0, 15.0, 26.0, 35.0, 36.0, 32.0, 43.0, 48.0, 62.0, 64.0, 62.0, 75.0, 56.0, 69.0, 59.0, 35.0, 37.0, 42.0, 43.0, 23.0, 19.0, 10.0, 13.0, 5.0, 8.0, 12.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.061676025390625, -0.0599360466003418, -0.058196067810058594, -0.05645608901977539, -0.05471611022949219, -0.052976131439208984, -0.05123615264892578, -0.04949617385864258, -0.047756195068359375, -0.04601621627807617, -0.04427623748779297, -0.042536258697509766, -0.04079627990722656, -0.03905630111694336, -0.037316322326660156, -0.03557634353637695, -0.03383636474609375, -0.03209638595581055, -0.030356407165527344, -0.02861642837524414, -0.026876449584960938, -0.025136470794677734, -0.02339649200439453, -0.021656513214111328, -0.019916534423828125, -0.018176555633544922, -0.01643657684326172, -0.014696598052978516, -0.012956619262695312, -0.01121664047241211, -0.009476661682128906, -0.007736682891845703, -0.0059967041015625, -0.004256725311279297, -0.0025167465209960938, -0.0007767677307128906, 0.0009632110595703125, 0.0027031898498535156, 0.004443168640136719, 0.006183147430419922, 0.007923126220703125, 0.009663105010986328, 0.011403083801269531, 0.013143062591552734, 0.014883041381835938, 0.01662302017211914, 0.018362998962402344, 0.020102977752685547, 0.02184295654296875, 0.023582935333251953, 0.025322914123535156, 0.02706289291381836, 0.028802871704101562, 0.030542850494384766, 0.03228282928466797, 0.03402280807495117, 0.035762786865234375, 0.03750276565551758, 0.03924274444580078, 0.040982723236083984, 0.04272270202636719, 0.04446268081665039, 0.046202659606933594, 0.0479426383972168, 0.0496826171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 24.0, 32.0, 47.0, 83.0, 117.0, 155.0, 161.0, 134.0, 105.0, 53.0, 29.0, 15.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1331210136413574, -1.10261070728302, -1.0721004009246826, -1.0415900945663452, -1.0110797882080078, -0.9805694818496704, -0.9500591158866882, -0.9195488095283508, -0.8890385031700134, -0.858528196811676, -0.8280178904533386, -0.7975075840950012, -0.766997218132019, -0.7364869117736816, -0.7059766054153442, -0.6754662990570068, -0.6449559926986694, -0.614445686340332, -0.5839353799819946, -0.5534250736236572, -0.5229147672653198, -0.49240443110466003, -0.46189409494400024, -0.43138378858566284, -0.40087348222732544, -0.37036317586898804, -0.33985286951065063, -0.30934253334999084, -0.27883222699165344, -0.24832192063331604, -0.21781159937381744, -0.18730127811431885, -0.15679091215133667, -0.12628060579299927, -0.09577028453350067, -0.06525997072458267, -0.03474965691566467, -0.0042393505573272705, 0.026270970702171326, 0.05678129196166992, 0.08729159832000732, 0.11780191212892532, 0.14831222593784332, 0.17882254719734192, 0.20933285355567932, 0.23984315991401672, 0.2703534960746765, 0.3008638024330139, 0.3313741087913513, 0.3618844151496887, 0.3923947215080261, 0.4229050576686859, 0.4534153640270233, 0.4839256703853607, 0.5144360065460205, 0.5449463129043579, 0.5754566192626953, 0.6059669256210327, 0.6364772319793701, 0.6669875383377075, 0.6974978446960449, 0.7280081510543823, 0.7585185170173645, 0.7890288233757019, 0.8195391297340393]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 8.0, 10.0, 12.0, 14.0, 11.0, 15.0, 19.0, 24.0, 23.0, 30.0, 31.0, 30.0, 34.0, 33.0, 37.0, 41.0, 49.0, 39.0, 40.0, 57.0, 51.0, 41.0, 35.0, 41.0, 40.0, 37.0, 33.0, 24.0, 24.0, 26.0, 13.0, 16.0, 10.0, 11.0, 14.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.628786027431488, -0.6077795624732971, -0.5867730379104614, -0.5657665729522705, -0.5447601079940796, -0.5237536430358887, -0.5027471780776978, -0.48174065351486206, -0.46073418855667114, -0.4397277235984802, -0.4187212288379669, -0.3977147340774536, -0.3767082691192627, -0.3557018041610718, -0.33469530940055847, -0.31368881464004517, -0.29268234968185425, -0.27167588472366333, -0.25066938996315, -0.2296629101037979, -0.2086564302444458, -0.1876499503850937, -0.16664347052574158, -0.14563699066638947, -0.12463051080703735, -0.10362403094768524, -0.08261755108833313, -0.06161107122898102, -0.040604591369628906, -0.019598111510276794, 0.0014083683490753174, 0.02241484820842743, 0.043421387672424316, 0.06442786753177643, 0.08543434739112854, 0.10644082725048065, 0.12744730710983276, 0.14845378696918488, 0.169460266828537, 0.1904667466878891, 0.2114732265472412, 0.23247970640659332, 0.25348618626594543, 0.27449268102645874, 0.29549914598464966, 0.3165056109428406, 0.3375121057033539, 0.3585186004638672, 0.3795250654220581, 0.400531530380249, 0.42153802514076233, 0.44254451990127563, 0.46355098485946655, 0.48455744981765747, 0.5055639743804932, 0.5265704393386841, 0.547576904296875, 0.5685833692550659, 0.5895898342132568, 0.6105963587760925, 0.6316028237342834, 0.6526092886924744, 0.6736158132553101, 0.694622278213501, 0.7156287431716919]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 15.0, 14.0, 18.0, 28.0, 41.0, 71.0, 76.0, 131.0, 220.0, 384.0, 678.0, 1210.0, 2400.0, 5146.0, 11516.0, 28195.0, 75144.0, 213843.0, 572893.0, 1066852.0, 1127928.0, 654324.0, 269392.0, 97104.0, 37877.0, 15733.0, 6372.0, 2969.0, 1647.0, 831.0, 442.0, 293.0, 151.0, 114.0, 68.0, 40.0, 33.0, 19.0, 13.0, 9.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08270263671875, -0.08012771606445312, -0.07755279541015625, -0.07497787475585938, -0.0724029541015625, -0.06982803344726562, -0.06725311279296875, -0.06467819213867188, -0.062103271484375, -0.059528350830078125, -0.05695343017578125, -0.054378509521484375, -0.0518035888671875, -0.049228668212890625, -0.04665374755859375, -0.044078826904296875, -0.04150390625, -0.038928985595703125, -0.03635406494140625, -0.033779144287109375, -0.0312042236328125, -0.028629302978515625, -0.02605438232421875, -0.023479461669921875, -0.020904541015625, -0.018329620361328125, -0.01575469970703125, -0.013179779052734375, -0.0106048583984375, -0.008029937744140625, -0.00545501708984375, -0.002880096435546875, -0.00030517578125, 0.002269744873046875, 0.00484466552734375, 0.007419586181640625, 0.0099945068359375, 0.012569427490234375, 0.01514434814453125, 0.017719268798828125, 0.020294189453125, 0.022869110107421875, 0.02544403076171875, 0.028018951416015625, 0.0305938720703125, 0.033168792724609375, 0.03574371337890625, 0.038318634033203125, 0.0408935546875, 0.043468475341796875, 0.04604339599609375, 0.048618316650390625, 0.0511932373046875, 0.053768157958984375, 0.05634307861328125, 0.058917999267578125, 0.061492919921875, 0.06406784057617188, 0.06664276123046875, 0.06921768188476562, 0.0717926025390625, 0.07436752319335938, 0.07694244384765625, 0.07951736450195312, 0.08209228515625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 18.0, 14.0, 18.0, 33.0, 19.0, 34.0, 45.0, 58.0, 42.0, 67.0, 64.0, 48.0, 71.0, 49.0, 51.0, 60.0, 43.0, 44.0, 39.0, 38.0, 27.0, 32.0, 17.0, 13.0, 9.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1456298828125, -0.14133262634277344, -0.13703536987304688, -0.1327381134033203, -0.12844085693359375, -0.12414360046386719, -0.11984634399414062, -0.11554908752441406, -0.1112518310546875, -0.10695457458496094, -0.10265731811523438, -0.09836006164550781, -0.09406280517578125, -0.08976554870605469, -0.08546829223632812, -0.08117103576660156, -0.076873779296875, -0.07257652282714844, -0.06827926635742188, -0.06398200988769531, -0.05968475341796875, -0.05538749694824219, -0.051090240478515625, -0.04679298400878906, -0.0424957275390625, -0.03819847106933594, -0.033901214599609375, -0.029603958129882812, -0.02530670166015625, -0.021009445190429688, -0.016712188720703125, -0.012414932250976562, -0.00811767578125, -0.0038204193115234375, 0.000476837158203125, 0.0047740936279296875, 0.00907135009765625, 0.013368606567382812, 0.017665863037109375, 0.021963119506835938, 0.0262603759765625, 0.030557632446289062, 0.034854888916015625, 0.03915214538574219, 0.04344940185546875, 0.04774665832519531, 0.052043914794921875, 0.05634117126464844, 0.060638427734375, 0.06493568420410156, 0.06923294067382812, 0.07353019714355469, 0.07782745361328125, 0.08212471008300781, 0.08642196655273438, 0.09071922302246094, 0.0950164794921875, 0.09931373596191406, 0.10361099243164062, 0.10790824890136719, 0.11220550537109375, 0.11650276184082031, 0.12080001831054688, 0.12509727478027344, 0.12939453125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 8.0, 10.0, 15.0, 17.0, 19.0, 41.0, 58.0, 84.0, 173.0, 313.0, 632.0, 1758.0, 6026.0, 28346.0, 225764.0, 2960943.0, 881524.0, 71287.0, 12129.0, 3059.0, 1111.0, 468.0, 201.0, 126.0, 62.0, 51.0, 21.0, 13.0, 16.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15440940856933594, -0.14658737182617188, -0.1387653350830078, -0.13094329833984375, -0.12312126159667969, -0.11529922485351562, -0.10747718811035156, -0.0996551513671875, -0.09183311462402344, -0.08401107788085938, -0.07618904113769531, -0.06836700439453125, -0.06054496765136719, -0.052722930908203125, -0.04490089416503906, -0.037078857421875, -0.029256820678710938, -0.021434783935546875, -0.013612747192382812, -0.00579071044921875, 0.0020313262939453125, 0.009853363037109375, 0.017675399780273438, 0.0254974365234375, 0.03331947326660156, 0.041141510009765625, 0.04896354675292969, 0.05678558349609375, 0.06460762023925781, 0.07242965698242188, 0.08025169372558594, 0.08807373046875, 0.09589576721191406, 0.10371780395507812, 0.11153984069824219, 0.11936187744140625, 0.1271839141845703, 0.13500595092773438, 0.14282798767089844, 0.1506500244140625, 0.15847206115722656, 0.16629409790039062, 0.1741161346435547, 0.18193817138671875, 0.1897602081298828, 0.19758224487304688, 0.20540428161621094, 0.213226318359375, 0.22104835510253906, 0.22887039184570312, 0.2366924285888672, 0.24451446533203125, 0.2523365020751953, 0.2601585388183594, 0.26798057556152344, 0.2758026123046875, 0.28362464904785156, 0.2914466857910156, 0.2992687225341797, 0.30709075927734375, 0.3149127960205078, 0.3227348327636719, 0.33055686950683594, 0.33837890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 10.0, 3.0, 15.0, 18.0, 15.0, 23.0, 40.0, 40.0, 70.0, 120.0, 181.0, 318.0, 498.0, 638.0, 685.0, 514.0, 305.0, 180.0, 124.0, 73.0, 64.0, 48.0, 23.0, 24.0, 17.0, 7.0, 10.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160400390625, -0.1537017822265625, -0.147003173828125, -0.1403045654296875, -0.13360595703125, -0.1269073486328125, -0.120208740234375, -0.1135101318359375, -0.1068115234375, -0.1001129150390625, -0.093414306640625, -0.0867156982421875, -0.08001708984375, -0.0733184814453125, -0.066619873046875, -0.0599212646484375, -0.05322265625, -0.0465240478515625, -0.039825439453125, -0.0331268310546875, -0.02642822265625, -0.0197296142578125, -0.013031005859375, -0.0063323974609375, 0.0003662109375, 0.0070648193359375, 0.013763427734375, 0.0204620361328125, 0.02716064453125, 0.0338592529296875, 0.040557861328125, 0.0472564697265625, 0.053955078125, 0.0606536865234375, 0.067352294921875, 0.0740509033203125, 0.08074951171875, 0.0874481201171875, 0.094146728515625, 0.1008453369140625, 0.1075439453125, 0.1142425537109375, 0.120941162109375, 0.1276397705078125, 0.13433837890625, 0.1410369873046875, 0.147735595703125, 0.1544342041015625, 0.1611328125, 0.1678314208984375, 0.174530029296875, 0.1812286376953125, 0.18792724609375, 0.1946258544921875, 0.201324462890625, 0.2080230712890625, 0.2147216796875, 0.2214202880859375, 0.228118896484375, 0.2348175048828125, 0.24151611328125, 0.2482147216796875, 0.254913330078125, 0.2616119384765625, 0.268310546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 24.0, 42.0, 76.0, 152.0, 211.0, 181.0, 132.0, 89.0, 46.0, 18.0, 11.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6986613273620605, -1.6522955894470215, -1.6059297323226929, -1.5595639944076538, -1.5131982564926147, -1.4668323993682861, -1.420466661453247, -1.374100923538208, -1.327735185623169, -1.2813694477081299, -1.2350035905838013, -1.1886378526687622, -1.1422721147537231, -1.0959062576293945, -1.0495405197143555, -1.0031747817993164, -0.9568089246749878, -0.910443127155304, -0.8640773892402649, -0.817711591720581, -0.771345853805542, -0.7249800562858582, -0.6786142587661743, -0.6322485208511353, -0.5858827233314514, -0.5395169258117676, -0.4931511878967285, -0.4467853903770447, -0.4004196226596832, -0.3540538549423218, -0.30768805742263794, -0.2613222897052765, -0.2149564027786255, -0.16859063506126404, -0.1222248524427414, -0.07585906982421875, -0.0294933021068573, 0.01687246561050415, 0.06323826313018799, 0.10960403084754944, 0.1559697985649109, 0.20233556628227234, 0.24870134890079498, 0.2950671315193176, 0.3414328992366791, 0.3877986669540405, 0.43416446447372437, 0.4805302321910858, 0.5268959999084473, 0.5732617974281311, 0.6196275353431702, 0.665993332862854, 0.7123590707778931, 0.7587248682975769, 0.8050906658172607, 0.8514564037322998, 0.8978222012519836, 0.9441879987716675, 0.9905537366867065, 1.0369195938110352, 1.0832853317260742, 1.1296510696411133, 1.1760168075561523, 1.222382664680481, 1.26874840259552]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 12.0, 9.0, 3.0, 11.0, 7.0, 18.0, 14.0, 12.0, 18.0, 23.0, 22.0, 30.0, 33.0, 30.0, 36.0, 40.0, 41.0, 33.0, 36.0, 28.0, 40.0, 41.0, 43.0, 38.0, 35.0, 42.0, 28.0, 41.0, 25.0, 29.0, 21.0, 24.0, 28.0, 21.0, 13.0, 11.0, 16.0, 10.0, 15.0, 6.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5187353491783142, -0.5014481544494629, -0.4841609001159668, -0.4668736755847931, -0.4495864510536194, -0.43229925632476807, -0.41501203179359436, -0.39772480726242065, -0.38043758273124695, -0.36315035820007324, -0.34586313366889954, -0.32857590913772583, -0.3112887144088745, -0.2940014600753784, -0.2767142653465271, -0.2594270408153534, -0.2421398162841797, -0.22485259175300598, -0.20756536722183228, -0.19027815759181976, -0.17299093306064606, -0.15570370852947235, -0.13841649889945984, -0.12112927436828613, -0.10384204983711243, -0.08655482530593872, -0.06926760822534561, -0.051980387419462204, -0.034693166613578796, -0.01740594208240509, -0.0001187250018119812, 0.017168492078781128, 0.034455716609954834, 0.05174293741583824, 0.06903015822172165, 0.08631737530231476, 0.10360459983348846, 0.12089182436466217, 0.13817903399467468, 0.1554662585258484, 0.1727534830570221, 0.1900407075881958, 0.2073279321193695, 0.22461514174938202, 0.24190236628055573, 0.2591896057128906, 0.27647680044174194, 0.29376402497291565, 0.31105124950408936, 0.32833847403526306, 0.34562569856643677, 0.3629129230976105, 0.3802001476287842, 0.3974873423576355, 0.4147745668888092, 0.4320617914199829, 0.4493490159511566, 0.4666362404823303, 0.48392346501350403, 0.5012106895446777, 0.518497884273529, 0.5357851386070251, 0.5530723333358765, 0.5703595876693726, 0.5876467823982239]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 13.0, 20.0, 24.0, 45.0, 52.0, 93.0, 170.0, 332.0, 643.0, 1174.0, 2337.0, 5010.0, 10437.0, 23072.0, 53249.0, 120917.0, 237835.0, 279456.0, 171943.0, 78853.0, 33785.0, 15353.0, 6995.0, 3256.0, 1697.0, 817.0, 404.0, 240.0, 137.0, 69.0, 48.0, 20.0, 20.0, 9.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.13222312927246094, -0.12784957885742188, -0.12347602844238281, -0.11910247802734375, -0.11472892761230469, -0.11035537719726562, -0.10598182678222656, -0.1016082763671875, -0.09723472595214844, -0.09286117553710938, -0.08848762512207031, -0.08411407470703125, -0.07974052429199219, -0.07536697387695312, -0.07099342346191406, -0.066619873046875, -0.06224632263183594, -0.057872772216796875, -0.05349922180175781, -0.04912567138671875, -0.04475212097167969, -0.040378570556640625, -0.03600502014160156, -0.0316314697265625, -0.027257919311523438, -0.022884368896484375, -0.018510818481445312, -0.01413726806640625, -0.009763717651367188, -0.005390167236328125, -0.0010166168212890625, 0.00335693359375, 0.0077304840087890625, 0.012104034423828125, 0.016477584838867188, 0.02085113525390625, 0.025224685668945312, 0.029598236083984375, 0.03397178649902344, 0.0383453369140625, 0.04271888732910156, 0.047092437744140625, 0.05146598815917969, 0.05583953857421875, 0.06021308898925781, 0.06458663940429688, 0.06896018981933594, 0.073333740234375, 0.07770729064941406, 0.08208084106445312, 0.08645439147949219, 0.09082794189453125, 0.09520149230957031, 0.09957504272460938, 0.10394859313964844, 0.1083221435546875, 0.11269569396972656, 0.11706924438476562, 0.12144279479980469, 0.12581634521484375, 0.1301898956298828, 0.13456344604492188, 0.13893699645996094, 0.143310546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 10.0, 8.0, 14.0, 12.0, 20.0, 26.0, 25.0, 49.0, 64.0, 62.0, 59.0, 72.0, 77.0, 65.0, 59.0, 53.0, 66.0, 56.0, 42.0, 36.0, 35.0, 30.0, 17.0, 13.0, 10.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200439453125, -0.19531631469726562, -0.19019317626953125, -0.18507003784179688, -0.1799468994140625, -0.17482376098632812, -0.16970062255859375, -0.16457748413085938, -0.159454345703125, -0.15433120727539062, -0.14920806884765625, -0.14408493041992188, -0.1389617919921875, -0.13383865356445312, -0.12871551513671875, -0.12359237670898438, -0.11846923828125, -0.11334609985351562, -0.10822296142578125, -0.10309982299804688, -0.0979766845703125, -0.09285354614257812, -0.08773040771484375, -0.08260726928710938, -0.077484130859375, -0.07236099243164062, -0.06723785400390625, -0.062114715576171875, -0.0569915771484375, -0.051868438720703125, -0.04674530029296875, -0.041622161865234375, -0.0364990234375, -0.031375885009765625, -0.02625274658203125, -0.021129608154296875, -0.0160064697265625, -0.010883331298828125, -0.00576019287109375, -0.000637054443359375, 0.004486083984375, 0.009609222412109375, 0.01473236083984375, 0.019855499267578125, 0.0249786376953125, 0.030101776123046875, 0.03522491455078125, 0.040348052978515625, 0.04547119140625, 0.050594329833984375, 0.05571746826171875, 0.060840606689453125, 0.0659637451171875, 0.07108688354492188, 0.07621002197265625, 0.08133316040039062, 0.086456298828125, 0.09157943725585938, 0.09670257568359375, 0.10182571411132812, 0.1069488525390625, 0.11207199096679688, 0.11719512939453125, 0.12231826782226562, 0.12744140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 3.0, 5.0, 12.0, 14.0, 26.0, 42.0, 56.0, 91.0, 135.0, 233.0, 419.0, 701.0, 1449.0, 2977.0, 6295.0, 14235.0, 34164.0, 85071.0, 207739.0, 335792.0, 211332.0, 85987.0, 34848.0, 14396.0, 6383.0, 2878.0, 1513.0, 743.0, 399.0, 208.0, 131.0, 86.0, 51.0, 38.0, 34.0, 18.0, 11.0, 7.0, 10.0, 10.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.16630172729492188, -0.16085052490234375, -0.15539932250976562, -0.1499481201171875, -0.14449691772460938, -0.13904571533203125, -0.13359451293945312, -0.128143310546875, -0.12269210815429688, -0.11724090576171875, -0.11178970336914062, -0.1063385009765625, -0.10088729858398438, -0.09543609619140625, -0.08998489379882812, -0.08453369140625, -0.07908248901367188, -0.07363128662109375, -0.06818008422851562, -0.0627288818359375, -0.057277679443359375, -0.05182647705078125, -0.046375274658203125, -0.040924072265625, -0.035472869873046875, -0.03002166748046875, -0.024570465087890625, -0.0191192626953125, -0.013668060302734375, -0.00821685791015625, -0.002765655517578125, 0.002685546875, 0.008136749267578125, 0.01358795166015625, 0.019039154052734375, 0.0244903564453125, 0.029941558837890625, 0.03539276123046875, 0.040843963623046875, 0.046295166015625, 0.051746368408203125, 0.05719757080078125, 0.06264877319335938, 0.0680999755859375, 0.07355117797851562, 0.07900238037109375, 0.08445358276367188, 0.08990478515625, 0.09535598754882812, 0.10080718994140625, 0.10625839233398438, 0.1117095947265625, 0.11716079711914062, 0.12261199951171875, 0.12806320190429688, 0.133514404296875, 0.13896560668945312, 0.14441680908203125, 0.14986801147460938, 0.1553192138671875, 0.16077041625976562, 0.16622161865234375, 0.17167282104492188, 0.1771240234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 5.0, 12.0, 9.0, 5.0, 15.0, 18.0, 15.0, 20.0, 26.0, 27.0, 25.0, 31.0, 32.0, 30.0, 42.0, 37.0, 47.0, 47.0, 39.0, 38.0, 45.0, 47.0, 41.0, 38.0, 42.0, 36.0, 30.0, 28.0, 20.0, 29.0, 18.0, 10.0, 18.0, 15.0, 21.0, 4.0, 10.0, 5.0, 2.0, 7.0, 5.0, 1.0, 0.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2895011901855469, -0.27993011474609375, -0.2703590393066406, -0.2607879638671875, -0.2512168884277344, -0.24164581298828125, -0.23207473754882812, -0.222503662109375, -0.21293258666992188, -0.20336151123046875, -0.19379043579101562, -0.1842193603515625, -0.17464828491210938, -0.16507720947265625, -0.15550613403320312, -0.14593505859375, -0.13636398315429688, -0.12679290771484375, -0.11722183227539062, -0.1076507568359375, -0.09807968139648438, -0.08850860595703125, -0.07893753051757812, -0.069366455078125, -0.059795379638671875, -0.05022430419921875, -0.040653228759765625, -0.0310821533203125, -0.021511077880859375, -0.01194000244140625, -0.002368927001953125, 0.0072021484375, 0.016773223876953125, 0.02634429931640625, 0.035915374755859375, 0.0454864501953125, 0.055057525634765625, 0.06462860107421875, 0.07419967651367188, 0.083770751953125, 0.09334182739257812, 0.10291290283203125, 0.11248397827148438, 0.1220550537109375, 0.13162612915039062, 0.14119720458984375, 0.15076828002929688, 0.16033935546875, 0.16991043090820312, 0.17948150634765625, 0.18905258178710938, 0.1986236572265625, 0.20819473266601562, 0.21776580810546875, 0.22733688354492188, 0.236907958984375, 0.24647903442382812, 0.25605010986328125, 0.2656211853027344, 0.2751922607421875, 0.2847633361816406, 0.29433441162109375, 0.3039054870605469, 0.3134765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 12.0, 35.0, 29.0, 49.0, 87.0, 151.0, 277.0, 461.0, 865.0, 1644.0, 3280.0, 6625.0, 13827.0, 28980.0, 63935.0, 145446.0, 271422.0, 262246.0, 135731.0, 60124.0, 27396.0, 12851.0, 6293.0, 3287.0, 1605.0, 813.0, 443.0, 243.0, 150.0, 85.0, 52.0, 23.0, 22.0, 11.0, 12.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04669189453125, -0.045230865478515625, -0.04376983642578125, -0.042308807373046875, -0.0408477783203125, -0.039386749267578125, -0.03792572021484375, -0.036464691162109375, -0.035003662109375, -0.033542633056640625, -0.03208160400390625, -0.030620574951171875, -0.0291595458984375, -0.027698516845703125, -0.02623748779296875, -0.024776458740234375, -0.0233154296875, -0.021854400634765625, -0.02039337158203125, -0.018932342529296875, -0.0174713134765625, -0.016010284423828125, -0.01454925537109375, -0.013088226318359375, -0.011627197265625, -0.010166168212890625, -0.00870513916015625, -0.007244110107421875, -0.0057830810546875, -0.004322052001953125, -0.00286102294921875, -0.001399993896484375, 6.103515625e-05, 0.001522064208984375, 0.00298309326171875, 0.004444122314453125, 0.0059051513671875, 0.007366180419921875, 0.00882720947265625, 0.010288238525390625, 0.011749267578125, 0.013210296630859375, 0.01467132568359375, 0.016132354736328125, 0.0175933837890625, 0.019054412841796875, 0.02051544189453125, 0.021976470947265625, 0.0234375, 0.024898529052734375, 0.02635955810546875, 0.027820587158203125, 0.0292816162109375, 0.030742645263671875, 0.03220367431640625, 0.033664703369140625, 0.035125732421875, 0.036586761474609375, 0.03804779052734375, 0.039508819580078125, 0.0409698486328125, 0.042430877685546875, 0.04389190673828125, 0.045352935791015625, 0.04681396484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 10.0, 11.0, 12.0, 11.0, 17.0, 16.0, 21.0, 39.0, 43.0, 50.0, 71.0, 54.0, 76.0, 76.0, 78.0, 78.0, 68.0, 42.0, 40.0, 32.0, 22.0, 31.0, 17.0, 14.0, 10.0, 11.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.6884878277778625e-05, -1.636520028114319e-05, -1.584552228450775e-05, -1.5325844287872314e-05, -1.4806166291236877e-05, -1.428648829460144e-05, -1.3766810297966003e-05, -1.3247132301330566e-05, -1.272745430469513e-05, -1.2207776308059692e-05, -1.1688098311424255e-05, -1.1168420314788818e-05, -1.0648742318153381e-05, -1.0129064321517944e-05, -9.609386324882507e-06, -9.08970832824707e-06, -8.570030331611633e-06, -8.050352334976196e-06, -7.530674338340759e-06, -7.010996341705322e-06, -6.491318345069885e-06, -5.971640348434448e-06, -5.451962351799011e-06, -4.932284355163574e-06, -4.412606358528137e-06, -3.8929283618927e-06, -3.373250365257263e-06, -2.853572368621826e-06, -2.333894371986389e-06, -1.8142163753509521e-06, -1.2945383787155151e-06, -7.748603820800781e-07, -2.551823854446411e-07, 2.644956111907959e-07, 7.841736078262329e-07, 1.30385160446167e-06, 1.823529601097107e-06, 2.343207597732544e-06, 2.862885594367981e-06, 3.382563591003418e-06, 3.902241587638855e-06, 4.421919584274292e-06, 4.941597580909729e-06, 5.461275577545166e-06, 5.980953574180603e-06, 6.50063157081604e-06, 7.020309567451477e-06, 7.539987564086914e-06, 8.059665560722351e-06, 8.579343557357788e-06, 9.099021553993225e-06, 9.618699550628662e-06, 1.0138377547264099e-05, 1.0658055543899536e-05, 1.1177733540534973e-05, 1.169741153717041e-05, 1.2217089533805847e-05, 1.2736767530441284e-05, 1.3256445527076721e-05, 1.3776123523712158e-05, 1.4295801520347595e-05, 1.4815479516983032e-05, 1.533515751361847e-05, 1.5854835510253906e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 2.0, 6.0, 12.0, 7.0, 13.0, 22.0, 22.0, 34.0, 68.0, 82.0, 130.0, 170.0, 310.0, 574.0, 1060.0, 1976.0, 4014.0, 8143.0, 16585.0, 35271.0, 73955.0, 150133.0, 244731.0, 237650.0, 141357.0, 68493.0, 32542.0, 15625.0, 7596.0, 3699.0, 1907.0, 963.0, 525.0, 319.0, 171.0, 118.0, 79.0, 52.0, 34.0, 34.0, 23.0, 16.0, 10.0, 4.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04095458984375, -0.0396728515625, -0.03839111328125, -0.037109375, -0.03582763671875, -0.0345458984375, -0.03326416015625, -0.031982421875, -0.03070068359375, -0.0294189453125, -0.02813720703125, -0.02685546875, -0.02557373046875, -0.0242919921875, -0.02301025390625, -0.021728515625, -0.02044677734375, -0.0191650390625, -0.01788330078125, -0.0166015625, -0.01531982421875, -0.0140380859375, -0.01275634765625, -0.011474609375, -0.01019287109375, -0.0089111328125, -0.00762939453125, -0.00634765625, -0.00506591796875, -0.0037841796875, -0.00250244140625, -0.001220703125, 6.103515625e-05, 0.0013427734375, 0.00262451171875, 0.00390625, 0.00518798828125, 0.0064697265625, 0.00775146484375, 0.009033203125, 0.01031494140625, 0.0115966796875, 0.01287841796875, 0.01416015625, 0.01544189453125, 0.0167236328125, 0.01800537109375, 0.019287109375, 0.02056884765625, 0.0218505859375, 0.02313232421875, 0.0244140625, 0.02569580078125, 0.0269775390625, 0.02825927734375, 0.029541015625, 0.03082275390625, 0.0321044921875, 0.03338623046875, 0.03466796875, 0.03594970703125, 0.0372314453125, 0.03851318359375, 0.039794921875, 0.04107666015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 6.0, 14.0, 14.0, 18.0, 14.0, 29.0, 40.0, 36.0, 39.0, 56.0, 57.0, 61.0, 75.0, 72.0, 59.0, 47.0, 61.0, 36.0, 37.0, 38.0, 31.0, 26.0, 28.0, 15.0, 10.0, 12.0, 14.0, 9.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050384521484375, -0.04865837097167969, -0.046932220458984375, -0.04520606994628906, -0.04347991943359375, -0.04175376892089844, -0.040027618408203125, -0.03830146789550781, -0.0365753173828125, -0.03484916687011719, -0.033123016357421875, -0.03139686584472656, -0.02967071533203125, -0.027944564819335938, -0.026218414306640625, -0.024492263793945312, -0.02276611328125, -0.021039962768554688, -0.019313812255859375, -0.017587661743164062, -0.01586151123046875, -0.014135360717773438, -0.012409210205078125, -0.010683059692382812, -0.0089569091796875, -0.0072307586669921875, -0.005504608154296875, -0.0037784576416015625, -0.00205230712890625, -0.0003261566162109375, 0.001399993896484375, 0.0031261444091796875, 0.004852294921875, 0.0065784454345703125, 0.008304595947265625, 0.010030746459960938, 0.01175689697265625, 0.013483047485351562, 0.015209197998046875, 0.016935348510742188, 0.0186614990234375, 0.020387649536132812, 0.022113800048828125, 0.023839950561523438, 0.02556610107421875, 0.027292251586914062, 0.029018402099609375, 0.030744552612304688, 0.032470703125, 0.03419685363769531, 0.035923004150390625, 0.03764915466308594, 0.03937530517578125, 0.04110145568847656, 0.042827606201171875, 0.04455375671386719, 0.0462799072265625, 0.04800605773925781, 0.049732208251953125, 0.05145835876464844, 0.05318450927734375, 0.05491065979003906, 0.056636810302734375, 0.05836296081542969, 0.060089111328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 5.0, 10.0, 15.0, 66.0, 165.0, 234.0, 263.0, 146.0, 60.0, 21.0, 8.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.471949338912964, -2.413187026977539, -2.3544247150421143, -2.2956624031066895, -2.2369000911712646, -2.17813777923584, -2.119375467300415, -2.0606131553649902, -2.0018506050109863, -1.9430882930755615, -1.8843259811401367, -1.825563669204712, -1.766801357269287, -1.7080390453338623, -1.649276614189148, -1.5905143022537231, -1.531752109527588, -1.472989797592163, -1.4142274856567383, -1.3554651737213135, -1.2967028617858887, -1.2379405498504639, -1.1791781187057495, -1.1204158067703247, -1.0616534948349, -1.002891182899475, -0.9441288709640503, -0.8853664994239807, -0.8266041874885559, -0.7678418755531311, -0.7090795040130615, -0.6503171920776367, -0.5915548801422119, -0.5327925682067871, -0.4740302264690399, -0.4152678847312927, -0.3565055727958679, -0.2977432608604431, -0.23898091912269592, -0.18021857738494873, -0.12145626544952393, -0.06269393861293793, -0.003931611776351929, 0.05483071506023407, 0.11359304189682007, 0.17235535383224487, 0.23111769556999207, 0.28988003730773926, 0.34864234924316406, 0.40740466117858887, 0.46616700291633606, 0.5249293446540833, 0.5836916565895081, 0.6424539685249329, 0.7012163400650024, 0.7599786520004272, 0.818740963935852, 0.8775032758712769, 0.9362655878067017, 0.9950279593467712, 1.0537903308868408, 1.1125526428222656, 1.1713149547576904, 1.2300772666931152, 1.28883957862854]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 6.0, 12.0, 16.0, 16.0, 12.0, 20.0, 21.0, 29.0, 32.0, 24.0, 26.0, 27.0, 44.0, 49.0, 35.0, 43.0, 50.0, 42.0, 46.0, 44.0, 50.0, 36.0, 42.0, 29.0, 43.0, 24.0, 33.0, 21.0, 23.0, 19.0, 15.0, 16.0, 13.0, 11.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.8290795087814331, -0.8060147762298584, -0.7829501032829285, -0.7598853707313538, -0.7368206977844238, -0.7137559652328491, -0.6906912326812744, -0.6676265001296997, -0.6445618271827698, -0.6214970946311951, -0.5984324216842651, -0.5753676891326904, -0.5523029565811157, -0.5292382836341858, -0.5061735510826111, -0.48310884833335876, -0.46004414558410645, -0.4369794428348541, -0.4139147400856018, -0.3908500075340271, -0.3677853047847748, -0.34472060203552246, -0.32165586948394775, -0.29859116673469543, -0.2755264639854431, -0.2524617612361908, -0.22939704358577728, -0.20633232593536377, -0.18326762318611145, -0.16020292043685913, -0.13713820278644562, -0.1140734851360321, -0.09100878238677979, -0.06794407218694687, -0.04487936198711395, -0.021814651787281036, 0.0012500584125518799, 0.024314768612384796, 0.04737947881221771, 0.07044419646263123, 0.09350889921188354, 0.11657360941171646, 0.13963831961154938, 0.1627030372619629, 0.1857677400112152, 0.20883244276046753, 0.23189716041088104, 0.25496187806129456, 0.2780265808105469, 0.3010912835597992, 0.3241559863090515, 0.3472207188606262, 0.37028542160987854, 0.39335012435913086, 0.41641485691070557, 0.4394795596599579, 0.4625442624092102, 0.4856089651584625, 0.5086736679077148, 0.5317384004592896, 0.5548031330108643, 0.5778678059577942, 0.6009325385093689, 0.6239972114562988, 0.6470619440078735]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 19.0, 14.0, 17.0, 39.0, 50.0, 52.0, 97.0, 132.0, 181.0, 317.0, 544.0, 843.0, 1461.0, 2745.0, 5350.0, 11111.0, 23822.0, 58587.0, 143069.0, 318802.0, 604479.0, 887077.0, 891145.0, 628336.0, 342811.0, 152984.0, 62632.0, 28702.0, 14042.0, 6935.0, 3515.0, 1782.0, 977.0, 607.0, 330.0, 221.0, 155.0, 87.0, 55.0, 41.0, 24.0, 24.0, 19.0, 5.0, 12.0, 3.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.072998046875, -0.07078933715820312, -0.06858062744140625, -0.06637191772460938, -0.0641632080078125, -0.061954498291015625, -0.05974578857421875, -0.057537078857421875, -0.055328369140625, -0.053119659423828125, -0.05091094970703125, -0.048702239990234375, -0.0464935302734375, -0.044284820556640625, -0.04207611083984375, -0.039867401123046875, -0.03765869140625, -0.035449981689453125, -0.03324127197265625, -0.031032562255859375, -0.0288238525390625, -0.026615142822265625, -0.02440643310546875, -0.022197723388671875, -0.019989013671875, -0.017780303955078125, -0.01557159423828125, -0.013362884521484375, -0.0111541748046875, -0.008945465087890625, -0.00673675537109375, -0.004528045654296875, -0.0023193359375, -0.000110626220703125, 0.00209808349609375, 0.004306793212890625, 0.0065155029296875, 0.008724212646484375, 0.01093292236328125, 0.013141632080078125, 0.015350341796875, 0.017559051513671875, 0.01976776123046875, 0.021976470947265625, 0.0241851806640625, 0.026393890380859375, 0.02860260009765625, 0.030811309814453125, 0.03302001953125, 0.035228729248046875, 0.03743743896484375, 0.039646148681640625, 0.0418548583984375, 0.044063568115234375, 0.04627227783203125, 0.048480987548828125, 0.050689697265625, 0.052898406982421875, 0.05510711669921875, 0.057315826416015625, 0.0595245361328125, 0.061733245849609375, 0.06394195556640625, 0.06615066528320312, 0.068359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 7.0, 11.0, 12.0, 15.0, 15.0, 22.0, 31.0, 32.0, 33.0, 37.0, 47.0, 43.0, 42.0, 52.0, 46.0, 49.0, 61.0, 56.0, 46.0, 50.0, 41.0, 44.0, 39.0, 29.0, 29.0, 19.0, 14.0, 17.0, 16.0, 12.0, 14.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1268625259399414, -0.12298774719238281, -0.11911296844482422, -0.11523818969726562, -0.11136341094970703, -0.10748863220214844, -0.10361385345458984, -0.09973907470703125, -0.09586429595947266, -0.09198951721191406, -0.08811473846435547, -0.08423995971679688, -0.08036518096923828, -0.07649040222167969, -0.0726156234741211, -0.0687408447265625, -0.0648660659790039, -0.06099128723144531, -0.05711650848388672, -0.053241729736328125, -0.04936695098876953, -0.04549217224121094, -0.041617393493652344, -0.03774261474609375, -0.033867835998535156, -0.029993057250976562, -0.02611827850341797, -0.022243499755859375, -0.01836872100830078, -0.014493942260742188, -0.010619163513183594, -0.006744384765625, -0.0028696060180664062, 0.0010051727294921875, 0.004879951477050781, 0.008754730224609375, 0.012629508972167969, 0.016504287719726562, 0.020379066467285156, 0.02425384521484375, 0.028128623962402344, 0.03200340270996094, 0.03587818145751953, 0.039752960205078125, 0.04362773895263672, 0.04750251770019531, 0.051377296447753906, 0.0552520751953125, 0.059126853942871094, 0.06300163269042969, 0.06687641143798828, 0.07075119018554688, 0.07462596893310547, 0.07850074768066406, 0.08237552642822266, 0.08625030517578125, 0.09012508392333984, 0.09399986267089844, 0.09787464141845703, 0.10174942016601562, 0.10562419891357422, 0.10949897766113281, 0.1133737564086914, 0.11724853515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 11.0, 15.0, 15.0, 23.0, 21.0, 26.0, 34.0, 60.0, 81.0, 111.0, 205.0, 577.0, 3341.0, 103187.0, 3944033.0, 137384.0, 3934.0, 567.0, 222.0, 117.0, 83.0, 68.0, 58.0, 38.0, 15.0, 20.0, 11.0, 8.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3630218505859375, -0.346160888671875, -0.3292999267578125, -0.31243896484375, -0.2955780029296875, -0.278717041015625, -0.2618560791015625, -0.2449951171875, -0.2281341552734375, -0.211273193359375, -0.1944122314453125, -0.17755126953125, -0.1606903076171875, -0.143829345703125, -0.1269683837890625, -0.110107421875, -0.0932464599609375, -0.076385498046875, -0.0595245361328125, -0.04266357421875, -0.0258026123046875, -0.008941650390625, 0.0079193115234375, 0.0247802734375, 0.0416412353515625, 0.058502197265625, 0.0753631591796875, 0.09222412109375, 0.1090850830078125, 0.125946044921875, 0.1428070068359375, 0.15966796875, 0.1765289306640625, 0.193389892578125, 0.2102508544921875, 0.22711181640625, 0.2439727783203125, 0.260833740234375, 0.2776947021484375, 0.2945556640625, 0.3114166259765625, 0.328277587890625, 0.3451385498046875, 0.36199951171875, 0.3788604736328125, 0.395721435546875, 0.4125823974609375, 0.429443359375, 0.4463043212890625, 0.463165283203125, 0.4800262451171875, 0.49688720703125, 0.5137481689453125, 0.530609130859375, 0.5474700927734375, 0.5643310546875, 0.5811920166015625, 0.598052978515625, 0.6149139404296875, 0.63177490234375, 0.6486358642578125, 0.665496826171875, 0.6823577880859375, 0.69921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 9.0, 15.0, 54.0, 89.0, 220.0, 643.0, 1454.0, 1010.0, 379.0, 124.0, 48.0, 22.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.3272209167480469, -0.31142425537109375, -0.2956275939941406, -0.2798309326171875, -0.2640342712402344, -0.24823760986328125, -0.23244094848632812, -0.216644287109375, -0.20084762573242188, -0.18505096435546875, -0.16925430297851562, -0.1534576416015625, -0.13766098022460938, -0.12186431884765625, -0.10606765747070312, -0.09027099609375, -0.07447433471679688, -0.05867767333984375, -0.042881011962890625, -0.0270843505859375, -0.011287689208984375, 0.00450897216796875, 0.020305633544921875, 0.036102294921875, 0.051898956298828125, 0.06769561767578125, 0.08349227905273438, 0.0992889404296875, 0.11508560180664062, 0.13088226318359375, 0.14667892456054688, 0.1624755859375, 0.17827224731445312, 0.19406890869140625, 0.20986557006835938, 0.2256622314453125, 0.24145889282226562, 0.25725555419921875, 0.2730522155761719, 0.288848876953125, 0.3046455383300781, 0.32044219970703125, 0.3362388610839844, 0.3520355224609375, 0.3678321838378906, 0.38362884521484375, 0.3994255065917969, 0.41522216796875, 0.4310188293457031, 0.44681549072265625, 0.4626121520996094, 0.4784088134765625, 0.4942054748535156, 0.5100021362304688, 0.5257987976074219, 0.541595458984375, 0.5573921203613281, 0.5731887817382812, 0.5889854431152344, 0.6047821044921875, 0.6205787658691406, 0.6363754272460938, 0.6521720886230469, 0.66796875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 16.0, 43.0, 128.0, 259.0, 260.0, 179.0, 67.0, 30.0, 13.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8495746850967407, -1.7760834693908691, -1.7025922536849976, -1.629101037979126, -1.5556098222732544, -1.4821186065673828, -1.4086273908615112, -1.3351361751556396, -1.261644959449768, -1.1881537437438965, -1.114662528038025, -1.0411713123321533, -0.9676800966262817, -0.8941888809204102, -0.8206976652145386, -0.747206449508667, -0.6737152338027954, -0.6002240180969238, -0.5267328023910522, -0.45324158668518066, -0.3797503709793091, -0.3062591552734375, -0.23276793956756592, -0.15927672386169434, -0.08578550815582275, -0.012294292449951172, 0.06119692325592041, 0.134688138961792, 0.20817935466766357, 0.28167057037353516, 0.35516178607940674, 0.4286530017852783, 0.5021443367004395, 0.575635552406311, 0.6491267681121826, 0.7226179838180542, 0.7961091995239258, 0.8696004152297974, 0.943091630935669, 1.0165828466415405, 1.090074062347412, 1.1635652780532837, 1.2370564937591553, 1.3105477094650269, 1.3840389251708984, 1.45753014087677, 1.5310213565826416, 1.6045125722885132, 1.6780037879943848, 1.7514950037002563, 1.824986219406128, 1.8984774351119995, 1.971968650817871, 2.045459747314453, 2.1189510822296143, 2.1924424171447754, 2.2659335136413574, 2.3394246101379395, 2.4129159450531006, 2.4864072799682617, 2.5598983764648438, 2.633389472961426, 2.706880807876587, 2.780372142791748, 2.85386323928833]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 5.0, 15.0, 3.0, 7.0, 14.0, 19.0, 15.0, 21.0, 32.0, 26.0, 30.0, 35.0, 31.0, 32.0, 44.0, 34.0, 37.0, 41.0, 34.0, 50.0, 33.0, 28.0, 33.0, 40.0, 32.0, 27.0, 28.0, 32.0, 22.0, 25.0, 19.0, 21.0, 19.0, 18.0, 16.0, 8.0, 11.0, 6.0, 8.0, 10.0, 8.0, 3.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5667837858200073, -0.5489415526390076, -0.5310993194580078, -0.5132570266723633, -0.4954147934913635, -0.47757256031036377, -0.4597302973270416, -0.4418880343437195, -0.4240458011627197, -0.40620356798171997, -0.3883613049983978, -0.3705190420150757, -0.3526768088340759, -0.33483457565307617, -0.31699231266975403, -0.2991500496864319, -0.28130781650543213, -0.2634655833244324, -0.24562332034111023, -0.22778107225894928, -0.20993882417678833, -0.19209657609462738, -0.17425432801246643, -0.15641207993030548, -0.13856983184814453, -0.12072758376598358, -0.10288533568382263, -0.08504308760166168, -0.06720083951950073, -0.04935859143733978, -0.03151634335517883, -0.013674095273017883, 0.004168152809143066, 0.022010400891304016, 0.039852648973464966, 0.057694897055625916, 0.07553714513778687, 0.09337939321994781, 0.11122164130210876, 0.12906388938426971, 0.14690613746643066, 0.1647483855485916, 0.18259063363075256, 0.2004328817129135, 0.21827512979507446, 0.2361173778772354, 0.25395962595939636, 0.2718018889427185, 0.28964412212371826, 0.307486355304718, 0.32532861828804016, 0.3431708812713623, 0.36101311445236206, 0.3788553476333618, 0.39669761061668396, 0.4145398736000061, 0.43238210678100586, 0.4502243399620056, 0.46806660294532776, 0.4859088659286499, 0.5037510991096497, 0.5215933322906494, 0.539435625076294, 0.5572778582572937, 0.5751200914382935]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 9.0, 12.0, 19.0, 20.0, 61.0, 75.0, 72.0, 122.0, 165.0, 253.0, 383.0, 494.0, 792.0, 1105.0, 1672.0, 2553.0, 4063.0, 6480.0, 10584.0, 18253.0, 32560.0, 60379.0, 113400.0, 186220.0, 220275.0, 168455.0, 97741.0, 52039.0, 28138.0, 15923.0, 9582.0, 5876.0, 3611.0, 2375.0, 1581.0, 982.0, 672.0, 487.0, 323.0, 192.0, 153.0, 92.0, 92.0, 44.0, 46.0, 38.0, 31.0, 26.0, 8.0, 9.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0], "bins": [-0.09576416015625, -0.09271240234375, -0.08966064453125, -0.08660888671875, -0.08355712890625, -0.08050537109375, -0.07745361328125, -0.07440185546875, -0.07135009765625, -0.06829833984375, -0.06524658203125, -0.06219482421875, -0.05914306640625, -0.05609130859375, -0.05303955078125, -0.04998779296875, -0.04693603515625, -0.04388427734375, -0.04083251953125, -0.03778076171875, -0.03472900390625, -0.03167724609375, -0.02862548828125, -0.02557373046875, -0.02252197265625, -0.01947021484375, -0.01641845703125, -0.01336669921875, -0.01031494140625, -0.00726318359375, -0.00421142578125, -0.00115966796875, 0.00189208984375, 0.00494384765625, 0.00799560546875, 0.01104736328125, 0.01409912109375, 0.01715087890625, 0.02020263671875, 0.02325439453125, 0.02630615234375, 0.02935791015625, 0.03240966796875, 0.03546142578125, 0.03851318359375, 0.04156494140625, 0.04461669921875, 0.04766845703125, 0.05072021484375, 0.05377197265625, 0.05682373046875, 0.05987548828125, 0.06292724609375, 0.06597900390625, 0.06903076171875, 0.07208251953125, 0.07513427734375, 0.07818603515625, 0.08123779296875, 0.08428955078125, 0.08734130859375, 0.09039306640625, 0.09344482421875, 0.09649658203125, 0.09954833984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 10.0, 3.0, 13.0, 21.0, 11.0, 25.0, 33.0, 31.0, 31.0, 31.0, 54.0, 38.0, 45.0, 42.0, 56.0, 53.0, 59.0, 59.0, 53.0, 39.0, 40.0, 34.0, 40.0, 31.0, 26.0, 21.0, 21.0, 15.0, 18.0, 11.0, 12.0, 6.0, 2.0, 9.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1549072265625, -0.15042877197265625, -0.1459503173828125, -0.14147186279296875, -0.136993408203125, -0.13251495361328125, -0.1280364990234375, -0.12355804443359375, -0.11907958984375, -0.11460113525390625, -0.1101226806640625, -0.10564422607421875, -0.101165771484375, -0.09668731689453125, -0.0922088623046875, -0.08773040771484375, -0.083251953125, -0.07877349853515625, -0.0742950439453125, -0.06981658935546875, -0.065338134765625, -0.06085968017578125, -0.0563812255859375, -0.05190277099609375, -0.04742431640625, -0.04294586181640625, -0.0384674072265625, -0.03398895263671875, -0.029510498046875, -0.02503204345703125, -0.0205535888671875, -0.01607513427734375, -0.0115966796875, -0.00711822509765625, -0.0026397705078125, 0.00183868408203125, 0.006317138671875, 0.01079559326171875, 0.0152740478515625, 0.01975250244140625, 0.02423095703125, 0.02870941162109375, 0.0331878662109375, 0.03766632080078125, 0.042144775390625, 0.04662322998046875, 0.0511016845703125, 0.05558013916015625, 0.06005859375, 0.06453704833984375, 0.0690155029296875, 0.07349395751953125, 0.077972412109375, 0.08245086669921875, 0.0869293212890625, 0.09140777587890625, 0.09588623046875, 0.10036468505859375, 0.1048431396484375, 0.10932159423828125, 0.113800048828125, 0.11827850341796875, 0.1227569580078125, 0.12723541259765625, 0.1317138671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 7.0, 12.0, 12.0, 19.0, 28.0, 43.0, 67.0, 110.0, 201.0, 374.0, 675.0, 1298.0, 2496.0, 5169.0, 11111.0, 26089.0, 70813.0, 211663.0, 390146.0, 210106.0, 70168.0, 26161.0, 11188.0, 5239.0, 2507.0, 1235.0, 668.0, 339.0, 209.0, 126.0, 80.0, 56.0, 40.0, 25.0, 16.0, 10.0, 5.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.197998046875, -0.19208717346191406, -0.18617630004882812, -0.1802654266357422, -0.17435455322265625, -0.1684436798095703, -0.16253280639648438, -0.15662193298339844, -0.1507110595703125, -0.14480018615722656, -0.13888931274414062, -0.1329784393310547, -0.12706756591796875, -0.12115669250488281, -0.11524581909179688, -0.10933494567871094, -0.103424072265625, -0.09751319885253906, -0.09160232543945312, -0.08569145202636719, -0.07978057861328125, -0.07386970520019531, -0.06795883178710938, -0.06204795837402344, -0.0561370849609375, -0.05022621154785156, -0.044315338134765625, -0.03840446472167969, -0.03249359130859375, -0.026582717895507812, -0.020671844482421875, -0.014760971069335938, -0.00885009765625, -0.0029392242431640625, 0.002971649169921875, 0.008882522583007812, 0.01479339599609375, 0.020704269409179688, 0.026615142822265625, 0.03252601623535156, 0.0384368896484375, 0.04434776306152344, 0.050258636474609375, 0.05616950988769531, 0.06208038330078125, 0.06799125671386719, 0.07390213012695312, 0.07981300354003906, 0.085723876953125, 0.09163475036621094, 0.09754562377929688, 0.10345649719238281, 0.10936737060546875, 0.11527824401855469, 0.12118911743164062, 0.12709999084472656, 0.1330108642578125, 0.13892173767089844, 0.14483261108398438, 0.1507434844970703, 0.15665435791015625, 0.1625652313232422, 0.16847610473632812, 0.17438697814941406, 0.1802978515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 8.0, 9.0, 5.0, 6.0, 7.0, 16.0, 12.0, 16.0, 22.0, 14.0, 28.0, 26.0, 24.0, 31.0, 35.0, 35.0, 34.0, 36.0, 33.0, 42.0, 39.0, 53.0, 32.0, 50.0, 27.0, 35.0, 37.0, 31.0, 33.0, 38.0, 24.0, 22.0, 16.0, 17.0, 11.0, 18.0, 9.0, 14.0, 8.0, 6.0, 5.0, 4.0, 7.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.276123046875, -0.2671852111816406, -0.25824737548828125, -0.24930953979492188, -0.2403717041015625, -0.23143386840820312, -0.22249603271484375, -0.21355819702148438, -0.204620361328125, -0.19568252563476562, -0.18674468994140625, -0.17780685424804688, -0.1688690185546875, -0.15993118286132812, -0.15099334716796875, -0.14205551147460938, -0.13311767578125, -0.12417984008789062, -0.11524200439453125, -0.10630416870117188, -0.0973663330078125, -0.08842849731445312, -0.07949066162109375, -0.07055282592773438, -0.061614990234375, -0.052677154541015625, -0.04373931884765625, -0.034801483154296875, -0.0258636474609375, -0.016925811767578125, -0.00798797607421875, 0.000949859619140625, 0.0098876953125, 0.018825531005859375, 0.02776336669921875, 0.036701202392578125, 0.0456390380859375, 0.054576873779296875, 0.06351470947265625, 0.07245254516601562, 0.081390380859375, 0.09032821655273438, 0.09926605224609375, 0.10820388793945312, 0.1171417236328125, 0.12607955932617188, 0.13501739501953125, 0.14395523071289062, 0.15289306640625, 0.16183090209960938, 0.17076873779296875, 0.17970657348632812, 0.1886444091796875, 0.19758224487304688, 0.20652008056640625, 0.21545791625976562, 0.224395751953125, 0.23333358764648438, 0.24227142333984375, 0.2512092590332031, 0.2601470947265625, 0.2690849304199219, 0.27802276611328125, 0.2869606018066406, 0.2958984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 8.0, 9.0, 14.0, 24.0, 28.0, 53.0, 68.0, 127.0, 208.0, 321.0, 540.0, 921.0, 1468.0, 2629.0, 4873.0, 9356.0, 19070.0, 41821.0, 93097.0, 198083.0, 283882.0, 207104.0, 99076.0, 44027.0, 20027.0, 10035.0, 5149.0, 2720.0, 1506.0, 868.0, 555.0, 327.0, 205.0, 115.0, 72.0, 51.0, 28.0, 17.0, 21.0, 20.0, 6.0, 6.0, 5.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037994384765625, -0.036861419677734375, -0.03572845458984375, -0.034595489501953125, -0.0334625244140625, -0.032329559326171875, -0.03119659423828125, -0.030063629150390625, -0.0289306640625, -0.027797698974609375, -0.02666473388671875, -0.025531768798828125, -0.0243988037109375, -0.023265838623046875, -0.02213287353515625, -0.020999908447265625, -0.019866943359375, -0.018733978271484375, -0.01760101318359375, -0.016468048095703125, -0.0153350830078125, -0.014202117919921875, -0.01306915283203125, -0.011936187744140625, -0.01080322265625, -0.009670257568359375, -0.00853729248046875, -0.007404327392578125, -0.0062713623046875, -0.005138397216796875, -0.00400543212890625, -0.002872467041015625, -0.001739501953125, -0.000606536865234375, 0.00052642822265625, 0.001659393310546875, 0.0027923583984375, 0.003925323486328125, 0.00505828857421875, 0.006191253662109375, 0.00732421875, 0.008457183837890625, 0.00959014892578125, 0.010723114013671875, 0.0118560791015625, 0.012989044189453125, 0.01412200927734375, 0.015254974365234375, 0.016387939453125, 0.017520904541015625, 0.01865386962890625, 0.019786834716796875, 0.0209197998046875, 0.022052764892578125, 0.02318572998046875, 0.024318695068359375, 0.02545166015625, 0.026584625244140625, 0.02771759033203125, 0.028850555419921875, 0.0299835205078125, 0.031116485595703125, 0.03224945068359375, 0.033382415771484375, 0.034515380859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 8.0, 9.0, 10.0, 15.0, 15.0, 33.0, 47.0, 48.0, 81.0, 90.0, 106.0, 108.0, 87.0, 89.0, 60.0, 43.0, 38.0, 34.0, 14.0, 12.0, 17.0, 6.0, 8.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6464462280273438e-05, -2.577155828475952e-05, -2.5078654289245605e-05, -2.438575029373169e-05, -2.3692846298217773e-05, -2.2999942302703857e-05, -2.230703830718994e-05, -2.1614134311676025e-05, -2.092123031616211e-05, -2.0228326320648193e-05, -1.9535422325134277e-05, -1.884251832962036e-05, -1.8149614334106445e-05, -1.745671033859253e-05, -1.6763806343078613e-05, -1.6070902347564697e-05, -1.537799835205078e-05, -1.4685094356536865e-05, -1.399219036102295e-05, -1.3299286365509033e-05, -1.2606382369995117e-05, -1.1913478374481201e-05, -1.1220574378967285e-05, -1.0527670383453369e-05, -9.834766387939453e-06, -9.141862392425537e-06, -8.448958396911621e-06, -7.756054401397705e-06, -7.063150405883789e-06, -6.370246410369873e-06, -5.677342414855957e-06, -4.984438419342041e-06, -4.291534423828125e-06, -3.598630428314209e-06, -2.905726432800293e-06, -2.212822437286377e-06, -1.519918441772461e-06, -8.270144462585449e-07, -1.341104507446289e-07, 5.587935447692871e-07, 1.2516975402832031e-06, 1.944601535797119e-06, 2.637505531311035e-06, 3.330409526824951e-06, 4.023313522338867e-06, 4.716217517852783e-06, 5.409121513366699e-06, 6.102025508880615e-06, 6.794929504394531e-06, 7.487833499908447e-06, 8.180737495422363e-06, 8.87364149093628e-06, 9.566545486450195e-06, 1.0259449481964111e-05, 1.0952353477478027e-05, 1.1645257472991943e-05, 1.233816146850586e-05, 1.3031065464019775e-05, 1.3723969459533691e-05, 1.4416873455047607e-05, 1.5109777450561523e-05, 1.580268144607544e-05, 1.6495585441589355e-05, 1.718848943710327e-05, 1.7881393432617188e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 9.0, 7.0, 15.0, 29.0, 40.0, 83.0, 140.0, 214.0, 510.0, 1085.0, 2476.0, 6122.0, 15959.0, 47484.0, 143147.0, 325894.0, 309572.0, 128977.0, 42445.0, 14510.0, 5595.0, 2297.0, 953.0, 460.0, 237.0, 123.0, 60.0, 44.0, 24.0, 20.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034820556640625, -0.03336668014526367, -0.031912803649902344, -0.030458927154541016, -0.029005050659179688, -0.02755117416381836, -0.02609729766845703, -0.024643421173095703, -0.023189544677734375, -0.021735668182373047, -0.02028179168701172, -0.01882791519165039, -0.017374038696289062, -0.015920162200927734, -0.014466285705566406, -0.013012409210205078, -0.01155853271484375, -0.010104656219482422, -0.008650779724121094, -0.007196903228759766, -0.0057430267333984375, -0.004289150238037109, -0.0028352737426757812, -0.0013813972473144531, 7.2479248046875e-05, 0.0015263557434082031, 0.0029802322387695312, 0.004434108734130859, 0.0058879852294921875, 0.007341861724853516, 0.008795738220214844, 0.010249614715576172, 0.0117034912109375, 0.013157367706298828, 0.014611244201660156, 0.016065120697021484, 0.017518997192382812, 0.01897287368774414, 0.02042675018310547, 0.021880626678466797, 0.023334503173828125, 0.024788379669189453, 0.02624225616455078, 0.02769613265991211, 0.029150009155273438, 0.030603885650634766, 0.032057762145996094, 0.03351163864135742, 0.03496551513671875, 0.03641939163208008, 0.037873268127441406, 0.039327144622802734, 0.04078102111816406, 0.04223489761352539, 0.04368877410888672, 0.04514265060424805, 0.046596527099609375, 0.0480504035949707, 0.04950428009033203, 0.05095815658569336, 0.05241203308105469, 0.053865909576416016, 0.055319786071777344, 0.05677366256713867, 0.0582275390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 4.0, 6.0, 13.0, 12.0, 15.0, 18.0, 15.0, 23.0, 28.0, 35.0, 27.0, 46.0, 49.0, 78.0, 64.0, 50.0, 55.0, 60.0, 35.0, 42.0, 43.0, 57.0, 20.0, 30.0, 30.0, 23.0, 16.0, 22.0, 16.0, 9.0, 13.0, 7.0, 6.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.040924072265625, -0.039659976959228516, -0.03839588165283203, -0.03713178634643555, -0.03586769104003906, -0.03460359573364258, -0.033339500427246094, -0.03207540512084961, -0.030811309814453125, -0.02954721450805664, -0.028283119201660156, -0.027019023895263672, -0.025754928588867188, -0.024490833282470703, -0.02322673797607422, -0.021962642669677734, -0.02069854736328125, -0.019434452056884766, -0.01817035675048828, -0.016906261444091797, -0.015642166137695312, -0.014378070831298828, -0.013113975524902344, -0.01184988021850586, -0.010585784912109375, -0.00932168960571289, -0.008057594299316406, -0.006793498992919922, -0.0055294036865234375, -0.004265308380126953, -0.0030012130737304688, -0.0017371177673339844, -0.0004730224609375, 0.0007910728454589844, 0.0020551681518554688, 0.003319263458251953, 0.0045833587646484375, 0.005847454071044922, 0.007111549377441406, 0.00837564468383789, 0.009639739990234375, 0.01090383529663086, 0.012167930603027344, 0.013432025909423828, 0.014696121215820312, 0.015960216522216797, 0.01722431182861328, 0.018488407135009766, 0.01975250244140625, 0.021016597747802734, 0.02228069305419922, 0.023544788360595703, 0.024808883666992188, 0.026072978973388672, 0.027337074279785156, 0.02860116958618164, 0.029865264892578125, 0.03112936019897461, 0.032393455505371094, 0.03365755081176758, 0.03492164611816406, 0.03618574142456055, 0.03744983673095703, 0.038713932037353516, 0.03997802734375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 19.0, 28.0, 39.0, 93.0, 117.0, 170.0, 167.0, 117.0, 93.0, 65.0, 30.0, 25.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.4524821043014526, -1.4172271490097046, -1.381972074508667, -1.346717119216919, -1.311462163925171, -1.2762070894241333, -1.2409521341323853, -1.2056970596313477, -1.1704421043395996, -1.1351871490478516, -1.099932074546814, -1.064677119255066, -1.0294220447540283, -0.9941670894622803, -0.9589121341705322, -0.9236571192741394, -0.8884021043777466, -0.8531470894813538, -0.8178920745849609, -0.7826371192932129, -0.7473821043968201, -0.7121270895004272, -0.6768721342086792, -0.6416171193122864, -0.6063621044158936, -0.5711070895195007, -0.5358520746231079, -0.5005971193313599, -0.46534210443496704, -0.4300870895385742, -0.3948321044445038, -0.35957711935043335, -0.3243222236633301, -0.28906720876693726, -0.2538122236728668, -0.2185572236776352, -0.18330222368240356, -0.14804722368717194, -0.11279222369194031, -0.07753722369670868, -0.04228222370147705, -0.007027223706245422, 0.028227776288986206, 0.06348277628421783, 0.09873777627944946, 0.1339927762746811, 0.16924777626991272, 0.20450277626514435, 0.23975777626037598, 0.2750127911567688, 0.31026777625083923, 0.34552276134490967, 0.3807777762413025, 0.4160327911376953, 0.45128777623176575, 0.4865427613258362, 0.521797776222229, 0.5570527911186218, 0.5923078060150146, 0.6275627613067627, 0.6628177762031555, 0.6980727910995483, 0.7333277463912964, 0.7685827612876892, 0.803837776184082]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 4.0, 9.0, 5.0, 11.0, 14.0, 10.0, 12.0, 8.0, 13.0, 15.0, 18.0, 21.0, 19.0, 35.0, 24.0, 30.0, 34.0, 24.0, 47.0, 38.0, 44.0, 46.0, 33.0, 43.0, 32.0, 33.0, 30.0, 40.0, 33.0, 37.0, 35.0, 25.0, 24.0, 19.0, 21.0, 12.0, 18.0, 15.0, 8.0, 12.0, 15.0, 8.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6836521029472351, -0.663291335105896, -0.6429305672645569, -0.6225697994232178, -0.6022090315818787, -0.5818482637405396, -0.5614874958992004, -0.5411267280578613, -0.520766019821167, -0.5004052519798279, -0.48004448413848877, -0.45968371629714966, -0.43932294845581055, -0.41896218061447144, -0.3986014425754547, -0.3782406747341156, -0.3578798770904541, -0.337519109249115, -0.3171583414077759, -0.29679757356643677, -0.27643680572509766, -0.25607603788375854, -0.23571529984474182, -0.2153545320034027, -0.1949937641620636, -0.1746329963207245, -0.15427222847938538, -0.13391147553920746, -0.11355070769786835, -0.09318993985652924, -0.07282917946577072, -0.05246841907501221, -0.03210759162902832, -0.011746827512979507, 0.008613936603069305, 0.02897470071911812, 0.04933546483516693, 0.06969623267650604, 0.09005699306726456, 0.11041775345802307, 0.13077852129936218, 0.1511392891407013, 0.1715000569820404, 0.19186080992221832, 0.21222157776355743, 0.23258234560489655, 0.25294309854507446, 0.2733038663864136, 0.2936646342277527, 0.3140254020690918, 0.3343861699104309, 0.35474693775177, 0.37510770559310913, 0.39546847343444824, 0.41582921147346497, 0.4361899793148041, 0.4565507471561432, 0.4769115149974823, 0.4972722828388214, 0.5176330208778381, 0.5379937887191772, 0.5583545565605164, 0.5787153244018555, 0.5990760922431946, 0.6194368600845337]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 17.0, 17.0, 36.0, 66.0, 90.0, 134.0, 184.0, 361.0, 575.0, 1147.0, 2256.0, 5338.0, 14870.0, 56749.0, 246405.0, 811752.0, 1477164.0, 1068094.0, 375299.0, 92595.0, 24855.0, 8505.0, 3968.0, 1751.0, 874.0, 469.0, 259.0, 150.0, 111.0, 68.0, 44.0, 29.0, 15.0, 12.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1463623046875, -0.14247703552246094, -0.13859176635742188, -0.1347064971923828, -0.13082122802734375, -0.1269359588623047, -0.12305068969726562, -0.11916542053222656, -0.1152801513671875, -0.11139488220214844, -0.10750961303710938, -0.10362434387207031, -0.09973907470703125, -0.09585380554199219, -0.09196853637695312, -0.08808326721191406, -0.084197998046875, -0.08031272888183594, -0.07642745971679688, -0.07254219055175781, -0.06865692138671875, -0.06477165222167969, -0.060886383056640625, -0.05700111389160156, -0.0531158447265625, -0.04923057556152344, -0.045345306396484375, -0.04146003723144531, -0.03757476806640625, -0.03368949890136719, -0.029804229736328125, -0.025918960571289062, -0.02203369140625, -0.018148422241210938, -0.014263153076171875, -0.010377883911132812, -0.00649261474609375, -0.0026073455810546875, 0.001277923583984375, 0.0051631927490234375, 0.0090484619140625, 0.012933731079101562, 0.016819000244140625, 0.020704269409179688, 0.02458953857421875, 0.028474807739257812, 0.032360076904296875, 0.03624534606933594, 0.040130615234375, 0.04401588439941406, 0.047901153564453125, 0.05178642272949219, 0.05567169189453125, 0.05955696105957031, 0.06344223022460938, 0.06732749938964844, 0.0712127685546875, 0.07509803771972656, 0.07898330688476562, 0.08286857604980469, 0.08675384521484375, 0.09063911437988281, 0.09452438354492188, 0.09840965270996094, 0.102294921875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 14.0, 16.0, 21.0, 20.0, 26.0, 25.0, 36.0, 43.0, 43.0, 53.0, 58.0, 52.0, 62.0, 77.0, 50.0, 57.0, 44.0, 55.0, 42.0, 36.0, 26.0, 29.0, 26.0, 18.0, 12.0, 14.0, 9.0, 10.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.176513671875, -0.172210693359375, -0.16790771484375, -0.163604736328125, -0.1593017578125, -0.154998779296875, -0.15069580078125, -0.146392822265625, -0.14208984375, -0.137786865234375, -0.13348388671875, -0.129180908203125, -0.1248779296875, -0.120574951171875, -0.11627197265625, -0.111968994140625, -0.107666015625, -0.103363037109375, -0.09906005859375, -0.094757080078125, -0.0904541015625, -0.086151123046875, -0.08184814453125, -0.077545166015625, -0.0732421875, -0.068939208984375, -0.06463623046875, -0.060333251953125, -0.0560302734375, -0.051727294921875, -0.04742431640625, -0.043121337890625, -0.038818359375, -0.034515380859375, -0.03021240234375, -0.025909423828125, -0.0216064453125, -0.017303466796875, -0.01300048828125, -0.008697509765625, -0.00439453125, -9.1552734375e-05, 0.00421142578125, 0.008514404296875, 0.0128173828125, 0.017120361328125, 0.02142333984375, 0.025726318359375, 0.030029296875, 0.034332275390625, 0.03863525390625, 0.042938232421875, 0.0472412109375, 0.051544189453125, 0.05584716796875, 0.060150146484375, 0.064453125, 0.068756103515625, 0.07305908203125, 0.077362060546875, 0.0816650390625, 0.085968017578125, 0.09027099609375, 0.094573974609375, 0.098876953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 17.0, 23.0, 23.0, 29.0, 30.0, 48.0, 60.0, 65.0, 95.0, 157.0, 337.0, 813.0, 2410.0, 9110.0, 51963.0, 677002.0, 3181824.0, 235063.0, 26614.0, 5661.0, 1610.0, 591.0, 260.0, 150.0, 80.0, 60.0, 45.0, 32.0, 22.0, 18.0, 12.0, 11.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2078857421875, -0.1993389129638672, -0.19079208374023438, -0.18224525451660156, -0.17369842529296875, -0.16515159606933594, -0.15660476684570312, -0.1480579376220703, -0.1395111083984375, -0.1309642791748047, -0.12241744995117188, -0.11387062072753906, -0.10532379150390625, -0.09677696228027344, -0.08823013305664062, -0.07968330383300781, -0.071136474609375, -0.06258964538574219, -0.054042816162109375, -0.04549598693847656, -0.03694915771484375, -0.028402328491210938, -0.019855499267578125, -0.011308670043945312, -0.0027618408203125, 0.0057849884033203125, 0.014331817626953125, 0.022878646850585938, 0.03142547607421875, 0.03997230529785156, 0.048519134521484375, 0.05706596374511719, 0.06561279296875, 0.07415962219238281, 0.08270645141601562, 0.09125328063964844, 0.09980010986328125, 0.10834693908691406, 0.11689376831054688, 0.1254405975341797, 0.1339874267578125, 0.1425342559814453, 0.15108108520507812, 0.15962791442871094, 0.16817474365234375, 0.17672157287597656, 0.18526840209960938, 0.1938152313232422, 0.202362060546875, 0.2109088897705078, 0.21945571899414062, 0.22800254821777344, 0.23654937744140625, 0.24509620666503906, 0.2536430358886719, 0.2621898651123047, 0.2707366943359375, 0.2792835235595703, 0.2878303527832031, 0.29637718200683594, 0.30492401123046875, 0.31347084045410156, 0.3220176696777344, 0.3305644989013672, 0.339111328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 17.0, 18.0, 21.0, 40.0, 45.0, 74.0, 123.0, 207.0, 268.0, 458.0, 610.0, 658.0, 521.0, 317.0, 225.0, 148.0, 105.0, 70.0, 47.0, 27.0, 18.0, 9.0, 11.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135986328125, -0.12893295288085938, -0.12187957763671875, -0.11482620239257812, -0.1077728271484375, -0.10071945190429688, -0.09366607666015625, -0.08661270141601562, -0.079559326171875, -0.07250595092773438, -0.06545257568359375, -0.058399200439453125, -0.0513458251953125, -0.044292449951171875, -0.03723907470703125, -0.030185699462890625, -0.02313232421875, -0.016078948974609375, -0.00902557373046875, -0.001972198486328125, 0.0050811767578125, 0.012134552001953125, 0.01918792724609375, 0.026241302490234375, 0.033294677734375, 0.040348052978515625, 0.04740142822265625, 0.054454803466796875, 0.0615081787109375, 0.06856155395507812, 0.07561492919921875, 0.08266830444335938, 0.0897216796875, 0.09677505493164062, 0.10382843017578125, 0.11088180541992188, 0.1179351806640625, 0.12498855590820312, 0.13204193115234375, 0.13909530639648438, 0.146148681640625, 0.15320205688476562, 0.16025543212890625, 0.16730880737304688, 0.1743621826171875, 0.18141555786132812, 0.18846893310546875, 0.19552230834960938, 0.20257568359375, 0.20962905883789062, 0.21668243408203125, 0.22373580932617188, 0.2307891845703125, 0.23784255981445312, 0.24489593505859375, 0.2519493103027344, 0.259002685546875, 0.2660560607910156, 0.27310943603515625, 0.2801628112792969, 0.2872161865234375, 0.2942695617675781, 0.30132293701171875, 0.3083763122558594, 0.3154296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 10.0, 17.0, 61.0, 168.0, 274.0, 243.0, 143.0, 52.0, 15.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7956990003585815, -1.7135035991668701, -1.6313081979751587, -1.5491127967834473, -1.4669173955917358, -1.3847219944000244, -1.3025267124176025, -1.2203311920166016, -1.1381359100341797, -1.0559405088424683, -0.9737451076507568, -0.8915497064590454, -0.809354305267334, -0.7271589040756226, -0.6449635624885559, -0.5627681612968445, -0.4805727005004883, -0.39837729930877686, -0.31618189811706543, -0.2339865267276764, -0.15179112553596497, -0.06959572434425354, 0.012599647045135498, 0.09479504823684692, 0.17699044942855835, 0.2591858506202698, 0.3413812518119812, 0.42357662320137024, 0.5057719945907593, 0.5879673957824707, 0.6701627969741821, 0.7523581981658936, 0.8345537185668945, 0.916749119758606, 0.9989445209503174, 1.0811399221420288, 1.1633353233337402, 1.2455307245254517, 1.327726125717163, 1.409921407699585, 1.492116928100586, 1.5743123292922974, 1.6565077304840088, 1.7387031316757202, 1.8208985328674316, 1.903093934059143, 1.9852893352508545, 2.0674846172332764, 2.1496801376342773, 2.231875419616699, 2.3140709400177, 2.396266222000122, 2.478461742401123, 2.560657024383545, 2.642852544784546, 2.7250478267669678, 2.8072431087493896, 2.8894383907318115, 2.9716339111328125, 3.0538291931152344, 3.1360247135162354, 3.2182199954986572, 3.300415515899658, 3.38261079788208, 3.464806318283081]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 8.0, 3.0, 9.0, 7.0, 17.0, 18.0, 25.0, 28.0, 29.0, 31.0, 35.0, 45.0, 53.0, 52.0, 43.0, 61.0, 46.0, 56.0, 47.0, 49.0, 49.0, 35.0, 36.0, 27.0, 23.0, 24.0, 29.0, 19.0, 31.0, 8.0, 9.0, 11.0, 7.0, 9.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7776639461517334, -0.7558853030204773, -0.7341066598892212, -0.7123280763626099, -0.6905494332313538, -0.6687707901000977, -0.6469922065734863, -0.6252135634422302, -0.6034349203109741, -0.581656277179718, -0.5598776340484619, -0.5380990505218506, -0.5163204073905945, -0.4945417642593384, -0.47276315093040466, -0.45098453760147095, -0.42920589447021484, -0.40742725133895874, -0.385648638010025, -0.3638700246810913, -0.3420913815498352, -0.3203127384185791, -0.2985341250896454, -0.27675551176071167, -0.25497686862945557, -0.23319824039936066, -0.21141961216926575, -0.18964098393917084, -0.16786235570907593, -0.14608372747898102, -0.12430509924888611, -0.1025264710187912, -0.08074784278869629, -0.05896921455860138, -0.03719058632850647, -0.01541195809841156, 0.00636667013168335, 0.02814529836177826, 0.04992392659187317, 0.07170255482196808, 0.09348118305206299, 0.1152598112821579, 0.1370384395122528, 0.15881706774234772, 0.18059569597244263, 0.20237432420253754, 0.22415295243263245, 0.24593158066272736, 0.26771020889282227, 0.28948885202407837, 0.3112674653530121, 0.3330460786819458, 0.3548247218132019, 0.376603364944458, 0.3983819782733917, 0.42016059160232544, 0.44193923473358154, 0.46371787786483765, 0.48549649119377136, 0.5072751045227051, 0.5290537476539612, 0.5508323907852173, 0.5726109743118286, 0.5943896174430847, 0.6161682605743408]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 18.0, 21.0, 33.0, 64.0, 115.0, 256.0, 503.0, 1295.0, 3241.0, 9463.0, 27802.0, 82257.0, 215214.0, 343209.0, 229162.0, 89442.0, 29969.0, 10296.0, 3626.0, 1454.0, 577.0, 245.0, 115.0, 73.0, 28.0, 23.0, 15.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14440345764160156, -0.13951492309570312, -0.1346263885498047, -0.12973785400390625, -0.12484931945800781, -0.11996078491210938, -0.11507225036621094, -0.1101837158203125, -0.10529518127441406, -0.10040664672851562, -0.09551811218261719, -0.09062957763671875, -0.08574104309082031, -0.08085250854492188, -0.07596397399902344, -0.071075439453125, -0.06618690490722656, -0.061298370361328125, -0.05640983581542969, -0.05152130126953125, -0.04663276672363281, -0.041744232177734375, -0.03685569763183594, -0.0319671630859375, -0.027078628540039062, -0.022190093994140625, -0.017301559448242188, -0.01241302490234375, -0.0075244903564453125, -0.002635955810546875, 0.0022525787353515625, 0.00714111328125, 0.012029647827148438, 0.016918182373046875, 0.021806716918945312, 0.02669525146484375, 0.03158378601074219, 0.036472320556640625, 0.04136085510253906, 0.0462493896484375, 0.05113792419433594, 0.056026458740234375, 0.06091499328613281, 0.06580352783203125, 0.07069206237792969, 0.07558059692382812, 0.08046913146972656, 0.085357666015625, 0.09024620056152344, 0.09513473510742188, 0.10002326965332031, 0.10491180419921875, 0.10980033874511719, 0.11468887329101562, 0.11957740783691406, 0.1244659423828125, 0.12935447692871094, 0.13424301147460938, 0.1391315460205078, 0.14402008056640625, 0.1489086151123047, 0.15379714965820312, 0.15868568420410156, 0.16357421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 9.0, 13.0, 12.0, 20.0, 25.0, 28.0, 36.0, 30.0, 40.0, 48.0, 52.0, 53.0, 45.0, 53.0, 61.0, 51.0, 71.0, 59.0, 45.0, 45.0, 22.0, 42.0, 23.0, 22.0, 15.0, 21.0, 15.0, 10.0, 14.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.17333984375, -0.1688375473022461, -0.1643352508544922, -0.15983295440673828, -0.15533065795898438, -0.15082836151123047, -0.14632606506347656, -0.14182376861572266, -0.13732147216796875, -0.13281917572021484, -0.12831687927246094, -0.12381458282470703, -0.11931228637695312, -0.11480998992919922, -0.11030769348144531, -0.1058053970336914, -0.1013031005859375, -0.0968008041381836, -0.09229850769042969, -0.08779621124267578, -0.08329391479492188, -0.07879161834716797, -0.07428932189941406, -0.06978702545166016, -0.06528472900390625, -0.060782432556152344, -0.05628013610839844, -0.05177783966064453, -0.047275543212890625, -0.04277324676513672, -0.03827095031738281, -0.033768653869628906, -0.029266357421875, -0.024764060974121094, -0.020261764526367188, -0.01575946807861328, -0.011257171630859375, -0.006754875183105469, -0.0022525787353515625, 0.0022497177124023438, 0.00675201416015625, 0.011254310607910156, 0.015756607055664062, 0.02025890350341797, 0.024761199951171875, 0.02926349639892578, 0.03376579284667969, 0.038268089294433594, 0.0427703857421875, 0.047272682189941406, 0.05177497863769531, 0.05627727508544922, 0.060779571533203125, 0.06528186798095703, 0.06978416442871094, 0.07428646087646484, 0.07878875732421875, 0.08329105377197266, 0.08779335021972656, 0.09229564666748047, 0.09679794311523438, 0.10130023956298828, 0.10580253601074219, 0.1103048324584961, 0.11480712890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 15.0, 9.0, 14.0, 24.0, 34.0, 31.0, 66.0, 99.0, 175.0, 312.0, 502.0, 924.0, 1772.0, 3628.0, 7538.0, 16306.0, 36957.0, 84124.0, 180439.0, 306150.0, 216540.0, 106484.0, 46917.0, 20739.0, 9415.0, 4521.0, 2185.0, 1073.0, 603.0, 391.0, 217.0, 122.0, 83.0, 48.0, 33.0, 22.0, 11.0, 12.0, 10.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.13623046875, -0.13229846954345703, -0.12836647033691406, -0.1244344711303711, -0.12050247192382812, -0.11657047271728516, -0.11263847351074219, -0.10870647430419922, -0.10477447509765625, -0.10084247589111328, -0.09691047668457031, -0.09297847747802734, -0.08904647827148438, -0.0851144790649414, -0.08118247985839844, -0.07725048065185547, -0.0733184814453125, -0.06938648223876953, -0.06545448303222656, -0.061522483825683594, -0.057590484619140625, -0.053658485412597656, -0.04972648620605469, -0.04579448699951172, -0.04186248779296875, -0.03793048858642578, -0.03399848937988281, -0.030066490173339844, -0.026134490966796875, -0.022202491760253906, -0.018270492553710938, -0.014338493347167969, -0.010406494140625, -0.006474494934082031, -0.0025424957275390625, 0.0013895034790039062, 0.005321502685546875, 0.009253501892089844, 0.013185501098632812, 0.01711750030517578, 0.02104949951171875, 0.02498149871826172, 0.028913497924804688, 0.032845497131347656, 0.036777496337890625, 0.040709495544433594, 0.04464149475097656, 0.04857349395751953, 0.0525054931640625, 0.05643749237060547, 0.06036949157714844, 0.0643014907836914, 0.06823348999023438, 0.07216548919677734, 0.07609748840332031, 0.08002948760986328, 0.08396148681640625, 0.08789348602294922, 0.09182548522949219, 0.09575748443603516, 0.09968948364257812, 0.1036214828491211, 0.10755348205566406, 0.11148548126220703, 0.11541748046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 14.0, 8.0, 16.0, 12.0, 19.0, 25.0, 24.0, 25.0, 30.0, 31.0, 29.0, 37.0, 33.0, 41.0, 45.0, 37.0, 27.0, 42.0, 31.0, 46.0, 32.0, 36.0, 43.0, 30.0, 40.0, 22.0, 31.0, 22.0, 15.0, 27.0, 24.0, 18.0, 11.0, 12.0, 8.0, 8.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.259033203125, -0.25058746337890625, -0.2421417236328125, -0.23369598388671875, -0.225250244140625, -0.21680450439453125, -0.2083587646484375, -0.19991302490234375, -0.19146728515625, -0.18302154541015625, -0.1745758056640625, -0.16613006591796875, -0.157684326171875, -0.14923858642578125, -0.1407928466796875, -0.13234710693359375, -0.1239013671875, -0.11545562744140625, -0.1070098876953125, -0.09856414794921875, -0.090118408203125, -0.08167266845703125, -0.0732269287109375, -0.06478118896484375, -0.05633544921875, -0.04788970947265625, -0.0394439697265625, -0.03099822998046875, -0.022552490234375, -0.01410675048828125, -0.0056610107421875, 0.00278472900390625, 0.01123046875, 0.01967620849609375, 0.0281219482421875, 0.03656768798828125, 0.045013427734375, 0.05345916748046875, 0.0619049072265625, 0.07035064697265625, 0.07879638671875, 0.08724212646484375, 0.0956878662109375, 0.10413360595703125, 0.112579345703125, 0.12102508544921875, 0.1294708251953125, 0.13791656494140625, 0.1463623046875, 0.15480804443359375, 0.1632537841796875, 0.17169952392578125, 0.180145263671875, 0.18859100341796875, 0.1970367431640625, 0.20548248291015625, 0.21392822265625, 0.22237396240234375, 0.2308197021484375, 0.23926544189453125, 0.247711181640625, 0.25615692138671875, 0.2646026611328125, 0.27304840087890625, 0.281494140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 14.0, 18.0, 31.0, 54.0, 75.0, 144.0, 238.0, 409.0, 669.0, 1183.0, 2232.0, 4011.0, 7917.0, 16372.0, 34932.0, 75357.0, 152711.0, 277722.0, 230967.0, 126879.0, 60589.0, 28441.0, 13270.0, 6656.0, 3328.0, 1872.0, 1059.0, 560.0, 324.0, 196.0, 119.0, 70.0, 50.0, 25.0, 19.0, 12.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0237274169921875, -0.02284407615661621, -0.021960735321044922, -0.021077394485473633, -0.020194053649902344, -0.019310712814331055, -0.018427371978759766, -0.017544031143188477, -0.016660690307617188, -0.0157773494720459, -0.01489400863647461, -0.01401066780090332, -0.013127326965332031, -0.012243986129760742, -0.011360645294189453, -0.010477304458618164, -0.009593963623046875, -0.008710622787475586, -0.007827281951904297, -0.006943941116333008, -0.006060600280761719, -0.00517725944519043, -0.004293918609619141, -0.0034105777740478516, -0.0025272369384765625, -0.0016438961029052734, -0.0007605552673339844, 0.0001227855682373047, 0.0010061264038085938, 0.0018894672393798828, 0.002772808074951172, 0.003656148910522461, 0.00453948974609375, 0.005422830581665039, 0.006306171417236328, 0.007189512252807617, 0.008072853088378906, 0.008956193923950195, 0.009839534759521484, 0.010722875595092773, 0.011606216430664062, 0.012489557266235352, 0.01337289810180664, 0.01425623893737793, 0.015139579772949219, 0.016022920608520508, 0.016906261444091797, 0.017789602279663086, 0.018672943115234375, 0.019556283950805664, 0.020439624786376953, 0.021322965621948242, 0.02220630645751953, 0.02308964729309082, 0.02397298812866211, 0.0248563289642334, 0.025739669799804688, 0.026623010635375977, 0.027506351470947266, 0.028389692306518555, 0.029273033142089844, 0.030156373977661133, 0.031039714813232422, 0.03192305564880371, 0.032806396484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 14.0, 11.0, 14.0, 16.0, 15.0, 24.0, 43.0, 57.0, 59.0, 67.0, 69.0, 98.0, 88.0, 71.0, 60.0, 75.0, 46.0, 40.0, 26.0, 28.0, 12.0, 15.0, 10.0, 15.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7762184143066406e-05, -1.7255544662475586e-05, -1.6748905181884766e-05, -1.6242265701293945e-05, -1.5735626220703125e-05, -1.5228986740112305e-05, -1.4722347259521484e-05, -1.4215707778930664e-05, -1.3709068298339844e-05, -1.3202428817749023e-05, -1.2695789337158203e-05, -1.2189149856567383e-05, -1.1682510375976562e-05, -1.1175870895385742e-05, -1.0669231414794922e-05, -1.0162591934204102e-05, -9.655952453613281e-06, -9.149312973022461e-06, -8.64267349243164e-06, -8.13603401184082e-06, -7.62939453125e-06, -7.12275505065918e-06, -6.616115570068359e-06, -6.109476089477539e-06, -5.602836608886719e-06, -5.0961971282958984e-06, -4.589557647705078e-06, -4.082918167114258e-06, -3.5762786865234375e-06, -3.069639205932617e-06, -2.562999725341797e-06, -2.0563602447509766e-06, -1.5497207641601562e-06, -1.043081283569336e-06, -5.364418029785156e-07, -2.9802322387695312e-08, 4.76837158203125e-07, 9.834766387939453e-07, 1.4901161193847656e-06, 1.996755599975586e-06, 2.5033950805664062e-06, 3.0100345611572266e-06, 3.516674041748047e-06, 4.023313522338867e-06, 4.5299530029296875e-06, 5.036592483520508e-06, 5.543231964111328e-06, 6.0498714447021484e-06, 6.556510925292969e-06, 7.063150405883789e-06, 7.569789886474609e-06, 8.07642936706543e-06, 8.58306884765625e-06, 9.08970832824707e-06, 9.59634780883789e-06, 1.0102987289428711e-05, 1.0609626770019531e-05, 1.1116266250610352e-05, 1.1622905731201172e-05, 1.2129545211791992e-05, 1.2636184692382812e-05, 1.3142824172973633e-05, 1.3649463653564453e-05, 1.4156103134155273e-05, 1.4662742614746094e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 27.0, 44.0, 72.0, 125.0, 286.0, 598.0, 1297.0, 3191.0, 7608.0, 19804.0, 52978.0, 135777.0, 287799.0, 307340.0, 142090.0, 55019.0, 20676.0, 7889.0, 3289.0, 1350.0, 626.0, 329.0, 147.0, 77.0, 40.0, 21.0, 15.0, 6.0, 5.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0302886962890625, -0.02924513816833496, -0.028201580047607422, -0.027158021926879883, -0.026114463806152344, -0.025070905685424805, -0.024027347564697266, -0.022983789443969727, -0.021940231323242188, -0.02089667320251465, -0.01985311508178711, -0.01880955696105957, -0.01776599884033203, -0.016722440719604492, -0.015678882598876953, -0.014635324478149414, -0.013591766357421875, -0.012548208236694336, -0.011504650115966797, -0.010461091995239258, -0.009417533874511719, -0.00837397575378418, -0.007330417633056641, -0.0062868595123291016, -0.0052433013916015625, -0.0041997432708740234, -0.0031561851501464844, -0.0021126270294189453, -0.0010690689086914062, -2.5510787963867188e-05, 0.0010180473327636719, 0.002061605453491211, 0.00310516357421875, 0.004148721694946289, 0.005192279815673828, 0.006235837936401367, 0.007279396057128906, 0.008322954177856445, 0.009366512298583984, 0.010410070419311523, 0.011453628540039062, 0.012497186660766602, 0.01354074478149414, 0.01458430290222168, 0.01562786102294922, 0.016671419143676758, 0.017714977264404297, 0.018758535385131836, 0.019802093505859375, 0.020845651626586914, 0.021889209747314453, 0.022932767868041992, 0.02397632598876953, 0.02501988410949707, 0.02606344223022461, 0.02710700035095215, 0.028150558471679688, 0.029194116592407227, 0.030237674713134766, 0.031281232833862305, 0.032324790954589844, 0.03336834907531738, 0.03441190719604492, 0.03545546531677246, 0.0364990234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 7.0, 10.0, 7.0, 7.0, 10.0, 18.0, 20.0, 19.0, 25.0, 30.0, 22.0, 33.0, 43.0, 29.0, 35.0, 52.0, 35.0, 41.0, 44.0, 36.0, 42.0, 44.0, 32.0, 47.0, 40.0, 46.0, 28.0, 41.0, 30.0, 24.0, 23.0, 13.0, 17.0, 9.0, 14.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0283203125, -0.027355194091796875, -0.02639007568359375, -0.025424957275390625, -0.0244598388671875, -0.023494720458984375, -0.02252960205078125, -0.021564483642578125, -0.020599365234375, -0.019634246826171875, -0.01866912841796875, -0.017704010009765625, -0.0167388916015625, -0.015773773193359375, -0.01480865478515625, -0.013843536376953125, -0.01287841796875, -0.011913299560546875, -0.01094818115234375, -0.009983062744140625, -0.0090179443359375, -0.008052825927734375, -0.00708770751953125, -0.006122589111328125, -0.005157470703125, -0.004192352294921875, -0.00322723388671875, -0.002262115478515625, -0.0012969970703125, -0.000331878662109375, 0.00063323974609375, 0.001598358154296875, 0.0025634765625, 0.003528594970703125, 0.00449371337890625, 0.005458831787109375, 0.0064239501953125, 0.007389068603515625, 0.00835418701171875, 0.009319305419921875, 0.010284423828125, 0.011249542236328125, 0.01221466064453125, 0.013179779052734375, 0.0141448974609375, 0.015110015869140625, 0.01607513427734375, 0.017040252685546875, 0.01800537109375, 0.018970489501953125, 0.01993560791015625, 0.020900726318359375, 0.0218658447265625, 0.022830963134765625, 0.02379608154296875, 0.024761199951171875, 0.025726318359375, 0.026691436767578125, 0.02765655517578125, 0.028621673583984375, 0.0295867919921875, 0.030551910400390625, 0.03151702880859375, 0.032482147216796875, 0.033447265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 11.0, 14.0, 25.0, 51.0, 72.0, 105.0, 137.0, 175.0, 149.0, 110.0, 69.0, 32.0, 22.0, 7.0, 8.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.304499864578247, -1.272280216217041, -1.2400604486465454, -1.2078408002853394, -1.1756211519241333, -1.1434015035629272, -1.1111817359924316, -1.0789620876312256, -1.0467424392700195, -1.0145227909088135, -0.9823030829429626, -0.9500833749771118, -0.9178637266159058, -0.8856440186500549, -0.8534243106842041, -0.821204662322998, -0.7889849543571472, -0.7567652463912964, -0.7245455980300903, -0.6923258900642395, -0.6601062417030334, -0.6278865337371826, -0.5956668853759766, -0.5634471774101257, -0.5312274694442749, -0.49900779128074646, -0.466788113117218, -0.4345684051513672, -0.40234875679016113, -0.3701290488243103, -0.33790937066078186, -0.3056896924972534, -0.2734699845314026, -0.24125030636787415, -0.2090306282043457, -0.17681093513965607, -0.14459125697612762, -0.11237157881259918, -0.08015188574790955, -0.047932207584381104, -0.01571252942085266, 0.01650715246796608, 0.04872683435678482, 0.08094651997089386, 0.1131661981344223, 0.14538587629795074, 0.17760556936264038, 0.20982524752616882, 0.24204492568969727, 0.2742646038532257, 0.30648428201675415, 0.338703989982605, 0.37092363834381104, 0.40314334630966187, 0.4353630244731903, 0.46758270263671875, 0.4998023808002472, 0.5320220589637756, 0.5642417669296265, 0.5964614152908325, 0.6286811232566833, 0.6609007716178894, 0.6931204795837402, 0.7253401279449463, 0.7575598359107971]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 5.0, 5.0, 7.0, 13.0, 10.0, 10.0, 16.0, 23.0, 28.0, 27.0, 28.0, 33.0, 41.0, 42.0, 39.0, 42.0, 38.0, 42.0, 54.0, 49.0, 33.0, 44.0, 49.0, 38.0, 25.0, 32.0, 24.0, 27.0, 27.0, 22.0, 21.0, 14.0, 12.0, 12.0, 13.0, 8.0, 9.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6679368019104004, -0.6468158960342407, -0.6256949305534363, -0.6045740246772766, -0.5834530591964722, -0.5623321533203125, -0.5412112474441528, -0.5200903415679932, -0.4989693760871887, -0.47784844040870667, -0.4567275047302246, -0.43560659885406494, -0.4144856631755829, -0.39336472749710083, -0.37224382162094116, -0.3511228859424591, -0.33000195026397705, -0.308881014585495, -0.28776007890701294, -0.26663917303085327, -0.24551823735237122, -0.22439730167388916, -0.2032763808965683, -0.18215546011924744, -0.16103452444076538, -0.13991358876228333, -0.11879266798496246, -0.097671739757061, -0.07655081152915955, -0.05542988330125809, -0.03430895507335663, -0.013188034296035767, 0.007932960987091064, 0.029053889214992523, 0.05017481744289398, 0.07129574567079544, 0.0924166738986969, 0.11353760212659836, 0.13465853035449982, 0.15577945113182068, 0.17690038681030273, 0.1980213224887848, 0.21914224326610565, 0.2402631640434265, 0.26138409972190857, 0.2825050354003906, 0.3036259412765503, 0.32474687695503235, 0.3458678126335144, 0.36698874831199646, 0.3881096839904785, 0.4092305898666382, 0.43035152554512024, 0.4514724612236023, 0.47259336709976196, 0.493714302778244, 0.5148352384567261, 0.5359561443328857, 0.5570771098136902, 0.5781980156898499, 0.5993189811706543, 0.620439887046814, 0.6415607929229736, 0.6626816987991333, 0.6838026642799377]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 9.0, 14.0, 17.0, 21.0, 39.0, 73.0, 83.0, 117.0, 202.0, 319.0, 668.0, 2412.0, 42566.0, 2019285.0, 2074408.0, 49182.0, 3308.0, 650.0, 288.0, 199.0, 110.0, 98.0, 68.0, 39.0, 35.0, 22.0, 18.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.4062538146972656, -0.39356231689453125, -0.3808708190917969, -0.3681793212890625, -0.3554878234863281, -0.34279632568359375, -0.3301048278808594, -0.317413330078125, -0.3047218322753906, -0.29203033447265625, -0.2793388366699219, -0.2666473388671875, -0.2539558410644531, -0.24126434326171875, -0.22857284545898438, -0.21588134765625, -0.20318984985351562, -0.19049835205078125, -0.17780685424804688, -0.1651153564453125, -0.15242385864257812, -0.13973236083984375, -0.12704086303710938, -0.114349365234375, -0.10165786743164062, -0.08896636962890625, -0.07627487182617188, -0.0635833740234375, -0.050891876220703125, -0.03820037841796875, -0.025508880615234375, -0.0128173828125, -0.000125885009765625, 0.01256561279296875, 0.025257110595703125, 0.0379486083984375, 0.050640106201171875, 0.06333160400390625, 0.07602310180664062, 0.088714599609375, 0.10140609741210938, 0.11409759521484375, 0.12678909301757812, 0.1394805908203125, 0.15217208862304688, 0.16486358642578125, 0.17755508422851562, 0.19024658203125, 0.20293807983398438, 0.21562957763671875, 0.22832107543945312, 0.2410125732421875, 0.2537040710449219, 0.26639556884765625, 0.2790870666503906, 0.291778564453125, 0.3044700622558594, 0.31716156005859375, 0.3298530578613281, 0.3425445556640625, 0.3552360534667969, 0.36792755126953125, 0.3806190490722656, 0.393310546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 6.0, 12.0, 28.0, 22.0, 27.0, 28.0, 42.0, 39.0, 50.0, 61.0, 73.0, 50.0, 56.0, 64.0, 68.0, 51.0, 46.0, 52.0, 39.0, 54.0, 28.0, 21.0, 17.0, 16.0, 14.0, 11.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17578125, -0.17123985290527344, -0.16669845581054688, -0.1621570587158203, -0.15761566162109375, -0.1530742645263672, -0.14853286743164062, -0.14399147033691406, -0.1394500732421875, -0.13490867614746094, -0.13036727905273438, -0.1258258819580078, -0.12128448486328125, -0.11674308776855469, -0.11220169067382812, -0.10766029357910156, -0.103118896484375, -0.09857749938964844, -0.09403610229492188, -0.08949470520019531, -0.08495330810546875, -0.08041191101074219, -0.07587051391601562, -0.07132911682128906, -0.0667877197265625, -0.06224632263183594, -0.057704925537109375, -0.05316352844238281, -0.04862213134765625, -0.04408073425292969, -0.039539337158203125, -0.03499794006347656, -0.03045654296875, -0.025915145874023438, -0.021373748779296875, -0.016832351684570312, -0.01229095458984375, -0.0077495574951171875, -0.003208160400390625, 0.0013332366943359375, 0.0058746337890625, 0.010416030883789062, 0.014957427978515625, 0.019498825073242188, 0.02404022216796875, 0.028581619262695312, 0.033123016357421875, 0.03766441345214844, 0.042205810546875, 0.04674720764160156, 0.051288604736328125, 0.05583000183105469, 0.06037139892578125, 0.06491279602050781, 0.06945419311523438, 0.07399559020996094, 0.0785369873046875, 0.08307838439941406, 0.08761978149414062, 0.09216117858886719, 0.09670257568359375, 0.10124397277832031, 0.10578536987304688, 0.11032676696777344, 0.1148681640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 12.0, 19.0, 22.0, 35.0, 56.0, 66.0, 114.0, 181.0, 303.0, 654.0, 1631.0, 5501.0, 35472.0, 828336.0, 3195311.0, 110401.0, 11383.0, 2754.0, 997.0, 434.0, 209.0, 129.0, 82.0, 61.0, 45.0, 24.0, 18.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36962890625, -0.35882568359375, -0.3480224609375, -0.33721923828125, -0.326416015625, -0.31561279296875, -0.3048095703125, -0.29400634765625, -0.283203125, -0.27239990234375, -0.2615966796875, -0.25079345703125, -0.239990234375, -0.22918701171875, -0.2183837890625, -0.20758056640625, -0.19677734375, -0.18597412109375, -0.1751708984375, -0.16436767578125, -0.153564453125, -0.14276123046875, -0.1319580078125, -0.12115478515625, -0.1103515625, -0.09954833984375, -0.0887451171875, -0.07794189453125, -0.067138671875, -0.05633544921875, -0.0455322265625, -0.03472900390625, -0.02392578125, -0.01312255859375, -0.0023193359375, 0.00848388671875, 0.019287109375, 0.03009033203125, 0.0408935546875, 0.05169677734375, 0.0625, 0.07330322265625, 0.0841064453125, 0.09490966796875, 0.105712890625, 0.11651611328125, 0.1273193359375, 0.13812255859375, 0.14892578125, 0.15972900390625, 0.1705322265625, 0.18133544921875, 0.192138671875, 0.20294189453125, 0.2137451171875, 0.22454833984375, 0.2353515625, 0.24615478515625, 0.2569580078125, 0.26776123046875, 0.278564453125, 0.28936767578125, 0.3001708984375, 0.31097412109375, 0.32177734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 6.0, 14.0, 20.0, 27.0, 27.0, 50.0, 86.0, 137.0, 204.0, 281.0, 365.0, 473.0, 586.0, 513.0, 397.0, 281.0, 200.0, 145.0, 72.0, 67.0, 35.0, 19.0, 17.0, 16.0, 14.0, 5.0, 6.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18048858642578125, -0.1717681884765625, -0.16304779052734375, -0.154327392578125, -0.14560699462890625, -0.1368865966796875, -0.12816619873046875, -0.11944580078125, -0.11072540283203125, -0.1020050048828125, -0.09328460693359375, -0.084564208984375, -0.07584381103515625, -0.0671234130859375, -0.05840301513671875, -0.0496826171875, -0.04096221923828125, -0.0322418212890625, -0.02352142333984375, -0.014801025390625, -0.00608062744140625, 0.0026397705078125, 0.01136016845703125, 0.02008056640625, 0.02880096435546875, 0.0375213623046875, 0.04624176025390625, 0.054962158203125, 0.06368255615234375, 0.0724029541015625, 0.08112335205078125, 0.08984375, 0.09856414794921875, 0.1072845458984375, 0.11600494384765625, 0.124725341796875, 0.13344573974609375, 0.1421661376953125, 0.15088653564453125, 0.15960693359375, 0.16832733154296875, 0.1770477294921875, 0.18576812744140625, 0.194488525390625, 0.20320892333984375, 0.2119293212890625, 0.22064971923828125, 0.2293701171875, 0.23809051513671875, 0.2468109130859375, 0.25553131103515625, 0.264251708984375, 0.27297210693359375, 0.2816925048828125, 0.29041290283203125, 0.29913330078125, 0.30785369873046875, 0.3165740966796875, 0.32529449462890625, 0.334014892578125, 0.34273529052734375, 0.3514556884765625, 0.36017608642578125, 0.368896484375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 12.0, 36.0, 61.0, 127.0, 235.0, 220.0, 157.0, 71.0, 40.0, 14.0, 14.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.567248821258545, -2.4327948093414307, -2.2983407974243164, -2.163886785507202, -2.029432773590088, -1.8949787616729736, -1.7605247497558594, -1.6260707378387451, -1.4916167259216309, -1.3571627140045166, -1.2227087020874023, -1.088254690170288, -0.9538006782531738, -0.8193466663360596, -0.6848926544189453, -0.550438642501831, -0.4159846305847168, -0.28153061866760254, -0.14707660675048828, -0.012622594833374023, 0.12183141708374023, 0.2562854290008545, 0.39073944091796875, 0.525193452835083, 0.6596474647521973, 0.7941014766693115, 0.9285554885864258, 1.06300950050354, 1.1974635124206543, 1.3319175243377686, 1.4663715362548828, 1.600825548171997, 1.7352790832519531, 1.8697330951690674, 2.0041871070861816, 2.138641119003296, 2.27309513092041, 2.4075491428375244, 2.5420031547546387, 2.676457166671753, 2.810911178588867, 2.9453651905059814, 3.0798192024230957, 3.21427321434021, 3.348727226257324, 3.4831812381744385, 3.6176352500915527, 3.752089262008667, 3.8865432739257812, 4.020997047424316, 4.15545129776001, 4.289905548095703, 4.424359321594238, 4.558813095092773, 4.693267345428467, 4.82772159576416, 4.962175369262695, 5.0966291427612305, 5.231083393096924, 5.365537643432617, 5.499991416931152, 5.6344451904296875, 5.768899440765381, 5.903353691101074, 6.037807464599609]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 6.0, 14.0, 11.0, 15.0, 20.0, 29.0, 34.0, 34.0, 42.0, 39.0, 47.0, 59.0, 68.0, 53.0, 58.0, 47.0, 56.0, 62.0, 58.0, 40.0, 41.0, 35.0, 28.0, 24.0, 20.0, 11.0, 6.0, 14.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34394371509552, -1.3013237714767456, -1.2587037086486816, -1.2160837650299072, -1.1734638214111328, -1.1308438777923584, -1.0882238149642944, -1.04560387134552, -1.002983808517456, -0.9603638052940369, -0.9177438616752625, -0.8751238584518433, -0.8325039148330688, -0.7898839116096497, -0.7472639083862305, -0.704643964767456, -0.6620240211486816, -0.6194040179252625, -0.576784074306488, -0.5341640710830688, -0.49154409766197205, -0.44892412424087524, -0.40630412101745605, -0.36368414759635925, -0.32106417417526245, -0.27844420075416565, -0.23582421243190765, -0.19320422410964966, -0.15058425068855286, -0.10796427726745605, -0.06534427404403687, -0.022724300622940063, 0.01989579200744629, 0.06251577287912369, 0.10513575375080109, 0.14775574207305908, 0.19037571549415588, 0.23299568891525269, 0.2756156921386719, 0.3182356655597687, 0.3608556389808655, 0.4034756124019623, 0.4460955858230591, 0.48871558904647827, 0.5313355922698975, 0.5739555358886719, 0.6165755391120911, 0.6591955423355103, 0.7018154859542847, 0.7444354891777039, 0.7870554327964783, 0.8296754360198975, 0.8722953796386719, 0.9149153828620911, 0.9575353860855103, 1.0001553297042847, 1.0427753925323486, 1.085395336151123, 1.128015398979187, 1.1706353425979614, 1.2132552862167358, 1.2558753490447998, 1.2984952926635742, 1.3411152362823486, 1.383735179901123]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 10.0, 11.0, 23.0, 19.0, 28.0, 30.0, 51.0, 59.0, 93.0, 131.0, 208.0, 282.0, 489.0, 785.0, 1563.0, 3675.0, 12070.0, 75499.0, 696926.0, 222480.0, 23532.0, 5623.0, 2205.0, 1106.0, 570.0, 339.0, 203.0, 144.0, 126.0, 79.0, 55.0, 40.0, 22.0, 22.0, 14.0, 7.0, 11.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.354248046875, -0.34485435485839844, -0.3354606628417969, -0.3260669708251953, -0.31667327880859375, -0.3072795867919922, -0.2978858947753906, -0.28849220275878906, -0.2790985107421875, -0.26970481872558594, -0.2603111267089844, -0.2509174346923828, -0.24152374267578125, -0.2321300506591797, -0.22273635864257812, -0.21334266662597656, -0.203948974609375, -0.19455528259277344, -0.18516159057617188, -0.1757678985595703, -0.16637420654296875, -0.1569805145263672, -0.14758682250976562, -0.13819313049316406, -0.1287994384765625, -0.11940574645996094, -0.11001205444335938, -0.10061836242675781, -0.09122467041015625, -0.08183097839355469, -0.07243728637695312, -0.06304359436035156, -0.05364990234375, -0.04425621032714844, -0.034862518310546875, -0.025468826293945312, -0.01607513427734375, -0.0066814422607421875, 0.002712249755859375, 0.012105941772460938, 0.0214996337890625, 0.030893325805664062, 0.040287017822265625, 0.04968070983886719, 0.05907440185546875, 0.06846809387207031, 0.07786178588867188, 0.08725547790527344, 0.096649169921875, 0.10604286193847656, 0.11543655395507812, 0.12483024597167969, 0.13422393798828125, 0.1436176300048828, 0.15301132202148438, 0.16240501403808594, 0.1717987060546875, 0.18119239807128906, 0.19058609008789062, 0.1999797821044922, 0.20937347412109375, 0.2187671661376953, 0.22816085815429688, 0.23755455017089844, 0.2469482421875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 1.0, 9.0, 7.0, 4.0, 12.0, 12.0, 16.0, 18.0, 19.0, 26.0, 33.0, 41.0, 55.0, 50.0, 55.0, 54.0, 65.0, 68.0, 51.0, 64.0, 52.0, 39.0, 46.0, 37.0, 30.0, 22.0, 20.0, 26.0, 14.0, 9.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2135009765625, -0.2079029083251953, -0.20230484008789062, -0.19670677185058594, -0.19110870361328125, -0.18551063537597656, -0.17991256713867188, -0.1743144989013672, -0.1687164306640625, -0.1631183624267578, -0.15752029418945312, -0.15192222595214844, -0.14632415771484375, -0.14072608947753906, -0.13512802124023438, -0.1295299530029297, -0.123931884765625, -0.11833381652832031, -0.11273574829101562, -0.10713768005371094, -0.10153961181640625, -0.09594154357910156, -0.09034347534179688, -0.08474540710449219, -0.0791473388671875, -0.07354927062988281, -0.06795120239257812, -0.06235313415527344, -0.05675506591796875, -0.05115699768066406, -0.045558929443359375, -0.03996086120605469, -0.03436279296875, -0.028764724731445312, -0.023166656494140625, -0.017568588256835938, -0.01197052001953125, -0.0063724517822265625, -0.000774383544921875, 0.0048236846923828125, 0.0104217529296875, 0.016019821166992188, 0.021617889404296875, 0.027215957641601562, 0.03281402587890625, 0.03841209411621094, 0.044010162353515625, 0.04960823059082031, 0.055206298828125, 0.06080436706542969, 0.06640243530273438, 0.07200050354003906, 0.07759857177734375, 0.08319664001464844, 0.08879470825195312, 0.09439277648925781, 0.0999908447265625, 0.10558891296386719, 0.11118698120117188, 0.11678504943847656, 0.12238311767578125, 0.12798118591308594, 0.13357925415039062, 0.1391773223876953, 0.144775390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 2.0, 7.0, 9.0, 10.0, 20.0, 19.0, 19.0, 39.0, 48.0, 46.0, 87.0, 101.0, 181.0, 371.0, 1131.0, 7023.0, 181966.0, 833693.0, 20402.0, 2099.0, 523.0, 256.0, 140.0, 114.0, 62.0, 47.0, 28.0, 22.0, 25.0, 18.0, 9.0, 11.0, 6.0, 4.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3693885803222656, -0.35889434814453125, -0.3484001159667969, -0.3379058837890625, -0.3274116516113281, -0.31691741943359375, -0.3064231872558594, -0.295928955078125, -0.2854347229003906, -0.27494049072265625, -0.2644462585449219, -0.2539520263671875, -0.24345779418945312, -0.23296356201171875, -0.22246932983398438, -0.21197509765625, -0.20148086547851562, -0.19098663330078125, -0.18049240112304688, -0.1699981689453125, -0.15950393676757812, -0.14900970458984375, -0.13851547241210938, -0.128021240234375, -0.11752700805664062, -0.10703277587890625, -0.09653854370117188, -0.0860443115234375, -0.07555007934570312, -0.06505584716796875, -0.054561614990234375, -0.0440673828125, -0.033573150634765625, -0.02307891845703125, -0.012584686279296875, -0.0020904541015625, 0.008403778076171875, 0.01889801025390625, 0.029392242431640625, 0.039886474609375, 0.050380706787109375, 0.06087493896484375, 0.07136917114257812, 0.0818634033203125, 0.09235763549804688, 0.10285186767578125, 0.11334609985351562, 0.12384033203125, 0.13433456420898438, 0.14482879638671875, 0.15532302856445312, 0.1658172607421875, 0.17631149291992188, 0.18680572509765625, 0.19729995727539062, 0.207794189453125, 0.21828842163085938, 0.22878265380859375, 0.23927688598632812, 0.2497711181640625, 0.2602653503417969, 0.27075958251953125, 0.2812538146972656, 0.291748046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 5.0, 9.0, 11.0, 16.0, 20.0, 23.0, 20.0, 43.0, 24.0, 51.0, 46.0, 53.0, 54.0, 48.0, 68.0, 62.0, 69.0, 50.0, 42.0, 31.0, 52.0, 38.0, 33.0, 29.0, 23.0, 14.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34375, -0.3329429626464844, -0.32213592529296875, -0.3113288879394531, -0.3005218505859375, -0.2897148132324219, -0.27890777587890625, -0.2681007385253906, -0.257293701171875, -0.24648666381835938, -0.23567962646484375, -0.22487258911132812, -0.2140655517578125, -0.20325851440429688, -0.19245147705078125, -0.18164443969726562, -0.17083740234375, -0.16003036499023438, -0.14922332763671875, -0.13841629028320312, -0.1276092529296875, -0.11680221557617188, -0.10599517822265625, -0.09518814086914062, -0.084381103515625, -0.07357406616210938, -0.06276702880859375, -0.051959991455078125, -0.0411529541015625, -0.030345916748046875, -0.01953887939453125, -0.008731842041015625, 0.0020751953125, 0.012882232666015625, 0.02368927001953125, 0.034496307373046875, 0.0453033447265625, 0.056110382080078125, 0.06691741943359375, 0.07772445678710938, 0.088531494140625, 0.09933853149414062, 0.11014556884765625, 0.12095260620117188, 0.1317596435546875, 0.14256668090820312, 0.15337371826171875, 0.16418075561523438, 0.17498779296875, 0.18579483032226562, 0.19660186767578125, 0.20740890502929688, 0.2182159423828125, 0.22902297973632812, 0.23983001708984375, 0.2506370544433594, 0.261444091796875, 0.2722511291503906, 0.28305816650390625, 0.2938652038574219, 0.3046722412109375, 0.3154792785644531, 0.32628631591796875, 0.3370933532714844, 0.347900390625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 9.0, 16.0, 21.0, 21.0, 27.0, 37.0, 77.0, 140.0, 161.0, 348.0, 841.0, 3320.0, 24686.0, 469083.0, 518274.0, 26236.0, 3397.0, 899.0, 391.0, 183.0, 122.0, 49.0, 49.0, 41.0, 22.0, 17.0, 14.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.059906005859375, -0.058034420013427734, -0.05616283416748047, -0.0542912483215332, -0.05241966247558594, -0.05054807662963867, -0.048676490783691406, -0.04680490493774414, -0.044933319091796875, -0.04306173324584961, -0.041190147399902344, -0.03931856155395508, -0.03744697570800781, -0.03557538986206055, -0.03370380401611328, -0.031832218170166016, -0.02996063232421875, -0.028089046478271484, -0.02621746063232422, -0.024345874786376953, -0.022474288940429688, -0.020602703094482422, -0.018731117248535156, -0.01685953140258789, -0.014987945556640625, -0.01311635971069336, -0.011244773864746094, -0.009373188018798828, -0.0075016021728515625, -0.005630016326904297, -0.0037584304809570312, -0.0018868446350097656, -1.52587890625e-05, 0.0018563270568847656, 0.0037279129028320312, 0.005599498748779297, 0.0074710845947265625, 0.009342670440673828, 0.011214256286621094, 0.01308584213256836, 0.014957427978515625, 0.01682901382446289, 0.018700599670410156, 0.020572185516357422, 0.022443771362304688, 0.024315357208251953, 0.02618694305419922, 0.028058528900146484, 0.02993011474609375, 0.031801700592041016, 0.03367328643798828, 0.03554487228393555, 0.03741645812988281, 0.03928804397583008, 0.041159629821777344, 0.04303121566772461, 0.044902801513671875, 0.04677438735961914, 0.048645973205566406, 0.05051755905151367, 0.05238914489746094, 0.0542607307434082, 0.05613231658935547, 0.058003902435302734, 0.05987548828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 2.0, 5.0, 5.0, 16.0, 11.0, 24.0, 14.0, 16.0, 46.0, 31.0, 29.0, 53.0, 55.0, 56.0, 60.0, 79.0, 64.0, 56.0, 60.0, 52.0, 37.0, 30.0, 37.0, 31.0, 23.0, 11.0, 12.0, 16.0, 7.0, 12.0, 11.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -8.987262845039368e-06, -8.676201105117798e-06, -8.365139365196228e-06, -8.054077625274658e-06, -7.743015885353088e-06, -7.4319541454315186e-06, -7.120892405509949e-06, -6.809830665588379e-06, -6.498768925666809e-06, -6.187707185745239e-06, -5.8766454458236694e-06, -5.5655837059021e-06, -5.25452196598053e-06, -4.94346022605896e-06, -4.63239848613739e-06, -4.32133674621582e-06, -4.0102750062942505e-06, -3.6992132663726807e-06, -3.388151526451111e-06, -3.077089786529541e-06, -2.766028046607971e-06, -2.4549663066864014e-06, -2.1439045667648315e-06, -1.8328428268432617e-06, -1.521781086921692e-06, -1.210719347000122e-06, -8.996576070785522e-07, -5.885958671569824e-07, -2.775341272354126e-07, 3.3527612686157227e-08, 3.4458935260772705e-07, 6.556510925292969e-07, 9.667128324508667e-07, 1.2777745723724365e-06, 1.5888363122940063e-06, 1.8998980522155762e-06, 2.210959792137146e-06, 2.522021532058716e-06, 2.8330832719802856e-06, 3.1441450119018555e-06, 3.4552067518234253e-06, 3.766268491744995e-06, 4.077330231666565e-06, 4.388391971588135e-06, 4.699453711509705e-06, 5.010515451431274e-06, 5.321577191352844e-06, 5.632638931274414e-06, 5.943700671195984e-06, 6.254762411117554e-06, 6.5658241510391235e-06, 6.876885890960693e-06, 7.187947630882263e-06, 7.499009370803833e-06, 7.810071110725403e-06, 8.121132850646973e-06, 8.432194590568542e-06, 8.743256330490112e-06, 9.054318070411682e-06, 9.365379810333252e-06, 9.676441550254822e-06, 9.987503290176392e-06, 1.0298565030097961e-05, 1.0609626770019531e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 8.0, 12.0, 17.0, 40.0, 70.0, 105.0, 176.0, 455.0, 2020.0, 25185.0, 881372.0, 132616.0, 5135.0, 837.0, 244.0, 115.0, 54.0, 35.0, 27.0, 12.0, 6.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114501953125, -0.11154460906982422, -0.10858726501464844, -0.10562992095947266, -0.10267257690429688, -0.0997152328491211, -0.09675788879394531, -0.09380054473876953, -0.09084320068359375, -0.08788585662841797, -0.08492851257324219, -0.0819711685180664, -0.07901382446289062, -0.07605648040771484, -0.07309913635253906, -0.07014179229736328, -0.0671844482421875, -0.06422710418701172, -0.06126976013183594, -0.058312416076660156, -0.055355072021484375, -0.052397727966308594, -0.04944038391113281, -0.04648303985595703, -0.04352569580078125, -0.04056835174560547, -0.03761100769042969, -0.034653663635253906, -0.031696319580078125, -0.028738975524902344, -0.025781631469726562, -0.02282428741455078, -0.019866943359375, -0.01690959930419922, -0.013952255249023438, -0.010994911193847656, -0.008037567138671875, -0.005080223083496094, -0.0021228790283203125, 0.0008344650268554688, 0.00379180908203125, 0.006749153137207031, 0.009706497192382812, 0.012663841247558594, 0.015621185302734375, 0.018578529357910156, 0.021535873413085938, 0.02449321746826172, 0.0274505615234375, 0.03040790557861328, 0.03336524963378906, 0.036322593688964844, 0.039279937744140625, 0.042237281799316406, 0.04519462585449219, 0.04815196990966797, 0.05110931396484375, 0.05406665802001953, 0.05702400207519531, 0.059981346130371094, 0.06293869018554688, 0.06589603424072266, 0.06885337829589844, 0.07181072235107422, 0.07476806640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 14.0, 22.0, 22.0, 39.0, 37.0, 56.0, 74.0, 62.0, 82.0, 80.0, 80.0, 94.0, 68.0, 64.0, 50.0, 47.0, 35.0, 13.0, 24.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.06067609786987305, -0.059004783630371094, -0.05733346939086914, -0.05566215515136719, -0.053990840911865234, -0.05231952667236328, -0.05064821243286133, -0.048976898193359375, -0.04730558395385742, -0.04563426971435547, -0.043962955474853516, -0.04229164123535156, -0.04062032699584961, -0.038949012756347656, -0.0372776985168457, -0.03560638427734375, -0.0339350700378418, -0.032263755798339844, -0.03059244155883789, -0.028921127319335938, -0.027249813079833984, -0.02557849884033203, -0.023907184600830078, -0.022235870361328125, -0.020564556121826172, -0.01889324188232422, -0.017221927642822266, -0.015550613403320312, -0.01387929916381836, -0.012207984924316406, -0.010536670684814453, -0.0088653564453125, -0.007194042205810547, -0.005522727966308594, -0.0038514137268066406, -0.0021800994873046875, -0.0005087852478027344, 0.0011625289916992188, 0.002833843231201172, 0.004505157470703125, 0.006176471710205078, 0.007847785949707031, 0.009519100189208984, 0.011190414428710938, 0.01286172866821289, 0.014533042907714844, 0.016204357147216797, 0.01787567138671875, 0.019546985626220703, 0.021218299865722656, 0.02288961410522461, 0.024560928344726562, 0.026232242584228516, 0.02790355682373047, 0.029574871063232422, 0.031246185302734375, 0.03291749954223633, 0.03458881378173828, 0.036260128021240234, 0.03793144226074219, 0.03960275650024414, 0.041274070739746094, 0.04294538497924805, 0.04461669921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 10.0, 33.0, 93.0, 220.0, 325.0, 175.0, 86.0, 31.0, 15.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654874324798584, -2.5964503288269043, -2.5380263328552246, -2.479602336883545, -2.4211783409118652, -2.3627543449401855, -2.304330348968506, -2.245906352996826, -2.1874823570251465, -2.129058361053467, -2.070634365081787, -2.0122103691101074, -1.9537863731384277, -1.895362377166748, -1.8369383811950684, -1.7785143852233887, -1.7200902700424194, -1.6616662740707397, -1.60324227809906, -1.5448182821273804, -1.4863942861557007, -1.427970290184021, -1.3695461750030518, -1.311122179031372, -1.2526981830596924, -1.1942741870880127, -1.135850191116333, -1.0774261951446533, -1.0190021991729736, -0.960578203201294, -0.9021541476249695, -0.8437301516532898, -0.7853060960769653, -0.7268821001052856, -0.668458104133606, -0.6100341081619263, -0.5516101121902466, -0.4931860864162445, -0.43476206064224243, -0.37633806467056274, -0.31791406869888306, -0.25949007272720337, -0.2010660618543625, -0.1426420509815216, -0.08421805500984192, -0.02579405903816223, 0.032629966735839844, 0.09105396270751953, 0.14947795867919922, 0.2079019546508789, 0.2663259506225586, 0.32474997639656067, 0.38317397236824036, 0.44159796833992004, 0.5000219941139221, 0.5584459900856018, 0.6168699860572815, 0.6752939820289612, 0.7337179780006409, 0.7921420335769653, 0.850566029548645, 0.9089900255203247, 0.9674140214920044, 1.025838017463684, 1.0842620134353638]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 8.0, 17.0, 21.0, 20.0, 24.0, 42.0, 52.0, 73.0, 52.0, 70.0, 78.0, 127.0, 69.0, 81.0, 71.0, 51.0, 27.0, 29.0, 17.0, 18.0, 16.0, 9.0, 6.0, 9.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3044617176055908, -1.2703602313995361, -1.236258625984192, -1.2021571397781372, -1.1680556535720825, -1.1339540481567383, -1.0998525619506836, -1.065751075744629, -1.0316495895385742, -0.9975480437278748, -0.9634465575218201, -0.9293450117111206, -0.8952435255050659, -0.8611419796943665, -0.827040433883667, -0.7929389476776123, -0.7588373422622681, -0.7247357964515686, -0.6906343102455139, -0.6565327644348145, -0.6224312782287598, -0.5883297324180603, -0.5542281866073608, -0.5201267004013062, -0.4860251545906067, -0.4519236385822296, -0.41782212257385254, -0.3837205767631531, -0.349619060754776, -0.3155175447463989, -0.28141599893569946, -0.2473144829273224, -0.21321290731430054, -0.17911139130592346, -0.1450098603963852, -0.11090833693742752, -0.07680681347846985, -0.04270529747009277, -0.008603766560554504, 0.025497764348983765, 0.05959928035736084, 0.09370080381631851, 0.12780232727527618, 0.16190385818481445, 0.19600537419319153, 0.2301068902015686, 0.26420843601226807, 0.29830995202064514, 0.3324114680290222, 0.3665129840373993, 0.40061450004577637, 0.43471604585647583, 0.4688175618648529, 0.50291907787323, 0.5370206236839294, 0.5711221694946289, 0.6052236557006836, 0.6393252015113831, 0.6734266877174377, 0.7075282335281372, 0.7416297197341919, 0.7757312655448914, 0.8098328113555908, 0.8439342975616455, 0.878035843372345]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 14.0, 16.0, 32.0, 33.0, 56.0, 107.0, 441.0, 112.0, 58.0, 39.0, 32.0, 24.0, 10.0, 8.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5951061248779297, -0.5823020935058594, -0.5694980621337891, -0.5566940307617188, -0.5438899993896484, -0.5310859680175781, -0.5182819366455078, -0.5054779052734375, -0.4926738739013672, -0.4798698425292969, -0.46706581115722656, -0.45426177978515625, -0.44145774841308594, -0.4286537170410156, -0.4158496856689453, -0.403045654296875, -0.3902416229248047, -0.3774375915527344, -0.36463356018066406, -0.35182952880859375, -0.33902549743652344, -0.3262214660644531, -0.3134174346923828, -0.3006134033203125, -0.2878093719482422, -0.2750053405761719, -0.26220130920410156, -0.24939727783203125, -0.23659324645996094, -0.22378921508789062, -0.2109851837158203, -0.19818115234375, -0.1853771209716797, -0.17257308959960938, -0.15976905822753906, -0.14696502685546875, -0.13416099548339844, -0.12135696411132812, -0.10855293273925781, -0.0957489013671875, -0.08294486999511719, -0.07014083862304688, -0.05733680725097656, -0.04453277587890625, -0.03172874450683594, -0.018924713134765625, -0.0061206817626953125, 0.006683349609375, 0.019487380981445312, 0.032291412353515625, 0.04509544372558594, 0.05789947509765625, 0.07070350646972656, 0.08350753784179688, 0.09631156921386719, 0.1091156005859375, 0.12191963195800781, 0.13472366333007812, 0.14752769470214844, 0.16033172607421875, 0.17313575744628906, 0.18593978881835938, 0.1987438201904297, 0.2115478515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 11.0, 20.0, 29.0, 47.0, 85.0, 108.0, 252.0, 540.0, 1537.0, 6758.0, 230041.0, 8137553.0, 8660.0, 1742.0, 593.0, 245.0, 116.0, 87.0, 43.0, 24.0, 21.0, 16.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8624014258384705, -0.8384891748428345, -0.8145768642425537, -0.7906646132469177, -0.7667523622512817, -0.7428401112556458, -0.718927800655365, -0.695015549659729, -0.671103298664093, -0.647191047668457, -0.6232787370681763, -0.5993664860725403, -0.5754542350769043, -0.5515419840812683, -0.5276296734809875, -0.5037174224853516, -0.4798051416873932, -0.4558928608894348, -0.43198060989379883, -0.40806832909584045, -0.38415607810020447, -0.3602437973022461, -0.3363315463066101, -0.31241926550865173, -0.28850698471069336, -0.264594703912735, -0.240682452917099, -0.21677017211914062, -0.19285792112350464, -0.16894564032554626, -0.14503337442874908, -0.1211211085319519, -0.09720885753631592, -0.07329659163951874, -0.04938432201743126, -0.02547205239534378, -0.0015597864985466003, 0.02235247939825058, 0.04626475274562836, 0.07017701864242554, 0.09408928453922272, 0.1180015504360199, 0.14191381633281708, 0.16582608222961426, 0.18973836302757263, 0.21365061402320862, 0.237562894821167, 0.261475145816803, 0.28538742661476135, 0.3092997074127197, 0.3332119584083557, 0.3571242392063141, 0.3810364902019501, 0.40494877099990845, 0.42886102199554443, 0.4527733027935028, 0.4766855835914612, 0.5005978345870972, 0.5245101451873779, 0.5484223961830139, 0.5723346471786499, 0.5962468981742859, 0.6201592087745667, 0.6440714597702026, 0.6679837107658386]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 10.0, 4.0, 6.0, 5.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2566770613193512, -0.244013249874115, -0.23134943842887878, -0.21868561208248138, -0.20602180063724518, -0.19335798919200897, -0.18069416284561157, -0.16803035140037537, -0.15536653995513916, -0.14270272850990295, -0.13003891706466675, -0.11737509071826935, -0.10471127927303314, -0.09204746782779694, -0.07938364893198013, -0.06671983003616333, -0.054056018590927124, -0.04139220342040062, -0.028728388249874115, -0.01606457307934761, -0.003400757908821106, 0.0092630535364151, 0.021926872432231903, 0.034590691328048706, 0.04725450277328491, 0.05991831794381142, 0.07258213311433792, 0.08524595201015472, 0.09790976345539093, 0.11057357490062714, 0.12323739379644394, 0.13590121269226074, 0.14856499433517456, 0.16122880578041077, 0.17389261722564697, 0.18655644357204437, 0.19922025501728058, 0.21188406646251678, 0.22454789280891418, 0.2372117042541504, 0.2498755156993866, 0.2625393271446228, 0.275203138589859, 0.2878669500350952, 0.3005307912826538, 0.3131945729255676, 0.3258584141731262, 0.3385222256183624, 0.35118603706359863, 0.36384984850883484, 0.37651365995407104, 0.38917747139930725, 0.40184128284454346, 0.41450512409210205, 0.42716893553733826, 0.43983274698257446, 0.45249655842781067, 0.4651603698730469, 0.4778241813182831, 0.4904879927635193, 0.5031518340110779, 0.5158156156539917, 0.5284794569015503, 0.5411432981491089, 0.5538070797920227]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 8.0, 7.0, 12.0, 9.0, 11.0, 12.0, 19.0, 15.0, 17.0, 26.0, 42.0, 36.0, 37.0, 42.0, 38.0, 56.0, 51.0, 50.0, 50.0, 58.0, 56.0, 45.0, 33.0, 41.0, 24.0, 37.0, 23.0, 23.0, 19.0, 9.0, 18.0, 12.0, 10.0, 5.0, 9.0, 8.0, 10.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10198974609375, -0.09874343872070312, -0.09549713134765625, -0.09225082397460938, -0.0890045166015625, -0.08575820922851562, -0.08251190185546875, -0.07926559448242188, -0.076019287109375, -0.07277297973632812, -0.06952667236328125, -0.06628036499023438, -0.0630340576171875, -0.059787750244140625, -0.05654144287109375, -0.053295135498046875, -0.050048828125, -0.046802520751953125, -0.04355621337890625, -0.040309906005859375, -0.0370635986328125, -0.033817291259765625, -0.03057098388671875, -0.027324676513671875, -0.024078369140625, -0.020832061767578125, -0.01758575439453125, -0.014339447021484375, -0.0110931396484375, -0.007846832275390625, -0.00460052490234375, -0.001354217529296875, 0.00189208984375, 0.005138397216796875, 0.00838470458984375, 0.011631011962890625, 0.0148773193359375, 0.018123626708984375, 0.02136993408203125, 0.024616241455078125, 0.027862548828125, 0.031108856201171875, 0.03435516357421875, 0.037601470947265625, 0.0408477783203125, 0.044094085693359375, 0.04734039306640625, 0.050586700439453125, 0.0538330078125, 0.057079315185546875, 0.06032562255859375, 0.06357192993164062, 0.0668182373046875, 0.07006454467773438, 0.07331085205078125, 0.07655715942382812, 0.079803466796875, 0.08304977416992188, 0.08629608154296875, 0.08954238891601562, 0.0927886962890625, 0.09603500366210938, 0.09928131103515625, 0.10252761840820312, 0.10577392578125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 12.0, 15.0, 25.0, 42.0, 68.0, 83.0, 139.0, 221.0, 372.0, 646.0, 1188.0, 2460.0, 5682.0, 17010.0, 65772.0, 281853.0, 111086.0, 23733.0, 7530.0, 3006.0, 1464.0, 739.0, 421.0, 247.0, 171.0, 94.0, 59.0, 41.0, 25.0, 20.0, 12.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6796875, -1.6230316162109375, -1.566375732421875, -1.5097198486328125, -1.45306396484375, -1.3964080810546875, -1.339752197265625, -1.2830963134765625, -1.2264404296875, -1.1697845458984375, -1.113128662109375, -1.0564727783203125, -0.99981689453125, -0.9431610107421875, -0.886505126953125, -0.8298492431640625, -0.773193359375, -0.7165374755859375, -0.659881591796875, -0.6032257080078125, -0.54656982421875, -0.4899139404296875, -0.433258056640625, -0.3766021728515625, -0.3199462890625, -0.2632904052734375, -0.206634521484375, -0.1499786376953125, -0.09332275390625, -0.0366668701171875, 0.019989013671875, 0.0766448974609375, 0.13330078125, 0.1899566650390625, 0.246612548828125, 0.3032684326171875, 0.35992431640625, 0.4165802001953125, 0.473236083984375, 0.5298919677734375, 0.5865478515625, 0.6432037353515625, 0.699859619140625, 0.7565155029296875, 0.81317138671875, 0.8698272705078125, 0.926483154296875, 0.9831390380859375, 1.039794921875, 1.0964508056640625, 1.153106689453125, 1.2097625732421875, 1.26641845703125, 1.3230743408203125, 1.379730224609375, 1.4363861083984375, 1.4930419921875, 1.5496978759765625, 1.606353759765625, 1.6630096435546875, 1.71966552734375, 1.7763214111328125, 1.832977294921875, 1.8896331787109375, 1.9462890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 8.0, 4.0, 3.0, 7.0, 18.0, 20.0, 21.0, 20.0, 28.0, 33.0, 35.0, 55.0, 53.0, 52.0, 57.0, 68.0, 70.0, 59.0, 49.0, 51.0, 41.0, 47.0, 30.0, 39.0, 29.0, 17.0, 12.0, 14.0, 13.0, 12.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1092529296875, -0.10498809814453125, -0.1007232666015625, -0.09645843505859375, -0.092193603515625, -0.08792877197265625, -0.0836639404296875, -0.07939910888671875, -0.07513427734375, -0.07086944580078125, -0.0666046142578125, -0.06233978271484375, -0.058074951171875, -0.05381011962890625, -0.0495452880859375, -0.04528045654296875, -0.041015625, -0.03675079345703125, -0.0324859619140625, -0.02822113037109375, -0.023956298828125, -0.01969146728515625, -0.0154266357421875, -0.01116180419921875, -0.00689697265625, -0.00263214111328125, 0.0016326904296875, 0.00589752197265625, 0.010162353515625, 0.01442718505859375, 0.0186920166015625, 0.02295684814453125, 0.0272216796875, 0.03148651123046875, 0.0357513427734375, 0.04001617431640625, 0.044281005859375, 0.04854583740234375, 0.0528106689453125, 0.05707550048828125, 0.06134033203125, 0.06560516357421875, 0.0698699951171875, 0.07413482666015625, 0.078399658203125, 0.08266448974609375, 0.0869293212890625, 0.09119415283203125, 0.095458984375, 0.09972381591796875, 0.1039886474609375, 0.10825347900390625, 0.112518310546875, 0.11678314208984375, 0.1210479736328125, 0.12531280517578125, 0.12957763671875, 0.13384246826171875, 0.1381072998046875, 0.14237213134765625, 0.146636962890625, 0.15090179443359375, 0.1551666259765625, 0.15943145751953125, 0.1636962890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 16.0, 17.0, 20.0, 28.0, 38.0, 45.0, 47.0, 42.0, 45.0, 36.0, 30.0, 19.0, 10.0, 11.0, 7.0, 7.0, 6.0, 6.0, 6.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24130772054195404, -0.23242919147014618, -0.22355066239833832, -0.21467213332653046, -0.2057936191558838, -0.19691509008407593, -0.18803656101226807, -0.1791580319404602, -0.17027950286865234, -0.16140097379684448, -0.15252244472503662, -0.14364391565322876, -0.1347653865814209, -0.12588685750961304, -0.11700834333896637, -0.10812981426715851, -0.09925128519535065, -0.09037275612354279, -0.08149422705173492, -0.07261570543050766, -0.0637371763586998, -0.05485864728689194, -0.045980121940374374, -0.03710159659385681, -0.02822306752204895, -0.019344540312886238, -0.010466013103723526, -0.001587485894560814, 0.007291041314601898, 0.01616957038640976, 0.025048095732927322, 0.033926621079444885, 0.04280516505241394, 0.0516836941242218, 0.060562219470739365, 0.06944074481725693, 0.07831927388906479, 0.08719780296087265, 0.09607632458209991, 0.10495485365390778, 0.11383338272571564, 0.1227119117975235, 0.13159044086933136, 0.14046896994113922, 0.1493474841117859, 0.15822601318359375, 0.1671045422554016, 0.17598307132720947, 0.18486160039901733, 0.1937401294708252, 0.20261865854263306, 0.21149718761444092, 0.22037571668624878, 0.22925424575805664, 0.2381327599287033, 0.24701128900051117, 0.2558898329734802, 0.2647683620452881, 0.27364689111709595, 0.2825254201889038, 0.29140394926071167, 0.30028247833251953, 0.3091610074043274, 0.31803953647613525, 0.3269180357456207]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 5.0, 5.0, 6.0, 9.0, 7.0, 7.0, 15.0, 16.0, 69.0, 110.0, 70.0, 32.0, 18.0, 13.0, 9.0, 8.0, 6.0, 6.0, 8.0, 11.0, 1.0, 3.0, 8.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3911067843437195, -0.37814080715179443, -0.365174800157547, -0.35220882296562195, -0.3392428457736969, -0.32627683877944946, -0.3133108615875244, -0.30034488439559937, -0.2873789072036743, -0.27441293001174927, -0.26144692301750183, -0.24848094582557678, -0.23551496863365173, -0.2225489765405655, -0.20958298444747925, -0.1966170072555542, -0.18365101516246796, -0.1706850230693817, -0.15771904587745667, -0.14475305378437042, -0.13178707659244537, -0.11882108449935913, -0.10585509985685349, -0.09288911521434784, -0.0799231305718422, -0.06695714592933655, -0.0539911612868309, -0.04102517291903496, -0.028059188276529312, -0.015093199908733368, -0.002127215266227722, 0.010838769376277924, 0.02380475401878357, 0.036770738661289215, 0.04973672330379486, 0.0627027153968811, 0.07566869258880615, 0.0886346846818924, 0.10160066932439804, 0.11456665396690369, 0.12753263115882874, 0.14049862325191498, 0.15346460044384003, 0.16643059253692627, 0.17939656972885132, 0.19236256182193756, 0.2053285539150238, 0.21829453110694885, 0.2312605232000351, 0.24422651529312134, 0.2571924924850464, 0.27015846967697144, 0.28312447667121887, 0.2960904538631439, 0.30905643105506897, 0.3220224380493164, 0.33498841524124146, 0.3479543924331665, 0.36092039942741394, 0.373886376619339, 0.38685235381126404, 0.3998183608055115, 0.4127843379974365, 0.4257503151893616, 0.4387162923812866]}, "eval/loss": 4.923842430114746, "eval/bleu": 0.0, "eval/runtime": 2550.431, "eval/samples_per_second": 5.787, "eval/steps_per_second": 0.723} \ No newline at end of file