diff --git "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.9849, "train/learning_rate": 2.9109263657957245e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8584, "_timestamp": 1646955823, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 6.0, 3.0, 9.0, 8.0, 7.0, 7.0, 14.0, 15.0, 8.0, 15.0, 26.0, 28.0, 23.0, 39.0, 22.0, 36.0, 37.0, 44.0, 43.0, 32.0, 34.0, 39.0, 46.0, 37.0, 41.0, 34.0, 38.0, 30.0, 32.0, 32.0, 32.0, 24.0, 18.0, 23.0, 21.0, 28.0, 13.0, 7.0, 4.0, 12.0, 5.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.9377670288086, -64.06999969482422, -62.20222854614258, -60.33445739746094, -58.46669006347656, -56.59891891479492, -54.73114776611328, -52.863380432128906, -50.99561309814453, -49.12784194946289, -47.260074615478516, -45.392303466796875, -43.5245361328125, -41.65676498413086, -39.78899383544922, -37.921226501464844, -36.0534553527832, -34.18568420410156, -32.31791687011719, -30.450145721435547, -28.582378387451172, -26.71460723876953, -24.846837997436523, -22.979068756103516, -21.111299514770508, -19.2435302734375, -17.375761032104492, -15.507990837097168, -13.64022159576416, -11.772452354431152, -9.904682159423828, -8.03691291809082, -6.169139862060547, -4.301370620727539, -2.433600902557373, -0.565831184387207, 1.3019380569458008, 3.1697072982788086, 5.037477493286133, 6.905246734619141, 8.773015975952148, 10.640785217285156, 12.508554458618164, 14.376324653625488, 16.244094848632812, 18.111862182617188, 19.979633331298828, 21.847402572631836, 23.715171813964844, 25.58294105529785, 27.45071029663086, 29.3184814453125, 31.186248779296875, 33.054019927978516, 34.921791076660156, 36.78955841064453, 38.657325744628906, 40.52509689331055, 42.39286422729492, 44.26063537597656, 46.12840270996094, 47.99617385864258, 49.86394500732422, 51.731712341308594, 53.599483489990234]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 13.0, 8.0, 8.0, 15.0, 25.0, 25.0, 22.0, 30.0, 30.0, 32.0, 25.0, 33.0, 29.0, 39.0, 42.0, 39.0, 38.0, 42.0, 43.0, 44.0, 41.0, 42.0, 34.0, 36.0, 33.0, 26.0, 31.0, 19.0, 23.0, 16.0, 20.0, 10.0, 16.0, 9.0, 7.0, 6.0, 15.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.35487365722656, -66.1024398803711, -63.850006103515625, -61.597572326660156, -59.34513854980469, -57.09270477294922, -54.840274810791016, -52.58784103393555, -50.33540725708008, -48.08297348022461, -45.83053970336914, -43.57810592651367, -41.32567596435547, -39.0732421875, -36.82080841064453, -34.56837463378906, -32.315940856933594, -30.063507080078125, -27.811073303222656, -25.55864143371582, -23.30620765686035, -21.053773880004883, -18.801342010498047, -16.548908233642578, -14.29647445678711, -12.04404067993164, -9.791607856750488, -7.539174556732178, -5.286741256713867, -3.0343074798583984, -0.7818746566772461, 1.4705581665039062, 3.7229843139648438, 5.975417613983154, 8.227850914001465, 10.480283737182617, 12.732717514038086, 14.985151290893555, 17.23758316040039, 19.49001693725586, 21.742450714111328, 23.994884490966797, 26.247318267822266, 28.4997501373291, 30.75218391418457, 33.004615783691406, 35.257049560546875, 37.509483337402344, 39.76191711425781, 42.01435089111328, 44.26678466796875, 46.51921844482422, 48.77165222167969, 51.024085998535156, 53.27651596069336, 55.52894973754883, 57.7813835144043, 60.033817291259766, 62.286251068115234, 64.53868103027344, 66.7911148071289, 69.04354858398438, 71.29598236083984, 73.54841613769531, 75.80084991455078]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [4.0, 5.0, 6.0, 14.0, 14.0, 32.0, 60.0, 73.0, 104.0, 172.0, 248.0, 362.0, 594.0, 837.0, 1243.0, 1901.0, 3029.0, 4748.0, 7530.0, 12575.0, 20610.0, 35733.0, 64203.0, 117699.0, 231027.0, 488927.0, 909407.0, 1019484.0, 634392.0, 301915.0, 149140.0, 79121.0, 44161.0, 25198.0, 15204.0, 9088.0, 5683.0, 3442.0, 2206.0, 1412.0, 952.0, 545.0, 409.0, 276.0, 184.0, 119.0, 82.0, 45.0, 32.0, 20.0, 14.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.65625, -57.46142578125, -55.2666015625, -53.07177734375, -50.876953125, -48.68212890625, -46.4873046875, -44.29248046875, -42.09765625, -39.90283203125, -37.7080078125, -35.51318359375, -33.318359375, -31.12353515625, -28.9287109375, -26.73388671875, -24.5390625, -22.34423828125, -20.1494140625, -17.95458984375, -15.759765625, -13.56494140625, -11.3701171875, -9.17529296875, -6.98046875, -4.78564453125, -2.5908203125, -0.39599609375, 1.798828125, 3.99365234375, 6.1884765625, 8.38330078125, 10.578125, 12.77294921875, 14.9677734375, 17.16259765625, 19.357421875, 21.55224609375, 23.7470703125, 25.94189453125, 28.13671875, 30.33154296875, 32.5263671875, 34.72119140625, 36.916015625, 39.11083984375, 41.3056640625, 43.50048828125, 45.6953125, 47.89013671875, 50.0849609375, 52.27978515625, 54.474609375, 56.66943359375, 58.8642578125, 61.05908203125, 63.25390625, 65.44873046875, 67.6435546875, 69.83837890625, 72.033203125, 74.22802734375, 76.4228515625, 78.61767578125, 80.8125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 7.0, 11.0, 7.0, 7.0, 15.0, 21.0, 20.0, 28.0, 25.0, 31.0, 32.0, 23.0, 36.0, 34.0, 31.0, 35.0, 33.0, 54.0, 46.0, 40.0, 35.0, 42.0, 42.0, 30.0, 51.0, 21.0, 30.0, 20.0, 37.0, 22.0, 20.0, 18.0, 19.0, 14.0, 8.0, 12.0, 5.0, 4.0, 8.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.71875, -40.31494140625, -38.9111328125, -37.50732421875, -36.103515625, -34.69970703125, -33.2958984375, -31.89208984375, -30.48828125, -29.08447265625, -27.6806640625, -26.27685546875, -24.873046875, -23.46923828125, -22.0654296875, -20.66162109375, -19.2578125, -17.85400390625, -16.4501953125, -15.04638671875, -13.642578125, -12.23876953125, -10.8349609375, -9.43115234375, -8.02734375, -6.62353515625, -5.2197265625, -3.81591796875, -2.412109375, -1.00830078125, 0.3955078125, 1.79931640625, 3.203125, 4.60693359375, 6.0107421875, 7.41455078125, 8.818359375, 10.22216796875, 11.6259765625, 13.02978515625, 14.43359375, 15.83740234375, 17.2412109375, 18.64501953125, 20.048828125, 21.45263671875, 22.8564453125, 24.26025390625, 25.6640625, 27.06787109375, 28.4716796875, 29.87548828125, 31.279296875, 32.68310546875, 34.0869140625, 35.49072265625, 36.89453125, 38.29833984375, 39.7021484375, 41.10595703125, 42.509765625, 43.91357421875, 45.3173828125, 46.72119140625, 48.125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 13.0, 25.0, 50.0, 72.0, 114.0, 149.0, 236.0, 393.0, 558.0, 859.0, 1301.0, 2129.0, 3196.0, 5248.0, 8107.0, 12885.0, 21164.0, 33911.0, 54848.0, 88861.0, 144419.0, 231943.0, 359659.0, 532868.0, 681986.0, 656366.0, 487812.0, 323904.0, 205893.0, 127733.0, 78846.0, 48198.0, 30026.0, 18776.0, 11693.0, 7306.0, 4570.0, 2975.0, 1838.0, 1229.0, 718.0, 516.0, 329.0, 203.0, 121.0, 99.0, 63.0, 33.0, 20.0, 12.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-47.59375, -46.1005859375, -44.607421875, -43.1142578125, -41.62109375, -40.1279296875, -38.634765625, -37.1416015625, -35.6484375, -34.1552734375, -32.662109375, -31.1689453125, -29.67578125, -28.1826171875, -26.689453125, -25.1962890625, -23.703125, -22.2099609375, -20.716796875, -19.2236328125, -17.73046875, -16.2373046875, -14.744140625, -13.2509765625, -11.7578125, -10.2646484375, -8.771484375, -7.2783203125, -5.78515625, -4.2919921875, -2.798828125, -1.3056640625, 0.1875, 1.6806640625, 3.173828125, 4.6669921875, 6.16015625, 7.6533203125, 9.146484375, 10.6396484375, 12.1328125, 13.6259765625, 15.119140625, 16.6123046875, 18.10546875, 19.5986328125, 21.091796875, 22.5849609375, 24.078125, 25.5712890625, 27.064453125, 28.5576171875, 30.05078125, 31.5439453125, 33.037109375, 34.5302734375, 36.0234375, 37.5166015625, 39.009765625, 40.5029296875, 41.99609375, 43.4892578125, 44.982421875, 46.4755859375, 47.96875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 4.0, 6.0, 8.0, 9.0, 11.0, 21.0, 20.0, 29.0, 25.0, 24.0, 45.0, 45.0, 70.0, 90.0, 76.0, 107.0, 126.0, 135.0, 184.0, 219.0, 252.0, 263.0, 319.0, 285.0, 291.0, 268.0, 205.0, 201.0, 158.0, 141.0, 97.0, 97.0, 59.0, 42.0, 34.0, 16.0, 24.0, 16.0, 16.0, 4.0, 9.0, 6.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.890625, -26.123046875, -25.35546875, -24.587890625, -23.8203125, -23.052734375, -22.28515625, -21.517578125, -20.75, -19.982421875, -19.21484375, -18.447265625, -17.6796875, -16.912109375, -16.14453125, -15.376953125, -14.609375, -13.841796875, -13.07421875, -12.306640625, -11.5390625, -10.771484375, -10.00390625, -9.236328125, -8.46875, -7.701171875, -6.93359375, -6.166015625, -5.3984375, -4.630859375, -3.86328125, -3.095703125, -2.328125, -1.560546875, -0.79296875, -0.025390625, 0.7421875, 1.509765625, 2.27734375, 3.044921875, 3.8125, 4.580078125, 5.34765625, 6.115234375, 6.8828125, 7.650390625, 8.41796875, 9.185546875, 9.953125, 10.720703125, 11.48828125, 12.255859375, 13.0234375, 13.791015625, 14.55859375, 15.326171875, 16.09375, 16.861328125, 17.62890625, 18.396484375, 19.1640625, 19.931640625, 20.69921875, 21.466796875, 22.234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 9.0, 5.0, 8.0, 13.0, 20.0, 27.0, 22.0, 27.0, 19.0, 36.0, 43.0, 37.0, 39.0, 47.0, 48.0, 43.0, 46.0, 44.0, 51.0, 45.0, 47.0, 40.0, 37.0, 28.0, 29.0, 28.0, 18.0, 15.0, 22.0, 15.0, 11.0, 11.0, 6.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.84572982788086, -47.34406661987305, -45.8424072265625, -44.34074401855469, -42.839080810546875, -41.33742141723633, -39.835758209228516, -38.33409881591797, -36.832435607910156, -35.330772399902344, -33.8291130065918, -32.327449798583984, -30.825788497924805, -29.324127197265625, -27.822463989257812, -26.320802688598633, -24.819141387939453, -23.317480087280273, -21.815818786621094, -20.31415557861328, -18.8124942779541, -17.310832977294922, -15.809170722961426, -14.30750846862793, -12.80584716796875, -11.30418586730957, -9.802523612976074, -8.300861358642578, -6.799200057983398, -5.2975382804870605, -3.7958765029907227, -2.2942142486572266, -0.7925491333007812, 0.7091126441955566, 2.2107744216918945, 3.7124361991882324, 5.21409797668457, 6.715759754180908, 8.217421531677246, 9.719083786010742, 11.220745086669922, 12.722406387329102, 14.224068641662598, 15.725730895996094, 17.227392196655273, 18.729053497314453, 20.230716705322266, 21.732378005981445, 23.234039306640625, 24.735700607299805, 26.237361907958984, 27.739025115966797, 29.240686416625977, 30.742347717285156, 32.24401092529297, 33.74567413330078, 35.24733352661133, 36.74899673461914, 38.25065612792969, 39.7523193359375, 41.25398254394531, 42.75564193725586, 44.25730514526367, 45.75896453857422, 47.26062774658203]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 8.0, 9.0, 6.0, 9.0, 7.0, 9.0, 16.0, 13.0, 30.0, 21.0, 14.0, 26.0, 23.0, 35.0, 28.0, 34.0, 40.0, 24.0, 48.0, 44.0, 38.0, 33.0, 42.0, 42.0, 41.0, 37.0, 27.0, 31.0, 29.0, 26.0, 33.0, 32.0, 18.0, 17.0, 15.0, 13.0, 15.0, 6.0, 14.0, 7.0, 11.0, 8.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.810020446777344, -49.19010543823242, -47.5701904296875, -45.950279235839844, -44.33036422729492, -42.71044921875, -41.09053421020508, -39.470619201660156, -37.8507080078125, -36.23079299926758, -34.610877990722656, -32.990966796875, -31.371051788330078, -29.751136779785156, -28.131221771240234, -26.511306762695312, -24.89139175415039, -23.27147674560547, -21.65156364440918, -20.031648635864258, -18.41173553466797, -16.791820526123047, -15.171905517578125, -13.55199146270752, -11.932077407836914, -10.312163352966309, -8.692249298095703, -7.072334289550781, -5.452420234680176, -3.8325061798095703, -2.2125911712646484, -0.592677116394043, 1.0272369384765625, 2.647151231765747, 4.267065525054932, 5.886980056762695, 7.506894111633301, 9.126808166503906, 10.746723175048828, 12.366637229919434, 13.986551284790039, 15.606465339660645, 17.22637939453125, 18.846294403076172, 20.466209411621094, 22.086122512817383, 23.706037521362305, 25.325950622558594, 26.945865631103516, 28.565780639648438, 30.185693740844727, 31.80560874938965, 33.42552185058594, 35.04543685913086, 36.66535186767578, 38.2852668762207, 39.905181884765625, 41.52509689331055, 43.14501190185547, 44.764923095703125, 46.38483810424805, 48.00475311279297, 49.62466812133789, 51.24458312988281, 52.86449432373047]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 14.0, 16.0, 36.0, 39.0, 46.0, 80.0, 82.0, 107.0, 153.0, 232.0, 336.0, 452.0, 708.0, 976.0, 1456.0, 2180.0, 3211.0, 5063.0, 8379.0, 14954.0, 31229.0, 82281.0, 368234.0, 375224.0, 83085.0, 31362.0, 14888.0, 8390.0, 5178.0, 3163.0, 2141.0, 1519.0, 964.0, 671.0, 478.0, 341.0, 241.0, 174.0, 133.0, 98.0, 63.0, 50.0, 32.0, 27.0, 22.0, 18.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-39.53125, -38.33349609375, -37.1357421875, -35.93798828125, -34.740234375, -33.54248046875, -32.3447265625, -31.14697265625, -29.94921875, -28.75146484375, -27.5537109375, -26.35595703125, -25.158203125, -23.96044921875, -22.7626953125, -21.56494140625, -20.3671875, -19.16943359375, -17.9716796875, -16.77392578125, -15.576171875, -14.37841796875, -13.1806640625, -11.98291015625, -10.78515625, -9.58740234375, -8.3896484375, -7.19189453125, -5.994140625, -4.79638671875, -3.5986328125, -2.40087890625, -1.203125, -0.00537109375, 1.1923828125, 2.39013671875, 3.587890625, 4.78564453125, 5.9833984375, 7.18115234375, 8.37890625, 9.57666015625, 10.7744140625, 11.97216796875, 13.169921875, 14.36767578125, 15.5654296875, 16.76318359375, 17.9609375, 19.15869140625, 20.3564453125, 21.55419921875, 22.751953125, 23.94970703125, 25.1474609375, 26.34521484375, 27.54296875, 28.74072265625, 29.9384765625, 31.13623046875, 32.333984375, 33.53173828125, 34.7294921875, 35.92724609375, 37.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 9.0, 5.0, 10.0, 8.0, 6.0, 18.0, 12.0, 30.0, 22.0, 13.0, 25.0, 25.0, 35.0, 32.0, 26.0, 38.0, 28.0, 42.0, 48.0, 37.0, 31.0, 47.0, 40.0, 44.0, 37.0, 25.0, 28.0, 33.0, 23.0, 35.0, 33.0, 17.0, 22.0, 12.0, 16.0, 12.0, 10.0, 12.0, 6.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-49.71875, -48.14208984375, -46.5654296875, -44.98876953125, -43.412109375, -41.83544921875, -40.2587890625, -38.68212890625, -37.10546875, -35.52880859375, -33.9521484375, -32.37548828125, -30.798828125, -29.22216796875, -27.6455078125, -26.06884765625, -24.4921875, -22.91552734375, -21.3388671875, -19.76220703125, -18.185546875, -16.60888671875, -15.0322265625, -13.45556640625, -11.87890625, -10.30224609375, -8.7255859375, -7.14892578125, -5.572265625, -3.99560546875, -2.4189453125, -0.84228515625, 0.734375, 2.31103515625, 3.8876953125, 5.46435546875, 7.041015625, 8.61767578125, 10.1943359375, 11.77099609375, 13.34765625, 14.92431640625, 16.5009765625, 18.07763671875, 19.654296875, 21.23095703125, 22.8076171875, 24.38427734375, 25.9609375, 27.53759765625, 29.1142578125, 30.69091796875, 32.267578125, 33.84423828125, 35.4208984375, 36.99755859375, 38.57421875, 40.15087890625, 41.7275390625, 43.30419921875, 44.880859375, 46.45751953125, 48.0341796875, 49.61083984375, 51.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 10.0, 9.0, 16.0, 30.0, 26.0, 30.0, 45.0, 77.0, 88.0, 125.0, 198.0, 250.0, 328.0, 538.0, 770.0, 1193.0, 1900.0, 3255.0, 6094.0, 13527.0, 41558.0, 245923.0, 607643.0, 83728.0, 21223.0, 8611.0, 4409.0, 2473.0, 1512.0, 913.0, 619.0, 404.0, 271.0, 205.0, 133.0, 106.0, 79.0, 52.0, 42.0, 37.0, 19.0, 14.0, 15.0, 10.0, 6.0, 10.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.734375, -30.648681640625, -29.56298828125, -28.477294921875, -27.3916015625, -26.305908203125, -25.22021484375, -24.134521484375, -23.048828125, -21.963134765625, -20.87744140625, -19.791748046875, -18.7060546875, -17.620361328125, -16.53466796875, -15.448974609375, -14.36328125, -13.277587890625, -12.19189453125, -11.106201171875, -10.0205078125, -8.934814453125, -7.84912109375, -6.763427734375, -5.677734375, -4.592041015625, -3.50634765625, -2.420654296875, -1.3349609375, -0.249267578125, 0.83642578125, 1.922119140625, 3.0078125, 4.093505859375, 5.17919921875, 6.264892578125, 7.3505859375, 8.436279296875, 9.52197265625, 10.607666015625, 11.693359375, 12.779052734375, 13.86474609375, 14.950439453125, 16.0361328125, 17.121826171875, 18.20751953125, 19.293212890625, 20.37890625, 21.464599609375, 22.55029296875, 23.635986328125, 24.7216796875, 25.807373046875, 26.89306640625, 27.978759765625, 29.064453125, 30.150146484375, 31.23583984375, 32.321533203125, 33.4072265625, 34.492919921875, 35.57861328125, 36.664306640625, 37.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 6.0, 4.0, 13.0, 12.0, 10.0, 14.0, 17.0, 19.0, 17.0, 31.0, 21.0, 27.0, 34.0, 30.0, 22.0, 30.0, 34.0, 42.0, 29.0, 41.0, 37.0, 39.0, 38.0, 46.0, 33.0, 47.0, 34.0, 34.0, 26.0, 24.0, 34.0, 26.0, 21.0, 16.0, 13.0, 8.0, 11.0, 16.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-43.5, -42.28564453125, -41.0712890625, -39.85693359375, -38.642578125, -37.42822265625, -36.2138671875, -34.99951171875, -33.78515625, -32.57080078125, -31.3564453125, -30.14208984375, -28.927734375, -27.71337890625, -26.4990234375, -25.28466796875, -24.0703125, -22.85595703125, -21.6416015625, -20.42724609375, -19.212890625, -17.99853515625, -16.7841796875, -15.56982421875, -14.35546875, -13.14111328125, -11.9267578125, -10.71240234375, -9.498046875, -8.28369140625, -7.0693359375, -5.85498046875, -4.640625, -3.42626953125, -2.2119140625, -0.99755859375, 0.216796875, 1.43115234375, 2.6455078125, 3.85986328125, 5.07421875, 6.28857421875, 7.5029296875, 8.71728515625, 9.931640625, 11.14599609375, 12.3603515625, 13.57470703125, 14.7890625, 16.00341796875, 17.2177734375, 18.43212890625, 19.646484375, 20.86083984375, 22.0751953125, 23.28955078125, 24.50390625, 25.71826171875, 26.9326171875, 28.14697265625, 29.361328125, 30.57568359375, 31.7900390625, 33.00439453125, 34.21875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 9.0, 9.0, 18.0, 13.0, 12.0, 20.0, 29.0, 23.0, 44.0, 64.0, 78.0, 135.0, 132.0, 200.0, 267.0, 431.0, 564.0, 814.0, 1224.0, 1920.0, 2881.0, 4486.0, 7717.0, 13363.0, 25387.0, 58164.0, 287450.0, 503884.0, 71261.0, 29707.0, 14963.0, 8614.0, 5025.0, 3131.0, 2019.0, 1367.0, 914.0, 637.0, 439.0, 311.0, 232.0, 159.0, 112.0, 77.0, 52.0, 48.0, 40.0, 24.0, 29.0, 20.0, 13.0, 6.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.5859375, -9.2674560546875, -8.948974609375, -8.6304931640625, -8.31201171875, -7.9935302734375, -7.675048828125, -7.3565673828125, -7.0380859375, -6.7196044921875, -6.401123046875, -6.0826416015625, -5.76416015625, -5.4456787109375, -5.127197265625, -4.8087158203125, -4.490234375, -4.1717529296875, -3.853271484375, -3.5347900390625, -3.21630859375, -2.8978271484375, -2.579345703125, -2.2608642578125, -1.9423828125, -1.6239013671875, -1.305419921875, -0.9869384765625, -0.66845703125, -0.3499755859375, -0.031494140625, 0.2869873046875, 0.60546875, 0.9239501953125, 1.242431640625, 1.5609130859375, 1.87939453125, 2.1978759765625, 2.516357421875, 2.8348388671875, 3.1533203125, 3.4718017578125, 3.790283203125, 4.1087646484375, 4.42724609375, 4.7457275390625, 5.064208984375, 5.3826904296875, 5.701171875, 6.0196533203125, 6.338134765625, 6.6566162109375, 6.97509765625, 7.2935791015625, 7.612060546875, 7.9305419921875, 8.2490234375, 8.5675048828125, 8.885986328125, 9.2044677734375, 9.52294921875, 9.8414306640625, 10.159912109375, 10.4783935546875, 10.796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 8.0, 4.0, 3.0, 11.0, 9.0, 15.0, 16.0, 18.0, 30.0, 35.0, 54.0, 71.0, 98.0, 154.0, 110.0, 91.0, 78.0, 43.0, 32.0, 25.0, 21.0, 10.0, 10.0, 10.0, 4.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0014400482177734375, -0.0013997256755828857, -0.001359403133392334, -0.0013190805912017822, -0.0012787580490112305, -0.0012384355068206787, -0.001198112964630127, -0.0011577904224395752, -0.0011174678802490234, -0.0010771453380584717, -0.00103682279586792, -0.0009965002536773682, -0.0009561777114868164, -0.0009158551692962646, -0.0008755326271057129, -0.0008352100849151611, -0.0007948875427246094, -0.0007545650005340576, -0.0007142424583435059, -0.0006739199161529541, -0.0006335973739624023, -0.0005932748317718506, -0.0005529522895812988, -0.0005126297473907471, -0.0004723072052001953, -0.00043198466300964355, -0.0003916621208190918, -0.00035133957862854004, -0.0003110170364379883, -0.0002706944942474365, -0.00023037195205688477, -0.000190049409866333, -0.00014972686767578125, -0.00010940432548522949, -6.908178329467773e-05, -2.8759241104125977e-05, 1.1563301086425781e-05, 5.188584327697754e-05, 9.22083854675293e-05, 0.00013253092765808105, 0.0001728534698486328, 0.00021317601203918457, 0.00025349855422973633, 0.0002938210964202881, 0.00033414363861083984, 0.0003744661808013916, 0.00041478872299194336, 0.0004551112651824951, 0.0004954338073730469, 0.0005357563495635986, 0.0005760788917541504, 0.0006164014339447021, 0.0006567239761352539, 0.0006970465183258057, 0.0007373690605163574, 0.0007776916027069092, 0.0008180141448974609, 0.0008583366870880127, 0.0008986592292785645, 0.0009389817714691162, 0.000979304313659668, 0.0010196268558502197, 0.0010599493980407715, 0.0011002719402313232, 0.001140594482421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 9.0, 2.0, 7.0, 14.0, 18.0, 23.0, 48.0, 56.0, 91.0, 126.0, 212.0, 290.0, 395.0, 553.0, 908.0, 1128.0, 1725.0, 2424.0, 3544.0, 5177.0, 7383.0, 11042.0, 15992.0, 23388.0, 36125.0, 61095.0, 119672.0, 257322.0, 230421.0, 108269.0, 56461.0, 34077.0, 22202.0, 15080.0, 10354.0, 7044.0, 4757.0, 3388.0, 2376.0, 1674.0, 1125.0, 834.0, 537.0, 390.0, 237.0, 187.0, 135.0, 72.0, 60.0, 40.0, 24.0, 26.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.421875, -5.24658203125, -5.0712890625, -4.89599609375, -4.720703125, -4.54541015625, -4.3701171875, -4.19482421875, -4.01953125, -3.84423828125, -3.6689453125, -3.49365234375, -3.318359375, -3.14306640625, -2.9677734375, -2.79248046875, -2.6171875, -2.44189453125, -2.2666015625, -2.09130859375, -1.916015625, -1.74072265625, -1.5654296875, -1.39013671875, -1.21484375, -1.03955078125, -0.8642578125, -0.68896484375, -0.513671875, -0.33837890625, -0.1630859375, 0.01220703125, 0.1875, 0.36279296875, 0.5380859375, 0.71337890625, 0.888671875, 1.06396484375, 1.2392578125, 1.41455078125, 1.58984375, 1.76513671875, 1.9404296875, 2.11572265625, 2.291015625, 2.46630859375, 2.6416015625, 2.81689453125, 2.9921875, 3.16748046875, 3.3427734375, 3.51806640625, 3.693359375, 3.86865234375, 4.0439453125, 4.21923828125, 4.39453125, 4.56982421875, 4.7451171875, 4.92041015625, 5.095703125, 5.27099609375, 5.4462890625, 5.62158203125, 5.796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 7.0, 10.0, 15.0, 17.0, 9.0, 19.0, 21.0, 16.0, 19.0, 17.0, 15.0, 26.0, 34.0, 39.0, 46.0, 94.0, 92.0, 92.0, 55.0, 43.0, 35.0, 29.0, 29.0, 17.0, 17.0, 15.0, 21.0, 24.0, 19.0, 17.0, 12.0, 15.0, 9.0, 5.0, 7.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.98187255859375, -1.9051513671875, -1.82843017578125, -1.751708984375, -1.67498779296875, -1.5982666015625, -1.52154541015625, -1.44482421875, -1.36810302734375, -1.2913818359375, -1.21466064453125, -1.137939453125, -1.06121826171875, -0.9844970703125, -0.90777587890625, -0.8310546875, -0.75433349609375, -0.6776123046875, -0.60089111328125, -0.524169921875, -0.44744873046875, -0.3707275390625, -0.29400634765625, -0.21728515625, -0.14056396484375, -0.0638427734375, 0.01287841796875, 0.089599609375, 0.16632080078125, 0.2430419921875, 0.31976318359375, 0.396484375, 0.47320556640625, 0.5499267578125, 0.62664794921875, 0.703369140625, 0.78009033203125, 0.8568115234375, 0.93353271484375, 1.01025390625, 1.08697509765625, 1.1636962890625, 1.24041748046875, 1.317138671875, 1.39385986328125, 1.4705810546875, 1.54730224609375, 1.6240234375, 1.70074462890625, 1.7774658203125, 1.85418701171875, 1.930908203125, 2.00762939453125, 2.0843505859375, 2.16107177734375, 2.23779296875, 2.31451416015625, 2.3912353515625, 2.46795654296875, 2.544677734375, 2.62139892578125, 2.6981201171875, 2.77484130859375, 2.8515625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 7.0, 7.0, 4.0, 5.0, 14.0, 6.0, 11.0, 20.0, 17.0, 20.0, 27.0, 34.0, 28.0, 32.0, 42.0, 35.0, 47.0, 44.0, 34.0, 44.0, 39.0, 46.0, 47.0, 43.0, 43.0, 33.0, 38.0, 32.0, 24.0, 22.0, 27.0, 17.0, 14.0, 11.0, 22.0, 8.0, 9.0, 8.0, 10.0, 6.0, 4.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.906925201416016, -46.50751495361328, -45.10810089111328, -43.70869064331055, -42.30928039550781, -40.90986633300781, -39.51045608520508, -38.111045837402344, -36.711631774902344, -35.31222152709961, -33.91280746459961, -32.513397216796875, -31.113985061645508, -29.71457290649414, -28.315162658691406, -26.91575050354004, -25.516338348388672, -24.116926193237305, -22.717514038085938, -21.318103790283203, -19.918691635131836, -18.51927947998047, -17.119869232177734, -15.720457077026367, -14.321044921875, -12.921632766723633, -11.522221565246582, -10.122810363769531, -8.723398208618164, -7.323986530303955, -5.924574851989746, -4.525163650512695, -3.125751495361328, -1.7263398170471191, -0.32692813873291016, 1.0724835395812988, 2.471895217895508, 3.871306896209717, 5.270718574523926, 6.670129776000977, 8.069541931152344, 9.468954086303711, 10.868365287780762, 12.267776489257812, 13.66718864440918, 15.066600799560547, 16.46601104736328, 17.86542320251465, 19.264835357666016, 20.664247512817383, 22.06365966796875, 23.463069915771484, 24.86248207092285, 26.26189422607422, 27.661304473876953, 29.06071662902832, 30.460128784179688, 31.859540939331055, 33.25895309448242, 34.658363342285156, 36.057777404785156, 37.45718765258789, 38.856597900390625, 40.256011962890625, 41.65542221069336]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 5.0, 11.0, 5.0, 8.0, 7.0, 12.0, 17.0, 14.0, 20.0, 26.0, 20.0, 22.0, 27.0, 25.0, 35.0, 32.0, 34.0, 33.0, 33.0, 47.0, 38.0, 40.0, 36.0, 37.0, 37.0, 47.0, 27.0, 25.0, 38.0, 23.0, 32.0, 30.0, 24.0, 18.0, 15.0, 12.0, 11.0, 12.0, 10.0, 12.0, 9.0, 10.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-49.556034088134766, -47.986114501953125, -46.41619110107422, -44.84627151489258, -43.27635192871094, -41.70642852783203, -40.13650894165039, -38.56658935546875, -36.996665954589844, -35.4267463684082, -33.8568229675293, -32.286903381347656, -30.716983795166016, -29.147062301635742, -27.57714080810547, -26.007221221923828, -24.437301635742188, -22.867380142211914, -21.297460556030273, -19.7275390625, -18.15761947631836, -16.587697982788086, -15.017776489257812, -13.447855949401855, -11.877935409545898, -10.308014869689941, -8.738094329833984, -7.168172836303711, -5.598252296447754, -4.028331756591797, -2.4584102630615234, -0.8884897232055664, 0.6814346313476562, 2.2513554096221924, 3.8212761878967285, 5.391197204589844, 6.961117744445801, 8.531038284301758, 10.100959777832031, 11.670880317687988, 13.240800857543945, 14.810721397399902, 16.38064193725586, 17.950563430786133, 19.520484924316406, 21.090404510498047, 22.66032600402832, 24.230247497558594, 25.800167083740234, 27.370088577270508, 28.94000816345215, 30.509929656982422, 32.07984924316406, 33.64977264404297, 35.21969223022461, 36.78961181640625, 38.359535217285156, 39.9294548034668, 41.4993782043457, 43.069297790527344, 44.639217376708984, 46.209136962890625, 47.77906036376953, 49.34897994995117, 50.91889953613281]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 9.0, 26.0, 45.0, 58.0, 89.0, 118.0, 203.0, 266.0, 358.0, 573.0, 781.0, 1078.0, 1775.0, 2458.0, 3925.0, 5755.0, 8767.0, 13649.0, 21822.0, 33906.0, 53748.0, 81400.0, 116021.0, 145870.0, 151190.0, 130230.0, 95215.0, 64366.0, 40989.0, 25828.0, 16854.0, 10538.0, 6985.0, 4335.0, 2960.0, 2046.0, 1327.0, 946.0, 636.0, 456.0, 310.0, 204.0, 162.0, 84.0, 51.0, 59.0, 32.0, 19.0, 13.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.0, -43.51025390625, -42.0205078125, -40.53076171875, -39.041015625, -37.55126953125, -36.0615234375, -34.57177734375, -33.08203125, -31.59228515625, -30.1025390625, -28.61279296875, -27.123046875, -25.63330078125, -24.1435546875, -22.65380859375, -21.1640625, -19.67431640625, -18.1845703125, -16.69482421875, -15.205078125, -13.71533203125, -12.2255859375, -10.73583984375, -9.24609375, -7.75634765625, -6.2666015625, -4.77685546875, -3.287109375, -1.79736328125, -0.3076171875, 1.18212890625, 2.671875, 4.16162109375, 5.6513671875, 7.14111328125, 8.630859375, 10.12060546875, 11.6103515625, 13.10009765625, 14.58984375, 16.07958984375, 17.5693359375, 19.05908203125, 20.548828125, 22.03857421875, 23.5283203125, 25.01806640625, 26.5078125, 27.99755859375, 29.4873046875, 30.97705078125, 32.466796875, 33.95654296875, 35.4462890625, 36.93603515625, 38.42578125, 39.91552734375, 41.4052734375, 42.89501953125, 44.384765625, 45.87451171875, 47.3642578125, 48.85400390625, 50.34375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 4.0, 3.0, 12.0, 5.0, 7.0, 10.0, 11.0, 16.0, 15.0, 20.0, 24.0, 20.0, 22.0, 28.0, 27.0, 31.0, 33.0, 39.0, 28.0, 29.0, 49.0, 39.0, 38.0, 36.0, 40.0, 40.0, 46.0, 30.0, 23.0, 32.0, 28.0, 30.0, 28.0, 27.0, 15.0, 15.0, 14.0, 11.0, 11.0, 14.0, 10.0, 8.0, 10.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-45.78125, -44.33251953125, -42.8837890625, -41.43505859375, -39.986328125, -38.53759765625, -37.0888671875, -35.64013671875, -34.19140625, -32.74267578125, -31.2939453125, -29.84521484375, -28.396484375, -26.94775390625, -25.4990234375, -24.05029296875, -22.6015625, -21.15283203125, -19.7041015625, -18.25537109375, -16.806640625, -15.35791015625, -13.9091796875, -12.46044921875, -11.01171875, -9.56298828125, -8.1142578125, -6.66552734375, -5.216796875, -3.76806640625, -2.3193359375, -0.87060546875, 0.578125, 2.02685546875, 3.4755859375, 4.92431640625, 6.373046875, 7.82177734375, 9.2705078125, 10.71923828125, 12.16796875, 13.61669921875, 15.0654296875, 16.51416015625, 17.962890625, 19.41162109375, 20.8603515625, 22.30908203125, 23.7578125, 25.20654296875, 26.6552734375, 28.10400390625, 29.552734375, 31.00146484375, 32.4501953125, 33.89892578125, 35.34765625, 36.79638671875, 38.2451171875, 39.69384765625, 41.142578125, 42.59130859375, 44.0400390625, 45.48876953125, 46.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 6.0, 16.0, 33.0, 37.0, 59.0, 75.0, 132.0, 154.0, 278.0, 367.0, 503.0, 776.0, 1111.0, 1569.0, 2445.0, 3621.0, 5223.0, 8052.0, 12203.0, 18435.0, 28881.0, 44080.0, 66910.0, 96797.0, 126424.0, 144622.0, 137305.0, 111159.0, 80309.0, 54053.0, 35493.0, 22934.0, 14844.0, 9764.0, 6354.0, 4328.0, 2985.0, 1943.0, 1346.0, 911.0, 623.0, 422.0, 308.0, 227.0, 160.0, 98.0, 64.0, 38.0, 23.0, 20.0, 13.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0], "bins": [-51.25, -49.6845703125, -48.119140625, -46.5537109375, -44.98828125, -43.4228515625, -41.857421875, -40.2919921875, -38.7265625, -37.1611328125, -35.595703125, -34.0302734375, -32.46484375, -30.8994140625, -29.333984375, -27.7685546875, -26.203125, -24.6376953125, -23.072265625, -21.5068359375, -19.94140625, -18.3759765625, -16.810546875, -15.2451171875, -13.6796875, -12.1142578125, -10.548828125, -8.9833984375, -7.41796875, -5.8525390625, -4.287109375, -2.7216796875, -1.15625, 0.4091796875, 1.974609375, 3.5400390625, 5.10546875, 6.6708984375, 8.236328125, 9.8017578125, 11.3671875, 12.9326171875, 14.498046875, 16.0634765625, 17.62890625, 19.1943359375, 20.759765625, 22.3251953125, 23.890625, 25.4560546875, 27.021484375, 28.5869140625, 30.15234375, 31.7177734375, 33.283203125, 34.8486328125, 36.4140625, 37.9794921875, 39.544921875, 41.1103515625, 42.67578125, 44.2412109375, 45.806640625, 47.3720703125, 48.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 5.0, 3.0, 10.0, 7.0, 11.0, 8.0, 18.0, 13.0, 20.0, 17.0, 30.0, 30.0, 32.0, 27.0, 27.0, 45.0, 31.0, 40.0, 36.0, 38.0, 42.0, 41.0, 35.0, 40.0, 39.0, 37.0, 39.0, 39.0, 34.0, 34.0, 25.0, 23.0, 17.0, 19.0, 17.0, 15.0, 7.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.54736328125, -32.4384765625, -31.32958984375, -30.220703125, -29.11181640625, -28.0029296875, -26.89404296875, -25.78515625, -24.67626953125, -23.5673828125, -22.45849609375, -21.349609375, -20.24072265625, -19.1318359375, -18.02294921875, -16.9140625, -15.80517578125, -14.6962890625, -13.58740234375, -12.478515625, -11.36962890625, -10.2607421875, -9.15185546875, -8.04296875, -6.93408203125, -5.8251953125, -4.71630859375, -3.607421875, -2.49853515625, -1.3896484375, -0.28076171875, 0.828125, 1.93701171875, 3.0458984375, 4.15478515625, 5.263671875, 6.37255859375, 7.4814453125, 8.59033203125, 9.69921875, 10.80810546875, 11.9169921875, 13.02587890625, 14.134765625, 15.24365234375, 16.3525390625, 17.46142578125, 18.5703125, 19.67919921875, 20.7880859375, 21.89697265625, 23.005859375, 24.11474609375, 25.2236328125, 26.33251953125, 27.44140625, 28.55029296875, 29.6591796875, 30.76806640625, 31.876953125, 32.98583984375, 34.0947265625, 35.20361328125, 36.3125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 6.0, 6.0, 18.0, 28.0, 42.0, 69.0, 95.0, 143.0, 188.0, 318.0, 458.0, 694.0, 1152.0, 2004.0, 3289.0, 5417.0, 9523.0, 16525.0, 28948.0, 49716.0, 81690.0, 122408.0, 160105.0, 169084.0, 142891.0, 101076.0, 63070.0, 37552.0, 21599.0, 12341.0, 7224.0, 4179.0, 2501.0, 1509.0, 948.0, 610.0, 354.0, 246.0, 146.0, 108.0, 82.0, 53.0, 34.0, 29.0, 19.0, 20.0, 9.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.8125, -9.4769287109375, -9.141357421875, -8.8057861328125, -8.47021484375, -8.1346435546875, -7.799072265625, -7.4635009765625, -7.1279296875, -6.7923583984375, -6.456787109375, -6.1212158203125, -5.78564453125, -5.4500732421875, -5.114501953125, -4.7789306640625, -4.443359375, -4.1077880859375, -3.772216796875, -3.4366455078125, -3.10107421875, -2.7655029296875, -2.429931640625, -2.0943603515625, -1.7587890625, -1.4232177734375, -1.087646484375, -0.7520751953125, -0.41650390625, -0.0809326171875, 0.254638671875, 0.5902099609375, 0.92578125, 1.2613525390625, 1.596923828125, 1.9324951171875, 2.26806640625, 2.6036376953125, 2.939208984375, 3.2747802734375, 3.6103515625, 3.9459228515625, 4.281494140625, 4.6170654296875, 4.95263671875, 5.2882080078125, 5.623779296875, 5.9593505859375, 6.294921875, 6.6304931640625, 6.966064453125, 7.3016357421875, 7.63720703125, 7.9727783203125, 8.308349609375, 8.6439208984375, 8.9794921875, 9.3150634765625, 9.650634765625, 9.9862060546875, 10.32177734375, 10.6573486328125, 10.992919921875, 11.3284912109375, 11.6640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 4.0, 5.0, 5.0, 11.0, 7.0, 13.0, 17.0, 23.0, 19.0, 28.0, 25.0, 30.0, 41.0, 33.0, 40.0, 41.0, 54.0, 59.0, 60.0, 53.0, 54.0, 33.0, 48.0, 39.0, 33.0, 30.0, 27.0, 28.0, 22.0, 27.0, 20.0, 12.0, 12.0, 8.0, 11.0, 7.0, 9.0, 2.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0009236335754394531, -0.0008952617645263672, -0.0008668899536132812, -0.0008385181427001953, -0.0008101463317871094, -0.0007817745208740234, -0.0007534027099609375, -0.0007250308990478516, -0.0006966590881347656, -0.0006682872772216797, -0.0006399154663085938, -0.0006115436553955078, -0.0005831718444824219, -0.0005548000335693359, -0.00052642822265625, -0.0004980564117431641, -0.0004696846008300781, -0.0004413127899169922, -0.00041294097900390625, -0.0003845691680908203, -0.0003561973571777344, -0.00032782554626464844, -0.0002994537353515625, -0.00027108192443847656, -0.00024271011352539062, -0.0002143383026123047, -0.00018596649169921875, -0.0001575946807861328, -0.00012922286987304688, -0.00010085105895996094, -7.2479248046875e-05, -4.410743713378906e-05, -1.5735626220703125e-05, 1.2636184692382812e-05, 4.100799560546875e-05, 6.937980651855469e-05, 9.775161743164062e-05, 0.00012612342834472656, 0.0001544952392578125, 0.00018286705017089844, 0.00021123886108398438, 0.0002396106719970703, 0.00026798248291015625, 0.0002963542938232422, 0.0003247261047363281, 0.00035309791564941406, 0.0003814697265625, 0.00040984153747558594, 0.0004382133483886719, 0.0004665851593017578, 0.0004949569702148438, 0.0005233287811279297, 0.0005517005920410156, 0.0005800724029541016, 0.0006084442138671875, 0.0006368160247802734, 0.0006651878356933594, 0.0006935596466064453, 0.0007219314575195312, 0.0007503032684326172, 0.0007786750793457031, 0.0008070468902587891, 0.000835418701171875, 0.0008637905120849609, 0.0008921623229980469]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 8.0, 18.0, 18.0, 29.0, 56.0, 89.0, 120.0, 188.0, 333.0, 540.0, 823.0, 1284.0, 2042.0, 3298.0, 5301.0, 8558.0, 13891.0, 22584.0, 35972.0, 56876.0, 83699.0, 114765.0, 139282.0, 144941.0, 127811.0, 98614.0, 68226.0, 44632.0, 28312.0, 17594.0, 10828.0, 6604.0, 4162.0, 2572.0, 1629.0, 1029.0, 656.0, 402.0, 268.0, 183.0, 102.0, 70.0, 49.0, 37.0, 19.0, 11.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-9.8046875, -9.518310546875, -9.23193359375, -8.945556640625, -8.6591796875, -8.372802734375, -8.08642578125, -7.800048828125, -7.513671875, -7.227294921875, -6.94091796875, -6.654541015625, -6.3681640625, -6.081787109375, -5.79541015625, -5.509033203125, -5.22265625, -4.936279296875, -4.64990234375, -4.363525390625, -4.0771484375, -3.790771484375, -3.50439453125, -3.218017578125, -2.931640625, -2.645263671875, -2.35888671875, -2.072509765625, -1.7861328125, -1.499755859375, -1.21337890625, -0.927001953125, -0.640625, -0.354248046875, -0.06787109375, 0.218505859375, 0.5048828125, 0.791259765625, 1.07763671875, 1.364013671875, 1.650390625, 1.936767578125, 2.22314453125, 2.509521484375, 2.7958984375, 3.082275390625, 3.36865234375, 3.655029296875, 3.94140625, 4.227783203125, 4.51416015625, 4.800537109375, 5.0869140625, 5.373291015625, 5.65966796875, 5.946044921875, 6.232421875, 6.518798828125, 6.80517578125, 7.091552734375, 7.3779296875, 7.664306640625, 7.95068359375, 8.237060546875, 8.5234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 4.0, 10.0, 9.0, 12.0, 10.0, 18.0, 17.0, 18.0, 22.0, 31.0, 44.0, 37.0, 41.0, 47.0, 51.0, 61.0, 61.0, 62.0, 47.0, 48.0, 38.0, 42.0, 42.0, 32.0, 29.0, 28.0, 21.0, 17.0, 24.0, 12.0, 10.0, 8.0, 6.0, 10.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.01953125, -4.89532470703125, -4.7711181640625, -4.64691162109375, -4.522705078125, -4.39849853515625, -4.2742919921875, -4.15008544921875, -4.02587890625, -3.90167236328125, -3.7774658203125, -3.65325927734375, -3.529052734375, -3.40484619140625, -3.2806396484375, -3.15643310546875, -3.0322265625, -2.90802001953125, -2.7838134765625, -2.65960693359375, -2.535400390625, -2.41119384765625, -2.2869873046875, -2.16278076171875, -2.03857421875, -1.91436767578125, -1.7901611328125, -1.66595458984375, -1.541748046875, -1.41754150390625, -1.2933349609375, -1.16912841796875, -1.044921875, -0.92071533203125, -0.7965087890625, -0.67230224609375, -0.548095703125, -0.42388916015625, -0.2996826171875, -0.17547607421875, -0.05126953125, 0.07293701171875, 0.1971435546875, 0.32135009765625, 0.445556640625, 0.56976318359375, 0.6939697265625, 0.81817626953125, 0.9423828125, 1.06658935546875, 1.1907958984375, 1.31500244140625, 1.439208984375, 1.56341552734375, 1.6876220703125, 1.81182861328125, 1.93603515625, 2.06024169921875, 2.1844482421875, 2.30865478515625, 2.432861328125, 2.55706787109375, 2.6812744140625, 2.80548095703125, 2.9296875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 2.0, 5.0, 6.0, 7.0, 12.0, 12.0, 13.0, 19.0, 22.0, 25.0, 20.0, 28.0, 25.0, 40.0, 28.0, 36.0, 32.0, 34.0, 56.0, 35.0, 42.0, 46.0, 41.0, 51.0, 46.0, 37.0, 33.0, 32.0, 31.0, 24.0, 16.0, 26.0, 17.0, 10.0, 13.0, 17.0, 13.0, 11.0, 4.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.26207733154297, -36.91667938232422, -35.5712776184082, -34.22587966918945, -32.88047790527344, -31.535078048706055, -30.189678192138672, -28.844280242919922, -27.498878479003906, -26.153478622436523, -24.80807876586914, -23.462678909301758, -22.117279052734375, -20.771879196166992, -19.42647933959961, -18.08108139038086, -16.735681533813477, -15.390281677246094, -14.044881820678711, -12.699481964111328, -11.354082107543945, -10.008682250976562, -8.663283348083496, -7.317883491516113, -5.9724836349487305, -4.627083778381348, -3.281684160232544, -1.9362845420837402, -0.5908846855163574, 0.7545151710510254, 2.09991455078125, 3.445314407348633, 4.790714263916016, 6.136114120483398, 7.481513977050781, 8.826913833618164, 10.172313690185547, 11.51771354675293, 12.863112449645996, 14.208512306213379, 15.553912162780762, 16.899311065673828, 18.24471092224121, 19.590110778808594, 20.935510635375977, 22.28091049194336, 23.626310348510742, 24.971710205078125, 26.317110061645508, 27.66250991821289, 29.007909774780273, 30.353309631347656, 31.69870948791504, 33.04410934448242, 34.38950729370117, 35.73490905761719, 37.08030700683594, 38.42570495605469, 39.7711067199707, 41.11650466918945, 42.46190643310547, 43.80730438232422, 45.152706146240234, 46.498104095458984, 47.843505859375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 6.0, 8.0, 6.0, 9.0, 2.0, 11.0, 10.0, 16.0, 14.0, 23.0, 21.0, 23.0, 25.0, 28.0, 32.0, 42.0, 35.0, 29.0, 26.0, 34.0, 35.0, 36.0, 28.0, 41.0, 41.0, 39.0, 53.0, 35.0, 31.0, 35.0, 23.0, 22.0, 22.0, 24.0, 22.0, 17.0, 15.0, 16.0, 8.0, 15.0, 10.0, 3.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-58.07903289794922, -56.39326095581055, -54.70748519897461, -53.02171325683594, -51.3359375, -49.65016555786133, -47.96438980102539, -46.27861785888672, -44.59284210205078, -42.90707015991211, -41.22129440307617, -39.5355224609375, -37.84974670410156, -36.16397476196289, -34.47819900512695, -32.79242706298828, -31.106653213500977, -29.420879364013672, -27.735105514526367, -26.049331665039062, -24.363557815551758, -22.677783966064453, -20.99201202392578, -19.306236267089844, -17.620464324951172, -15.934690475463867, -14.248916625976562, -12.563142776489258, -10.877368927001953, -9.191596031188965, -7.50582218170166, -5.8200483322143555, -4.134273529052734, -2.4484996795654297, -0.7627260684967041, 0.9230475425720215, 2.608821392059326, 4.294594764709473, 5.980368614196777, 7.666142463684082, 9.351916313171387, 11.037690162658691, 12.723464012145996, 14.409236907958984, 16.09501075744629, 17.780784606933594, 19.4665584564209, 21.152332305908203, 22.838106155395508, 24.523880004882812, 26.209653854370117, 27.895427703857422, 29.581201553344727, 31.26697540283203, 32.9527473449707, 34.63852310180664, 36.32429504394531, 38.010066986083984, 39.69584274291992, 41.381614685058594, 43.06739044189453, 44.7531623840332, 46.43893814086914, 48.12471008300781, 49.81048583984375]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 6.0, 10.0, 21.0, 26.0, 50.0, 76.0, 87.0, 160.0, 235.0, 348.0, 531.0, 748.0, 1171.0, 1656.0, 2610.0, 3851.0, 6015.0, 8970.0, 13805.0, 22110.0, 35048.0, 56912.0, 93475.0, 153627.0, 252116.0, 399726.0, 572415.0, 677579.0, 630316.0, 468925.0, 305259.0, 187008.0, 114029.0, 69338.0, 42660.0, 26581.0, 16507.0, 10389.0, 6814.0, 4475.0, 2876.0, 1939.0, 1282.0, 810.0, 563.0, 374.0, 246.0, 160.0, 113.0, 86.0, 50.0, 38.0, 26.0, 17.0, 11.0, 5.0, 7.0, 1.0, 1.0, 3.0, 2.0], "bins": [-38.96875, -37.69921875, -36.4296875, -35.16015625, -33.890625, -32.62109375, -31.3515625, -30.08203125, -28.8125, -27.54296875, -26.2734375, -25.00390625, -23.734375, -22.46484375, -21.1953125, -19.92578125, -18.65625, -17.38671875, -16.1171875, -14.84765625, -13.578125, -12.30859375, -11.0390625, -9.76953125, -8.5, -7.23046875, -5.9609375, -4.69140625, -3.421875, -2.15234375, -0.8828125, 0.38671875, 1.65625, 2.92578125, 4.1953125, 5.46484375, 6.734375, 8.00390625, 9.2734375, 10.54296875, 11.8125, 13.08203125, 14.3515625, 15.62109375, 16.890625, 18.16015625, 19.4296875, 20.69921875, 21.96875, 23.23828125, 24.5078125, 25.77734375, 27.046875, 28.31640625, 29.5859375, 30.85546875, 32.125, 33.39453125, 34.6640625, 35.93359375, 37.203125, 38.47265625, 39.7421875, 41.01171875, 42.28125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 6.0, 10.0, 4.0, 12.0, 9.0, 19.0, 18.0, 23.0, 21.0, 19.0, 30.0, 28.0, 33.0, 39.0, 33.0, 26.0, 30.0, 28.0, 35.0, 34.0, 36.0, 35.0, 44.0, 31.0, 48.0, 47.0, 30.0, 33.0, 21.0, 24.0, 23.0, 19.0, 22.0, 23.0, 11.0, 18.0, 6.0, 14.0, 9.0, 5.0, 11.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-40.78125, -39.58740234375, -38.3935546875, -37.19970703125, -36.005859375, -34.81201171875, -33.6181640625, -32.42431640625, -31.23046875, -30.03662109375, -28.8427734375, -27.64892578125, -26.455078125, -25.26123046875, -24.0673828125, -22.87353515625, -21.6796875, -20.48583984375, -19.2919921875, -18.09814453125, -16.904296875, -15.71044921875, -14.5166015625, -13.32275390625, -12.12890625, -10.93505859375, -9.7412109375, -8.54736328125, -7.353515625, -6.15966796875, -4.9658203125, -3.77197265625, -2.578125, -1.38427734375, -0.1904296875, 1.00341796875, 2.197265625, 3.39111328125, 4.5849609375, 5.77880859375, 6.97265625, 8.16650390625, 9.3603515625, 10.55419921875, 11.748046875, 12.94189453125, 14.1357421875, 15.32958984375, 16.5234375, 17.71728515625, 18.9111328125, 20.10498046875, 21.298828125, 22.49267578125, 23.6865234375, 24.88037109375, 26.07421875, 27.26806640625, 28.4619140625, 29.65576171875, 30.849609375, 32.04345703125, 33.2373046875, 34.43115234375, 35.625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 8.0, 11.0, 18.0, 37.0, 54.0, 83.0, 105.0, 189.0, 282.0, 480.0, 677.0, 1193.0, 1886.0, 3018.0, 4920.0, 7846.0, 13116.0, 22166.0, 36569.0, 60024.0, 98592.0, 156064.0, 239457.0, 344780.0, 462088.0, 547027.0, 561046.0, 496861.0, 386250.0, 272521.0, 181565.0, 114991.0, 71062.0, 43200.0, 25995.0, 15529.0, 9501.0, 5698.0, 3589.0, 2073.0, 1334.0, 865.0, 559.0, 353.0, 212.0, 138.0, 96.0, 58.0, 42.0, 17.0, 25.0, 5.0, 7.0, 4.0, 2.0, 1.0], "bins": [-37.1875, -36.09912109375, -35.0107421875, -33.92236328125, -32.833984375, -31.74560546875, -30.6572265625, -29.56884765625, -28.48046875, -27.39208984375, -26.3037109375, -25.21533203125, -24.126953125, -23.03857421875, -21.9501953125, -20.86181640625, -19.7734375, -18.68505859375, -17.5966796875, -16.50830078125, -15.419921875, -14.33154296875, -13.2431640625, -12.15478515625, -11.06640625, -9.97802734375, -8.8896484375, -7.80126953125, -6.712890625, -5.62451171875, -4.5361328125, -3.44775390625, -2.359375, -1.27099609375, -0.1826171875, 0.90576171875, 1.994140625, 3.08251953125, 4.1708984375, 5.25927734375, 6.34765625, 7.43603515625, 8.5244140625, 9.61279296875, 10.701171875, 11.78955078125, 12.8779296875, 13.96630859375, 15.0546875, 16.14306640625, 17.2314453125, 18.31982421875, 19.408203125, 20.49658203125, 21.5849609375, 22.67333984375, 23.76171875, 24.85009765625, 25.9384765625, 27.02685546875, 28.115234375, 29.20361328125, 30.2919921875, 31.38037109375, 32.46875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 10.0, 6.0, 5.0, 14.0, 9.0, 18.0, 21.0, 34.0, 29.0, 36.0, 44.0, 34.0, 65.0, 88.0, 104.0, 101.0, 107.0, 159.0, 129.0, 157.0, 200.0, 217.0, 213.0, 214.0, 224.0, 221.0, 194.0, 190.0, 181.0, 163.0, 140.0, 132.0, 107.0, 96.0, 82.0, 64.0, 48.0, 40.0, 45.0, 31.0, 18.0, 23.0, 19.0, 12.0, 13.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-20.9375, -20.3699951171875, -19.802490234375, -19.2349853515625, -18.66748046875, -18.0999755859375, -17.532470703125, -16.9649658203125, -16.3974609375, -15.8299560546875, -15.262451171875, -14.6949462890625, -14.12744140625, -13.5599365234375, -12.992431640625, -12.4249267578125, -11.857421875, -11.2899169921875, -10.722412109375, -10.1549072265625, -9.58740234375, -9.0198974609375, -8.452392578125, -7.8848876953125, -7.3173828125, -6.7498779296875, -6.182373046875, -5.6148681640625, -5.04736328125, -4.4798583984375, -3.912353515625, -3.3448486328125, -2.77734375, -2.2098388671875, -1.642333984375, -1.0748291015625, -0.50732421875, 0.0601806640625, 0.627685546875, 1.1951904296875, 1.7626953125, 2.3302001953125, 2.897705078125, 3.4652099609375, 4.03271484375, 4.6002197265625, 5.167724609375, 5.7352294921875, 6.302734375, 6.8702392578125, 7.437744140625, 8.0052490234375, 8.57275390625, 9.1402587890625, 9.707763671875, 10.2752685546875, 10.8427734375, 11.4102783203125, 11.977783203125, 12.5452880859375, 13.11279296875, 13.6802978515625, 14.247802734375, 14.8153076171875, 15.3828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 4.0, 12.0, 15.0, 9.0, 9.0, 11.0, 19.0, 21.0, 28.0, 17.0, 23.0, 30.0, 22.0, 36.0, 39.0, 45.0, 52.0, 53.0, 45.0, 39.0, 53.0, 45.0, 46.0, 46.0, 40.0, 39.0, 24.0, 21.0, 20.0, 23.0, 16.0, 24.0, 12.0, 12.0, 8.0, 7.0, 5.0, 6.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.264259338378906, -38.05012512207031, -36.83599090576172, -35.621856689453125, -34.40772247314453, -33.19358825683594, -31.979454040527344, -30.76531982421875, -29.551185607910156, -28.337051391601562, -27.12291717529297, -25.908782958984375, -24.69464874267578, -23.480514526367188, -22.266380310058594, -21.05224609375, -19.838111877441406, -18.623977661132812, -17.40984344482422, -16.195709228515625, -14.981575012207031, -13.767440795898438, -12.553306579589844, -11.33917236328125, -10.125038146972656, -8.910903930664062, -7.696769714355469, -6.482635498046875, -5.268501281738281, -4.0543670654296875, -2.8402328491210938, -1.6260986328125, -0.41196441650390625, 0.8021697998046875, 2.0163040161132812, 3.230438232421875, 4.444572448730469, 5.6587066650390625, 6.872840881347656, 8.08697509765625, 9.301109313964844, 10.515243530273438, 11.729377746582031, 12.943511962890625, 14.157646179199219, 15.371780395507812, 16.585914611816406, 17.800048828125, 19.014183044433594, 20.228317260742188, 21.44245147705078, 22.656585693359375, 23.87071990966797, 25.084854125976562, 26.298988342285156, 27.51312255859375, 28.727256774902344, 29.941390991210938, 31.15552520751953, 32.369659423828125, 33.58379364013672, 34.79792785644531, 36.012062072753906, 37.2261962890625, 38.440330505371094]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 15.0, 8.0, 8.0, 17.0, 7.0, 16.0, 15.0, 31.0, 26.0, 22.0, 36.0, 31.0, 34.0, 34.0, 31.0, 30.0, 28.0, 27.0, 24.0, 37.0, 41.0, 42.0, 42.0, 29.0, 30.0, 33.0, 37.0, 29.0, 27.0, 34.0, 17.0, 21.0, 17.0, 15.0, 17.0, 14.0, 12.0, 8.0, 9.0, 7.0, 3.0, 10.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.67929458618164, -41.26819610595703, -39.85709762573242, -38.44599914550781, -37.0349006652832, -35.623802185058594, -34.212703704833984, -32.801605224609375, -31.390506744384766, -29.979408264160156, -28.568309783935547, -27.157211303710938, -25.746112823486328, -24.33501434326172, -22.92391586303711, -21.5128173828125, -20.10171890258789, -18.69062042236328, -17.279521942138672, -15.868423461914062, -14.457324981689453, -13.046226501464844, -11.635128021240234, -10.224029541015625, -8.812931060791016, -7.401832580566406, -5.990734100341797, -4.5796356201171875, -3.168537139892578, -1.7574386596679688, -0.3463401794433594, 1.06475830078125, 2.475860595703125, 3.8869590759277344, 5.298057556152344, 6.709156036376953, 8.120254516601562, 9.531352996826172, 10.942451477050781, 12.35354995727539, 13.7646484375, 15.17574691772461, 16.58684539794922, 17.997943878173828, 19.409042358398438, 20.820140838623047, 22.231239318847656, 23.642337799072266, 25.053436279296875, 26.464534759521484, 27.875633239746094, 29.286731719970703, 30.697830200195312, 32.10892868041992, 33.52002716064453, 34.93112564086914, 36.34222412109375, 37.75332260131836, 39.16442108154297, 40.57551956176758, 41.98661804199219, 43.3977165222168, 44.808815002441406, 46.219913482666016, 47.631011962890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 15.0, 17.0, 19.0, 41.0, 54.0, 56.0, 114.0, 145.0, 208.0, 266.0, 411.0, 564.0, 925.0, 1232.0, 1993.0, 3232.0, 4976.0, 8447.0, 14524.0, 26600.0, 48818.0, 98242.0, 221427.0, 315587.0, 146334.0, 69441.0, 35912.0, 19595.0, 11116.0, 6604.0, 4053.0, 2526.0, 1621.0, 1033.0, 760.0, 483.0, 329.0, 229.0, 186.0, 112.0, 96.0, 47.0, 42.0, 33.0, 26.0, 20.0, 12.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-10.7890625, -10.45458984375, -10.1201171875, -9.78564453125, -9.451171875, -9.11669921875, -8.7822265625, -8.44775390625, -8.11328125, -7.77880859375, -7.4443359375, -7.10986328125, -6.775390625, -6.44091796875, -6.1064453125, -5.77197265625, -5.4375, -5.10302734375, -4.7685546875, -4.43408203125, -4.099609375, -3.76513671875, -3.4306640625, -3.09619140625, -2.76171875, -2.42724609375, -2.0927734375, -1.75830078125, -1.423828125, -1.08935546875, -0.7548828125, -0.42041015625, -0.0859375, 0.24853515625, 0.5830078125, 0.91748046875, 1.251953125, 1.58642578125, 1.9208984375, 2.25537109375, 2.58984375, 2.92431640625, 3.2587890625, 3.59326171875, 3.927734375, 4.26220703125, 4.5966796875, 4.93115234375, 5.265625, 5.60009765625, 5.9345703125, 6.26904296875, 6.603515625, 6.93798828125, 7.2724609375, 7.60693359375, 7.94140625, 8.27587890625, 8.6103515625, 8.94482421875, 9.279296875, 9.61376953125, 9.9482421875, 10.28271484375, 10.6171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 7.0, 6.0, 14.0, 9.0, 8.0, 16.0, 13.0, 10.0, 14.0, 31.0, 30.0, 20.0, 41.0, 27.0, 34.0, 34.0, 38.0, 24.0, 26.0, 29.0, 26.0, 33.0, 39.0, 46.0, 42.0, 32.0, 29.0, 30.0, 39.0, 28.0, 27.0, 37.0, 13.0, 20.0, 17.0, 15.0, 18.0, 15.0, 10.0, 10.0, 8.0, 4.0, 4.0, 10.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.4375, -41.0380859375, -39.638671875, -38.2392578125, -36.83984375, -35.4404296875, -34.041015625, -32.6416015625, -31.2421875, -29.8427734375, -28.443359375, -27.0439453125, -25.64453125, -24.2451171875, -22.845703125, -21.4462890625, -20.046875, -18.6474609375, -17.248046875, -15.8486328125, -14.44921875, -13.0498046875, -11.650390625, -10.2509765625, -8.8515625, -7.4521484375, -6.052734375, -4.6533203125, -3.25390625, -1.8544921875, -0.455078125, 0.9443359375, 2.34375, 3.7431640625, 5.142578125, 6.5419921875, 7.94140625, 9.3408203125, 10.740234375, 12.1396484375, 13.5390625, 14.9384765625, 16.337890625, 17.7373046875, 19.13671875, 20.5361328125, 21.935546875, 23.3349609375, 24.734375, 26.1337890625, 27.533203125, 28.9326171875, 30.33203125, 31.7314453125, 33.130859375, 34.5302734375, 35.9296875, 37.3291015625, 38.728515625, 40.1279296875, 41.52734375, 42.9267578125, 44.326171875, 45.7255859375, 47.125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 10.0, 19.0, 15.0, 27.0, 35.0, 44.0, 60.0, 99.0, 153.0, 174.0, 310.0, 487.0, 760.0, 1260.0, 2081.0, 3513.0, 6589.0, 12502.0, 25990.0, 57381.0, 141813.0, 362290.0, 257042.0, 94672.0, 40332.0, 18983.0, 9394.0, 5242.0, 2807.0, 1687.0, 893.0, 644.0, 410.0, 261.0, 194.0, 112.0, 81.0, 50.0, 37.0, 29.0, 17.0, 16.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.890625, -9.6063232421875, -9.322021484375, -9.0377197265625, -8.75341796875, -8.4691162109375, -8.184814453125, -7.9005126953125, -7.6162109375, -7.3319091796875, -7.047607421875, -6.7633056640625, -6.47900390625, -6.1947021484375, -5.910400390625, -5.6260986328125, -5.341796875, -5.0574951171875, -4.773193359375, -4.4888916015625, -4.20458984375, -3.9202880859375, -3.635986328125, -3.3516845703125, -3.0673828125, -2.7830810546875, -2.498779296875, -2.2144775390625, -1.93017578125, -1.6458740234375, -1.361572265625, -1.0772705078125, -0.79296875, -0.5086669921875, -0.224365234375, 0.0599365234375, 0.34423828125, 0.6285400390625, 0.912841796875, 1.1971435546875, 1.4814453125, 1.7657470703125, 2.050048828125, 2.3343505859375, 2.61865234375, 2.9029541015625, 3.187255859375, 3.4715576171875, 3.755859375, 4.0401611328125, 4.324462890625, 4.6087646484375, 4.89306640625, 5.1773681640625, 5.461669921875, 5.7459716796875, 6.0302734375, 6.3145751953125, 6.598876953125, 6.8831787109375, 7.16748046875, 7.4517822265625, 7.736083984375, 8.0203857421875, 8.3046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 7.0, 18.0, 11.0, 6.0, 15.0, 17.0, 18.0, 14.0, 19.0, 20.0, 32.0, 29.0, 34.0, 27.0, 32.0, 45.0, 31.0, 30.0, 42.0, 33.0, 32.0, 40.0, 46.0, 37.0, 42.0, 48.0, 36.0, 28.0, 25.0, 39.0, 17.0, 20.0, 17.0, 19.0, 14.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.0625, -31.94677734375, -30.8310546875, -29.71533203125, -28.599609375, -27.48388671875, -26.3681640625, -25.25244140625, -24.13671875, -23.02099609375, -21.9052734375, -20.78955078125, -19.673828125, -18.55810546875, -17.4423828125, -16.32666015625, -15.2109375, -14.09521484375, -12.9794921875, -11.86376953125, -10.748046875, -9.63232421875, -8.5166015625, -7.40087890625, -6.28515625, -5.16943359375, -4.0537109375, -2.93798828125, -1.822265625, -0.70654296875, 0.4091796875, 1.52490234375, 2.640625, 3.75634765625, 4.8720703125, 5.98779296875, 7.103515625, 8.21923828125, 9.3349609375, 10.45068359375, 11.56640625, 12.68212890625, 13.7978515625, 14.91357421875, 16.029296875, 17.14501953125, 18.2607421875, 19.37646484375, 20.4921875, 21.60791015625, 22.7236328125, 23.83935546875, 24.955078125, 26.07080078125, 27.1865234375, 28.30224609375, 29.41796875, 30.53369140625, 31.6494140625, 32.76513671875, 33.880859375, 34.99658203125, 36.1123046875, 37.22802734375, 38.34375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 16.0, 23.0, 11.0, 33.0, 41.0, 57.0, 95.0, 113.0, 180.0, 240.0, 371.0, 557.0, 844.0, 1379.0, 2133.0, 3664.0, 6510.0, 12246.0, 26388.0, 76646.0, 581653.0, 246026.0, 47639.0, 19210.0, 9328.0, 5055.0, 3040.0, 1782.0, 1088.0, 690.0, 464.0, 312.0, 203.0, 152.0, 117.0, 78.0, 50.0, 31.0, 32.0, 17.0, 16.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-6.46875, -6.2880859375, -6.107421875, -5.9267578125, -5.74609375, -5.5654296875, -5.384765625, -5.2041015625, -5.0234375, -4.8427734375, -4.662109375, -4.4814453125, -4.30078125, -4.1201171875, -3.939453125, -3.7587890625, -3.578125, -3.3974609375, -3.216796875, -3.0361328125, -2.85546875, -2.6748046875, -2.494140625, -2.3134765625, -2.1328125, -1.9521484375, -1.771484375, -1.5908203125, -1.41015625, -1.2294921875, -1.048828125, -0.8681640625, -0.6875, -0.5068359375, -0.326171875, -0.1455078125, 0.03515625, 0.2158203125, 0.396484375, 0.5771484375, 0.7578125, 0.9384765625, 1.119140625, 1.2998046875, 1.48046875, 1.6611328125, 1.841796875, 2.0224609375, 2.203125, 2.3837890625, 2.564453125, 2.7451171875, 2.92578125, 3.1064453125, 3.287109375, 3.4677734375, 3.6484375, 3.8291015625, 4.009765625, 4.1904296875, 4.37109375, 4.5517578125, 4.732421875, 4.9130859375, 5.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 5.0, 7.0, 4.0, 9.0, 13.0, 13.0, 16.0, 17.0, 24.0, 30.0, 44.0, 57.0, 92.0, 134.0, 108.0, 101.0, 93.0, 54.0, 42.0, 22.0, 25.0, 16.0, 21.0, 11.0, 12.0, 11.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005655288696289062, -0.0005468353629112244, -0.0005281418561935425, -0.0005094483494758606, -0.0004907548427581787, -0.0004720613360404968, -0.00045336782932281494, -0.00043467432260513306, -0.00041598081588745117, -0.0003972873091697693, -0.0003785938024520874, -0.0003599002957344055, -0.00034120678901672363, -0.00032251328229904175, -0.00030381977558135986, -0.000285126268863678, -0.0002664327621459961, -0.0002477392554283142, -0.00022904574871063232, -0.00021035224199295044, -0.00019165873527526855, -0.00017296522855758667, -0.00015427172183990479, -0.0001355782151222229, -0.00011688470840454102, -9.819120168685913e-05, -7.949769496917725e-05, -6.080418825149536e-05, -4.2110681533813477e-05, -2.3417174816131592e-05, -4.723668098449707e-06, 1.3969838619232178e-05, 3.266334533691406e-05, 5.135685205459595e-05, 7.005035877227783e-05, 8.874386548995972e-05, 0.0001074373722076416, 0.00012613087892532349, 0.00014482438564300537, 0.00016351789236068726, 0.00018221139907836914, 0.00020090490579605103, 0.0002195984125137329, 0.0002382919192314148, 0.0002569854259490967, 0.00027567893266677856, 0.00029437243938446045, 0.00031306594610214233, 0.0003317594528198242, 0.0003504529595375061, 0.000369146466255188, 0.0003878399729728699, 0.00040653347969055176, 0.00042522698640823364, 0.00044392049312591553, 0.0004626139998435974, 0.0004813075065612793, 0.0005000010132789612, 0.0005186945199966431, 0.000537388026714325, 0.0005560815334320068, 0.0005747750401496887, 0.0005934685468673706, 0.0006121620535850525, 0.0006308555603027344]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 19.0, 19.0, 34.0, 43.0, 77.0, 83.0, 117.0, 132.0, 205.0, 296.0, 377.0, 534.0, 787.0, 1089.0, 1584.0, 2287.0, 3302.0, 5077.0, 7918.0, 12704.0, 20331.0, 33724.0, 58300.0, 106071.0, 215222.0, 268578.0, 132066.0, 70580.0, 40521.0, 24142.0, 14731.0, 9121.0, 5829.0, 3967.0, 2573.0, 1770.0, 1288.0, 847.0, 602.0, 459.0, 301.0, 238.0, 187.0, 92.0, 85.0, 68.0, 46.0, 42.0, 20.0, 14.0, 14.0, 9.0, 4.0, 7.0, 5.0, 1.0, 2.0], "bins": [-3.767578125, -3.65045166015625, -3.5333251953125, -3.41619873046875, -3.299072265625, -3.18194580078125, -3.0648193359375, -2.94769287109375, -2.83056640625, -2.71343994140625, -2.5963134765625, -2.47918701171875, -2.362060546875, -2.24493408203125, -2.1278076171875, -2.01068115234375, -1.8935546875, -1.77642822265625, -1.6593017578125, -1.54217529296875, -1.425048828125, -1.30792236328125, -1.1907958984375, -1.07366943359375, -0.95654296875, -0.83941650390625, -0.7222900390625, -0.60516357421875, -0.488037109375, -0.37091064453125, -0.2537841796875, -0.13665771484375, -0.01953125, 0.09759521484375, 0.2147216796875, 0.33184814453125, 0.448974609375, 0.56610107421875, 0.6832275390625, 0.80035400390625, 0.91748046875, 1.03460693359375, 1.1517333984375, 1.26885986328125, 1.385986328125, 1.50311279296875, 1.6202392578125, 1.73736572265625, 1.8544921875, 1.97161865234375, 2.0887451171875, 2.20587158203125, 2.322998046875, 2.44012451171875, 2.5572509765625, 2.67437744140625, 2.79150390625, 2.90863037109375, 3.0257568359375, 3.14288330078125, 3.260009765625, 3.37713623046875, 3.4942626953125, 3.61138916015625, 3.728515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 5.0, 14.0, 13.0, 17.0, 16.0, 24.0, 30.0, 35.0, 49.0, 45.0, 49.0, 48.0, 46.0, 36.0, 56.0, 50.0, 42.0, 48.0, 39.0, 39.0, 43.0, 49.0, 46.0, 38.0, 20.0, 25.0, 16.0, 13.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.177734375, -2.110198974609375, -2.04266357421875, -1.975128173828125, -1.9075927734375, -1.840057373046875, -1.77252197265625, -1.704986572265625, -1.637451171875, -1.569915771484375, -1.50238037109375, -1.434844970703125, -1.3673095703125, -1.299774169921875, -1.23223876953125, -1.164703369140625, -1.09716796875, -1.029632568359375, -0.96209716796875, -0.894561767578125, -0.8270263671875, -0.759490966796875, -0.69195556640625, -0.624420166015625, -0.556884765625, -0.489349365234375, -0.42181396484375, -0.354278564453125, -0.2867431640625, -0.219207763671875, -0.15167236328125, -0.084136962890625, -0.0166015625, 0.050933837890625, 0.11846923828125, 0.186004638671875, 0.2535400390625, 0.321075439453125, 0.38861083984375, 0.456146240234375, 0.523681640625, 0.591217041015625, 0.65875244140625, 0.726287841796875, 0.7938232421875, 0.861358642578125, 0.92889404296875, 0.996429443359375, 1.06396484375, 1.131500244140625, 1.19903564453125, 1.266571044921875, 1.3341064453125, 1.401641845703125, 1.46917724609375, 1.536712646484375, 1.604248046875, 1.671783447265625, 1.73931884765625, 1.806854248046875, 1.8743896484375, 1.941925048828125, 2.00946044921875, 2.076995849609375, 2.14453125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 7.0, 5.0, 8.0, 16.0, 12.0, 9.0, 10.0, 21.0, 22.0, 23.0, 27.0, 24.0, 22.0, 37.0, 36.0, 38.0, 46.0, 49.0, 46.0, 51.0, 49.0, 51.0, 46.0, 47.0, 34.0, 45.0, 33.0, 19.0, 25.0, 26.0, 18.0, 15.0, 20.0, 16.0, 7.0, 8.0, 7.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.72322463989258, -38.50471878051758, -37.28621292114258, -36.06770706176758, -34.84919738769531, -33.63069152832031, -32.41218566894531, -31.193679809570312, -29.975173950195312, -28.756668090820312, -27.538162231445312, -26.31965446472168, -25.10114860534668, -23.88264274597168, -22.664134979248047, -21.445629119873047, -20.227123260498047, -19.008617401123047, -17.790111541748047, -16.571603775024414, -15.353097915649414, -14.134592056274414, -12.916085243225098, -11.697578430175781, -10.479072570800781, -9.260566711425781, -8.042059898376465, -6.823553562164307, -5.605047225952148, -4.38654088973999, -3.168034553527832, -1.9495277404785156, -0.7310218811035156, 0.4874844551086426, 1.7059907913208008, 2.924497127532959, 4.143003463745117, 5.361509799957275, 6.580016136169434, 7.79852294921875, 9.01702880859375, 10.23553466796875, 11.454041481018066, 12.672548294067383, 13.891054153442383, 15.109560012817383, 16.328067779541016, 17.546573638916016, 18.765079498291016, 19.983585357666016, 21.202091217041016, 22.42059898376465, 23.63910484313965, 24.85761070251465, 26.07611846923828, 27.29462432861328, 28.51313018798828, 29.73163604736328, 30.95014190673828, 32.16864776611328, 33.38715362548828, 34.60566329956055, 35.82416915893555, 37.04267501831055, 38.26118087768555]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 10.0, 9.0, 9.0, 12.0, 12.0, 16.0, 19.0, 26.0, 27.0, 25.0, 28.0, 34.0, 24.0, 37.0, 39.0, 27.0, 25.0, 34.0, 25.0, 31.0, 42.0, 40.0, 47.0, 34.0, 22.0, 32.0, 38.0, 32.0, 21.0, 30.0, 27.0, 14.0, 16.0, 23.0, 13.0, 13.0, 16.0, 9.0, 6.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-43.7476921081543, -42.35765838623047, -40.967628479003906, -39.57759475708008, -38.18756103515625, -36.79752731323242, -35.407493591308594, -34.01746368408203, -32.6274299621582, -31.237396240234375, -29.84736442565918, -28.457332611083984, -27.067298889160156, -25.677265167236328, -24.287233352661133, -22.897201538085938, -21.50716781616211, -20.11713409423828, -18.727102279663086, -17.33707046508789, -15.947036743164062, -14.55700397491455, -13.166971206665039, -11.776938438415527, -10.386905670166016, -8.996872901916504, -7.606840133666992, -6.2168073654174805, -4.826774597167969, -3.436741828918457, -2.0467090606689453, -0.6566762924194336, 0.7333602905273438, 2.1233930587768555, 3.513425827026367, 4.903458595275879, 6.293491363525391, 7.683524131774902, 9.073556900024414, 10.463589668273926, 11.853622436523438, 13.24365520477295, 14.633687973022461, 16.023719787597656, 17.413753509521484, 18.803787231445312, 20.193819046020508, 21.583850860595703, 22.97388458251953, 24.36391830444336, 25.753950119018555, 27.14398193359375, 28.534015655517578, 29.924049377441406, 31.3140811920166, 32.7041130065918, 34.094146728515625, 35.48418045043945, 36.87421417236328, 38.264244079589844, 39.65427780151367, 41.0443115234375, 42.43434143066406, 43.82437515258789, 45.21440887451172]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 7.0, 17.0, 19.0, 34.0, 38.0, 73.0, 81.0, 143.0, 201.0, 289.0, 424.0, 576.0, 877.0, 1216.0, 1683.0, 2544.0, 3642.0, 5384.0, 7899.0, 11098.0, 16150.0, 22959.0, 32472.0, 44648.0, 60521.0, 77969.0, 95067.0, 107248.0, 110222.0, 102774.0, 87935.0, 69937.0, 53435.0, 38859.0, 27981.0, 19691.0, 13751.0, 9443.0, 6589.0, 4497.0, 3054.0, 2119.0, 1495.0, 1042.0, 767.0, 524.0, 344.0, 248.0, 171.0, 122.0, 96.0, 56.0, 45.0, 27.0, 18.0, 21.0, 10.0, 5.0, 5.0, 1.0, 2.0], "bins": [-28.84375, -27.921630859375, -26.99951171875, -26.077392578125, -25.1552734375, -24.233154296875, -23.31103515625, -22.388916015625, -21.466796875, -20.544677734375, -19.62255859375, -18.700439453125, -17.7783203125, -16.856201171875, -15.93408203125, -15.011962890625, -14.08984375, -13.167724609375, -12.24560546875, -11.323486328125, -10.4013671875, -9.479248046875, -8.55712890625, -7.635009765625, -6.712890625, -5.790771484375, -4.86865234375, -3.946533203125, -3.0244140625, -2.102294921875, -1.18017578125, -0.258056640625, 0.6640625, 1.586181640625, 2.50830078125, 3.430419921875, 4.3525390625, 5.274658203125, 6.19677734375, 7.118896484375, 8.041015625, 8.963134765625, 9.88525390625, 10.807373046875, 11.7294921875, 12.651611328125, 13.57373046875, 14.495849609375, 15.41796875, 16.340087890625, 17.26220703125, 18.184326171875, 19.1064453125, 20.028564453125, 20.95068359375, 21.872802734375, 22.794921875, 23.717041015625, 24.63916015625, 25.561279296875, 26.4833984375, 27.405517578125, 28.32763671875, 29.249755859375, 30.171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 9.0, 11.0, 7.0, 13.0, 11.0, 16.0, 20.0, 27.0, 28.0, 25.0, 26.0, 33.0, 27.0, 34.0, 40.0, 27.0, 29.0, 32.0, 22.0, 34.0, 44.0, 41.0, 41.0, 33.0, 26.0, 30.0, 44.0, 29.0, 17.0, 33.0, 22.0, 17.0, 15.0, 23.0, 11.0, 15.0, 15.0, 11.0, 6.0, 6.0, 5.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.28125, -39.966796875, -38.65234375, -37.337890625, -36.0234375, -34.708984375, -33.39453125, -32.080078125, -30.765625, -29.451171875, -28.13671875, -26.822265625, -25.5078125, -24.193359375, -22.87890625, -21.564453125, -20.25, -18.935546875, -17.62109375, -16.306640625, -14.9921875, -13.677734375, -12.36328125, -11.048828125, -9.734375, -8.419921875, -7.10546875, -5.791015625, -4.4765625, -3.162109375, -1.84765625, -0.533203125, 0.78125, 2.095703125, 3.41015625, 4.724609375, 6.0390625, 7.353515625, 8.66796875, 9.982421875, 11.296875, 12.611328125, 13.92578125, 15.240234375, 16.5546875, 17.869140625, 19.18359375, 20.498046875, 21.8125, 23.126953125, 24.44140625, 25.755859375, 27.0703125, 28.384765625, 29.69921875, 31.013671875, 32.328125, 33.642578125, 34.95703125, 36.271484375, 37.5859375, 38.900390625, 40.21484375, 41.529296875, 42.84375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 7.0, 13.0, 21.0, 25.0, 43.0, 47.0, 84.0, 128.0, 190.0, 274.0, 394.0, 635.0, 1013.0, 1435.0, 2331.0, 3608.0, 5735.0, 8870.0, 14386.0, 23036.0, 36557.0, 56494.0, 84959.0, 117799.0, 143470.0, 147335.0, 126719.0, 94600.0, 64522.0, 41758.0, 26525.0, 16753.0, 10546.0, 6339.0, 4026.0, 2743.0, 1766.0, 1168.0, 757.0, 504.0, 312.0, 208.0, 143.0, 91.0, 58.0, 49.0, 25.0, 22.0, 10.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.125, -37.869140625, -36.61328125, -35.357421875, -34.1015625, -32.845703125, -31.58984375, -30.333984375, -29.078125, -27.822265625, -26.56640625, -25.310546875, -24.0546875, -22.798828125, -21.54296875, -20.287109375, -19.03125, -17.775390625, -16.51953125, -15.263671875, -14.0078125, -12.751953125, -11.49609375, -10.240234375, -8.984375, -7.728515625, -6.47265625, -5.216796875, -3.9609375, -2.705078125, -1.44921875, -0.193359375, 1.0625, 2.318359375, 3.57421875, 4.830078125, 6.0859375, 7.341796875, 8.59765625, 9.853515625, 11.109375, 12.365234375, 13.62109375, 14.876953125, 16.1328125, 17.388671875, 18.64453125, 19.900390625, 21.15625, 22.412109375, 23.66796875, 24.923828125, 26.1796875, 27.435546875, 28.69140625, 29.947265625, 31.203125, 32.458984375, 33.71484375, 34.970703125, 36.2265625, 37.482421875, 38.73828125, 39.994140625, 41.25]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 12.0, 12.0, 13.0, 18.0, 23.0, 16.0, 24.0, 33.0, 28.0, 30.0, 33.0, 42.0, 45.0, 37.0, 58.0, 37.0, 39.0, 60.0, 40.0, 38.0, 47.0, 35.0, 26.0, 35.0, 29.0, 23.0, 29.0, 22.0, 14.0, 21.0, 10.0, 13.0, 9.0, 10.0, 3.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.3125, -30.29736328125, -29.2822265625, -28.26708984375, -27.251953125, -26.23681640625, -25.2216796875, -24.20654296875, -23.19140625, -22.17626953125, -21.1611328125, -20.14599609375, -19.130859375, -18.11572265625, -17.1005859375, -16.08544921875, -15.0703125, -14.05517578125, -13.0400390625, -12.02490234375, -11.009765625, -9.99462890625, -8.9794921875, -7.96435546875, -6.94921875, -5.93408203125, -4.9189453125, -3.90380859375, -2.888671875, -1.87353515625, -0.8583984375, 0.15673828125, 1.171875, 2.18701171875, 3.2021484375, 4.21728515625, 5.232421875, 6.24755859375, 7.2626953125, 8.27783203125, 9.29296875, 10.30810546875, 11.3232421875, 12.33837890625, 13.353515625, 14.36865234375, 15.3837890625, 16.39892578125, 17.4140625, 18.42919921875, 19.4443359375, 20.45947265625, 21.474609375, 22.48974609375, 23.5048828125, 24.52001953125, 25.53515625, 26.55029296875, 27.5654296875, 28.58056640625, 29.595703125, 30.61083984375, 31.6259765625, 32.64111328125, 33.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 3.0, 9.0, 19.0, 21.0, 31.0, 36.0, 79.0, 116.0, 176.0, 265.0, 395.0, 641.0, 1006.0, 1530.0, 2400.0, 4126.0, 6663.0, 12079.0, 22064.0, 41593.0, 76532.0, 130048.0, 181600.0, 194487.0, 154515.0, 97599.0, 54617.0, 28843.0, 15371.0, 8454.0, 4929.0, 2987.0, 1854.0, 1218.0, 780.0, 523.0, 316.0, 236.0, 128.0, 103.0, 46.0, 34.0, 30.0, 14.0, 7.0, 11.0, 7.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.046875, -12.654052734375, -12.26123046875, -11.868408203125, -11.4755859375, -11.082763671875, -10.68994140625, -10.297119140625, -9.904296875, -9.511474609375, -9.11865234375, -8.725830078125, -8.3330078125, -7.940185546875, -7.54736328125, -7.154541015625, -6.76171875, -6.368896484375, -5.97607421875, -5.583251953125, -5.1904296875, -4.797607421875, -4.40478515625, -4.011962890625, -3.619140625, -3.226318359375, -2.83349609375, -2.440673828125, -2.0478515625, -1.655029296875, -1.26220703125, -0.869384765625, -0.4765625, -0.083740234375, 0.30908203125, 0.701904296875, 1.0947265625, 1.487548828125, 1.88037109375, 2.273193359375, 2.666015625, 3.058837890625, 3.45166015625, 3.844482421875, 4.2373046875, 4.630126953125, 5.02294921875, 5.415771484375, 5.80859375, 6.201416015625, 6.59423828125, 6.987060546875, 7.3798828125, 7.772705078125, 8.16552734375, 8.558349609375, 8.951171875, 9.343994140625, 9.73681640625, 10.129638671875, 10.5224609375, 10.915283203125, 11.30810546875, 11.700927734375, 12.09375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 6.0, 9.0, 15.0, 11.0, 16.0, 25.0, 36.0, 27.0, 41.0, 46.0, 31.0, 48.0, 46.0, 58.0, 58.0, 73.0, 63.0, 56.0, 61.0, 41.0, 35.0, 37.0, 31.0, 19.0, 15.0, 15.0, 15.0, 20.0, 4.0, 8.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.0011663436889648438, -0.0011362731456756592, -0.0011062026023864746, -0.00107613205909729, -0.0010460615158081055, -0.001015990972518921, -0.0009859204292297363, -0.0009558498859405518, -0.0009257793426513672, -0.0008957087993621826, -0.000865638256072998, -0.0008355677127838135, -0.0008054971694946289, -0.0007754266262054443, -0.0007453560829162598, -0.0007152855396270752, -0.0006852149963378906, -0.0006551444530487061, -0.0006250739097595215, -0.0005950033664703369, -0.0005649328231811523, -0.0005348622798919678, -0.0005047917366027832, -0.00047472119331359863, -0.00044465065002441406, -0.0004145801067352295, -0.0003845095634460449, -0.00035443902015686035, -0.0003243684768676758, -0.0002942979335784912, -0.00026422739028930664, -0.00023415684700012207, -0.0002040863037109375, -0.00017401576042175293, -0.00014394521713256836, -0.00011387467384338379, -8.380413055419922e-05, -5.373358726501465e-05, -2.3663043975830078e-05, 6.407499313354492e-06, 3.647804260253906e-05, 6.654858589172363e-05, 9.66191291809082e-05, 0.00012668967247009277, 0.00015676021575927734, 0.00018683075904846191, 0.00021690130233764648, 0.00024697184562683105, 0.0002770423889160156, 0.0003071129322052002, 0.00033718347549438477, 0.00036725401878356934, 0.0003973245620727539, 0.0004273951053619385, 0.00045746564865112305, 0.0004875361919403076, 0.0005176067352294922, 0.0005476772785186768, 0.0005777478218078613, 0.0006078183650970459, 0.0006378889083862305, 0.000667959451675415, 0.0006980299949645996, 0.0007281005382537842, 0.0007581710815429688]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 13.0, 16.0, 22.0, 24.0, 40.0, 52.0, 67.0, 108.0, 159.0, 257.0, 348.0, 527.0, 805.0, 1250.0, 2213.0, 3914.0, 7143.0, 13720.0, 27862.0, 54751.0, 102465.0, 167671.0, 208484.0, 187777.0, 125545.0, 69555.0, 35135.0, 18006.0, 8893.0, 4729.0, 2652.0, 1518.0, 977.0, 592.0, 376.0, 287.0, 158.0, 130.0, 83.0, 56.0, 43.0, 37.0, 27.0, 22.0, 7.0, 6.0, 15.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.8671875, -13.429443359375, -12.99169921875, -12.553955078125, -12.1162109375, -11.678466796875, -11.24072265625, -10.802978515625, -10.365234375, -9.927490234375, -9.48974609375, -9.052001953125, -8.6142578125, -8.176513671875, -7.73876953125, -7.301025390625, -6.86328125, -6.425537109375, -5.98779296875, -5.550048828125, -5.1123046875, -4.674560546875, -4.23681640625, -3.799072265625, -3.361328125, -2.923583984375, -2.48583984375, -2.048095703125, -1.6103515625, -1.172607421875, -0.73486328125, -0.297119140625, 0.140625, 0.578369140625, 1.01611328125, 1.453857421875, 1.8916015625, 2.329345703125, 2.76708984375, 3.204833984375, 3.642578125, 4.080322265625, 4.51806640625, 4.955810546875, 5.3935546875, 5.831298828125, 6.26904296875, 6.706787109375, 7.14453125, 7.582275390625, 8.02001953125, 8.457763671875, 8.8955078125, 9.333251953125, 9.77099609375, 10.208740234375, 10.646484375, 11.084228515625, 11.52197265625, 11.959716796875, 12.3974609375, 12.835205078125, 13.27294921875, 13.710693359375, 14.1484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 8.0, 8.0, 14.0, 18.0, 29.0, 36.0, 34.0, 34.0, 49.0, 49.0, 57.0, 84.0, 69.0, 63.0, 73.0, 62.0, 48.0, 51.0, 34.0, 37.0, 26.0, 23.0, 18.0, 10.0, 7.0, 11.0, 10.0, 6.0, 4.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.76171875, -6.5616455078125, -6.361572265625, -6.1614990234375, -5.96142578125, -5.7613525390625, -5.561279296875, -5.3612060546875, -5.1611328125, -4.9610595703125, -4.760986328125, -4.5609130859375, -4.36083984375, -4.1607666015625, -3.960693359375, -3.7606201171875, -3.560546875, -3.3604736328125, -3.160400390625, -2.9603271484375, -2.76025390625, -2.5601806640625, -2.360107421875, -2.1600341796875, -1.9599609375, -1.7598876953125, -1.559814453125, -1.3597412109375, -1.15966796875, -0.9595947265625, -0.759521484375, -0.5594482421875, -0.359375, -0.1593017578125, 0.040771484375, 0.2408447265625, 0.44091796875, 0.6409912109375, 0.841064453125, 1.0411376953125, 1.2412109375, 1.4412841796875, 1.641357421875, 1.8414306640625, 2.04150390625, 2.2415771484375, 2.441650390625, 2.6417236328125, 2.841796875, 3.0418701171875, 3.241943359375, 3.4420166015625, 3.64208984375, 3.8421630859375, 4.042236328125, 4.2423095703125, 4.4423828125, 4.6424560546875, 4.842529296875, 5.0426025390625, 5.24267578125, 5.4427490234375, 5.642822265625, 5.8428955078125, 6.04296875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 2.0, 6.0, 7.0, 10.0, 16.0, 15.0, 13.0, 18.0, 32.0, 26.0, 32.0, 26.0, 34.0, 34.0, 42.0, 52.0, 49.0, 39.0, 60.0, 49.0, 53.0, 39.0, 52.0, 43.0, 46.0, 33.0, 30.0, 21.0, 22.0, 17.0, 14.0, 9.0, 15.0, 6.0, 9.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.401031494140625, -42.12834930419922, -40.85567092895508, -39.58299255371094, -38.31031036376953, -37.037628173828125, -35.764949798583984, -34.492271423339844, -33.21958923339844, -31.946908950805664, -30.67422866821289, -29.401548385620117, -28.128868103027344, -26.85618782043457, -25.583507537841797, -24.310827255249023, -23.03814697265625, -21.765466690063477, -20.492786407470703, -19.22010612487793, -17.947425842285156, -16.674745559692383, -15.40206527709961, -14.129384994506836, -12.856704711914062, -11.584024429321289, -10.311344146728516, -9.038663864135742, -7.765983581542969, -6.493303298950195, -5.220623016357422, -3.9479427337646484, -2.6752662658691406, -1.4025859832763672, -0.12990570068359375, 1.1427745819091797, 2.415454864501953, 3.6881351470947266, 4.9608154296875, 6.233495712280273, 7.506175994873047, 8.77885627746582, 10.051536560058594, 11.324216842651367, 12.59689712524414, 13.869577407836914, 15.142257690429688, 16.41493797302246, 17.687618255615234, 18.960298538208008, 20.23297882080078, 21.505659103393555, 22.778339385986328, 24.0510196685791, 25.323699951171875, 26.59638023376465, 27.869060516357422, 29.141740798950195, 30.41442108154297, 31.687101364135742, 32.959781646728516, 34.232460021972656, 35.50514221191406, 36.77782440185547, 38.05050277709961]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 10.0, 12.0, 13.0, 12.0, 14.0, 13.0, 21.0, 25.0, 24.0, 31.0, 39.0, 33.0, 36.0, 31.0, 31.0, 37.0, 49.0, 38.0, 33.0, 37.0, 38.0, 47.0, 47.0, 29.0, 40.0, 39.0, 28.0, 26.0, 25.0, 17.0, 20.0, 21.0, 23.0, 5.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-56.451107025146484, -54.79768753051758, -53.14426803588867, -51.490848541259766, -49.837425231933594, -48.18400573730469, -46.53058624267578, -44.877166748046875, -43.22374725341797, -41.57032775878906, -39.916908264160156, -38.26348876953125, -36.610069274902344, -34.95664978027344, -33.303226470947266, -31.64980697631836, -29.996387481689453, -28.342967987060547, -26.68954849243164, -25.0361270904541, -23.382707595825195, -21.72928810119629, -20.07586669921875, -18.422447204589844, -16.769027709960938, -15.115608215332031, -13.462187767028809, -11.808767318725586, -10.15534782409668, -8.501928329467773, -6.848507881164551, -5.195087432861328, -3.5416641235351562, -1.8882441520690918, -0.23482418060302734, 1.418595790863037, 3.0720157623291016, 4.725435256958008, 6.3788557052612305, 8.032276153564453, 9.68569564819336, 11.339115142822266, 12.992535591125488, 14.645956039428711, 16.299375534057617, 17.952795028686523, 19.606216430664062, 21.25963592529297, 22.913055419921875, 24.56647491455078, 26.219894409179688, 27.873315811157227, 29.526735305786133, 31.18015480041504, 32.83357620239258, 34.486995697021484, 36.14041519165039, 37.7938346862793, 39.4472541809082, 41.10067367553711, 42.75409698486328, 44.40751647949219, 46.060935974121094, 47.71435546875, 49.367774963378906]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 12.0, 13.0, 18.0, 42.0, 59.0, 100.0, 176.0, 269.0, 447.0, 719.0, 1146.0, 1836.0, 3044.0, 4844.0, 8028.0, 13253.0, 22095.0, 37330.0, 63458.0, 107354.0, 183554.0, 306834.0, 479712.0, 646490.0, 696038.0, 588926.0, 409264.0, 253891.0, 150331.0, 88112.0, 51406.0, 30568.0, 17965.0, 10747.0, 6351.0, 3901.0, 2306.0, 1400.0, 850.0, 522.0, 344.0, 191.0, 133.0, 82.0, 44.0, 33.0, 20.0, 16.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-39.0625, -37.8896484375, -36.716796875, -35.5439453125, -34.37109375, -33.1982421875, -32.025390625, -30.8525390625, -29.6796875, -28.5068359375, -27.333984375, -26.1611328125, -24.98828125, -23.8154296875, -22.642578125, -21.4697265625, -20.296875, -19.1240234375, -17.951171875, -16.7783203125, -15.60546875, -14.4326171875, -13.259765625, -12.0869140625, -10.9140625, -9.7412109375, -8.568359375, -7.3955078125, -6.22265625, -5.0498046875, -3.876953125, -2.7041015625, -1.53125, -0.3583984375, 0.814453125, 1.9873046875, 3.16015625, 4.3330078125, 5.505859375, 6.6787109375, 7.8515625, 9.0244140625, 10.197265625, 11.3701171875, 12.54296875, 13.7158203125, 14.888671875, 16.0615234375, 17.234375, 18.4072265625, 19.580078125, 20.7529296875, 21.92578125, 23.0986328125, 24.271484375, 25.4443359375, 26.6171875, 27.7900390625, 28.962890625, 30.1357421875, 31.30859375, 32.4814453125, 33.654296875, 34.8271484375, 36.0]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 10.0, 15.0, 12.0, 15.0, 14.0, 9.0, 18.0, 28.0, 21.0, 37.0, 32.0, 39.0, 34.0, 31.0, 30.0, 36.0, 47.0, 46.0, 27.0, 41.0, 35.0, 40.0, 49.0, 35.0, 40.0, 37.0, 32.0, 28.0, 24.0, 13.0, 27.0, 17.0, 19.0, 10.0, 10.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-42.6875, -41.44091796875, -40.1943359375, -38.94775390625, -37.701171875, -36.45458984375, -35.2080078125, -33.96142578125, -32.71484375, -31.46826171875, -30.2216796875, -28.97509765625, -27.728515625, -26.48193359375, -25.2353515625, -23.98876953125, -22.7421875, -21.49560546875, -20.2490234375, -19.00244140625, -17.755859375, -16.50927734375, -15.2626953125, -14.01611328125, -12.76953125, -11.52294921875, -10.2763671875, -9.02978515625, -7.783203125, -6.53662109375, -5.2900390625, -4.04345703125, -2.796875, -1.55029296875, -0.3037109375, 0.94287109375, 2.189453125, 3.43603515625, 4.6826171875, 5.92919921875, 7.17578125, 8.42236328125, 9.6689453125, 10.91552734375, 12.162109375, 13.40869140625, 14.6552734375, 15.90185546875, 17.1484375, 18.39501953125, 19.6416015625, 20.88818359375, 22.134765625, 23.38134765625, 24.6279296875, 25.87451171875, 27.12109375, 28.36767578125, 29.6142578125, 30.86083984375, 32.107421875, 33.35400390625, 34.6005859375, 35.84716796875, 37.09375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 5.0, 2.0, 8.0, 18.0, 20.0, 30.0, 56.0, 84.0, 101.0, 214.0, 343.0, 501.0, 835.0, 1284.0, 2128.0, 3433.0, 5827.0, 9961.0, 16877.0, 28401.0, 47548.0, 78115.0, 124532.0, 193147.0, 282461.0, 386621.0, 480060.0, 531491.0, 520102.0, 448494.0, 348573.0, 248001.0, 165685.0, 105636.0, 65525.0, 39521.0, 23657.0, 14242.0, 8231.0, 4836.0, 2976.0, 1836.0, 1105.0, 683.0, 391.0, 238.0, 162.0, 98.0, 76.0, 48.0, 27.0, 13.0, 18.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.15625, -27.24267578125, -26.3291015625, -25.41552734375, -24.501953125, -23.58837890625, -22.6748046875, -21.76123046875, -20.84765625, -19.93408203125, -19.0205078125, -18.10693359375, -17.193359375, -16.27978515625, -15.3662109375, -14.45263671875, -13.5390625, -12.62548828125, -11.7119140625, -10.79833984375, -9.884765625, -8.97119140625, -8.0576171875, -7.14404296875, -6.23046875, -5.31689453125, -4.4033203125, -3.48974609375, -2.576171875, -1.66259765625, -0.7490234375, 0.16455078125, 1.078125, 1.99169921875, 2.9052734375, 3.81884765625, 4.732421875, 5.64599609375, 6.5595703125, 7.47314453125, 8.38671875, 9.30029296875, 10.2138671875, 11.12744140625, 12.041015625, 12.95458984375, 13.8681640625, 14.78173828125, 15.6953125, 16.60888671875, 17.5224609375, 18.43603515625, 19.349609375, 20.26318359375, 21.1767578125, 22.09033203125, 23.00390625, 23.91748046875, 24.8310546875, 25.74462890625, 26.658203125, 27.57177734375, 28.4853515625, 29.39892578125, 30.3125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 11.0, 13.0, 17.0, 23.0, 23.0, 34.0, 39.0, 51.0, 57.0, 69.0, 92.0, 104.0, 127.0, 135.0, 163.0, 182.0, 225.0, 228.0, 235.0, 234.0, 233.0, 243.0, 234.0, 189.0, 175.0, 143.0, 127.0, 119.0, 100.0, 70.0, 73.0, 72.0, 46.0, 42.0, 28.0, 37.0, 21.0, 13.0, 13.0, 4.0, 3.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.40625, -17.842529296875, -17.27880859375, -16.715087890625, -16.1513671875, -15.587646484375, -15.02392578125, -14.460205078125, -13.896484375, -13.332763671875, -12.76904296875, -12.205322265625, -11.6416015625, -11.077880859375, -10.51416015625, -9.950439453125, -9.38671875, -8.822998046875, -8.25927734375, -7.695556640625, -7.1318359375, -6.568115234375, -6.00439453125, -5.440673828125, -4.876953125, -4.313232421875, -3.74951171875, -3.185791015625, -2.6220703125, -2.058349609375, -1.49462890625, -0.930908203125, -0.3671875, 0.196533203125, 0.76025390625, 1.323974609375, 1.8876953125, 2.451416015625, 3.01513671875, 3.578857421875, 4.142578125, 4.706298828125, 5.27001953125, 5.833740234375, 6.3974609375, 6.961181640625, 7.52490234375, 8.088623046875, 8.65234375, 9.216064453125, 9.77978515625, 10.343505859375, 10.9072265625, 11.470947265625, 12.03466796875, 12.598388671875, 13.162109375, 13.725830078125, 14.28955078125, 14.853271484375, 15.4169921875, 15.980712890625, 16.54443359375, 17.108154296875, 17.671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 7.0, 10.0, 7.0, 16.0, 16.0, 17.0, 24.0, 24.0, 31.0, 34.0, 34.0, 45.0, 33.0, 38.0, 59.0, 44.0, 66.0, 44.0, 47.0, 52.0, 50.0, 44.0, 38.0, 37.0, 33.0, 23.0, 23.0, 23.0, 13.0, 20.0, 11.0, 7.0, 9.0, 6.0, 8.0, 2.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-44.770992279052734, -43.57698440551758, -42.38297653198242, -41.188968658447266, -39.99496078491211, -38.80095291137695, -37.6069450378418, -36.412933349609375, -35.21892547607422, -34.02491760253906, -32.830909729003906, -31.63690185546875, -30.442893981933594, -29.248886108398438, -28.05487632751465, -26.860868453979492, -25.66686248779297, -24.472854614257812, -23.278846740722656, -22.0848388671875, -20.890830993652344, -19.696823120117188, -18.5028133392334, -17.308805465698242, -16.114797592163086, -14.92078971862793, -13.726781845092773, -12.5327730178833, -11.338765144348145, -10.144757270812988, -8.950748443603516, -7.756740570068359, -6.56273078918457, -5.368722915649414, -4.1747145652771, -2.9807064533233643, -1.786698341369629, -0.5926904678344727, 0.6013178825378418, 1.7953262329101562, 2.9893341064453125, 4.183341979980469, 5.377350330352783, 6.571358680725098, 7.765366554260254, 8.95937442779541, 10.153383255004883, 11.347391128540039, 12.541399002075195, 13.735406875610352, 14.929414749145508, 16.123422622680664, 17.317432403564453, 18.51144027709961, 19.705448150634766, 20.899456024169922, 22.093463897705078, 23.287471771240234, 24.48147964477539, 25.675487518310547, 26.869495391845703, 28.06350326538086, 29.25751304626465, 30.451520919799805, 31.64552879333496]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 6.0, 5.0, 7.0, 17.0, 14.0, 19.0, 17.0, 20.0, 31.0, 25.0, 35.0, 42.0, 52.0, 42.0, 47.0, 47.0, 43.0, 42.0, 38.0, 30.0, 33.0, 41.0, 40.0, 46.0, 33.0, 28.0, 31.0, 27.0, 23.0, 22.0, 12.0, 16.0, 11.0, 11.0, 7.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.03507614135742, -46.5241813659668, -45.01329040527344, -43.50239562988281, -41.99150085449219, -40.48060607910156, -38.9697151184082, -37.45882034301758, -35.94792938232422, -34.437034606933594, -32.926143646240234, -31.41524887084961, -29.904354095458984, -28.393461227416992, -26.882568359375, -25.371673583984375, -23.86077880859375, -22.349885940551758, -20.838991165161133, -19.32809829711914, -17.817203521728516, -16.306310653686523, -14.795417785644531, -13.284523963928223, -11.773630142211914, -10.262736320495605, -8.751842498779297, -7.240949630737305, -5.730055809020996, -4.2191619873046875, -2.7082691192626953, -1.1973752975463867, 0.3135223388671875, 1.824415922164917, 3.3353095054626465, 4.846202850341797, 6.3570966720581055, 7.867990493774414, 9.378883361816406, 10.889777183532715, 12.400671005249023, 13.911564826965332, 15.42245864868164, 16.933351516723633, 18.444244384765625, 19.95513916015625, 21.466032028198242, 22.976924896240234, 24.48781967163086, 25.99871253967285, 27.509607315063477, 29.02050018310547, 30.531394958496094, 32.04228973388672, 33.55318069458008, 35.0640754699707, 36.57496643066406, 38.08586120605469, 39.59675216674805, 41.10764694213867, 42.6185417175293, 44.129432678222656, 45.64032745361328, 47.151222229003906, 48.66211700439453]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 9.0, 13.0, 12.0, 13.0, 26.0, 39.0, 47.0, 79.0, 95.0, 139.0, 174.0, 261.0, 345.0, 511.0, 794.0, 1173.0, 1847.0, 2825.0, 4701.0, 7790.0, 13188.0, 23329.0, 44264.0, 90218.0, 205275.0, 332584.0, 160692.0, 72790.0, 36308.0, 19665.0, 11259.0, 6424.0, 4019.0, 2500.0, 1660.0, 1047.0, 754.0, 497.0, 342.0, 226.0, 163.0, 128.0, 98.0, 69.0, 45.0, 28.0, 17.0, 27.0, 12.0, 7.0, 8.0, 7.0, 1.0, 2.0, 3.0, 4.0, 2.0], "bins": [-8.875, -8.6007080078125, -8.326416015625, -8.0521240234375, -7.77783203125, -7.5035400390625, -7.229248046875, -6.9549560546875, -6.6806640625, -6.4063720703125, -6.132080078125, -5.8577880859375, -5.58349609375, -5.3092041015625, -5.034912109375, -4.7606201171875, -4.486328125, -4.2120361328125, -3.937744140625, -3.6634521484375, -3.38916015625, -3.1148681640625, -2.840576171875, -2.5662841796875, -2.2919921875, -2.0177001953125, -1.743408203125, -1.4691162109375, -1.19482421875, -0.9205322265625, -0.646240234375, -0.3719482421875, -0.09765625, 0.1766357421875, 0.450927734375, 0.7252197265625, 0.99951171875, 1.2738037109375, 1.548095703125, 1.8223876953125, 2.0966796875, 2.3709716796875, 2.645263671875, 2.9195556640625, 3.19384765625, 3.4681396484375, 3.742431640625, 4.0167236328125, 4.291015625, 4.5653076171875, 4.839599609375, 5.1138916015625, 5.38818359375, 5.6624755859375, 5.936767578125, 6.2110595703125, 6.4853515625, 6.7596435546875, 7.033935546875, 7.3082275390625, 7.58251953125, 7.8568115234375, 8.131103515625, 8.4053955078125, 8.6796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 6.0, 5.0, 8.0, 17.0, 14.0, 17.0, 20.0, 16.0, 31.0, 26.0, 31.0, 42.0, 54.0, 46.0, 45.0, 52.0, 39.0, 41.0, 37.0, 32.0, 32.0, 40.0, 46.0, 40.0, 33.0, 27.0, 33.0, 25.0, 26.0, 21.0, 15.0, 13.0, 11.0, 11.0, 8.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.625, -46.12841796875, -44.6318359375, -43.13525390625, -41.638671875, -40.14208984375, -38.6455078125, -37.14892578125, -35.65234375, -34.15576171875, -32.6591796875, -31.16259765625, -29.666015625, -28.16943359375, -26.6728515625, -25.17626953125, -23.6796875, -22.18310546875, -20.6865234375, -19.18994140625, -17.693359375, -16.19677734375, -14.7001953125, -13.20361328125, -11.70703125, -10.21044921875, -8.7138671875, -7.21728515625, -5.720703125, -4.22412109375, -2.7275390625, -1.23095703125, 0.265625, 1.76220703125, 3.2587890625, 4.75537109375, 6.251953125, 7.74853515625, 9.2451171875, 10.74169921875, 12.23828125, 13.73486328125, 15.2314453125, 16.72802734375, 18.224609375, 19.72119140625, 21.2177734375, 22.71435546875, 24.2109375, 25.70751953125, 27.2041015625, 28.70068359375, 30.197265625, 31.69384765625, 33.1904296875, 34.68701171875, 36.18359375, 37.68017578125, 39.1767578125, 40.67333984375, 42.169921875, 43.66650390625, 45.1630859375, 46.65966796875, 48.15625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 5.0, 7.0, 9.0, 14.0, 12.0, 20.0, 28.0, 51.0, 85.0, 111.0, 179.0, 297.0, 401.0, 584.0, 1039.0, 1766.0, 3073.0, 6057.0, 11462.0, 23405.0, 51759.0, 132193.0, 376509.0, 269507.0, 93186.0, 38848.0, 17836.0, 8696.0, 4685.0, 2629.0, 1579.0, 910.0, 589.0, 333.0, 226.0, 137.0, 99.0, 72.0, 53.0, 32.0, 22.0, 23.0, 11.0, 8.0, 4.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6171875, -7.3529052734375, -7.088623046875, -6.8243408203125, -6.56005859375, -6.2957763671875, -6.031494140625, -5.7672119140625, -5.5029296875, -5.2386474609375, -4.974365234375, -4.7100830078125, -4.44580078125, -4.1815185546875, -3.917236328125, -3.6529541015625, -3.388671875, -3.1243896484375, -2.860107421875, -2.5958251953125, -2.33154296875, -2.0672607421875, -1.802978515625, -1.5386962890625, -1.2744140625, -1.0101318359375, -0.745849609375, -0.4815673828125, -0.21728515625, 0.0469970703125, 0.311279296875, 0.5755615234375, 0.83984375, 1.1041259765625, 1.368408203125, 1.6326904296875, 1.89697265625, 2.1612548828125, 2.425537109375, 2.6898193359375, 2.9541015625, 3.2183837890625, 3.482666015625, 3.7469482421875, 4.01123046875, 4.2755126953125, 4.539794921875, 4.8040771484375, 5.068359375, 5.3326416015625, 5.596923828125, 5.8612060546875, 6.12548828125, 6.3897705078125, 6.654052734375, 6.9183349609375, 7.1826171875, 7.4468994140625, 7.711181640625, 7.9754638671875, 8.23974609375, 8.5040283203125, 8.768310546875, 9.0325927734375, 9.296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 16.0, 10.0, 14.0, 22.0, 23.0, 35.0, 25.0, 42.0, 26.0, 30.0, 41.0, 37.0, 46.0, 38.0, 39.0, 32.0, 34.0, 54.0, 35.0, 44.0, 24.0, 35.0, 43.0, 34.0, 25.0, 29.0, 29.0, 14.0, 16.0, 25.0, 11.0, 5.0, 10.0, 7.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.859375, -30.820556640625, -29.78173828125, -28.742919921875, -27.7041015625, -26.665283203125, -25.62646484375, -24.587646484375, -23.548828125, -22.510009765625, -21.47119140625, -20.432373046875, -19.3935546875, -18.354736328125, -17.31591796875, -16.277099609375, -15.23828125, -14.199462890625, -13.16064453125, -12.121826171875, -11.0830078125, -10.044189453125, -9.00537109375, -7.966552734375, -6.927734375, -5.888916015625, -4.85009765625, -3.811279296875, -2.7724609375, -1.733642578125, -0.69482421875, 0.343994140625, 1.3828125, 2.421630859375, 3.46044921875, 4.499267578125, 5.5380859375, 6.576904296875, 7.61572265625, 8.654541015625, 9.693359375, 10.732177734375, 11.77099609375, 12.809814453125, 13.8486328125, 14.887451171875, 15.92626953125, 16.965087890625, 18.00390625, 19.042724609375, 20.08154296875, 21.120361328125, 22.1591796875, 23.197998046875, 24.23681640625, 25.275634765625, 26.314453125, 27.353271484375, 28.39208984375, 29.430908203125, 30.4697265625, 31.508544921875, 32.54736328125, 33.586181640625, 34.625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 27.0, 15.0, 24.0, 37.0, 44.0, 63.0, 117.0, 138.0, 211.0, 310.0, 530.0, 726.0, 1250.0, 2112.0, 3619.0, 7030.0, 14720.0, 37078.0, 135240.0, 528713.0, 223754.0, 53740.0, 19274.0, 8679.0, 4468.0, 2501.0, 1393.0, 890.0, 601.0, 364.0, 243.0, 182.0, 121.0, 92.0, 61.0, 45.0, 34.0, 22.0, 25.0, 14.0, 5.0, 11.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.23828125, -2.171783447265625, -2.10528564453125, -2.038787841796875, -1.9722900390625, -1.905792236328125, -1.83929443359375, -1.772796630859375, -1.706298828125, -1.639801025390625, -1.57330322265625, -1.506805419921875, -1.4403076171875, -1.373809814453125, -1.30731201171875, -1.240814208984375, -1.17431640625, -1.107818603515625, -1.04132080078125, -0.974822998046875, -0.9083251953125, -0.841827392578125, -0.77532958984375, -0.708831787109375, -0.642333984375, -0.575836181640625, -0.50933837890625, -0.442840576171875, -0.3763427734375, -0.309844970703125, -0.24334716796875, -0.176849365234375, -0.1103515625, -0.043853759765625, 0.02264404296875, 0.089141845703125, 0.1556396484375, 0.222137451171875, 0.28863525390625, 0.355133056640625, 0.421630859375, 0.488128662109375, 0.55462646484375, 0.621124267578125, 0.6876220703125, 0.754119873046875, 0.82061767578125, 0.887115478515625, 0.95361328125, 1.020111083984375, 1.08660888671875, 1.153106689453125, 1.2196044921875, 1.286102294921875, 1.35260009765625, 1.419097900390625, 1.485595703125, 1.552093505859375, 1.61859130859375, 1.685089111328125, 1.7515869140625, 1.818084716796875, 1.88458251953125, 1.951080322265625, 2.017578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 5.0, 6.0, 8.0, 11.0, 12.0, 17.0, 17.0, 22.0, 27.0, 40.0, 39.0, 46.0, 54.0, 76.0, 82.0, 100.0, 79.0, 62.0, 62.0, 40.0, 35.0, 25.0, 25.0, 22.0, 15.0, 11.0, 8.0, 9.0, 10.0, 5.0, 5.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020837783813476562, -0.00020126625895500183, -0.00019415467977523804, -0.00018704310059547424, -0.00017993152141571045, -0.00017281994223594666, -0.00016570836305618286, -0.00015859678387641907, -0.00015148520469665527, -0.00014437362551689148, -0.00013726204633712769, -0.0001301504671573639, -0.0001230388879776001, -0.0001159273087978363, -0.00010881572961807251, -0.00010170415043830872, -9.459257125854492e-05, -8.748099207878113e-05, -8.036941289901733e-05, -7.325783371925354e-05, -6.614625453948975e-05, -5.903467535972595e-05, -5.192309617996216e-05, -4.4811517000198364e-05, -3.769993782043457e-05, -3.0588358640670776e-05, -2.3476779460906982e-05, -1.636520028114319e-05, -9.253621101379395e-06, -2.1420419216156006e-06, 4.969537258148193e-06, 1.2081116437911987e-05, 1.919269561767578e-05, 2.6304274797439575e-05, 3.341585397720337e-05, 4.052743315696716e-05, 4.763901233673096e-05, 5.475059151649475e-05, 6.186217069625854e-05, 6.897374987602234e-05, 7.608532905578613e-05, 8.319690823554993e-05, 9.030848741531372e-05, 9.742006659507751e-05, 0.00010453164577484131, 0.0001116432249546051, 0.0001187548041343689, 0.0001258663833141327, 0.00013297796249389648, 0.00014008954167366028, 0.00014720112085342407, 0.00015431270003318787, 0.00016142427921295166, 0.00016853585839271545, 0.00017564743757247925, 0.00018275901675224304, 0.00018987059593200684, 0.00019698217511177063, 0.00020409375429153442, 0.00021120533347129822, 0.000218316912651062, 0.0002254284918308258, 0.0002325400710105896, 0.0002396516501903534, 0.0002467632293701172]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 13.0, 26.0, 32.0, 65.0, 83.0, 119.0, 183.0, 284.0, 448.0, 725.0, 1079.0, 1776.0, 2940.0, 4745.0, 7490.0, 12133.0, 19151.0, 31423.0, 51226.0, 84859.0, 140570.0, 239225.0, 178189.0, 105870.0, 63949.0, 38970.0, 23865.0, 14792.0, 9098.0, 5717.0, 3445.0, 2254.0, 1385.0, 877.0, 543.0, 369.0, 202.0, 149.0, 106.0, 65.0, 37.0, 24.0, 16.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.94622802734375, -1.8807373046875, -1.81524658203125, -1.749755859375, -1.68426513671875, -1.6187744140625, -1.55328369140625, -1.48779296875, -1.42230224609375, -1.3568115234375, -1.29132080078125, -1.225830078125, -1.16033935546875, -1.0948486328125, -1.02935791015625, -0.9638671875, -0.89837646484375, -0.8328857421875, -0.76739501953125, -0.701904296875, -0.63641357421875, -0.5709228515625, -0.50543212890625, -0.43994140625, -0.37445068359375, -0.3089599609375, -0.24346923828125, -0.177978515625, -0.11248779296875, -0.0469970703125, 0.01849365234375, 0.083984375, 0.14947509765625, 0.2149658203125, 0.28045654296875, 0.345947265625, 0.41143798828125, 0.4769287109375, 0.54241943359375, 0.60791015625, 0.67340087890625, 0.7388916015625, 0.80438232421875, 0.869873046875, 0.93536376953125, 1.0008544921875, 1.06634521484375, 1.1318359375, 1.19732666015625, 1.2628173828125, 1.32830810546875, 1.393798828125, 1.45928955078125, 1.5247802734375, 1.59027099609375, 1.65576171875, 1.72125244140625, 1.7867431640625, 1.85223388671875, 1.917724609375, 1.98321533203125, 2.0487060546875, 2.11419677734375, 2.1796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 12.0, 6.0, 15.0, 11.0, 22.0, 17.0, 15.0, 24.0, 22.0, 34.0, 33.0, 42.0, 39.0, 33.0, 33.0, 31.0, 39.0, 23.0, 37.0, 28.0, 33.0, 35.0, 39.0, 45.0, 59.0, 38.0, 41.0, 33.0, 35.0, 26.0, 21.0, 10.0, 12.0, 12.0, 14.0, 6.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.2676849365234375, -1.228729248046875, -1.1897735595703125, -1.15081787109375, -1.1118621826171875, -1.072906494140625, -1.0339508056640625, -0.9949951171875, -0.9560394287109375, -0.917083740234375, -0.8781280517578125, -0.83917236328125, -0.8002166748046875, -0.761260986328125, -0.7223052978515625, -0.683349609375, -0.6443939208984375, -0.605438232421875, -0.5664825439453125, -0.52752685546875, -0.4885711669921875, -0.449615478515625, -0.4106597900390625, -0.3717041015625, -0.3327484130859375, -0.293792724609375, -0.2548370361328125, -0.21588134765625, -0.1769256591796875, -0.137969970703125, -0.0990142822265625, -0.06005859375, -0.0211029052734375, 0.017852783203125, 0.0568084716796875, 0.09576416015625, 0.1347198486328125, 0.173675537109375, 0.2126312255859375, 0.2515869140625, 0.2905426025390625, 0.329498291015625, 0.3684539794921875, 0.40740966796875, 0.4463653564453125, 0.485321044921875, 0.5242767333984375, 0.563232421875, 0.6021881103515625, 0.641143798828125, 0.6800994873046875, 0.71905517578125, 0.7580108642578125, 0.796966552734375, 0.8359222412109375, 0.8748779296875, 0.9138336181640625, 0.952789306640625, 0.9917449951171875, 1.03070068359375, 1.0696563720703125, 1.108612060546875, 1.1475677490234375, 1.1865234375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 10.0, 4.0, 16.0, 21.0, 21.0, 20.0, 24.0, 22.0, 36.0, 35.0, 40.0, 41.0, 33.0, 54.0, 54.0, 61.0, 33.0, 53.0, 49.0, 49.0, 39.0, 45.0, 36.0, 32.0, 30.0, 20.0, 25.0, 16.0, 16.0, 12.0, 10.0, 7.0, 7.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-41.65922927856445, -40.516937255859375, -39.37464141845703, -38.23234939575195, -37.090057373046875, -35.9477653503418, -34.80547332763672, -33.663177490234375, -32.5208854675293, -31.37859344482422, -30.236299514770508, -29.094005584716797, -27.95171356201172, -26.80942153930664, -25.66712760925293, -24.52483367919922, -23.38254165649414, -22.240249633789062, -21.09795570373535, -19.95566177368164, -18.813369750976562, -17.671077728271484, -16.528783798217773, -15.386490821838379, -14.244197845458984, -13.10190486907959, -11.959611892700195, -10.8173189163208, -9.675025939941406, -8.532732963562012, -7.390439987182617, -6.248147010803223, -5.105855941772461, -3.9635629653930664, -2.821269989013672, -1.6789770126342773, -0.5366840362548828, 0.6056089401245117, 1.7479019165039062, 2.890194892883301, 4.032487869262695, 5.17478084564209, 6.317073822021484, 7.459366798400879, 8.601659774780273, 9.743952751159668, 10.886245727539062, 12.028538703918457, 13.170831680297852, 14.313124656677246, 15.45541763305664, 16.59770965576172, 17.74000358581543, 18.88229751586914, 20.02458953857422, 21.166881561279297, 22.309175491333008, 23.45146942138672, 24.593761444091797, 25.736053466796875, 26.878347396850586, 28.020641326904297, 29.162933349609375, 30.305225372314453, 31.447519302368164]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 6.0, 6.0, 7.0, 6.0, 16.0, 9.0, 21.0, 20.0, 20.0, 22.0, 30.0, 32.0, 35.0, 52.0, 46.0, 41.0, 46.0, 51.0, 32.0, 49.0, 27.0, 30.0, 43.0, 45.0, 39.0, 34.0, 30.0, 24.0, 28.0, 29.0, 17.0, 24.0, 9.0, 12.0, 15.0, 8.0, 8.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.94432830810547, -45.48052978515625, -44.01673126220703, -42.55293273925781, -41.089134216308594, -39.625335693359375, -38.161537170410156, -36.69773864746094, -35.23394012451172, -33.7701416015625, -32.30634307861328, -30.842544555664062, -29.378746032714844, -27.914947509765625, -26.451148986816406, -24.987350463867188, -23.523550033569336, -22.059751510620117, -20.5959529876709, -19.13215446472168, -17.66835594177246, -16.204557418823242, -14.740757942199707, -13.276959419250488, -11.81316089630127, -10.34936237335205, -8.885563850402832, -7.421764850616455, -5.957966327667236, -4.494167804718018, -3.0303688049316406, -1.5665702819824219, -0.10277175903320312, 1.3610268831253052, 2.8248255252838135, 4.288624286651611, 5.75242280960083, 7.216221332550049, 8.680020332336426, 10.143818855285645, 11.607617378234863, 13.071415901184082, 14.5352144241333, 15.999013900756836, 17.462812423706055, 18.926610946655273, 20.390409469604492, 21.85420799255371, 23.31800651550293, 24.78180503845215, 26.245603561401367, 27.709402084350586, 29.173200607299805, 30.636999130249023, 32.100799560546875, 33.564598083496094, 35.02839660644531, 36.49219512939453, 37.95599365234375, 39.41979217529297, 40.88359069824219, 42.347389221191406, 43.811187744140625, 45.274986267089844, 46.73878479003906]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 7.0, 12.0, 27.0, 36.0, 54.0, 82.0, 126.0, 200.0, 267.0, 351.0, 595.0, 861.0, 1296.0, 1987.0, 2869.0, 4180.0, 6420.0, 9845.0, 14844.0, 22613.0, 34085.0, 50833.0, 73641.0, 99023.0, 121512.0, 131539.0, 124756.0, 104153.0, 78192.0, 54422.0, 37017.0, 24702.0, 16288.0, 10783.0, 6836.0, 4647.0, 3111.0, 2064.0, 1383.0, 929.0, 685.0, 397.0, 302.0, 206.0, 119.0, 78.0, 74.0, 39.0, 20.0, 16.0, 15.0, 11.0, 4.0, 3.0, 2.0, 2.0], "bins": [-31.203125, -30.2744140625, -29.345703125, -28.4169921875, -27.48828125, -26.5595703125, -25.630859375, -24.7021484375, -23.7734375, -22.8447265625, -21.916015625, -20.9873046875, -20.05859375, -19.1298828125, -18.201171875, -17.2724609375, -16.34375, -15.4150390625, -14.486328125, -13.5576171875, -12.62890625, -11.7001953125, -10.771484375, -9.8427734375, -8.9140625, -7.9853515625, -7.056640625, -6.1279296875, -5.19921875, -4.2705078125, -3.341796875, -2.4130859375, -1.484375, -0.5556640625, 0.373046875, 1.3017578125, 2.23046875, 3.1591796875, 4.087890625, 5.0166015625, 5.9453125, 6.8740234375, 7.802734375, 8.7314453125, 9.66015625, 10.5888671875, 11.517578125, 12.4462890625, 13.375, 14.3037109375, 15.232421875, 16.1611328125, 17.08984375, 18.0185546875, 18.947265625, 19.8759765625, 20.8046875, 21.7333984375, 22.662109375, 23.5908203125, 24.51953125, 25.4482421875, 26.376953125, 27.3056640625, 28.234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 6.0, 6.0, 7.0, 7.0, 14.0, 7.0, 27.0, 16.0, 21.0, 23.0, 31.0, 31.0, 36.0, 47.0, 49.0, 43.0, 43.0, 50.0, 37.0, 46.0, 29.0, 27.0, 41.0, 49.0, 39.0, 33.0, 29.0, 26.0, 26.0, 32.0, 14.0, 23.0, 12.0, 11.0, 14.0, 9.0, 8.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0, -43.59765625, -42.1953125, -40.79296875, -39.390625, -37.98828125, -36.5859375, -35.18359375, -33.78125, -32.37890625, -30.9765625, -29.57421875, -28.171875, -26.76953125, -25.3671875, -23.96484375, -22.5625, -21.16015625, -19.7578125, -18.35546875, -16.953125, -15.55078125, -14.1484375, -12.74609375, -11.34375, -9.94140625, -8.5390625, -7.13671875, -5.734375, -4.33203125, -2.9296875, -1.52734375, -0.125, 1.27734375, 2.6796875, 4.08203125, 5.484375, 6.88671875, 8.2890625, 9.69140625, 11.09375, 12.49609375, 13.8984375, 15.30078125, 16.703125, 18.10546875, 19.5078125, 20.91015625, 22.3125, 23.71484375, 25.1171875, 26.51953125, 27.921875, 29.32421875, 30.7265625, 32.12890625, 33.53125, 34.93359375, 36.3359375, 37.73828125, 39.140625, 40.54296875, 41.9453125, 43.34765625, 44.75]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 9.0, 14.0, 39.0, 52.0, 61.0, 96.0, 157.0, 234.0, 384.0, 604.0, 896.0, 1317.0, 2035.0, 3026.0, 4669.0, 7198.0, 11439.0, 18129.0, 28538.0, 44519.0, 66826.0, 94518.0, 122295.0, 138841.0, 134902.0, 114107.0, 85872.0, 59580.0, 39063.0, 24859.0, 15874.0, 10095.0, 6507.0, 4192.0, 2661.0, 1655.0, 1110.0, 743.0, 483.0, 316.0, 207.0, 142.0, 94.0, 56.0, 41.0, 27.0, 17.0, 13.0, 13.0, 7.0, 6.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-31.40625, -30.420166015625, -29.43408203125, -28.447998046875, -27.4619140625, -26.475830078125, -25.48974609375, -24.503662109375, -23.517578125, -22.531494140625, -21.54541015625, -20.559326171875, -19.5732421875, -18.587158203125, -17.60107421875, -16.614990234375, -15.62890625, -14.642822265625, -13.65673828125, -12.670654296875, -11.6845703125, -10.698486328125, -9.71240234375, -8.726318359375, -7.740234375, -6.754150390625, -5.76806640625, -4.781982421875, -3.7958984375, -2.809814453125, -1.82373046875, -0.837646484375, 0.1484375, 1.134521484375, 2.12060546875, 3.106689453125, 4.0927734375, 5.078857421875, 6.06494140625, 7.051025390625, 8.037109375, 9.023193359375, 10.00927734375, 10.995361328125, 11.9814453125, 12.967529296875, 13.95361328125, 14.939697265625, 15.92578125, 16.911865234375, 17.89794921875, 18.884033203125, 19.8701171875, 20.856201171875, 21.84228515625, 22.828369140625, 23.814453125, 24.800537109375, 25.78662109375, 26.772705078125, 27.7587890625, 28.744873046875, 29.73095703125, 30.717041015625, 31.703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 5.0, 14.0, 11.0, 13.0, 16.0, 19.0, 24.0, 26.0, 25.0, 29.0, 26.0, 35.0, 42.0, 30.0, 28.0, 38.0, 32.0, 35.0, 46.0, 43.0, 34.0, 37.0, 49.0, 25.0, 28.0, 24.0, 32.0, 25.0, 31.0, 22.0, 14.0, 20.0, 14.0, 10.0, 19.0, 13.0, 7.0, 12.0, 11.0, 8.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-28.296875, -27.489990234375, -26.68310546875, -25.876220703125, -25.0693359375, -24.262451171875, -23.45556640625, -22.648681640625, -21.841796875, -21.034912109375, -20.22802734375, -19.421142578125, -18.6142578125, -17.807373046875, -17.00048828125, -16.193603515625, -15.38671875, -14.579833984375, -13.77294921875, -12.966064453125, -12.1591796875, -11.352294921875, -10.54541015625, -9.738525390625, -8.931640625, -8.124755859375, -7.31787109375, -6.510986328125, -5.7041015625, -4.897216796875, -4.09033203125, -3.283447265625, -2.4765625, -1.669677734375, -0.86279296875, -0.055908203125, 0.7509765625, 1.557861328125, 2.36474609375, 3.171630859375, 3.978515625, 4.785400390625, 5.59228515625, 6.399169921875, 7.2060546875, 8.012939453125, 8.81982421875, 9.626708984375, 10.43359375, 11.240478515625, 12.04736328125, 12.854248046875, 13.6611328125, 14.468017578125, 15.27490234375, 16.081787109375, 16.888671875, 17.695556640625, 18.50244140625, 19.309326171875, 20.1162109375, 20.923095703125, 21.72998046875, 22.536865234375, 23.34375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 9.0, 9.0, 15.0, 26.0, 37.0, 41.0, 53.0, 88.0, 124.0, 191.0, 328.0, 450.0, 920.0, 1940.0, 5008.0, 13981.0, 43051.0, 129093.0, 285287.0, 315351.0, 164941.0, 57648.0, 18413.0, 6402.0, 2471.0, 1078.0, 581.0, 324.0, 209.0, 149.0, 89.0, 82.0, 60.0, 26.0, 20.0, 16.0, 17.0, 7.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.921875, -19.3017578125, -18.681640625, -18.0615234375, -17.44140625, -16.8212890625, -16.201171875, -15.5810546875, -14.9609375, -14.3408203125, -13.720703125, -13.1005859375, -12.48046875, -11.8603515625, -11.240234375, -10.6201171875, -10.0, -9.3798828125, -8.759765625, -8.1396484375, -7.51953125, -6.8994140625, -6.279296875, -5.6591796875, -5.0390625, -4.4189453125, -3.798828125, -3.1787109375, -2.55859375, -1.9384765625, -1.318359375, -0.6982421875, -0.078125, 0.5419921875, 1.162109375, 1.7822265625, 2.40234375, 3.0224609375, 3.642578125, 4.2626953125, 4.8828125, 5.5029296875, 6.123046875, 6.7431640625, 7.36328125, 7.9833984375, 8.603515625, 9.2236328125, 9.84375, 10.4638671875, 11.083984375, 11.7041015625, 12.32421875, 12.9443359375, 13.564453125, 14.1845703125, 14.8046875, 15.4248046875, 16.044921875, 16.6650390625, 17.28515625, 17.9052734375, 18.525390625, 19.1455078125, 19.765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 10.0, 7.0, 14.0, 13.0, 27.0, 30.0, 41.0, 40.0, 51.0, 40.0, 55.0, 52.0, 41.0, 60.0, 49.0, 64.0, 53.0, 54.0, 35.0, 43.0, 34.0, 35.0, 24.0, 24.0, 20.0, 16.0, 15.0, 11.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007615089416503906, -0.0007349997758865356, -0.0007084906101226807, -0.0006819814443588257, -0.0006554722785949707, -0.0006289631128311157, -0.0006024539470672607, -0.0005759447813034058, -0.0005494356155395508, -0.0005229264497756958, -0.0004964172840118408, -0.00046990811824798584, -0.00044339895248413086, -0.0004168897867202759, -0.0003903806209564209, -0.0003638714551925659, -0.00033736228942871094, -0.00031085312366485596, -0.000284343957901001, -0.000257834792137146, -0.00023132562637329102, -0.00020481646060943604, -0.00017830729484558105, -0.00015179812908172607, -0.0001252889633178711, -9.877979755401611e-05, -7.227063179016113e-05, -4.576146602630615e-05, -1.9252300262451172e-05, 7.256865501403809e-06, 3.376603126525879e-05, 6.027519702911377e-05, 8.678436279296875e-05, 0.00011329352855682373, 0.0001398026943206787, 0.0001663118600845337, 0.00019282102584838867, 0.00021933019161224365, 0.00024583935737609863, 0.0002723485231399536, 0.0002988576889038086, 0.0003253668546676636, 0.00035187602043151855, 0.00037838518619537354, 0.0004048943519592285, 0.0004314035177230835, 0.0004579126834869385, 0.00048442184925079346, 0.0005109310150146484, 0.0005374401807785034, 0.0005639493465423584, 0.0005904585123062134, 0.0006169676780700684, 0.0006434768438339233, 0.0006699860095977783, 0.0006964951753616333, 0.0007230043411254883, 0.0007495135068893433, 0.0007760226726531982, 0.0008025318384170532, 0.0008290410041809082, 0.0008555501699447632, 0.0008820593357086182, 0.0009085685014724731, 0.0009350776672363281]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 6.0, 12.0, 15.0, 25.0, 28.0, 42.0, 76.0, 84.0, 106.0, 158.0, 253.0, 396.0, 666.0, 1220.0, 2099.0, 4380.0, 10042.0, 25639.0, 69200.0, 172129.0, 295246.0, 259086.0, 126453.0, 47887.0, 18207.0, 7485.0, 3335.0, 1700.0, 934.0, 579.0, 354.0, 221.0, 163.0, 106.0, 63.0, 43.0, 25.0, 30.0, 16.0, 14.0, 9.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.234375, -20.62451171875, -20.0146484375, -19.40478515625, -18.794921875, -18.18505859375, -17.5751953125, -16.96533203125, -16.35546875, -15.74560546875, -15.1357421875, -14.52587890625, -13.916015625, -13.30615234375, -12.6962890625, -12.08642578125, -11.4765625, -10.86669921875, -10.2568359375, -9.64697265625, -9.037109375, -8.42724609375, -7.8173828125, -7.20751953125, -6.59765625, -5.98779296875, -5.3779296875, -4.76806640625, -4.158203125, -3.54833984375, -2.9384765625, -2.32861328125, -1.71875, -1.10888671875, -0.4990234375, 0.11083984375, 0.720703125, 1.33056640625, 1.9404296875, 2.55029296875, 3.16015625, 3.77001953125, 4.3798828125, 4.98974609375, 5.599609375, 6.20947265625, 6.8193359375, 7.42919921875, 8.0390625, 8.64892578125, 9.2587890625, 9.86865234375, 10.478515625, 11.08837890625, 11.6982421875, 12.30810546875, 12.91796875, 13.52783203125, 14.1376953125, 14.74755859375, 15.357421875, 15.96728515625, 16.5771484375, 17.18701171875, 17.796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 12.0, 12.0, 14.0, 16.0, 23.0, 56.0, 61.0, 71.0, 96.0, 105.0, 116.0, 101.0, 98.0, 56.0, 46.0, 22.0, 24.0, 23.0, 13.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.614501953125, -8.33837890625, -8.062255859375, -7.7861328125, -7.510009765625, -7.23388671875, -6.957763671875, -6.681640625, -6.405517578125, -6.12939453125, -5.853271484375, -5.5771484375, -5.301025390625, -5.02490234375, -4.748779296875, -4.47265625, -4.196533203125, -3.92041015625, -3.644287109375, -3.3681640625, -3.092041015625, -2.81591796875, -2.539794921875, -2.263671875, -1.987548828125, -1.71142578125, -1.435302734375, -1.1591796875, -0.883056640625, -0.60693359375, -0.330810546875, -0.0546875, 0.221435546875, 0.49755859375, 0.773681640625, 1.0498046875, 1.325927734375, 1.60205078125, 1.878173828125, 2.154296875, 2.430419921875, 2.70654296875, 2.982666015625, 3.2587890625, 3.534912109375, 3.81103515625, 4.087158203125, 4.36328125, 4.639404296875, 4.91552734375, 5.191650390625, 5.4677734375, 5.743896484375, 6.02001953125, 6.296142578125, 6.572265625, 6.848388671875, 7.12451171875, 7.400634765625, 7.6767578125, 7.952880859375, 8.22900390625, 8.505126953125, 8.78125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 12.0, 11.0, 8.0, 16.0, 13.0, 17.0, 22.0, 27.0, 32.0, 35.0, 39.0, 27.0, 44.0, 52.0, 46.0, 57.0, 60.0, 45.0, 44.0, 47.0, 43.0, 29.0, 30.0, 33.0, 37.0, 23.0, 17.0, 20.0, 10.0, 19.0, 16.0, 12.0, 10.0, 12.0, 7.0, 9.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.079736709594727, -28.989492416381836, -27.899246215820312, -26.809001922607422, -25.7187557220459, -24.628511428833008, -23.538265228271484, -22.448020935058594, -21.357776641845703, -20.267532348632812, -19.17728614807129, -18.0870418548584, -16.996795654296875, -15.906551361083984, -14.816306114196777, -13.72606086730957, -12.635814666748047, -11.54556941986084, -10.455324172973633, -9.365079879760742, -8.274833679199219, -7.18458890914917, -6.094344139099121, -5.004098892211914, -3.913853645324707, -2.8236083984375, -1.733363389968872, -0.6431183815002441, 0.4471268653869629, 1.53737211227417, 2.6276168823242188, 3.717862129211426, 4.808109283447266, 5.898354530334473, 6.98859977722168, 8.07884407043457, 9.169090270996094, 10.259334564208984, 11.349579811096191, 12.439825057983398, 13.530070304870605, 14.620315551757812, 15.71056079864502, 16.800806045532227, 17.891050338745117, 18.98129653930664, 20.07154083251953, 21.161785125732422, 22.252031326293945, 23.342275619506836, 24.43252182006836, 25.52276611328125, 26.613012313842773, 27.703256607055664, 28.793502807617188, 29.883747100830078, 30.97399139404297, 32.06423568725586, 33.15447998046875, 34.244728088378906, 35.3349723815918, 36.42521667480469, 37.51546096801758, 38.60570526123047, 39.695953369140625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 8.0, 11.0, 4.0, 11.0, 13.0, 9.0, 10.0, 17.0, 24.0, 22.0, 25.0, 35.0, 33.0, 23.0, 45.0, 46.0, 44.0, 48.0, 47.0, 39.0, 42.0, 52.0, 36.0, 41.0, 43.0, 39.0, 45.0, 25.0, 27.0, 30.0, 16.0, 16.0, 11.0, 18.0, 13.0, 8.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.89802551269531, -50.3142204284668, -48.73041534423828, -47.146610260009766, -45.56280517578125, -43.979000091552734, -42.39519500732422, -40.81139373779297, -39.22758483886719, -37.64377975463867, -36.059974670410156, -34.47616958618164, -32.892364501953125, -31.30855941772461, -29.724756240844727, -28.14095115661621, -26.557147979736328, -24.973342895507812, -23.389537811279297, -21.80573272705078, -20.221927642822266, -18.63812255859375, -17.054319381713867, -15.470514297485352, -13.886709213256836, -12.30290412902832, -10.719099044799805, -9.135294914245605, -7.55148983001709, -5.967684745788574, -4.383880615234375, -2.8000755310058594, -1.2162704467773438, 0.3675343990325928, 1.9513392448425293, 3.5351438522338867, 5.118948936462402, 6.702754020690918, 8.286558151245117, 9.870363235473633, 11.454168319702148, 13.037973403930664, 14.62177848815918, 16.205581665039062, 17.789386749267578, 19.373191833496094, 20.95699691772461, 22.540802001953125, 24.12460708618164, 25.708412170410156, 27.292217254638672, 28.876022338867188, 30.459827423095703, 32.04363250732422, 33.62743377685547, 35.21124267578125, 36.7950439453125, 38.378849029541016, 39.96265411376953, 41.54645919799805, 43.13026428222656, 44.71406936645508, 46.297874450683594, 47.881675720214844, 49.465484619140625]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 2.0, 6.0, 4.0, 12.0, 21.0, 28.0, 45.0, 96.0, 107.0, 160.0, 256.0, 390.0, 684.0, 1103.0, 1707.0, 2902.0, 4651.0, 7731.0, 12973.0, 22096.0, 38285.0, 65599.0, 113041.0, 192168.0, 314066.0, 472706.0, 622045.0, 669238.0, 578798.0, 416565.0, 267358.0, 160403.0, 94415.0, 55380.0, 32043.0, 18730.0, 11249.0, 6660.0, 4014.0, 2413.0, 1541.0, 900.0, 668.0, 371.0, 227.0, 155.0, 100.0, 57.0, 43.0, 33.0, 18.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.34375, -31.3115234375, -30.279296875, -29.2470703125, -28.21484375, -27.1826171875, -26.150390625, -25.1181640625, -24.0859375, -23.0537109375, -22.021484375, -20.9892578125, -19.95703125, -18.9248046875, -17.892578125, -16.8603515625, -15.828125, -14.7958984375, -13.763671875, -12.7314453125, -11.69921875, -10.6669921875, -9.634765625, -8.6025390625, -7.5703125, -6.5380859375, -5.505859375, -4.4736328125, -3.44140625, -2.4091796875, -1.376953125, -0.3447265625, 0.6875, 1.7197265625, 2.751953125, 3.7841796875, 4.81640625, 5.8486328125, 6.880859375, 7.9130859375, 8.9453125, 9.9775390625, 11.009765625, 12.0419921875, 13.07421875, 14.1064453125, 15.138671875, 16.1708984375, 17.203125, 18.2353515625, 19.267578125, 20.2998046875, 21.33203125, 22.3642578125, 23.396484375, 24.4287109375, 25.4609375, 26.4931640625, 27.525390625, 28.5576171875, 29.58984375, 30.6220703125, 31.654296875, 32.6865234375, 33.71875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 10.0, 6.0, 5.0, 15.0, 8.0, 13.0, 9.0, 18.0, 20.0, 27.0, 22.0, 33.0, 33.0, 29.0, 34.0, 55.0, 41.0, 50.0, 41.0, 46.0, 38.0, 47.0, 46.0, 39.0, 41.0, 37.0, 43.0, 31.0, 27.0, 30.0, 17.0, 12.0, 17.0, 13.0, 14.0, 9.0, 6.0, 3.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.5, -38.29443359375, -37.0888671875, -35.88330078125, -34.677734375, -33.47216796875, -32.2666015625, -31.06103515625, -29.85546875, -28.64990234375, -27.4443359375, -26.23876953125, -25.033203125, -23.82763671875, -22.6220703125, -21.41650390625, -20.2109375, -19.00537109375, -17.7998046875, -16.59423828125, -15.388671875, -14.18310546875, -12.9775390625, -11.77197265625, -10.56640625, -9.36083984375, -8.1552734375, -6.94970703125, -5.744140625, -4.53857421875, -3.3330078125, -2.12744140625, -0.921875, 0.28369140625, 1.4892578125, 2.69482421875, 3.900390625, 5.10595703125, 6.3115234375, 7.51708984375, 8.72265625, 9.92822265625, 11.1337890625, 12.33935546875, 13.544921875, 14.75048828125, 15.9560546875, 17.16162109375, 18.3671875, 19.57275390625, 20.7783203125, 21.98388671875, 23.189453125, 24.39501953125, 25.6005859375, 26.80615234375, 28.01171875, 29.21728515625, 30.4228515625, 31.62841796875, 32.833984375, 34.03955078125, 35.2451171875, 36.45068359375, 37.65625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 14.0, 15.0, 35.0, 55.0, 84.0, 143.0, 257.0, 341.0, 644.0, 1100.0, 1908.0, 3243.0, 5519.0, 9427.0, 16446.0, 27667.0, 47138.0, 77622.0, 124126.0, 192099.0, 279119.0, 378458.0, 467542.0, 519048.0, 513234.0, 451249.0, 357147.0, 259584.0, 175235.0, 113327.0, 70477.0, 42094.0, 24849.0, 14570.0, 8420.0, 5050.0, 2868.0, 1679.0, 992.0, 554.0, 356.0, 243.0, 127.0, 92.0, 37.0, 27.0, 11.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.203125, -25.381591796875, -24.56005859375, -23.738525390625, -22.9169921875, -22.095458984375, -21.27392578125, -20.452392578125, -19.630859375, -18.809326171875, -17.98779296875, -17.166259765625, -16.3447265625, -15.523193359375, -14.70166015625, -13.880126953125, -13.05859375, -12.237060546875, -11.41552734375, -10.593994140625, -9.7724609375, -8.950927734375, -8.12939453125, -7.307861328125, -6.486328125, -5.664794921875, -4.84326171875, -4.021728515625, -3.2001953125, -2.378662109375, -1.55712890625, -0.735595703125, 0.0859375, 0.907470703125, 1.72900390625, 2.550537109375, 3.3720703125, 4.193603515625, 5.01513671875, 5.836669921875, 6.658203125, 7.479736328125, 8.30126953125, 9.122802734375, 9.9443359375, 10.765869140625, 11.58740234375, 12.408935546875, 13.23046875, 14.052001953125, 14.87353515625, 15.695068359375, 16.5166015625, 17.338134765625, 18.15966796875, 18.981201171875, 19.802734375, 20.624267578125, 21.44580078125, 22.267333984375, 23.0888671875, 23.910400390625, 24.73193359375, 25.553466796875, 26.375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 4.0, 6.0, 12.0, 17.0, 27.0, 23.0, 33.0, 30.0, 49.0, 58.0, 76.0, 90.0, 87.0, 141.0, 122.0, 150.0, 174.0, 194.0, 200.0, 198.0, 204.0, 229.0, 232.0, 209.0, 221.0, 188.0, 151.0, 154.0, 131.0, 115.0, 113.0, 71.0, 66.0, 64.0, 45.0, 39.0, 38.0, 28.0, 19.0, 16.0, 8.0, 9.0, 10.0, 8.0, 5.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.06005859375, -15.5576171875, -15.05517578125, -14.552734375, -14.05029296875, -13.5478515625, -13.04541015625, -12.54296875, -12.04052734375, -11.5380859375, -11.03564453125, -10.533203125, -10.03076171875, -9.5283203125, -9.02587890625, -8.5234375, -8.02099609375, -7.5185546875, -7.01611328125, -6.513671875, -6.01123046875, -5.5087890625, -5.00634765625, -4.50390625, -4.00146484375, -3.4990234375, -2.99658203125, -2.494140625, -1.99169921875, -1.4892578125, -0.98681640625, -0.484375, 0.01806640625, 0.5205078125, 1.02294921875, 1.525390625, 2.02783203125, 2.5302734375, 3.03271484375, 3.53515625, 4.03759765625, 4.5400390625, 5.04248046875, 5.544921875, 6.04736328125, 6.5498046875, 7.05224609375, 7.5546875, 8.05712890625, 8.5595703125, 9.06201171875, 9.564453125, 10.06689453125, 10.5693359375, 11.07177734375, 11.57421875, 12.07666015625, 12.5791015625, 13.08154296875, 13.583984375, 14.08642578125, 14.5888671875, 15.09130859375, 15.59375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 14.0, 17.0, 14.0, 11.0, 22.0, 32.0, 29.0, 37.0, 47.0, 46.0, 48.0, 63.0, 63.0, 68.0, 65.0, 45.0, 52.0, 56.0, 36.0, 43.0, 27.0, 27.0, 28.0, 16.0, 12.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.52817726135254, -30.364402770996094, -29.200626373291016, -28.03685188293457, -26.873075485229492, -25.709300994873047, -24.54552459716797, -23.381750106811523, -22.217975616455078, -21.054201126098633, -19.890424728393555, -18.72665023803711, -17.56287384033203, -16.399099349975586, -15.235323905944824, -14.071548461914062, -12.907772064208984, -11.743996620178223, -10.580221176147461, -9.416446685791016, -8.252670288085938, -7.088895320892334, -5.9251203536987305, -4.761344909667969, -3.597569465637207, -2.4337940216064453, -1.2700188159942627, -0.10624361038208008, 1.0575318336486816, 2.2213072776794434, 3.385082244873047, 4.548857688903809, 5.712635040283203, 6.876410484313965, 8.040185928344727, 9.203960418701172, 10.36773681640625, 11.531511306762695, 12.695286750793457, 13.859062194824219, 15.02283763885498, 16.186613082885742, 17.350387573242188, 18.514163970947266, 19.67793846130371, 20.84171485900879, 22.005489349365234, 23.169265747070312, 24.333040237426758, 25.496814727783203, 26.66059112548828, 27.824365615844727, 28.988142013549805, 30.15191650390625, 31.315692901611328, 32.479469299316406, 33.64324188232422, 34.8070182800293, 35.97079086303711, 37.13456726074219, 38.298343658447266, 39.462120056152344, 40.625892639160156, 41.789669036865234, 42.95344543457031]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 6.0, 10.0, 14.0, 18.0, 15.0, 11.0, 19.0, 16.0, 24.0, 24.0, 37.0, 35.0, 32.0, 52.0, 56.0, 44.0, 41.0, 47.0, 47.0, 36.0, 50.0, 39.0, 38.0, 35.0, 24.0, 34.0, 32.0, 26.0, 23.0, 15.0, 17.0, 8.0, 11.0, 8.0, 11.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-48.62558364868164, -47.25917434692383, -45.89276885986328, -44.52635955810547, -43.159950256347656, -41.793540954589844, -40.42713165283203, -39.060726165771484, -37.69431686401367, -36.32790756225586, -34.96150207519531, -33.5950927734375, -32.22868347167969, -30.862274169921875, -29.495866775512695, -28.129459381103516, -26.763050079345703, -25.39664077758789, -24.03023338317871, -22.66382598876953, -21.29741668701172, -19.931007385253906, -18.564599990844727, -17.198192596435547, -15.831783294677734, -14.465374946594238, -13.098966598510742, -11.732558250427246, -10.36614990234375, -8.999741554260254, -7.633333206176758, -6.266924858093262, -4.900520324707031, -3.534111976623535, -2.167703628540039, -0.801295280456543, 0.5651130676269531, 1.9315214157104492, 3.2979297637939453, 4.664338111877441, 6.0307464599609375, 7.397154808044434, 8.76356315612793, 10.129971504211426, 11.496379852294922, 12.862788200378418, 14.229196548461914, 15.59560489654541, 16.962013244628906, 18.32842254638672, 19.6948299407959, 21.061237335205078, 22.42764663696289, 23.794055938720703, 25.160463333129883, 26.526870727539062, 27.893280029296875, 29.259689331054688, 30.626096725463867, 31.992504119873047, 33.35891342163086, 34.72532272338867, 36.09172821044922, 37.45813751220703, 38.824546813964844]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 4.0, 13.0, 27.0, 26.0, 47.0, 50.0, 98.0, 142.0, 192.0, 290.0, 406.0, 529.0, 868.0, 1308.0, 2039.0, 3022.0, 5171.0, 8750.0, 15169.0, 27878.0, 54873.0, 117195.0, 286365.0, 286076.0, 117472.0, 54178.0, 28183.0, 15184.0, 8620.0, 5216.0, 3142.0, 1944.0, 1312.0, 854.0, 601.0, 405.0, 265.0, 192.0, 118.0, 84.0, 62.0, 56.0, 37.0, 26.0, 21.0, 13.0, 13.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.66796875, -7.43560791015625, -7.2032470703125, -6.97088623046875, -6.738525390625, -6.50616455078125, -6.2738037109375, -6.04144287109375, -5.80908203125, -5.57672119140625, -5.3443603515625, -5.11199951171875, -4.879638671875, -4.64727783203125, -4.4149169921875, -4.18255615234375, -3.9501953125, -3.71783447265625, -3.4854736328125, -3.25311279296875, -3.020751953125, -2.78839111328125, -2.5560302734375, -2.32366943359375, -2.09130859375, -1.85894775390625, -1.6265869140625, -1.39422607421875, -1.161865234375, -0.92950439453125, -0.6971435546875, -0.46478271484375, -0.232421875, -6.103515625e-05, 0.2322998046875, 0.46466064453125, 0.697021484375, 0.92938232421875, 1.1617431640625, 1.39410400390625, 1.62646484375, 1.85882568359375, 2.0911865234375, 2.32354736328125, 2.555908203125, 2.78826904296875, 3.0206298828125, 3.25299072265625, 3.4853515625, 3.71771240234375, 3.9500732421875, 4.18243408203125, 4.414794921875, 4.64715576171875, 4.8795166015625, 5.11187744140625, 5.34423828125, 5.57659912109375, 5.8089599609375, 6.04132080078125, 6.273681640625, 6.50604248046875, 6.7384033203125, 6.97076416015625, 7.203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 8.0, 5.0, 11.0, 14.0, 17.0, 15.0, 12.0, 16.0, 21.0, 22.0, 24.0, 36.0, 34.0, 34.0, 51.0, 57.0, 43.0, 44.0, 43.0, 48.0, 33.0, 51.0, 43.0, 38.0, 33.0, 24.0, 34.0, 30.0, 26.0, 25.0, 14.0, 18.0, 9.0, 8.0, 10.0, 11.0, 10.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-48.5625, -47.205078125, -45.84765625, -44.490234375, -43.1328125, -41.775390625, -40.41796875, -39.060546875, -37.703125, -36.345703125, -34.98828125, -33.630859375, -32.2734375, -30.916015625, -29.55859375, -28.201171875, -26.84375, -25.486328125, -24.12890625, -22.771484375, -21.4140625, -20.056640625, -18.69921875, -17.341796875, -15.984375, -14.626953125, -13.26953125, -11.912109375, -10.5546875, -9.197265625, -7.83984375, -6.482421875, -5.125, -3.767578125, -2.41015625, -1.052734375, 0.3046875, 1.662109375, 3.01953125, 4.376953125, 5.734375, 7.091796875, 8.44921875, 9.806640625, 11.1640625, 12.521484375, 13.87890625, 15.236328125, 16.59375, 17.951171875, 19.30859375, 20.666015625, 22.0234375, 23.380859375, 24.73828125, 26.095703125, 27.453125, 28.810546875, 30.16796875, 31.525390625, 32.8828125, 34.240234375, 35.59765625, 36.955078125, 38.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 5.0, 11.0, 11.0, 22.0, 28.0, 34.0, 61.0, 95.0, 155.0, 197.0, 315.0, 536.0, 918.0, 1713.0, 3122.0, 6540.0, 14150.0, 33553.0, 87732.0, 270462.0, 410230.0, 132310.0, 48616.0, 19534.0, 8789.0, 4201.0, 2140.0, 1165.0, 751.0, 441.0, 249.0, 159.0, 95.0, 66.0, 43.0, 30.0, 22.0, 20.0, 6.0, 6.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.0914306640625, -7.823486328125, -7.5555419921875, -7.28759765625, -7.0196533203125, -6.751708984375, -6.4837646484375, -6.2158203125, -5.9478759765625, -5.679931640625, -5.4119873046875, -5.14404296875, -4.8760986328125, -4.608154296875, -4.3402099609375, -4.072265625, -3.8043212890625, -3.536376953125, -3.2684326171875, -3.00048828125, -2.7325439453125, -2.464599609375, -2.1966552734375, -1.9287109375, -1.6607666015625, -1.392822265625, -1.1248779296875, -0.85693359375, -0.5889892578125, -0.321044921875, -0.0531005859375, 0.21484375, 0.4827880859375, 0.750732421875, 1.0186767578125, 1.28662109375, 1.5545654296875, 1.822509765625, 2.0904541015625, 2.3583984375, 2.6263427734375, 2.894287109375, 3.1622314453125, 3.43017578125, 3.6981201171875, 3.966064453125, 4.2340087890625, 4.501953125, 4.7698974609375, 5.037841796875, 5.3057861328125, 5.57373046875, 5.8416748046875, 6.109619140625, 6.3775634765625, 6.6455078125, 6.9134521484375, 7.181396484375, 7.4493408203125, 7.71728515625, 7.9852294921875, 8.253173828125, 8.5211181640625, 8.7890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 8.0, 5.0, 12.0, 11.0, 7.0, 17.0, 10.0, 26.0, 17.0, 24.0, 22.0, 30.0, 40.0, 30.0, 23.0, 44.0, 41.0, 35.0, 43.0, 44.0, 36.0, 58.0, 47.0, 35.0, 40.0, 34.0, 32.0, 35.0, 20.0, 31.0, 24.0, 24.0, 13.0, 8.0, 14.0, 8.0, 11.0, 6.0, 7.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.171875, -26.339599609375, -25.50732421875, -24.675048828125, -23.8427734375, -23.010498046875, -22.17822265625, -21.345947265625, -20.513671875, -19.681396484375, -18.84912109375, -18.016845703125, -17.1845703125, -16.352294921875, -15.52001953125, -14.687744140625, -13.85546875, -13.023193359375, -12.19091796875, -11.358642578125, -10.5263671875, -9.694091796875, -8.86181640625, -8.029541015625, -7.197265625, -6.364990234375, -5.53271484375, -4.700439453125, -3.8681640625, -3.035888671875, -2.20361328125, -1.371337890625, -0.5390625, 0.293212890625, 1.12548828125, 1.957763671875, 2.7900390625, 3.622314453125, 4.45458984375, 5.286865234375, 6.119140625, 6.951416015625, 7.78369140625, 8.615966796875, 9.4482421875, 10.280517578125, 11.11279296875, 11.945068359375, 12.77734375, 13.609619140625, 14.44189453125, 15.274169921875, 16.1064453125, 16.938720703125, 17.77099609375, 18.603271484375, 19.435546875, 20.267822265625, 21.10009765625, 21.932373046875, 22.7646484375, 23.596923828125, 24.42919921875, 25.261474609375, 26.09375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 10.0, 16.0, 17.0, 28.0, 57.0, 61.0, 85.0, 121.0, 161.0, 246.0, 384.0, 496.0, 872.0, 1318.0, 2170.0, 3775.0, 7104.0, 15993.0, 49413.0, 300700.0, 543412.0, 79479.0, 21993.0, 9068.0, 4464.0, 2597.0, 1520.0, 912.0, 623.0, 401.0, 308.0, 184.0, 147.0, 102.0, 70.0, 58.0, 41.0, 29.0, 26.0, 24.0, 14.0, 11.0, 6.0, 5.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.884765625, -1.822265625, -1.759765625, -1.697265625, -1.634765625, -1.572265625, -1.509765625, -1.447265625, -1.384765625, -1.322265625, -1.259765625, -1.197265625, -1.134765625, -1.072265625, -1.009765625, -0.947265625, -0.884765625, -0.822265625, -0.759765625, -0.697265625, -0.634765625, -0.572265625, -0.509765625, -0.447265625, -0.384765625, -0.322265625, -0.259765625, -0.197265625, -0.134765625, -0.072265625, -0.009765625, 0.052734375, 0.115234375, 0.177734375, 0.240234375, 0.302734375, 0.365234375, 0.427734375, 0.490234375, 0.552734375, 0.615234375, 0.677734375, 0.740234375, 0.802734375, 0.865234375, 0.927734375, 0.990234375, 1.052734375, 1.115234375, 1.177734375, 1.240234375, 1.302734375, 1.365234375, 1.427734375, 1.490234375, 1.552734375, 1.615234375, 1.677734375, 1.740234375, 1.802734375, 1.865234375, 1.927734375, 1.990234375, 2.052734375, 2.115234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 13.0, 9.0, 14.0, 24.0, 23.0, 39.0, 53.0, 106.0, 128.0, 153.0, 116.0, 97.0, 61.0, 37.0, 29.0, 28.0, 16.0, 11.0, 10.0, 6.0, 11.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002313852310180664, -0.0002242550253868103, -0.0002171248197555542, -0.0002099946141242981, -0.000202864408493042, -0.0001957342028617859, -0.00018860399723052979, -0.00018147379159927368, -0.00017434358596801758, -0.00016721338033676147, -0.00016008317470550537, -0.00015295296907424927, -0.00014582276344299316, -0.00013869255781173706, -0.00013156235218048096, -0.00012443214654922485, -0.00011730194091796875, -0.00011017173528671265, -0.00010304152965545654, -9.591132402420044e-05, -8.878111839294434e-05, -8.165091276168823e-05, -7.452070713043213e-05, -6.739050149917603e-05, -6.026029586791992e-05, -5.313009023666382e-05, -4.5999884605407715e-05, -3.886967897415161e-05, -3.173947334289551e-05, -2.4609267711639404e-05, -1.74790620803833e-05, -1.0348856449127197e-05, -3.2186508178710938e-06, 3.91155481338501e-06, 1.1041760444641113e-05, 1.8171966075897217e-05, 2.530217170715332e-05, 3.2432377338409424e-05, 3.956258296966553e-05, 4.669278860092163e-05, 5.3822994232177734e-05, 6.095319986343384e-05, 6.808340549468994e-05, 7.521361112594604e-05, 8.234381675720215e-05, 8.947402238845825e-05, 9.660422801971436e-05, 0.00010373443365097046, 0.00011086463928222656, 0.00011799484491348267, 0.00012512505054473877, 0.00013225525617599487, 0.00013938546180725098, 0.00014651566743850708, 0.00015364587306976318, 0.0001607760787010193, 0.0001679062843322754, 0.0001750364899635315, 0.0001821666955947876, 0.0001892969012260437, 0.0001964271068572998, 0.0002035573124885559, 0.000210687518119812, 0.00021781772375106812, 0.00022494792938232422]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 8.0, 16.0, 12.0, 24.0, 31.0, 35.0, 48.0, 70.0, 135.0, 160.0, 256.0, 323.0, 489.0, 695.0, 1074.0, 1682.0, 2519.0, 3808.0, 6166.0, 9961.0, 16621.0, 28162.0, 49784.0, 93573.0, 202014.0, 315859.0, 144711.0, 72045.0, 39387.0, 22751.0, 13373.0, 8152.0, 5184.0, 3192.0, 2056.0, 1380.0, 911.0, 582.0, 415.0, 267.0, 183.0, 140.0, 87.0, 65.0, 47.0, 38.0, 13.0, 15.0, 16.0, 2.0, 6.0, 9.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6308441162109375, -1.573211669921875, -1.5155792236328125, -1.45794677734375, -1.4003143310546875, -1.342681884765625, -1.2850494384765625, -1.2274169921875, -1.1697845458984375, -1.112152099609375, -1.0545196533203125, -0.99688720703125, -0.9392547607421875, -0.881622314453125, -0.8239898681640625, -0.766357421875, -0.7087249755859375, -0.651092529296875, -0.5934600830078125, -0.53582763671875, -0.4781951904296875, -0.420562744140625, -0.3629302978515625, -0.3052978515625, -0.2476654052734375, -0.190032958984375, -0.1324005126953125, -0.07476806640625, -0.0171356201171875, 0.040496826171875, 0.0981292724609375, 0.15576171875, 0.2133941650390625, 0.271026611328125, 0.3286590576171875, 0.38629150390625, 0.4439239501953125, 0.501556396484375, 0.5591888427734375, 0.6168212890625, 0.6744537353515625, 0.732086181640625, 0.7897186279296875, 0.84735107421875, 0.9049835205078125, 0.962615966796875, 1.0202484130859375, 1.077880859375, 1.1355133056640625, 1.193145751953125, 1.2507781982421875, 1.30841064453125, 1.3660430908203125, 1.423675537109375, 1.4813079833984375, 1.5389404296875, 1.5965728759765625, 1.654205322265625, 1.7118377685546875, 1.76947021484375, 1.8271026611328125, 1.884735107421875, 1.9423675537109375, 2.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 9.0, 13.0, 14.0, 21.0, 27.0, 29.0, 28.0, 31.0, 40.0, 31.0, 54.0, 46.0, 57.0, 37.0, 54.0, 40.0, 46.0, 43.0, 40.0, 39.0, 39.0, 29.0, 34.0, 39.0, 22.0, 33.0, 18.0, 20.0, 9.0, 5.0, 10.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-1.0673828125, -1.0367202758789062, -1.0060577392578125, -0.9753952026367188, -0.944732666015625, -0.9140701293945312, -0.8834075927734375, -0.8527450561523438, -0.82208251953125, -0.7914199829101562, -0.7607574462890625, -0.7300949096679688, -0.699432373046875, -0.6687698364257812, -0.6381072998046875, -0.6074447631835938, -0.5767822265625, -0.5461196899414062, -0.5154571533203125, -0.48479461669921875, -0.454132080078125, -0.42346954345703125, -0.3928070068359375, -0.36214447021484375, -0.33148193359375, -0.30081939697265625, -0.2701568603515625, -0.23949432373046875, -0.208831787109375, -0.17816925048828125, -0.1475067138671875, -0.11684417724609375, -0.086181640625, -0.05551910400390625, -0.0248565673828125, 0.00580596923828125, 0.036468505859375, 0.06713104248046875, 0.0977935791015625, 0.12845611572265625, 0.15911865234375, 0.18978118896484375, 0.2204437255859375, 0.25110626220703125, 0.281768798828125, 0.31243133544921875, 0.3430938720703125, 0.37375640869140625, 0.4044189453125, 0.43508148193359375, 0.4657440185546875, 0.49640655517578125, 0.527069091796875, 0.5577316284179688, 0.5883941650390625, 0.6190567016601562, 0.64971923828125, 0.6803817749023438, 0.7110443115234375, 0.7417068481445312, 0.772369384765625, 0.8030319213867188, 0.8336944580078125, 0.8643569946289062, 0.89501953125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 10.0, 15.0, 14.0, 15.0, 18.0, 18.0, 33.0, 40.0, 35.0, 48.0, 49.0, 50.0, 53.0, 82.0, 61.0, 49.0, 49.0, 55.0, 48.0, 44.0, 34.0, 29.0, 27.0, 26.0, 13.0, 15.0, 12.0, 10.0, 11.0, 6.0, 5.0, 8.0, 8.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90285873413086, -31.75777816772461, -30.61269760131836, -29.46761703491211, -28.32253646850586, -27.17745590209961, -26.032377243041992, -24.887296676635742, -23.742216110229492, -22.597135543823242, -21.452054977416992, -20.306974411010742, -19.161895751953125, -18.016815185546875, -16.871734619140625, -15.726654052734375, -14.581573486328125, -13.436492919921875, -12.291412353515625, -11.146332740783691, -10.001252174377441, -8.856171607971191, -7.7110915184021, -6.566011428833008, -5.420930862426758, -4.275850296020508, -3.130770206451416, -1.9856898784637451, -0.8406095504760742, 0.3044710159301758, 1.4495511054992676, 2.5946311950683594, 3.739715576171875, 4.884796142578125, 6.029876232147217, 7.174956321716309, 8.320036888122559, 9.465117454528809, 10.610197067260742, 11.755277633666992, 12.900358200073242, 14.045438766479492, 15.190519332885742, 16.335599899291992, 17.48067855834961, 18.62575912475586, 19.77083969116211, 20.91592025756836, 22.06100082397461, 23.20608139038086, 24.35116195678711, 25.49624252319336, 26.64132308959961, 27.78640365600586, 28.931482315063477, 30.076562881469727, 31.221643447875977, 32.366722106933594, 33.511802673339844, 34.656883239746094, 35.801963806152344, 36.947044372558594, 38.092124938964844, 39.237205505371094, 40.382286071777344]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 7.0, 7.0, 13.0, 16.0, 18.0, 13.0, 20.0, 15.0, 26.0, 27.0, 41.0, 29.0, 42.0, 44.0, 57.0, 46.0, 44.0, 48.0, 42.0, 43.0, 43.0, 40.0, 40.0, 36.0, 25.0, 33.0, 34.0, 22.0, 16.0, 15.0, 20.0, 7.0, 9.0, 11.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-49.199859619140625, -47.8168830871582, -46.43391036987305, -45.050933837890625, -43.6679573059082, -42.28498077392578, -40.902008056640625, -39.5190315246582, -38.13605499267578, -36.75307846069336, -35.3701057434082, -33.98712921142578, -32.60415267944336, -31.22117805480957, -29.83820343017578, -28.45522689819336, -27.072254180908203, -25.689279556274414, -24.306303024291992, -22.923328399658203, -21.54035186767578, -20.157377243041992, -18.774402618408203, -17.39142608642578, -16.008451461791992, -14.625475883483887, -13.242500305175781, -11.859525680541992, -10.476550102233887, -9.093574523925781, -7.710599899291992, -6.327624320983887, -4.944648742675781, -3.561673402786255, -2.1786980628967285, -0.7957229614257812, 0.5872526168823242, 1.9702281951904297, 3.3532028198242188, 4.736178398132324, 6.11915397644043, 7.502129554748535, 8.88510513305664, 10.26807975769043, 11.651055335998535, 13.03403091430664, 14.41700553894043, 15.799981117248535, 17.18295669555664, 18.56593132019043, 19.94890785217285, 21.33188247680664, 22.714859008789062, 24.09783363342285, 25.48080825805664, 26.863784790039062, 28.24675941467285, 29.62973403930664, 31.012710571289062, 32.39568328857422, 33.77865982055664, 35.16163635253906, 36.54460906982422, 37.92758560180664, 39.31056213378906]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 16.0, 35.0, 46.0, 64.0, 83.0, 120.0, 212.0, 334.0, 474.0, 768.0, 1144.0, 1882.0, 2820.0, 4333.0, 6822.0, 10366.0, 16165.0, 25193.0, 38406.0, 55668.0, 78551.0, 102035.0, 120164.0, 126997.0, 119145.0, 100039.0, 76652.0, 54275.0, 36975.0, 24424.0, 15660.0, 10108.0, 6602.0, 4313.0, 2660.0, 1792.0, 1104.0, 746.0, 466.0, 297.0, 201.0, 143.0, 73.0, 54.0, 35.0, 27.0, 17.0, 12.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-25.09375, -24.296142578125, -23.49853515625, -22.700927734375, -21.9033203125, -21.105712890625, -20.30810546875, -19.510498046875, -18.712890625, -17.915283203125, -17.11767578125, -16.320068359375, -15.5224609375, -14.724853515625, -13.92724609375, -13.129638671875, -12.33203125, -11.534423828125, -10.73681640625, -9.939208984375, -9.1416015625, -8.343994140625, -7.54638671875, -6.748779296875, -5.951171875, -5.153564453125, -4.35595703125, -3.558349609375, -2.7607421875, -1.963134765625, -1.16552734375, -0.367919921875, 0.4296875, 1.227294921875, 2.02490234375, 2.822509765625, 3.6201171875, 4.417724609375, 5.21533203125, 6.012939453125, 6.810546875, 7.608154296875, 8.40576171875, 9.203369140625, 10.0009765625, 10.798583984375, 11.59619140625, 12.393798828125, 13.19140625, 13.989013671875, 14.78662109375, 15.584228515625, 16.3818359375, 17.179443359375, 17.97705078125, 18.774658203125, 19.572265625, 20.369873046875, 21.16748046875, 21.965087890625, 22.7626953125, 23.560302734375, 24.35791015625, 25.155517578125, 25.953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 11.0, 6.0, 6.0, 12.0, 11.0, 18.0, 14.0, 13.0, 19.0, 21.0, 23.0, 27.0, 43.0, 28.0, 42.0, 46.0, 56.0, 44.0, 48.0, 42.0, 42.0, 49.0, 39.0, 41.0, 37.0, 41.0, 20.0, 39.0, 28.0, 21.0, 19.0, 13.0, 20.0, 6.0, 6.0, 14.0, 13.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-47.0625, -45.7353515625, -44.408203125, -43.0810546875, -41.75390625, -40.4267578125, -39.099609375, -37.7724609375, -36.4453125, -35.1181640625, -33.791015625, -32.4638671875, -31.13671875, -29.8095703125, -28.482421875, -27.1552734375, -25.828125, -24.5009765625, -23.173828125, -21.8466796875, -20.51953125, -19.1923828125, -17.865234375, -16.5380859375, -15.2109375, -13.8837890625, -12.556640625, -11.2294921875, -9.90234375, -8.5751953125, -7.248046875, -5.9208984375, -4.59375, -3.2666015625, -1.939453125, -0.6123046875, 0.71484375, 2.0419921875, 3.369140625, 4.6962890625, 6.0234375, 7.3505859375, 8.677734375, 10.0048828125, 11.33203125, 12.6591796875, 13.986328125, 15.3134765625, 16.640625, 17.9677734375, 19.294921875, 20.6220703125, 21.94921875, 23.2763671875, 24.603515625, 25.9306640625, 27.2578125, 28.5849609375, 29.912109375, 31.2392578125, 32.56640625, 33.8935546875, 35.220703125, 36.5478515625, 37.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 15.0, 27.0, 35.0, 60.0, 94.0, 124.0, 173.0, 271.0, 474.0, 755.0, 1132.0, 1901.0, 3166.0, 5182.0, 8351.0, 13795.0, 22338.0, 35710.0, 55007.0, 81466.0, 110910.0, 134327.0, 140852.0, 128330.0, 101956.0, 72844.0, 48465.0, 30999.0, 19156.0, 11757.0, 7266.0, 4391.0, 2681.0, 1673.0, 997.0, 668.0, 397.0, 288.0, 190.0, 112.0, 68.0, 55.0, 26.0, 21.0, 13.0, 8.0, 4.0, 5.0, 1.0, 3.0, 5.0, 2.0], "bins": [-30.53125, -29.642333984375, -28.75341796875, -27.864501953125, -26.9755859375, -26.086669921875, -25.19775390625, -24.308837890625, -23.419921875, -22.531005859375, -21.64208984375, -20.753173828125, -19.8642578125, -18.975341796875, -18.08642578125, -17.197509765625, -16.30859375, -15.419677734375, -14.53076171875, -13.641845703125, -12.7529296875, -11.864013671875, -10.97509765625, -10.086181640625, -9.197265625, -8.308349609375, -7.41943359375, -6.530517578125, -5.6416015625, -4.752685546875, -3.86376953125, -2.974853515625, -2.0859375, -1.197021484375, -0.30810546875, 0.580810546875, 1.4697265625, 2.358642578125, 3.24755859375, 4.136474609375, 5.025390625, 5.914306640625, 6.80322265625, 7.692138671875, 8.5810546875, 9.469970703125, 10.35888671875, 11.247802734375, 12.13671875, 13.025634765625, 13.91455078125, 14.803466796875, 15.6923828125, 16.581298828125, 17.47021484375, 18.359130859375, 19.248046875, 20.136962890625, 21.02587890625, 21.914794921875, 22.8037109375, 23.692626953125, 24.58154296875, 25.470458984375, 26.359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 12.0, 21.0, 21.0, 14.0, 30.0, 21.0, 26.0, 29.0, 39.0, 33.0, 33.0, 32.0, 39.0, 43.0, 36.0, 50.0, 41.0, 35.0, 45.0, 35.0, 26.0, 35.0, 39.0, 27.0, 28.0, 27.0, 32.0, 16.0, 13.0, 15.0, 12.0, 15.0, 7.0, 13.0, 7.0, 10.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.0625, -25.2958984375, -24.529296875, -23.7626953125, -22.99609375, -22.2294921875, -21.462890625, -20.6962890625, -19.9296875, -19.1630859375, -18.396484375, -17.6298828125, -16.86328125, -16.0966796875, -15.330078125, -14.5634765625, -13.796875, -13.0302734375, -12.263671875, -11.4970703125, -10.73046875, -9.9638671875, -9.197265625, -8.4306640625, -7.6640625, -6.8974609375, -6.130859375, -5.3642578125, -4.59765625, -3.8310546875, -3.064453125, -2.2978515625, -1.53125, -0.7646484375, 0.001953125, 0.7685546875, 1.53515625, 2.3017578125, 3.068359375, 3.8349609375, 4.6015625, 5.3681640625, 6.134765625, 6.9013671875, 7.66796875, 8.4345703125, 9.201171875, 9.9677734375, 10.734375, 11.5009765625, 12.267578125, 13.0341796875, 13.80078125, 14.5673828125, 15.333984375, 16.1005859375, 16.8671875, 17.6337890625, 18.400390625, 19.1669921875, 19.93359375, 20.7001953125, 21.466796875, 22.2333984375, 23.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 11.0, 15.0, 20.0, 41.0, 31.0, 75.0, 82.0, 135.0, 209.0, 290.0, 415.0, 690.0, 1011.0, 1441.0, 2243.0, 3575.0, 5614.0, 8619.0, 13469.0, 21401.0, 32553.0, 48804.0, 68928.0, 92964.0, 114903.0, 126245.0, 124075.0, 108727.0, 85741.0, 62712.0, 43166.0, 28523.0, 18422.0, 11914.0, 7626.0, 4891.0, 3079.0, 2019.0, 1283.0, 840.0, 609.0, 400.0, 221.0, 169.0, 122.0, 74.0, 58.0, 35.0, 25.0, 17.0, 12.0, 6.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.359375, -6.138916015625, -5.91845703125, -5.697998046875, -5.4775390625, -5.257080078125, -5.03662109375, -4.816162109375, -4.595703125, -4.375244140625, -4.15478515625, -3.934326171875, -3.7138671875, -3.493408203125, -3.27294921875, -3.052490234375, -2.83203125, -2.611572265625, -2.39111328125, -2.170654296875, -1.9501953125, -1.729736328125, -1.50927734375, -1.288818359375, -1.068359375, -0.847900390625, -0.62744140625, -0.406982421875, -0.1865234375, 0.033935546875, 0.25439453125, 0.474853515625, 0.6953125, 0.915771484375, 1.13623046875, 1.356689453125, 1.5771484375, 1.797607421875, 2.01806640625, 2.238525390625, 2.458984375, 2.679443359375, 2.89990234375, 3.120361328125, 3.3408203125, 3.561279296875, 3.78173828125, 4.002197265625, 4.22265625, 4.443115234375, 4.66357421875, 4.884033203125, 5.1044921875, 5.324951171875, 5.54541015625, 5.765869140625, 5.986328125, 6.206787109375, 6.42724609375, 6.647705078125, 6.8681640625, 7.088623046875, 7.30908203125, 7.529541015625, 7.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 5.0, 7.0, 9.0, 18.0, 12.0, 20.0, 15.0, 16.0, 27.0, 27.0, 36.0, 34.0, 35.0, 30.0, 51.0, 44.0, 46.0, 41.0, 46.0, 53.0, 36.0, 51.0, 40.0, 33.0, 24.0, 35.0, 32.0, 29.0, 20.0, 17.0, 19.0, 14.0, 17.0, 10.0, 8.0, 6.0, 6.0, 8.0, 2.0, 0.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005950927734375, -0.0005740076303482056, -0.0005529224872589111, -0.0005318373441696167, -0.0005107522010803223, -0.0004896670579910278, -0.0004685819149017334, -0.00044749677181243896, -0.00042641162872314453, -0.0004053264856338501, -0.00038424134254455566, -0.00036315619945526123, -0.0003420710563659668, -0.00032098591327667236, -0.00029990077018737793, -0.0002788156270980835, -0.00025773048400878906, -0.00023664534091949463, -0.0002155601978302002, -0.00019447505474090576, -0.00017338991165161133, -0.0001523047685623169, -0.00013121962547302246, -0.00011013448238372803, -8.90493392944336e-05, -6.796419620513916e-05, -4.6879053115844727e-05, -2.5793910026550293e-05, -4.708766937255859e-06, 1.6376376152038574e-05, 3.746151924133301e-05, 5.854666233062744e-05, 7.963180541992188e-05, 0.00010071694850921631, 0.00012180209159851074, 0.00014288723468780518, 0.0001639723777770996, 0.00018505752086639404, 0.00020614266395568848, 0.0002272278070449829, 0.00024831295013427734, 0.0002693980932235718, 0.0002904832363128662, 0.00031156837940216064, 0.0003326535224914551, 0.0003537386655807495, 0.00037482380867004395, 0.0003959089517593384, 0.0004169940948486328, 0.00043807923793792725, 0.0004591643810272217, 0.0004802495241165161, 0.0005013346672058105, 0.000522419810295105, 0.0005435049533843994, 0.0005645900964736938, 0.0005856752395629883, 0.0006067603826522827, 0.0006278455257415771, 0.0006489306688308716, 0.000670015811920166, 0.0006911009550094604, 0.0007121860980987549, 0.0007332712411880493, 0.0007543563842773438]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 11.0, 32.0, 27.0, 48.0, 85.0, 111.0, 194.0, 321.0, 459.0, 681.0, 1076.0, 1703.0, 2604.0, 4087.0, 6757.0, 10603.0, 17133.0, 27800.0, 44212.0, 67187.0, 96069.0, 124300.0, 141268.0, 138450.0, 116072.0, 86373.0, 59138.0, 38278.0, 23856.0, 14648.0, 9267.0, 5699.0, 3527.0, 2306.0, 1523.0, 923.0, 555.0, 414.0, 270.0, 158.0, 120.0, 65.0, 50.0, 26.0, 27.0, 7.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.046875, -7.7772216796875, -7.507568359375, -7.2379150390625, -6.96826171875, -6.6986083984375, -6.428955078125, -6.1593017578125, -5.8896484375, -5.6199951171875, -5.350341796875, -5.0806884765625, -4.81103515625, -4.5413818359375, -4.271728515625, -4.0020751953125, -3.732421875, -3.4627685546875, -3.193115234375, -2.9234619140625, -2.65380859375, -2.3841552734375, -2.114501953125, -1.8448486328125, -1.5751953125, -1.3055419921875, -1.035888671875, -0.7662353515625, -0.49658203125, -0.2269287109375, 0.042724609375, 0.3123779296875, 0.58203125, 0.8516845703125, 1.121337890625, 1.3909912109375, 1.66064453125, 1.9302978515625, 2.199951171875, 2.4696044921875, 2.7392578125, 3.0089111328125, 3.278564453125, 3.5482177734375, 3.81787109375, 4.0875244140625, 4.357177734375, 4.6268310546875, 4.896484375, 5.1661376953125, 5.435791015625, 5.7054443359375, 5.97509765625, 6.2447509765625, 6.514404296875, 6.7840576171875, 7.0537109375, 7.3233642578125, 7.593017578125, 7.8626708984375, 8.13232421875, 8.4019775390625, 8.671630859375, 8.9412841796875, 9.2109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 8.0, 13.0, 18.0, 16.0, 18.0, 13.0, 24.0, 37.0, 40.0, 47.0, 66.0, 42.0, 66.0, 55.0, 56.0, 62.0, 66.0, 70.0, 45.0, 45.0, 29.0, 33.0, 18.0, 23.0, 13.0, 19.0, 13.0, 4.0, 6.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.46484375, -5.2960205078125, -5.127197265625, -4.9583740234375, -4.78955078125, -4.6207275390625, -4.451904296875, -4.2830810546875, -4.1142578125, -3.9454345703125, -3.776611328125, -3.6077880859375, -3.43896484375, -3.2701416015625, -3.101318359375, -2.9324951171875, -2.763671875, -2.5948486328125, -2.426025390625, -2.2572021484375, -2.08837890625, -1.9195556640625, -1.750732421875, -1.5819091796875, -1.4130859375, -1.2442626953125, -1.075439453125, -0.9066162109375, -0.73779296875, -0.5689697265625, -0.400146484375, -0.2313232421875, -0.0625, 0.1063232421875, 0.275146484375, 0.4439697265625, 0.61279296875, 0.7816162109375, 0.950439453125, 1.1192626953125, 1.2880859375, 1.4569091796875, 1.625732421875, 1.7945556640625, 1.96337890625, 2.1322021484375, 2.301025390625, 2.4698486328125, 2.638671875, 2.8074951171875, 2.976318359375, 3.1451416015625, 3.31396484375, 3.4827880859375, 3.651611328125, 3.8204345703125, 3.9892578125, 4.1580810546875, 4.326904296875, 4.4957275390625, 4.66455078125, 4.8333740234375, 5.002197265625, 5.1710205078125, 5.33984375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 5.0, 9.0, 14.0, 13.0, 9.0, 18.0, 23.0, 24.0, 25.0, 39.0, 44.0, 37.0, 40.0, 48.0, 50.0, 54.0, 50.0, 47.0, 46.0, 43.0, 40.0, 40.0, 36.0, 40.0, 25.0, 25.0, 21.0, 18.0, 13.0, 12.0, 21.0, 6.0, 8.0, 9.0, 10.0, 10.0, 4.0, 3.0, 0.0, 6.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.09133529663086, -29.15003204345703, -28.20872688293457, -27.267423629760742, -26.326120376586914, -25.384815216064453, -24.443511962890625, -23.502208709716797, -22.56090545654297, -21.61960220336914, -20.67829704284668, -19.73699378967285, -18.795690536499023, -17.854385375976562, -16.913082122802734, -15.971778869628906, -15.030473709106445, -14.0891695022583, -13.147866249084473, -12.206562042236328, -11.2652587890625, -10.323954582214355, -9.382650375366211, -8.441347122192383, -7.500042915344238, -6.558739185333252, -5.617435455322266, -4.676131248474121, -3.7348275184631348, -2.7935237884521484, -1.852219581604004, -0.9109158515930176, 0.030385971069335938, 0.9716898202896118, 1.9129936695098877, 2.854297637939453, 3.7956013679504395, 4.736905097961426, 5.67820930480957, 6.619513034820557, 7.560816764831543, 8.502120971679688, 9.443424224853516, 10.38472843170166, 11.326032638549805, 12.267335891723633, 13.208640098571777, 14.149944305419922, 15.09124755859375, 16.032550811767578, 16.97385597229004, 17.915159225463867, 18.856462478637695, 19.797767639160156, 20.739070892333984, 21.680374145507812, 22.62167739868164, 23.56298065185547, 24.50428581237793, 25.445589065551758, 26.386892318725586, 27.328197479248047, 28.269500732421875, 29.210803985595703, 30.152109146118164]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 15.0, 25.0, 18.0, 16.0, 29.0, 27.0, 24.0, 33.0, 32.0, 47.0, 38.0, 53.0, 47.0, 47.0, 57.0, 56.0, 46.0, 46.0, 30.0, 47.0, 36.0, 26.0, 37.0, 24.0, 18.0, 16.0, 20.0, 14.0, 11.0, 8.0, 7.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-53.205692291259766, -51.65854263305664, -50.111392974853516, -48.56424331665039, -47.017093658447266, -45.46994400024414, -43.922794342041016, -42.37564468383789, -40.828495025634766, -39.28134536743164, -37.734195709228516, -36.18704605102539, -34.639896392822266, -33.09274673461914, -31.545597076416016, -29.99844741821289, -28.4512996673584, -26.904150009155273, -25.35700035095215, -23.809850692749023, -22.2627010345459, -20.715551376342773, -19.16840362548828, -17.621253967285156, -16.07410430908203, -14.526954650878906, -12.979804992675781, -11.432655334472656, -9.885505676269531, -8.338356018066406, -6.791207313537598, -5.244057655334473, -3.6969070434570312, -2.1497573852539062, -0.6026079654693604, 0.9445414543151855, 2.4916911125183105, 4.0388407707214355, 5.585989952087402, 7.133139610290527, 8.680289268493652, 10.227438926696777, 11.774588584899902, 13.321737289428711, 14.868886947631836, 16.41603660583496, 17.963186264038086, 19.51033592224121, 21.057485580444336, 22.60463523864746, 24.151784896850586, 25.69893455505371, 27.246084213256836, 28.79323387145996, 30.340381622314453, 31.887531280517578, 33.4346809387207, 34.98183059692383, 36.52898025512695, 38.07612991333008, 39.6232795715332, 41.17042922973633, 42.71757888793945, 44.26472854614258, 45.8118782043457]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 10.0, 22.0, 36.0, 51.0, 71.0, 114.0, 191.0, 366.0, 656.0, 1159.0, 2159.0, 4176.0, 8009.0, 15949.0, 31578.0, 63133.0, 123341.0, 234990.0, 420770.0, 653340.0, 796523.0, 724815.0, 500262.0, 291041.0, 155564.0, 79970.0, 41033.0, 21262.0, 10951.0, 5864.0, 3169.0, 1643.0, 854.0, 523.0, 269.0, 183.0, 119.0, 38.0, 31.0, 21.0, 5.0, 8.0, 3.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.0, -38.8466796875, -37.693359375, -36.5400390625, -35.38671875, -34.2333984375, -33.080078125, -31.9267578125, -30.7734375, -29.6201171875, -28.466796875, -27.3134765625, -26.16015625, -25.0068359375, -23.853515625, -22.7001953125, -21.546875, -20.3935546875, -19.240234375, -18.0869140625, -16.93359375, -15.7802734375, -14.626953125, -13.4736328125, -12.3203125, -11.1669921875, -10.013671875, -8.8603515625, -7.70703125, -6.5537109375, -5.400390625, -4.2470703125, -3.09375, -1.9404296875, -0.787109375, 0.3662109375, 1.51953125, 2.6728515625, 3.826171875, 4.9794921875, 6.1328125, 7.2861328125, 8.439453125, 9.5927734375, 10.74609375, 11.8994140625, 13.052734375, 14.2060546875, 15.359375, 16.5126953125, 17.666015625, 18.8193359375, 19.97265625, 21.1259765625, 22.279296875, 23.4326171875, 24.5859375, 25.7392578125, 26.892578125, 28.0458984375, 29.19921875, 30.3525390625, 31.505859375, 32.6591796875, 33.8125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 13.0, 19.0, 23.0, 19.0, 21.0, 24.0, 29.0, 25.0, 38.0, 33.0, 44.0, 46.0, 51.0, 48.0, 46.0, 61.0, 59.0, 40.0, 41.0, 45.0, 31.0, 34.0, 32.0, 29.0, 20.0, 21.0, 16.0, 17.0, 9.0, 15.0, 5.0, 10.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.9375, -39.7353515625, -38.533203125, -37.3310546875, -36.12890625, -34.9267578125, -33.724609375, -32.5224609375, -31.3203125, -30.1181640625, -28.916015625, -27.7138671875, -26.51171875, -25.3095703125, -24.107421875, -22.9052734375, -21.703125, -20.5009765625, -19.298828125, -18.0966796875, -16.89453125, -15.6923828125, -14.490234375, -13.2880859375, -12.0859375, -10.8837890625, -9.681640625, -8.4794921875, -7.27734375, -6.0751953125, -4.873046875, -3.6708984375, -2.46875, -1.2666015625, -0.064453125, 1.1376953125, 2.33984375, 3.5419921875, 4.744140625, 5.9462890625, 7.1484375, 8.3505859375, 9.552734375, 10.7548828125, 11.95703125, 13.1591796875, 14.361328125, 15.5634765625, 16.765625, 17.9677734375, 19.169921875, 20.3720703125, 21.57421875, 22.7763671875, 23.978515625, 25.1806640625, 26.3828125, 27.5849609375, 28.787109375, 29.9892578125, 31.19140625, 32.3935546875, 33.595703125, 34.7978515625, 36.0]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 5.0, 12.0, 17.0, 37.0, 66.0, 112.0, 178.0, 273.0, 465.0, 772.0, 1338.0, 2173.0, 3709.0, 6216.0, 10194.0, 17053.0, 27806.0, 44956.0, 70515.0, 107746.0, 158446.0, 223997.0, 297787.0, 372687.0, 430311.0, 458470.0, 445729.0, 398219.0, 328305.0, 252966.0, 183438.0, 126555.0, 83542.0, 54193.0, 33577.0, 20926.0, 12513.0, 7639.0, 4598.0, 2723.0, 1611.0, 975.0, 567.0, 353.0, 218.0, 125.0, 63.0, 42.0, 24.0, 21.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.90625, -21.236328125, -20.56640625, -19.896484375, -19.2265625, -18.556640625, -17.88671875, -17.216796875, -16.546875, -15.876953125, -15.20703125, -14.537109375, -13.8671875, -13.197265625, -12.52734375, -11.857421875, -11.1875, -10.517578125, -9.84765625, -9.177734375, -8.5078125, -7.837890625, -7.16796875, -6.498046875, -5.828125, -5.158203125, -4.48828125, -3.818359375, -3.1484375, -2.478515625, -1.80859375, -1.138671875, -0.46875, 0.201171875, 0.87109375, 1.541015625, 2.2109375, 2.880859375, 3.55078125, 4.220703125, 4.890625, 5.560546875, 6.23046875, 6.900390625, 7.5703125, 8.240234375, 8.91015625, 9.580078125, 10.25, 10.919921875, 11.58984375, 12.259765625, 12.9296875, 13.599609375, 14.26953125, 14.939453125, 15.609375, 16.279296875, 16.94921875, 17.619140625, 18.2890625, 18.958984375, 19.62890625, 20.298828125, 20.96875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 29.0, 35.0, 61.0, 67.0, 75.0, 97.0, 133.0, 136.0, 165.0, 172.0, 184.0, 201.0, 210.0, 216.0, 232.0, 220.0, 248.0, 168.0, 190.0, 183.0, 145.0, 146.0, 118.0, 116.0, 73.0, 68.0, 54.0, 50.0, 41.0, 33.0, 29.0, 19.0, 11.0, 11.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-15.578125, -15.1051025390625, -14.632080078125, -14.1590576171875, -13.68603515625, -13.2130126953125, -12.739990234375, -12.2669677734375, -11.7939453125, -11.3209228515625, -10.847900390625, -10.3748779296875, -9.90185546875, -9.4288330078125, -8.955810546875, -8.4827880859375, -8.009765625, -7.5367431640625, -7.063720703125, -6.5906982421875, -6.11767578125, -5.6446533203125, -5.171630859375, -4.6986083984375, -4.2255859375, -3.7525634765625, -3.279541015625, -2.8065185546875, -2.33349609375, -1.8604736328125, -1.387451171875, -0.9144287109375, -0.44140625, 0.0316162109375, 0.504638671875, 0.9776611328125, 1.45068359375, 1.9237060546875, 2.396728515625, 2.8697509765625, 3.3427734375, 3.8157958984375, 4.288818359375, 4.7618408203125, 5.23486328125, 5.7078857421875, 6.180908203125, 6.6539306640625, 7.126953125, 7.5999755859375, 8.072998046875, 8.5460205078125, 9.01904296875, 9.4920654296875, 9.965087890625, 10.4381103515625, 10.9111328125, 11.3841552734375, 11.857177734375, 12.3302001953125, 12.80322265625, 13.2762451171875, 13.749267578125, 14.2222900390625, 14.6953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 4.0, 7.0, 12.0, 14.0, 16.0, 12.0, 18.0, 29.0, 22.0, 34.0, 27.0, 40.0, 41.0, 51.0, 42.0, 40.0, 48.0, 37.0, 43.0, 49.0, 41.0, 44.0, 39.0, 29.0, 26.0, 26.0, 25.0, 26.0, 27.0, 19.0, 17.0, 11.0, 12.0, 7.0, 12.0, 9.0, 8.0, 8.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.570873260498047, -21.74411392211914, -20.917354583740234, -20.090595245361328, -19.263835906982422, -18.437076568603516, -17.61031723022461, -16.783557891845703, -15.95679759979248, -15.130038261413574, -14.303278923034668, -13.476518630981445, -12.649759292602539, -11.822999954223633, -10.996240615844727, -10.16948127746582, -9.342721939086914, -8.515962600708008, -7.689203262329102, -6.862443447113037, -6.035684108734131, -5.208924770355225, -4.38216495513916, -3.555405616760254, -2.7286462783813477, -1.9018868207931519, -1.075127363204956, -0.2483677864074707, 0.5783915519714355, 1.4051508903503418, 2.2319107055664062, 3.0586700439453125, 3.885427474975586, 4.712186813354492, 5.538946151733398, 6.365705966949463, 7.192465305328369, 8.019224166870117, 8.84598445892334, 9.672743797302246, 10.499503135681152, 11.326262474060059, 12.153021812438965, 12.979782104492188, 13.806541442871094, 14.63330078125, 15.460060119628906, 16.286819458007812, 17.11357879638672, 17.940338134765625, 18.76709747314453, 19.593856811523438, 20.420616149902344, 21.24737548828125, 22.074134826660156, 22.900894165039062, 23.72765350341797, 24.554412841796875, 25.38117218017578, 26.207931518554688, 27.034690856933594, 27.8614501953125, 28.688209533691406, 29.514968872070312, 30.34173011779785]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 6.0, 8.0, 12.0, 18.0, 22.0, 21.0, 27.0, 26.0, 38.0, 33.0, 38.0, 41.0, 32.0, 48.0, 58.0, 42.0, 50.0, 53.0, 50.0, 45.0, 48.0, 24.0, 30.0, 35.0, 27.0, 28.0, 28.0, 27.0, 16.0, 12.0, 17.0, 9.0, 6.0, 7.0, 1.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.06928634643555, -41.649688720703125, -40.2300910949707, -38.81049346923828, -37.390899658203125, -35.9713020324707, -34.55170440673828, -33.13210678100586, -31.712509155273438, -30.292911529541016, -28.873315811157227, -27.453718185424805, -26.034120559692383, -24.614524841308594, -23.194927215576172, -21.77532958984375, -20.35573387145996, -18.93613624572754, -17.51654052734375, -16.096942901611328, -14.677345275878906, -13.2577486038208, -11.838151931762695, -10.418554306030273, -8.998957633972168, -7.579360485076904, -6.159763336181641, -4.740166664123535, -3.3205695152282715, -1.9009723663330078, -0.48137569427490234, 0.9382219314575195, 2.357818603515625, 3.7774157524108887, 5.197012901306152, 6.616609573364258, 8.03620719909668, 9.455803871154785, 10.87540054321289, 12.294998168945312, 13.714594841003418, 15.134191513061523, 16.553789138793945, 17.973384857177734, 19.392982482910156, 20.812580108642578, 22.232177734375, 23.651775360107422, 25.07137107849121, 26.490968704223633, 27.910564422607422, 29.330162048339844, 30.749759674072266, 32.16935729980469, 33.588951110839844, 35.00855255126953, 36.42814636230469, 37.84774398803711, 39.26734161376953, 40.68693542480469, 42.10653305053711, 43.52613067626953, 44.94572830200195, 46.365325927734375, 47.7849235534668]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 7.0, 15.0, 22.0, 46.0, 33.0, 42.0, 81.0, 106.0, 181.0, 200.0, 311.0, 503.0, 701.0, 991.0, 1493.0, 2238.0, 3349.0, 5247.0, 7920.0, 12560.0, 20478.0, 34008.0, 58460.0, 106894.0, 224530.0, 266576.0, 129314.0, 68879.0, 39216.0, 23394.0, 14575.0, 9044.0, 5736.0, 3762.0, 2463.0, 1654.0, 1097.0, 711.0, 521.0, 364.0, 260.0, 168.0, 117.0, 101.0, 55.0, 45.0, 24.0, 20.0, 13.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.51953125, -5.3477783203125, -5.176025390625, -5.0042724609375, -4.83251953125, -4.6607666015625, -4.489013671875, -4.3172607421875, -4.1455078125, -3.9737548828125, -3.802001953125, -3.6302490234375, -3.45849609375, -3.2867431640625, -3.114990234375, -2.9432373046875, -2.771484375, -2.5997314453125, -2.427978515625, -2.2562255859375, -2.08447265625, -1.9127197265625, -1.740966796875, -1.5692138671875, -1.3974609375, -1.2257080078125, -1.053955078125, -0.8822021484375, -0.71044921875, -0.5386962890625, -0.366943359375, -0.1951904296875, -0.0234375, 0.1483154296875, 0.320068359375, 0.4918212890625, 0.66357421875, 0.8353271484375, 1.007080078125, 1.1788330078125, 1.3505859375, 1.5223388671875, 1.694091796875, 1.8658447265625, 2.03759765625, 2.2093505859375, 2.381103515625, 2.5528564453125, 2.724609375, 2.8963623046875, 3.068115234375, 3.2398681640625, 3.41162109375, 3.5833740234375, 3.755126953125, 3.9268798828125, 4.0986328125, 4.2703857421875, 4.442138671875, 4.6138916015625, 4.78564453125, 4.9573974609375, 5.129150390625, 5.3009033203125, 5.47265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 6.0, 8.0, 14.0, 17.0, 23.0, 22.0, 25.0, 26.0, 39.0, 34.0, 36.0, 40.0, 33.0, 50.0, 58.0, 43.0, 48.0, 54.0, 50.0, 42.0, 51.0, 22.0, 29.0, 38.0, 26.0, 29.0, 28.0, 24.0, 17.0, 14.0, 14.0, 12.0, 4.0, 6.0, 1.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.03125, -41.61572265625, -40.2001953125, -38.78466796875, -37.369140625, -35.95361328125, -34.5380859375, -33.12255859375, -31.70703125, -30.29150390625, -28.8759765625, -27.46044921875, -26.044921875, -24.62939453125, -23.2138671875, -21.79833984375, -20.3828125, -18.96728515625, -17.5517578125, -16.13623046875, -14.720703125, -13.30517578125, -11.8896484375, -10.47412109375, -9.05859375, -7.64306640625, -6.2275390625, -4.81201171875, -3.396484375, -1.98095703125, -0.5654296875, 0.85009765625, 2.265625, 3.68115234375, 5.0966796875, 6.51220703125, 7.927734375, 9.34326171875, 10.7587890625, 12.17431640625, 13.58984375, 15.00537109375, 16.4208984375, 17.83642578125, 19.251953125, 20.66748046875, 22.0830078125, 23.49853515625, 24.9140625, 26.32958984375, 27.7451171875, 29.16064453125, 30.576171875, 31.99169921875, 33.4072265625, 34.82275390625, 36.23828125, 37.65380859375, 39.0693359375, 40.48486328125, 41.900390625, 43.31591796875, 44.7314453125, 46.14697265625, 47.5625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 15.0, 13.0, 19.0, 26.0, 40.0, 65.0, 106.0, 133.0, 221.0, 321.0, 426.0, 679.0, 1093.0, 1822.0, 3084.0, 5281.0, 9377.0, 16918.0, 33962.0, 69191.0, 159923.0, 361904.0, 209398.0, 85956.0, 41132.0, 20959.0, 11247.0, 6051.0, 3490.0, 1984.0, 1330.0, 834.0, 550.0, 310.0, 206.0, 147.0, 95.0, 62.0, 66.0, 39.0, 27.0, 14.0, 16.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.546875, -5.35321044921875, -5.1595458984375, -4.96588134765625, -4.772216796875, -4.57855224609375, -4.3848876953125, -4.19122314453125, -3.99755859375, -3.80389404296875, -3.6102294921875, -3.41656494140625, -3.222900390625, -3.02923583984375, -2.8355712890625, -2.64190673828125, -2.4482421875, -2.25457763671875, -2.0609130859375, -1.86724853515625, -1.673583984375, -1.47991943359375, -1.2862548828125, -1.09259033203125, -0.89892578125, -0.70526123046875, -0.5115966796875, -0.31793212890625, -0.124267578125, 0.06939697265625, 0.2630615234375, 0.45672607421875, 0.650390625, 0.84405517578125, 1.0377197265625, 1.23138427734375, 1.425048828125, 1.61871337890625, 1.8123779296875, 2.00604248046875, 2.19970703125, 2.39337158203125, 2.5870361328125, 2.78070068359375, 2.974365234375, 3.16802978515625, 3.3616943359375, 3.55535888671875, 3.7490234375, 3.94268798828125, 4.1363525390625, 4.33001708984375, 4.523681640625, 4.71734619140625, 4.9110107421875, 5.10467529296875, 5.29833984375, 5.49200439453125, 5.6856689453125, 5.87933349609375, 6.072998046875, 6.26666259765625, 6.4603271484375, 6.65399169921875, 6.84765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 1.0, 5.0, 4.0, 10.0, 13.0, 7.0, 8.0, 21.0, 16.0, 23.0, 25.0, 22.0, 32.0, 17.0, 36.0, 29.0, 33.0, 33.0, 43.0, 42.0, 45.0, 38.0, 57.0, 45.0, 35.0, 34.0, 38.0, 43.0, 32.0, 20.0, 39.0, 25.0, 21.0, 17.0, 16.0, 22.0, 11.0, 6.0, 11.0, 4.0, 7.0, 1.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.69970703125, -27.8681640625, -27.03662109375, -26.205078125, -25.37353515625, -24.5419921875, -23.71044921875, -22.87890625, -22.04736328125, -21.2158203125, -20.38427734375, -19.552734375, -18.72119140625, -17.8896484375, -17.05810546875, -16.2265625, -15.39501953125, -14.5634765625, -13.73193359375, -12.900390625, -12.06884765625, -11.2373046875, -10.40576171875, -9.57421875, -8.74267578125, -7.9111328125, -7.07958984375, -6.248046875, -5.41650390625, -4.5849609375, -3.75341796875, -2.921875, -2.09033203125, -1.2587890625, -0.42724609375, 0.404296875, 1.23583984375, 2.0673828125, 2.89892578125, 3.73046875, 4.56201171875, 5.3935546875, 6.22509765625, 7.056640625, 7.88818359375, 8.7197265625, 9.55126953125, 10.3828125, 11.21435546875, 12.0458984375, 12.87744140625, 13.708984375, 14.54052734375, 15.3720703125, 16.20361328125, 17.03515625, 17.86669921875, 18.6982421875, 19.52978515625, 20.361328125, 21.19287109375, 22.0244140625, 22.85595703125, 23.6875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 10.0, 3.0, 11.0, 16.0, 13.0, 28.0, 39.0, 47.0, 71.0, 75.0, 107.0, 154.0, 198.0, 306.0, 473.0, 684.0, 1006.0, 1615.0, 2969.0, 6562.0, 24676.0, 352374.0, 607004.0, 33787.0, 7671.0, 3342.0, 1841.0, 1035.0, 703.0, 492.0, 328.0, 229.0, 176.0, 127.0, 92.0, 75.0, 46.0, 40.0, 25.0, 19.0, 19.0, 17.0, 9.0, 11.0, 8.0, 6.0, 5.0, 7.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.49609375, -2.4228515625, -2.349609375, -2.2763671875, -2.203125, -2.1298828125, -2.056640625, -1.9833984375, -1.91015625, -1.8369140625, -1.763671875, -1.6904296875, -1.6171875, -1.5439453125, -1.470703125, -1.3974609375, -1.32421875, -1.2509765625, -1.177734375, -1.1044921875, -1.03125, -0.9580078125, -0.884765625, -0.8115234375, -0.73828125, -0.6650390625, -0.591796875, -0.5185546875, -0.4453125, -0.3720703125, -0.298828125, -0.2255859375, -0.15234375, -0.0791015625, -0.005859375, 0.0673828125, 0.140625, 0.2138671875, 0.287109375, 0.3603515625, 0.43359375, 0.5068359375, 0.580078125, 0.6533203125, 0.7265625, 0.7998046875, 0.873046875, 0.9462890625, 1.01953125, 1.0927734375, 1.166015625, 1.2392578125, 1.3125, 1.3857421875, 1.458984375, 1.5322265625, 1.60546875, 1.6787109375, 1.751953125, 1.8251953125, 1.8984375, 1.9716796875, 2.044921875, 2.1181640625, 2.19140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 23.0, 46.0, 120.0, 284.0, 249.0, 130.0, 57.0, 30.0, 9.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002760887145996094, -0.00026689842343330383, -0.0002577081322669983, -0.00024851784110069275, -0.0002393275499343872, -0.00023013725876808167, -0.00022094696760177612, -0.00021175667643547058, -0.00020256638526916504, -0.0001933760941028595, -0.00018418580293655396, -0.0001749955117702484, -0.00016580522060394287, -0.00015661492943763733, -0.0001474246382713318, -0.00013823434710502625, -0.0001290440559387207, -0.00011985376477241516, -0.00011066347360610962, -0.00010147318243980408, -9.228289127349854e-05, -8.309260010719299e-05, -7.390230894088745e-05, -6.471201777458191e-05, -5.552172660827637e-05, -4.6331435441970825e-05, -3.714114427566528e-05, -2.795085310935974e-05, -1.87605619430542e-05, -9.570270776748657e-06, -3.7997961044311523e-07, 8.810311555862427e-06, 1.800060272216797e-05, 2.719089388847351e-05, 3.638118505477905e-05, 4.5571476221084595e-05, 5.476176738739014e-05, 6.395205855369568e-05, 7.314234972000122e-05, 8.233264088630676e-05, 9.15229320526123e-05, 0.00010071322321891785, 0.00010990351438522339, 0.00011909380555152893, 0.00012828409671783447, 0.00013747438788414001, 0.00014666467905044556, 0.0001558549702167511, 0.00016504526138305664, 0.00017423555254936218, 0.00018342584371566772, 0.00019261613488197327, 0.0002018064260482788, 0.00021099671721458435, 0.0002201870083808899, 0.00022937729954719543, 0.00023856759071350098, 0.0002477578818798065, 0.00025694817304611206, 0.0002661384642124176, 0.00027532875537872314, 0.0002845190465450287, 0.00029370933771133423, 0.00030289962887763977, 0.0003120899200439453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 20.0, 23.0, 41.0, 41.0, 50.0, 61.0, 79.0, 124.0, 170.0, 223.0, 336.0, 450.0, 661.0, 971.0, 1501.0, 2617.0, 4293.0, 8013.0, 15282.0, 31322.0, 65117.0, 142675.0, 343962.0, 233562.0, 100628.0, 46793.0, 22652.0, 11479.0, 5961.0, 3359.0, 2076.0, 1310.0, 800.0, 498.0, 365.0, 282.0, 207.0, 149.0, 94.0, 73.0, 56.0, 41.0, 37.0, 23.0, 14.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.3544921875, -1.3090057373046875, -1.263519287109375, -1.2180328369140625, -1.17254638671875, -1.1270599365234375, -1.081573486328125, -1.0360870361328125, -0.9906005859375, -0.9451141357421875, -0.899627685546875, -0.8541412353515625, -0.80865478515625, -0.7631683349609375, -0.717681884765625, -0.6721954345703125, -0.626708984375, -0.5812225341796875, -0.535736083984375, -0.4902496337890625, -0.44476318359375, -0.3992767333984375, -0.353790283203125, -0.3083038330078125, -0.2628173828125, -0.2173309326171875, -0.171844482421875, -0.1263580322265625, -0.08087158203125, -0.0353851318359375, 0.010101318359375, 0.0555877685546875, 0.10107421875, 0.1465606689453125, 0.192047119140625, 0.2375335693359375, 0.28302001953125, 0.3285064697265625, 0.373992919921875, 0.4194793701171875, 0.4649658203125, 0.5104522705078125, 0.555938720703125, 0.6014251708984375, 0.64691162109375, 0.6923980712890625, 0.737884521484375, 0.7833709716796875, 0.828857421875, 0.8743438720703125, 0.919830322265625, 0.9653167724609375, 1.01080322265625, 1.0562896728515625, 1.101776123046875, 1.1472625732421875, 1.1927490234375, 1.2382354736328125, 1.283721923828125, 1.3292083740234375, 1.37469482421875, 1.4201812744140625, 1.465667724609375, 1.5111541748046875, 1.556640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 2.0, 14.0, 14.0, 21.0, 42.0, 37.0, 46.0, 52.0, 54.0, 42.0, 47.0, 40.0, 45.0, 47.0, 36.0, 43.0, 55.0, 69.0, 47.0, 61.0, 35.0, 42.0, 18.0, 20.0, 9.0, 9.0, 9.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.83447265625, -0.810150146484375, -0.78582763671875, -0.761505126953125, -0.7371826171875, -0.712860107421875, -0.68853759765625, -0.664215087890625, -0.639892578125, -0.615570068359375, -0.59124755859375, -0.566925048828125, -0.5426025390625, -0.518280029296875, -0.49395751953125, -0.469635009765625, -0.4453125, -0.420989990234375, -0.39666748046875, -0.372344970703125, -0.3480224609375, -0.323699951171875, -0.29937744140625, -0.275054931640625, -0.250732421875, -0.226409912109375, -0.20208740234375, -0.177764892578125, -0.1534423828125, -0.129119873046875, -0.10479736328125, -0.080474853515625, -0.05615234375, -0.031829833984375, -0.00750732421875, 0.016815185546875, 0.0411376953125, 0.065460205078125, 0.08978271484375, 0.114105224609375, 0.138427734375, 0.162750244140625, 0.18707275390625, 0.211395263671875, 0.2357177734375, 0.260040283203125, 0.28436279296875, 0.308685302734375, 0.3330078125, 0.357330322265625, 0.38165283203125, 0.405975341796875, 0.4302978515625, 0.454620361328125, 0.47894287109375, 0.503265380859375, 0.527587890625, 0.551910400390625, 0.57623291015625, 0.600555419921875, 0.6248779296875, 0.649200439453125, 0.67352294921875, 0.697845458984375, 0.72216796875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 11.0, 3.0, 8.0, 9.0, 16.0, 12.0, 14.0, 20.0, 22.0, 29.0, 36.0, 22.0, 44.0, 40.0, 50.0, 42.0, 43.0, 51.0, 35.0, 44.0, 51.0, 40.0, 40.0, 44.0, 23.0, 32.0, 25.0, 30.0, 16.0, 25.0, 23.0, 18.0, 15.0, 7.0, 11.0, 8.0, 10.0, 8.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.526639938354492, -21.700138092041016, -20.873638153076172, -20.047136306762695, -19.22063446044922, -18.394132614135742, -17.567630767822266, -16.741130828857422, -15.914628982543945, -15.088127136230469, -14.261626243591309, -13.435125350952148, -12.608623504638672, -11.782121658325195, -10.955620765686035, -10.129119873046875, -9.302618026733398, -8.476116180419922, -7.649615287780762, -6.823113918304443, -5.996612548828125, -5.170111179351807, -4.343609809875488, -3.51710844039917, -2.6906070709228516, -1.8641057014465332, -1.0376043319702148, -0.21110296249389648, 0.6153984069824219, 1.4418997764587402, 2.2684011459350586, 3.094902515411377, 3.921405792236328, 4.7479071617126465, 5.574408531188965, 6.400909900665283, 7.227411270141602, 8.053913116455078, 8.880414009094238, 9.706914901733398, 10.533416748046875, 11.359918594360352, 12.186419486999512, 13.012920379638672, 13.839422225952148, 14.665924072265625, 15.492424964904785, 16.318925857543945, 17.145427703857422, 17.9719295501709, 18.798431396484375, 19.62493133544922, 20.451433181762695, 21.277935028076172, 22.104434967041016, 22.930936813354492, 23.75743865966797, 24.583940505981445, 25.410442352294922, 26.236942291259766, 27.063444137573242, 27.88994598388672, 28.716445922851562, 29.54294776916504, 30.369449615478516]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 8.0, 7.0, 11.0, 17.0, 23.0, 22.0, 25.0, 25.0, 39.0, 30.0, 45.0, 39.0, 34.0, 49.0, 52.0, 47.0, 51.0, 51.0, 49.0, 44.0, 54.0, 23.0, 28.0, 35.0, 29.0, 26.0, 28.0, 26.0, 16.0, 13.0, 16.0, 11.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.374454498291016, -41.950809478759766, -40.527164459228516, -39.103519439697266, -37.67987060546875, -36.2562255859375, -34.83258056640625, -33.408935546875, -31.98529052734375, -30.5616455078125, -29.13800048828125, -27.714353561401367, -26.290708541870117, -24.867063522338867, -23.443416595458984, -22.019771575927734, -20.596126556396484, -19.172481536865234, -17.748836517333984, -16.3251895904541, -14.901544570922852, -13.477899551391602, -12.054253578186035, -10.630607604980469, -9.206962585449219, -7.7833170890808105, -6.359671592712402, -4.936026096343994, -3.512380599975586, -2.0887351036071777, -0.6650896072387695, 0.7585563659667969, 2.182201385498047, 3.605846881866455, 5.029492378234863, 6.4531378746032715, 7.87678337097168, 9.30042839050293, 10.724074363708496, 12.147720336914062, 13.571365356445312, 14.995010375976562, 16.418655395507812, 17.842302322387695, 19.265947341918945, 20.689592361450195, 22.113239288330078, 23.536884307861328, 24.960529327392578, 26.384174346923828, 27.807819366455078, 29.23146629333496, 30.65511131286621, 32.078758239746094, 33.502403259277344, 34.926048278808594, 36.349693298339844, 37.773338317871094, 39.196983337402344, 40.620628356933594, 42.044273376464844, 43.46792221069336, 44.89156723022461, 46.31521224975586, 47.73885726928711]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 9.0, 5.0, 13.0, 17.0, 21.0, 38.0, 43.0, 80.0, 124.0, 169.0, 238.0, 376.0, 613.0, 987.0, 1432.0, 2194.0, 3584.0, 5834.0, 9159.0, 14848.0, 23303.0, 36005.0, 53580.0, 75999.0, 100593.0, 120965.0, 129663.0, 123230.0, 103837.0, 79952.0, 56642.0, 38105.0, 24452.0, 15925.0, 9944.0, 6049.0, 3813.0, 2333.0, 1529.0, 972.0, 621.0, 399.0, 263.0, 202.0, 130.0, 80.0, 47.0, 47.0, 32.0, 24.0, 14.0, 10.0, 7.0, 3.0, 1.0, 1.0, 3.0], "bins": [-24.5625, -23.830810546875, -23.09912109375, -22.367431640625, -21.6357421875, -20.904052734375, -20.17236328125, -19.440673828125, -18.708984375, -17.977294921875, -17.24560546875, -16.513916015625, -15.7822265625, -15.050537109375, -14.31884765625, -13.587158203125, -12.85546875, -12.123779296875, -11.39208984375, -10.660400390625, -9.9287109375, -9.197021484375, -8.46533203125, -7.733642578125, -7.001953125, -6.270263671875, -5.53857421875, -4.806884765625, -4.0751953125, -3.343505859375, -2.61181640625, -1.880126953125, -1.1484375, -0.416748046875, 0.31494140625, 1.046630859375, 1.7783203125, 2.510009765625, 3.24169921875, 3.973388671875, 4.705078125, 5.436767578125, 6.16845703125, 6.900146484375, 7.6318359375, 8.363525390625, 9.09521484375, 9.826904296875, 10.55859375, 11.290283203125, 12.02197265625, 12.753662109375, 13.4853515625, 14.217041015625, 14.94873046875, 15.680419921875, 16.412109375, 17.143798828125, 17.87548828125, 18.607177734375, 19.3388671875, 20.070556640625, 20.80224609375, 21.533935546875, 22.265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 10.0, 7.0, 9.0, 9.0, 17.0, 24.0, 23.0, 26.0, 22.0, 37.0, 35.0, 46.0, 37.0, 35.0, 51.0, 52.0, 47.0, 50.0, 50.0, 51.0, 45.0, 49.0, 22.0, 29.0, 34.0, 29.0, 30.0, 27.0, 25.0, 15.0, 14.0, 14.0, 13.0, 6.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.90625, -40.52685546875, -39.1474609375, -37.76806640625, -36.388671875, -35.00927734375, -33.6298828125, -32.25048828125, -30.87109375, -29.49169921875, -28.1123046875, -26.73291015625, -25.353515625, -23.97412109375, -22.5947265625, -21.21533203125, -19.8359375, -18.45654296875, -17.0771484375, -15.69775390625, -14.318359375, -12.93896484375, -11.5595703125, -10.18017578125, -8.80078125, -7.42138671875, -6.0419921875, -4.66259765625, -3.283203125, -1.90380859375, -0.5244140625, 0.85498046875, 2.234375, 3.61376953125, 4.9931640625, 6.37255859375, 7.751953125, 9.13134765625, 10.5107421875, 11.89013671875, 13.26953125, 14.64892578125, 16.0283203125, 17.40771484375, 18.787109375, 20.16650390625, 21.5458984375, 22.92529296875, 24.3046875, 25.68408203125, 27.0634765625, 28.44287109375, 29.822265625, 31.20166015625, 32.5810546875, 33.96044921875, 35.33984375, 36.71923828125, 38.0986328125, 39.47802734375, 40.857421875, 42.23681640625, 43.6162109375, 44.99560546875, 46.375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 5.0, 11.0, 12.0, 19.0, 28.0, 41.0, 64.0, 101.0, 164.0, 224.0, 366.0, 622.0, 1023.0, 1560.0, 2607.0, 4176.0, 6886.0, 11152.0, 18242.0, 29395.0, 46081.0, 69423.0, 98410.0, 125698.0, 139458.0, 135097.0, 114162.0, 85001.0, 58801.0, 37993.0, 23820.0, 14631.0, 8928.0, 5502.0, 3315.0, 2003.0, 1316.0, 846.0, 514.0, 315.0, 189.0, 146.0, 87.0, 42.0, 35.0, 12.0, 13.0, 5.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.953125, -22.155517578125, -21.35791015625, -20.560302734375, -19.7626953125, -18.965087890625, -18.16748046875, -17.369873046875, -16.572265625, -15.774658203125, -14.97705078125, -14.179443359375, -13.3818359375, -12.584228515625, -11.78662109375, -10.989013671875, -10.19140625, -9.393798828125, -8.59619140625, -7.798583984375, -7.0009765625, -6.203369140625, -5.40576171875, -4.608154296875, -3.810546875, -3.012939453125, -2.21533203125, -1.417724609375, -0.6201171875, 0.177490234375, 0.97509765625, 1.772705078125, 2.5703125, 3.367919921875, 4.16552734375, 4.963134765625, 5.7607421875, 6.558349609375, 7.35595703125, 8.153564453125, 8.951171875, 9.748779296875, 10.54638671875, 11.343994140625, 12.1416015625, 12.939208984375, 13.73681640625, 14.534423828125, 15.33203125, 16.129638671875, 16.92724609375, 17.724853515625, 18.5224609375, 19.320068359375, 20.11767578125, 20.915283203125, 21.712890625, 22.510498046875, 23.30810546875, 24.105712890625, 24.9033203125, 25.700927734375, 26.49853515625, 27.296142578125, 28.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 9.0, 9.0, 6.0, 20.0, 20.0, 9.0, 16.0, 20.0, 24.0, 24.0, 35.0, 18.0, 33.0, 32.0, 31.0, 32.0, 35.0, 47.0, 51.0, 54.0, 41.0, 48.0, 37.0, 36.0, 32.0, 37.0, 40.0, 40.0, 21.0, 14.0, 26.0, 12.0, 12.0, 14.0, 8.0, 8.0, 11.0, 6.0, 6.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.578125, -25.843994140625, -25.10986328125, -24.375732421875, -23.6416015625, -22.907470703125, -22.17333984375, -21.439208984375, -20.705078125, -19.970947265625, -19.23681640625, -18.502685546875, -17.7685546875, -17.034423828125, -16.30029296875, -15.566162109375, -14.83203125, -14.097900390625, -13.36376953125, -12.629638671875, -11.8955078125, -11.161376953125, -10.42724609375, -9.693115234375, -8.958984375, -8.224853515625, -7.49072265625, -6.756591796875, -6.0224609375, -5.288330078125, -4.55419921875, -3.820068359375, -3.0859375, -2.351806640625, -1.61767578125, -0.883544921875, -0.1494140625, 0.584716796875, 1.31884765625, 2.052978515625, 2.787109375, 3.521240234375, 4.25537109375, 4.989501953125, 5.7236328125, 6.457763671875, 7.19189453125, 7.926025390625, 8.66015625, 9.394287109375, 10.12841796875, 10.862548828125, 11.5966796875, 12.330810546875, 13.06494140625, 13.799072265625, 14.533203125, 15.267333984375, 16.00146484375, 16.735595703125, 17.4697265625, 18.203857421875, 18.93798828125, 19.672119140625, 20.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 9.0, 2.0, 6.0, 10.0, 15.0, 15.0, 32.0, 45.0, 65.0, 79.0, 137.0, 201.0, 313.0, 404.0, 631.0, 923.0, 1320.0, 2095.0, 3228.0, 5176.0, 8444.0, 14438.0, 24398.0, 40667.0, 66327.0, 100343.0, 134199.0, 154477.0, 148465.0, 120461.0, 84337.0, 54742.0, 32531.0, 19538.0, 11367.0, 6917.0, 4252.0, 2787.0, 1727.0, 1145.0, 733.0, 500.0, 329.0, 225.0, 172.0, 114.0, 60.0, 55.0, 33.0, 29.0, 18.0, 8.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-7.80078125, -7.55535888671875, -7.3099365234375, -7.06451416015625, -6.819091796875, -6.57366943359375, -6.3282470703125, -6.08282470703125, -5.83740234375, -5.59197998046875, -5.3465576171875, -5.10113525390625, -4.855712890625, -4.61029052734375, -4.3648681640625, -4.11944580078125, -3.8740234375, -3.62860107421875, -3.3831787109375, -3.13775634765625, -2.892333984375, -2.64691162109375, -2.4014892578125, -2.15606689453125, -1.91064453125, -1.66522216796875, -1.4197998046875, -1.17437744140625, -0.928955078125, -0.68353271484375, -0.4381103515625, -0.19268798828125, 0.052734375, 0.29815673828125, 0.5435791015625, 0.78900146484375, 1.034423828125, 1.27984619140625, 1.5252685546875, 1.77069091796875, 2.01611328125, 2.26153564453125, 2.5069580078125, 2.75238037109375, 2.997802734375, 3.24322509765625, 3.4886474609375, 3.73406982421875, 3.9794921875, 4.22491455078125, 4.4703369140625, 4.71575927734375, 4.961181640625, 5.20660400390625, 5.4520263671875, 5.69744873046875, 5.94287109375, 6.18829345703125, 6.4337158203125, 6.67913818359375, 6.924560546875, 7.16998291015625, 7.4154052734375, 7.66082763671875, 7.90625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 8.0, 6.0, 5.0, 14.0, 17.0, 21.0, 21.0, 34.0, 30.0, 35.0, 39.0, 52.0, 50.0, 55.0, 57.0, 54.0, 56.0, 52.0, 46.0, 46.0, 55.0, 42.0, 31.0, 26.0, 27.0, 29.0, 14.0, 17.0, 18.0, 10.0, 8.0, 6.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006937980651855469, -0.0006708577275276184, -0.0006479173898696899, -0.0006249770522117615, -0.000602036714553833, -0.0005790963768959045, -0.0005561560392379761, -0.0005332157015800476, -0.0005102753639221191, -0.0004873350262641907, -0.0004643946886062622, -0.00044145435094833374, -0.0004185140132904053, -0.0003955736756324768, -0.00037263333797454834, -0.0003496930003166199, -0.0003267526626586914, -0.00030381232500076294, -0.00028087198734283447, -0.000257931649684906, -0.00023499131202697754, -0.00021205097436904907, -0.0001891106367111206, -0.00016617029905319214, -0.00014322996139526367, -0.0001202896237373352, -9.734928607940674e-05, -7.440894842147827e-05, -5.1468610763549805e-05, -2.8528273105621338e-05, -5.587935447692871e-06, 1.7352402210235596e-05, 4.029273986816406e-05, 6.323307752609253e-05, 8.6173415184021e-05, 0.00010911375284194946, 0.00013205409049987793, 0.0001549944281578064, 0.00017793476581573486, 0.00020087510347366333, 0.0002238154411315918, 0.00024675577878952026, 0.00026969611644744873, 0.0002926364541053772, 0.00031557679176330566, 0.00033851712942123413, 0.0003614574670791626, 0.00038439780473709106, 0.00040733814239501953, 0.000430278480052948, 0.00045321881771087646, 0.00047615915536880493, 0.0004990994930267334, 0.0005220398306846619, 0.0005449801683425903, 0.0005679205060005188, 0.0005908608436584473, 0.0006138011813163757, 0.0006367415189743042, 0.0006596818566322327, 0.0006826221942901611, 0.0007055625319480896, 0.0007285028696060181, 0.0007514432072639465, 0.000774383544921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 18.0, 24.0, 22.0, 42.0, 35.0, 66.0, 137.0, 185.0, 301.0, 482.0, 853.0, 1829.0, 3757.0, 8535.0, 20750.0, 53688.0, 133044.0, 252736.0, 278024.0, 171327.0, 73141.0, 28373.0, 11337.0, 4837.0, 2318.0, 1132.0, 577.0, 365.0, 209.0, 123.0, 69.0, 51.0, 47.0, 25.0, 18.0, 14.0, 17.0, 4.0, 7.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0703125, -14.5706787109375, -14.071044921875, -13.5714111328125, -13.07177734375, -12.5721435546875, -12.072509765625, -11.5728759765625, -11.0732421875, -10.5736083984375, -10.073974609375, -9.5743408203125, -9.07470703125, -8.5750732421875, -8.075439453125, -7.5758056640625, -7.076171875, -6.5765380859375, -6.076904296875, -5.5772705078125, -5.07763671875, -4.5780029296875, -4.078369140625, -3.5787353515625, -3.0791015625, -2.5794677734375, -2.079833984375, -1.5802001953125, -1.08056640625, -0.5809326171875, -0.081298828125, 0.4183349609375, 0.91796875, 1.4176025390625, 1.917236328125, 2.4168701171875, 2.91650390625, 3.4161376953125, 3.915771484375, 4.4154052734375, 4.9150390625, 5.4146728515625, 5.914306640625, 6.4139404296875, 6.91357421875, 7.4132080078125, 7.912841796875, 8.4124755859375, 8.912109375, 9.4117431640625, 9.911376953125, 10.4110107421875, 10.91064453125, 11.4102783203125, 11.909912109375, 12.4095458984375, 12.9091796875, 13.4088134765625, 13.908447265625, 14.4080810546875, 14.90771484375, 15.4073486328125, 15.906982421875, 16.4066162109375, 16.90625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 6.0, 9.0, 15.0, 23.0, 17.0, 29.0, 33.0, 46.0, 59.0, 96.0, 102.0, 74.0, 76.0, 79.0, 83.0, 51.0, 36.0, 35.0, 38.0, 23.0, 20.0, 5.0, 9.0, 12.0, 4.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37890625, -5.16058349609375, -4.9422607421875, -4.72393798828125, -4.505615234375, -4.28729248046875, -4.0689697265625, -3.85064697265625, -3.63232421875, -3.41400146484375, -3.1956787109375, -2.97735595703125, -2.759033203125, -2.54071044921875, -2.3223876953125, -2.10406494140625, -1.8857421875, -1.66741943359375, -1.4490966796875, -1.23077392578125, -1.012451171875, -0.79412841796875, -0.5758056640625, -0.35748291015625, -0.13916015625, 0.07916259765625, 0.2974853515625, 0.51580810546875, 0.734130859375, 0.95245361328125, 1.1707763671875, 1.38909912109375, 1.607421875, 1.82574462890625, 2.0440673828125, 2.26239013671875, 2.480712890625, 2.69903564453125, 2.9173583984375, 3.13568115234375, 3.35400390625, 3.57232666015625, 3.7906494140625, 4.00897216796875, 4.227294921875, 4.44561767578125, 4.6639404296875, 4.88226318359375, 5.1005859375, 5.31890869140625, 5.5372314453125, 5.75555419921875, 5.973876953125, 6.19219970703125, 6.4105224609375, 6.62884521484375, 6.84716796875, 7.06549072265625, 7.2838134765625, 7.50213623046875, 7.720458984375, 7.93878173828125, 8.1571044921875, 8.37542724609375, 8.59375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 6.0, 8.0, 11.0, 12.0, 16.0, 7.0, 13.0, 20.0, 28.0, 38.0, 33.0, 27.0, 28.0, 35.0, 46.0, 38.0, 38.0, 43.0, 40.0, 33.0, 35.0, 29.0, 34.0, 25.0, 46.0, 37.0, 32.0, 29.0, 18.0, 25.0, 17.0, 19.0, 14.0, 18.0, 14.0, 9.0, 13.0, 8.0, 3.0, 7.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.822050094604492, -19.09874153137207, -18.37543296813965, -17.652124404907227, -16.928815841674805, -16.205507278442383, -15.482198715209961, -14.758890151977539, -14.035581588745117, -13.312273025512695, -12.588964462280273, -11.865655899047852, -11.14234733581543, -10.419038772583008, -9.695730209350586, -8.972421646118164, -8.249113082885742, -7.52580451965332, -6.802495956420898, -6.079187393188477, -5.355878829956055, -4.632570266723633, -3.909261703491211, -3.185953140258789, -2.462644577026367, -1.7393360137939453, -1.0160274505615234, -0.29271888732910156, 0.4305896759033203, 1.1538982391357422, 1.877206802368164, 2.600515365600586, 3.323823928833008, 4.04713249206543, 4.770441055297852, 5.493749618530273, 6.217058181762695, 6.940366744995117, 7.663675308227539, 8.386983871459961, 9.110292434692383, 9.833600997924805, 10.556909561157227, 11.280218124389648, 12.00352668762207, 12.726835250854492, 13.450143814086914, 14.173452377319336, 14.896760940551758, 15.62006950378418, 16.3433780670166, 17.066686630249023, 17.789995193481445, 18.513303756713867, 19.23661231994629, 19.95992088317871, 20.683229446411133, 21.406538009643555, 22.129846572875977, 22.8531551361084, 23.57646369934082, 24.299772262573242, 25.023080825805664, 25.746389389038086, 26.469697952270508]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 7.0, 8.0, 12.0, 21.0, 15.0, 24.0, 21.0, 38.0, 23.0, 38.0, 31.0, 48.0, 43.0, 44.0, 62.0, 50.0, 44.0, 41.0, 50.0, 42.0, 47.0, 42.0, 36.0, 31.0, 20.0, 25.0, 28.0, 13.0, 18.0, 13.0, 12.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.42231369018555, -40.96422576904297, -39.506141662597656, -38.04805374145508, -36.589969635009766, -35.13188171386719, -33.673797607421875, -32.2157096862793, -30.75762367248535, -29.299537658691406, -27.84145164489746, -26.383365631103516, -24.925277709960938, -23.467193603515625, -22.009105682373047, -20.5510196685791, -19.092933654785156, -17.63484764099121, -16.176761627197266, -14.718674659729004, -13.260588645935059, -11.802502632141113, -10.344415664672852, -8.886329650878906, -7.428243637084961, -5.970157623291016, -4.512071132659912, -3.0539846420288086, -1.5958986282348633, -0.13781261444091797, 1.3202743530273438, 2.778360366821289, 4.2364501953125, 5.694536209106445, 7.152622699737549, 8.610709190368652, 10.068795204162598, 11.526881217956543, 12.984968185424805, 14.44305419921875, 15.901140213012695, 17.35922622680664, 18.817312240600586, 20.27539825439453, 21.73348617553711, 23.191570281982422, 24.649658203125, 26.107744216918945, 27.56583023071289, 29.023916244506836, 30.48200225830078, 31.94009017944336, 33.39817428588867, 34.85626220703125, 36.31434631347656, 37.77243423461914, 39.23052215576172, 40.6886100769043, 42.14669418334961, 43.60478210449219, 45.0628662109375, 46.52095413208008, 47.979042053222656, 49.43712615966797, 50.89521026611328]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 9.0, 8.0, 17.0, 29.0, 38.0, 66.0, 88.0, 150.0, 236.0, 356.0, 607.0, 921.0, 1583.0, 2565.0, 4210.0, 6756.0, 11410.0, 17906.0, 29436.0, 47756.0, 75251.0, 119466.0, 182139.0, 266527.0, 367607.0, 463450.0, 525102.0, 522004.0, 456864.0, 355631.0, 256682.0, 173697.0, 113190.0, 71952.0, 45323.0, 28545.0, 17744.0, 10846.0, 6701.0, 4337.0, 2600.0, 1662.0, 1073.0, 661.0, 418.0, 229.0, 155.0, 105.0, 74.0, 37.0, 29.0, 18.0, 9.0, 3.0, 2.0, 6.0, 0.0, 2.0], "bins": [-24.3125, -23.57470703125, -22.8369140625, -22.09912109375, -21.361328125, -20.62353515625, -19.8857421875, -19.14794921875, -18.41015625, -17.67236328125, -16.9345703125, -16.19677734375, -15.458984375, -14.72119140625, -13.9833984375, -13.24560546875, -12.5078125, -11.77001953125, -11.0322265625, -10.29443359375, -9.556640625, -8.81884765625, -8.0810546875, -7.34326171875, -6.60546875, -5.86767578125, -5.1298828125, -4.39208984375, -3.654296875, -2.91650390625, -2.1787109375, -1.44091796875, -0.703125, 0.03466796875, 0.7724609375, 1.51025390625, 2.248046875, 2.98583984375, 3.7236328125, 4.46142578125, 5.19921875, 5.93701171875, 6.6748046875, 7.41259765625, 8.150390625, 8.88818359375, 9.6259765625, 10.36376953125, 11.1015625, 11.83935546875, 12.5771484375, 13.31494140625, 14.052734375, 14.79052734375, 15.5283203125, 16.26611328125, 17.00390625, 17.74169921875, 18.4794921875, 19.21728515625, 19.955078125, 20.69287109375, 21.4306640625, 22.16845703125, 22.90625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 7.0, 9.0, 13.0, 20.0, 13.0, 27.0, 21.0, 31.0, 24.0, 38.0, 40.0, 41.0, 46.0, 49.0, 54.0, 59.0, 37.0, 43.0, 48.0, 48.0, 49.0, 37.0, 37.0, 26.0, 29.0, 21.0, 21.0, 20.0, 17.0, 14.0, 11.0, 10.0, 14.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.564453125, -31.41015625, -30.255859375, -29.1015625, -27.947265625, -26.79296875, -25.638671875, -24.484375, -23.330078125, -22.17578125, -21.021484375, -19.8671875, -18.712890625, -17.55859375, -16.404296875, -15.25, -14.095703125, -12.94140625, -11.787109375, -10.6328125, -9.478515625, -8.32421875, -7.169921875, -6.015625, -4.861328125, -3.70703125, -2.552734375, -1.3984375, -0.244140625, 0.91015625, 2.064453125, 3.21875, 4.373046875, 5.52734375, 6.681640625, 7.8359375, 8.990234375, 10.14453125, 11.298828125, 12.453125, 13.607421875, 14.76171875, 15.916015625, 17.0703125, 18.224609375, 19.37890625, 20.533203125, 21.6875, 22.841796875, 23.99609375, 25.150390625, 26.3046875, 27.458984375, 28.61328125, 29.767578125, 30.921875, 32.076171875, 33.23046875, 34.384765625, 35.5390625, 36.693359375, 37.84765625, 39.001953125, 40.15625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 12.0, 12.0, 24.0, 37.0, 51.0, 90.0, 162.0, 227.0, 401.0, 680.0, 1053.0, 1778.0, 2806.0, 4535.0, 7266.0, 11645.0, 18414.0, 28724.0, 44178.0, 65568.0, 95617.0, 134604.0, 182902.0, 238473.0, 295041.0, 346923.0, 384362.0, 398507.0, 387122.0, 354811.0, 304864.0, 247467.0, 191515.0, 142374.0, 101378.0, 69606.0, 47147.0, 30851.0, 19744.0, 12586.0, 7981.0, 5109.0, 2896.0, 1820.0, 1151.0, 661.0, 415.0, 257.0, 166.0, 101.0, 71.0, 40.0, 25.0, 18.0, 11.0, 7.0, 5.0], "bins": [-19.359375, -18.799560546875, -18.23974609375, -17.679931640625, -17.1201171875, -16.560302734375, -16.00048828125, -15.440673828125, -14.880859375, -14.321044921875, -13.76123046875, -13.201416015625, -12.6416015625, -12.081787109375, -11.52197265625, -10.962158203125, -10.40234375, -9.842529296875, -9.28271484375, -8.722900390625, -8.1630859375, -7.603271484375, -7.04345703125, -6.483642578125, -5.923828125, -5.364013671875, -4.80419921875, -4.244384765625, -3.6845703125, -3.124755859375, -2.56494140625, -2.005126953125, -1.4453125, -0.885498046875, -0.32568359375, 0.234130859375, 0.7939453125, 1.353759765625, 1.91357421875, 2.473388671875, 3.033203125, 3.593017578125, 4.15283203125, 4.712646484375, 5.2724609375, 5.832275390625, 6.39208984375, 6.951904296875, 7.51171875, 8.071533203125, 8.63134765625, 9.191162109375, 9.7509765625, 10.310791015625, 10.87060546875, 11.430419921875, 11.990234375, 12.550048828125, 13.10986328125, 13.669677734375, 14.2294921875, 14.789306640625, 15.34912109375, 15.908935546875, 16.46875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 8.0, 14.0, 13.0, 13.0, 17.0, 34.0, 31.0, 42.0, 50.0, 64.0, 64.0, 77.0, 92.0, 97.0, 121.0, 136.0, 152.0, 161.0, 157.0, 184.0, 187.0, 191.0, 203.0, 197.0, 191.0, 205.0, 168.0, 171.0, 142.0, 122.0, 112.0, 121.0, 85.0, 64.0, 72.0, 54.0, 49.0, 38.0, 38.0, 26.0, 18.0, 22.0, 11.0, 8.0, 11.0, 5.0, 11.0, 10.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.3984375, -11.9932861328125, -11.588134765625, -11.1829833984375, -10.77783203125, -10.3726806640625, -9.967529296875, -9.5623779296875, -9.1572265625, -8.7520751953125, -8.346923828125, -7.9417724609375, -7.53662109375, -7.1314697265625, -6.726318359375, -6.3211669921875, -5.916015625, -5.5108642578125, -5.105712890625, -4.7005615234375, -4.29541015625, -3.8902587890625, -3.485107421875, -3.0799560546875, -2.6748046875, -2.2696533203125, -1.864501953125, -1.4593505859375, -1.05419921875, -0.6490478515625, -0.243896484375, 0.1612548828125, 0.56640625, 0.9715576171875, 1.376708984375, 1.7818603515625, 2.18701171875, 2.5921630859375, 2.997314453125, 3.4024658203125, 3.8076171875, 4.2127685546875, 4.617919921875, 5.0230712890625, 5.42822265625, 5.8333740234375, 6.238525390625, 6.6436767578125, 7.048828125, 7.4539794921875, 7.859130859375, 8.2642822265625, 8.66943359375, 9.0745849609375, 9.479736328125, 9.8848876953125, 10.2900390625, 10.6951904296875, 11.100341796875, 11.5054931640625, 11.91064453125, 12.3157958984375, 12.720947265625, 13.1260986328125, 13.53125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 14.0, 19.0, 24.0, 21.0, 29.0, 20.0, 37.0, 36.0, 35.0, 35.0, 39.0, 49.0, 45.0, 56.0, 53.0, 38.0, 41.0, 43.0, 26.0, 45.0, 37.0, 35.0, 28.0, 24.0, 13.0, 17.0, 19.0, 11.0, 11.0, 12.0, 8.0, 9.0, 4.0, 13.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-25.411588668823242, -24.619050979614258, -23.82651138305664, -23.033973693847656, -22.24143409729004, -21.448896408081055, -20.656356811523438, -19.863819122314453, -19.071279525756836, -18.27874183654785, -17.486202239990234, -16.69366455078125, -15.901124954223633, -15.108586311340332, -14.316047668457031, -13.523509979248047, -12.730971336364746, -11.938432693481445, -11.145894050598145, -10.353355407714844, -9.560816764831543, -8.768278121948242, -7.9757399559021, -7.183201313018799, -6.390662670135498, -5.598124027252197, -4.8055853843688965, -4.013047218322754, -3.220508337020874, -2.4279696941375732, -1.6354312896728516, -0.8428926467895508, -0.05035400390625, 0.742184579372406, 1.534723162651062, 2.3272616863250732, 3.119800329208374, 3.912338972091675, 4.7048773765563965, 5.497416019439697, 6.289954662322998, 7.082493305206299, 7.8750319480896, 8.667570114135742, 9.460108757019043, 10.252647399902344, 11.045186042785645, 11.837724685668945, 12.630263328552246, 13.422801971435547, 14.215340614318848, 15.007879257202148, 15.80041790008545, 16.59295654296875, 17.385494232177734, 18.17803382873535, 18.970571517944336, 19.76310920715332, 20.555648803710938, 21.348186492919922, 22.14072608947754, 22.933263778686523, 23.72580337524414, 24.518341064453125, 25.310880661010742]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 11.0, 9.0, 3.0, 7.0, 6.0, 16.0, 10.0, 20.0, 21.0, 28.0, 16.0, 31.0, 18.0, 40.0, 29.0, 30.0, 32.0, 41.0, 40.0, 45.0, 53.0, 49.0, 53.0, 41.0, 38.0, 40.0, 38.0, 37.0, 30.0, 27.0, 26.0, 19.0, 17.0, 16.0, 13.0, 12.0, 8.0, 7.0, 13.0, 3.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.79808044433594, -33.544334411621094, -32.290592193603516, -31.036846160888672, -29.78310203552246, -28.52935791015625, -27.275611877441406, -26.021867752075195, -24.768123626708984, -23.514379501342773, -22.260635375976562, -21.00688934326172, -19.753145217895508, -18.499401092529297, -17.245655059814453, -15.991910934448242, -14.738166809082031, -13.48442268371582, -12.230677604675293, -10.976932525634766, -9.723188400268555, -8.469444274902344, -7.215699195861816, -5.961954116821289, -4.708209991455078, -3.454465389251709, -2.20072078704834, -0.9469761848449707, 0.30676841735839844, 1.5605130195617676, 2.8142576217651367, 4.068002700805664, 5.321746826171875, 6.575491428375244, 7.829236030578613, 9.08298110961914, 10.336725234985352, 11.590469360351562, 12.84421443939209, 14.097959518432617, 15.351703643798828, 16.60544776916504, 17.85919189453125, 19.112937927246094, 20.366682052612305, 21.620426177978516, 22.87417221069336, 24.12791633605957, 25.38166046142578, 26.635404586791992, 27.889148712158203, 29.142894744873047, 30.396638870239258, 31.65038299560547, 32.90412902832031, 34.157875061035156, 35.411617279052734, 36.66536331176758, 37.919105529785156, 39.1728515625, 40.426597595214844, 41.68033981323242, 42.934085845947266, 44.187828063964844, 45.44157409667969]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 4.0, 2.0, 7.0, 6.0, 15.0, 22.0, 28.0, 42.0, 52.0, 63.0, 80.0, 132.0, 153.0, 224.0, 292.0, 446.0, 645.0, 885.0, 1230.0, 1885.0, 2756.0, 4079.0, 6244.0, 9127.0, 14431.0, 23376.0, 39125.0, 67096.0, 121603.0, 230223.0, 229883.0, 121700.0, 67309.0, 39187.0, 23222.0, 14564.0, 9285.0, 6067.0, 4158.0, 2673.0, 1873.0, 1269.0, 907.0, 588.0, 443.0, 333.0, 215.0, 157.0, 138.0, 97.0, 81.0, 51.0, 35.0, 20.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-4.44140625, -4.3026123046875, -4.163818359375, -4.0250244140625, -3.88623046875, -3.7474365234375, -3.608642578125, -3.4698486328125, -3.3310546875, -3.1922607421875, -3.053466796875, -2.9146728515625, -2.77587890625, -2.6370849609375, -2.498291015625, -2.3594970703125, -2.220703125, -2.0819091796875, -1.943115234375, -1.8043212890625, -1.66552734375, -1.5267333984375, -1.387939453125, -1.2491455078125, -1.1103515625, -0.9715576171875, -0.832763671875, -0.6939697265625, -0.55517578125, -0.4163818359375, -0.277587890625, -0.1387939453125, 0.0, 0.1387939453125, 0.277587890625, 0.4163818359375, 0.55517578125, 0.6939697265625, 0.832763671875, 0.9715576171875, 1.1103515625, 1.2491455078125, 1.387939453125, 1.5267333984375, 1.66552734375, 1.8043212890625, 1.943115234375, 2.0819091796875, 2.220703125, 2.3594970703125, 2.498291015625, 2.6370849609375, 2.77587890625, 2.9146728515625, 3.053466796875, 3.1922607421875, 3.3310546875, 3.4698486328125, 3.608642578125, 3.7474365234375, 3.88623046875, 4.0250244140625, 4.163818359375, 4.3026123046875, 4.44140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 11.0, 8.0, 3.0, 7.0, 5.0, 17.0, 11.0, 19.0, 22.0, 27.0, 17.0, 31.0, 18.0, 40.0, 30.0, 29.0, 34.0, 40.0, 39.0, 46.0, 54.0, 46.0, 54.0, 44.0, 35.0, 41.0, 37.0, 39.0, 28.0, 28.0, 26.0, 17.0, 20.0, 13.0, 13.0, 12.0, 9.0, 6.0, 14.0, 2.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.53125, -33.28125, -32.03125, -30.78125, -29.53125, -28.28125, -27.03125, -25.78125, -24.53125, -23.28125, -22.03125, -20.78125, -19.53125, -18.28125, -17.03125, -15.78125, -14.53125, -13.28125, -12.03125, -10.78125, -9.53125, -8.28125, -7.03125, -5.78125, -4.53125, -3.28125, -2.03125, -0.78125, 0.46875, 1.71875, 2.96875, 4.21875, 5.46875, 6.71875, 7.96875, 9.21875, 10.46875, 11.71875, 12.96875, 14.21875, 15.46875, 16.71875, 17.96875, 19.21875, 20.46875, 21.71875, 22.96875, 24.21875, 25.46875, 26.71875, 27.96875, 29.21875, 30.46875, 31.71875, 32.96875, 34.21875, 35.46875, 36.71875, 37.96875, 39.21875, 40.46875, 41.71875, 42.96875, 44.21875, 45.46875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 6.0, 7.0, 10.0, 19.0, 31.0, 47.0, 55.0, 100.0, 137.0, 205.0, 326.0, 525.0, 840.0, 1340.0, 2110.0, 3548.0, 6659.0, 12307.0, 23015.0, 45199.0, 94378.0, 233184.0, 344640.0, 145189.0, 64656.0, 32124.0, 16739.0, 9014.0, 4940.0, 2822.0, 1695.0, 983.0, 598.0, 366.0, 251.0, 174.0, 99.0, 71.0, 42.0, 38.0, 22.0, 16.0, 6.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.51116943359375, -5.3348388671875, -5.15850830078125, -4.982177734375, -4.80584716796875, -4.6295166015625, -4.45318603515625, -4.27685546875, -4.10052490234375, -3.9241943359375, -3.74786376953125, -3.571533203125, -3.39520263671875, -3.2188720703125, -3.04254150390625, -2.8662109375, -2.68988037109375, -2.5135498046875, -2.33721923828125, -2.160888671875, -1.98455810546875, -1.8082275390625, -1.63189697265625, -1.45556640625, -1.27923583984375, -1.1029052734375, -0.92657470703125, -0.750244140625, -0.57391357421875, -0.3975830078125, -0.22125244140625, -0.044921875, 0.13140869140625, 0.3077392578125, 0.48406982421875, 0.660400390625, 0.83673095703125, 1.0130615234375, 1.18939208984375, 1.36572265625, 1.54205322265625, 1.7183837890625, 1.89471435546875, 2.071044921875, 2.24737548828125, 2.4237060546875, 2.60003662109375, 2.7763671875, 2.95269775390625, 3.1290283203125, 3.30535888671875, 3.481689453125, 3.65802001953125, 3.8343505859375, 4.01068115234375, 4.18701171875, 4.36334228515625, 4.5396728515625, 4.71600341796875, 4.892333984375, 5.06866455078125, 5.2449951171875, 5.42132568359375, 5.59765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 1.0, 4.0, 7.0, 9.0, 9.0, 14.0, 8.0, 10.0, 25.0, 28.0, 24.0, 20.0, 24.0, 25.0, 26.0, 39.0, 34.0, 24.0, 43.0, 25.0, 45.0, 17.0, 44.0, 30.0, 40.0, 37.0, 38.0, 20.0, 46.0, 29.0, 38.0, 27.0, 22.0, 20.0, 19.0, 18.0, 17.0, 12.0, 18.0, 8.0, 13.0, 5.0, 5.0, 8.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.703125, -22.99462890625, -22.2861328125, -21.57763671875, -20.869140625, -20.16064453125, -19.4521484375, -18.74365234375, -18.03515625, -17.32666015625, -16.6181640625, -15.90966796875, -15.201171875, -14.49267578125, -13.7841796875, -13.07568359375, -12.3671875, -11.65869140625, -10.9501953125, -10.24169921875, -9.533203125, -8.82470703125, -8.1162109375, -7.40771484375, -6.69921875, -5.99072265625, -5.2822265625, -4.57373046875, -3.865234375, -3.15673828125, -2.4482421875, -1.73974609375, -1.03125, -0.32275390625, 0.3857421875, 1.09423828125, 1.802734375, 2.51123046875, 3.2197265625, 3.92822265625, 4.63671875, 5.34521484375, 6.0537109375, 6.76220703125, 7.470703125, 8.17919921875, 8.8876953125, 9.59619140625, 10.3046875, 11.01318359375, 11.7216796875, 12.43017578125, 13.138671875, 13.84716796875, 14.5556640625, 15.26416015625, 15.97265625, 16.68115234375, 17.3896484375, 18.09814453125, 18.806640625, 19.51513671875, 20.2236328125, 20.93212890625, 21.640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 10.0, 5.0, 12.0, 14.0, 18.0, 21.0, 33.0, 33.0, 39.0, 61.0, 73.0, 94.0, 134.0, 197.0, 287.0, 394.0, 568.0, 838.0, 1311.0, 2125.0, 3843.0, 7865.0, 19760.0, 73609.0, 461023.0, 379424.0, 62283.0, 17967.0, 7081.0, 3579.0, 2010.0, 1207.0, 779.0, 553.0, 368.0, 239.0, 206.0, 128.0, 86.0, 78.0, 51.0, 52.0, 22.0, 19.0, 10.0, 12.0, 9.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.171875, -1.13519287109375, -1.0985107421875, -1.06182861328125, -1.025146484375, -0.98846435546875, -0.9517822265625, -0.91510009765625, -0.87841796875, -0.84173583984375, -0.8050537109375, -0.76837158203125, -0.731689453125, -0.69500732421875, -0.6583251953125, -0.62164306640625, -0.5849609375, -0.54827880859375, -0.5115966796875, -0.47491455078125, -0.438232421875, -0.40155029296875, -0.3648681640625, -0.32818603515625, -0.29150390625, -0.25482177734375, -0.2181396484375, -0.18145751953125, -0.144775390625, -0.10809326171875, -0.0714111328125, -0.03472900390625, 0.001953125, 0.03863525390625, 0.0753173828125, 0.11199951171875, 0.148681640625, 0.18536376953125, 0.2220458984375, 0.25872802734375, 0.29541015625, 0.33209228515625, 0.3687744140625, 0.40545654296875, 0.442138671875, 0.47882080078125, 0.5155029296875, 0.55218505859375, 0.5888671875, 0.62554931640625, 0.6622314453125, 0.69891357421875, 0.735595703125, 0.77227783203125, 0.8089599609375, 0.84564208984375, 0.88232421875, 0.91900634765625, 0.9556884765625, 0.99237060546875, 1.029052734375, 1.06573486328125, 1.1024169921875, 1.13909912109375, 1.17578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 3.0, 4.0, 7.0, 14.0, 12.0, 23.0, 30.0, 37.0, 58.0, 67.0, 69.0, 81.0, 90.0, 98.0, 82.0, 72.0, 57.0, 38.0, 34.0, 26.0, 14.0, 18.0, 12.0, 14.0, 4.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.071826934814453e-05, -8.78702849149704e-05, -8.502230048179626e-05, -8.217431604862213e-05, -7.9326331615448e-05, -7.647834718227386e-05, -7.363036274909973e-05, -7.07823783159256e-05, -6.793439388275146e-05, -6.508640944957733e-05, -6.22384250164032e-05, -5.9390440583229065e-05, -5.654245615005493e-05, -5.36944717168808e-05, -5.0846487283706665e-05, -4.799850285053253e-05, -4.51505184173584e-05, -4.2302533984184265e-05, -3.945454955101013e-05, -3.6606565117836e-05, -3.3758580684661865e-05, -3.091059625148773e-05, -2.80626118183136e-05, -2.5214627385139465e-05, -2.2366642951965332e-05, -1.95186585187912e-05, -1.6670674085617065e-05, -1.3822689652442932e-05, -1.0974705219268799e-05, -8.126720786094666e-06, -5.278736352920532e-06, -2.430751919746399e-06, 4.172325134277344e-07, 3.2652169466018677e-06, 6.113201379776001e-06, 8.961185812950134e-06, 1.1809170246124268e-05, 1.4657154679298401e-05, 1.7505139112472534e-05, 2.0353123545646667e-05, 2.32011079788208e-05, 2.6049092411994934e-05, 2.8897076845169067e-05, 3.17450612783432e-05, 3.4593045711517334e-05, 3.744103014469147e-05, 4.02890145778656e-05, 4.3136999011039734e-05, 4.598498344421387e-05, 4.8832967877388e-05, 5.1680952310562134e-05, 5.452893674373627e-05, 5.73769211769104e-05, 6.0224905610084534e-05, 6.307289004325867e-05, 6.59208744764328e-05, 6.876885890960693e-05, 7.161684334278107e-05, 7.44648277759552e-05, 7.731281220912933e-05, 8.016079664230347e-05, 8.30087810754776e-05, 8.585676550865173e-05, 8.870474994182587e-05, 9.1552734375e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 17.0, 12.0, 23.0, 26.0, 46.0, 64.0, 102.0, 166.0, 229.0, 361.0, 536.0, 833.0, 1293.0, 2102.0, 3377.0, 5598.0, 8912.0, 14729.0, 24227.0, 40981.0, 70465.0, 131274.0, 264298.0, 220105.0, 108896.0, 60369.0, 35129.0, 20974.0, 12656.0, 7749.0, 4739.0, 3034.0, 1860.0, 1198.0, 714.0, 515.0, 323.0, 199.0, 128.0, 92.0, 66.0, 44.0, 35.0, 17.0, 17.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.06414794921875, -1.0296630859375, -0.99517822265625, -0.960693359375, -0.92620849609375, -0.8917236328125, -0.85723876953125, -0.82275390625, -0.78826904296875, -0.7537841796875, -0.71929931640625, -0.684814453125, -0.65032958984375, -0.6158447265625, -0.58135986328125, -0.546875, -0.51239013671875, -0.4779052734375, -0.44342041015625, -0.408935546875, -0.37445068359375, -0.3399658203125, -0.30548095703125, -0.27099609375, -0.23651123046875, -0.2020263671875, -0.16754150390625, -0.133056640625, -0.09857177734375, -0.0640869140625, -0.02960205078125, 0.0048828125, 0.03936767578125, 0.0738525390625, 0.10833740234375, 0.142822265625, 0.17730712890625, 0.2117919921875, 0.24627685546875, 0.28076171875, 0.31524658203125, 0.3497314453125, 0.38421630859375, 0.418701171875, 0.45318603515625, 0.4876708984375, 0.52215576171875, 0.556640625, 0.59112548828125, 0.6256103515625, 0.66009521484375, 0.694580078125, 0.72906494140625, 0.7635498046875, 0.79803466796875, 0.83251953125, 0.86700439453125, 0.9014892578125, 0.93597412109375, 0.970458984375, 1.00494384765625, 1.0394287109375, 1.07391357421875, 1.1083984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 8.0, 3.0, 2.0, 9.0, 4.0, 8.0, 7.0, 23.0, 18.0, 15.0, 23.0, 31.0, 32.0, 48.0, 35.0, 32.0, 42.0, 40.0, 44.0, 40.0, 22.0, 36.0, 36.0, 35.0, 44.0, 37.0, 32.0, 29.0, 41.0, 37.0, 32.0, 26.0, 23.0, 21.0, 21.0, 7.0, 15.0, 8.0, 4.0, 11.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6642074584960938, -0.6423797607421875, -0.6205520629882812, -0.598724365234375, -0.5768966674804688, -0.5550689697265625, -0.5332412719726562, -0.51141357421875, -0.48958587646484375, -0.4677581787109375, -0.44593048095703125, -0.424102783203125, -0.40227508544921875, -0.3804473876953125, -0.35861968994140625, -0.3367919921875, -0.31496429443359375, -0.2931365966796875, -0.27130889892578125, -0.249481201171875, -0.22765350341796875, -0.2058258056640625, -0.18399810791015625, -0.16217041015625, -0.14034271240234375, -0.1185150146484375, -0.09668731689453125, -0.074859619140625, -0.05303192138671875, -0.0312042236328125, -0.00937652587890625, 0.012451171875, 0.03427886962890625, 0.0561065673828125, 0.07793426513671875, 0.099761962890625, 0.12158966064453125, 0.1434173583984375, 0.16524505615234375, 0.18707275390625, 0.20890045166015625, 0.2307281494140625, 0.25255584716796875, 0.274383544921875, 0.29621124267578125, 0.3180389404296875, 0.33986663818359375, 0.3616943359375, 0.38352203369140625, 0.4053497314453125, 0.42717742919921875, 0.449005126953125, 0.47083282470703125, 0.4926605224609375, 0.5144882202148438, 0.53631591796875, 0.5581436157226562, 0.5799713134765625, 0.6017990112304688, 0.623626708984375, 0.6454544067382812, 0.6672821044921875, 0.6891098022460938, 0.7109375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 7.0, 8.0, 15.0, 14.0, 15.0, 29.0, 28.0, 22.0, 32.0, 32.0, 34.0, 40.0, 33.0, 42.0, 47.0, 58.0, 45.0, 41.0, 39.0, 51.0, 28.0, 33.0, 42.0, 39.0, 28.0, 25.0, 23.0, 17.0, 21.0, 14.0, 6.0, 12.0, 12.0, 4.0, 11.0, 9.0, 7.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-25.356735229492188, -24.57654571533203, -23.796358108520508, -23.01616859436035, -22.235979080200195, -21.455791473388672, -20.675601959228516, -19.89541244506836, -19.115222930908203, -18.335033416748047, -17.554845809936523, -16.774656295776367, -15.994466781616211, -15.214278221130371, -14.434089660644531, -13.653900146484375, -12.873712539672852, -12.093523979187012, -11.313334465026855, -10.533145904541016, -9.75295639038086, -8.97276782989502, -8.19257926940918, -7.412390232086182, -6.632201194763184, -5.8520121574401855, -5.0718231201171875, -4.291634559631348, -3.5114455223083496, -2.7312564849853516, -1.9510679244995117, -1.1708788871765137, -0.3906898498535156, 0.38949906826019287, 1.1696879863739014, 1.9498767852783203, 2.7300658226013184, 3.5102548599243164, 4.290443420410156, 5.070632457733154, 5.850821495056152, 6.63101053237915, 7.411199569702148, 8.191388130187988, 8.971576690673828, 9.751766204833984, 10.531954765319824, 11.312143325805664, 12.09233283996582, 12.87252140045166, 13.652710914611816, 14.432899475097656, 15.213088989257812, 15.993277549743652, 16.773466110229492, 17.55365562438965, 18.333843231201172, 19.114032745361328, 19.89422035217285, 20.674409866333008, 21.454599380493164, 22.234786987304688, 23.014976501464844, 23.795166015625, 24.575355529785156]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 3.0, 7.0, 8.0, 14.0, 13.0, 19.0, 27.0, 25.0, 17.0, 23.0, 30.0, 39.0, 26.0, 28.0, 40.0, 36.0, 39.0, 49.0, 50.0, 52.0, 47.0, 44.0, 43.0, 34.0, 38.0, 41.0, 21.0, 30.0, 26.0, 19.0, 18.0, 13.0, 18.0, 5.0, 11.0, 5.0, 12.0, 3.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.350311279296875, -33.10089111328125, -31.851470947265625, -30.602048873901367, -29.352628707885742, -28.103208541870117, -26.85378646850586, -25.604366302490234, -24.35494613647461, -23.105525970458984, -21.85610580444336, -20.6066837310791, -19.357263565063477, -18.10784339904785, -16.858421325683594, -15.609001159667969, -14.359580993652344, -13.110160827636719, -11.860739707946777, -10.611318588256836, -9.361898422241211, -8.112478256225586, -6.8630571365356445, -5.613636016845703, -4.364215850830078, -3.114795207977295, -1.8653745651245117, -0.6159539222717285, 0.6334667205810547, 1.882887363433838, 3.132308006286621, 4.3817291259765625, 5.631145477294922, 6.880566120147705, 8.129986763000488, 9.37940788269043, 10.628828048706055, 11.87824821472168, 13.127669334411621, 14.377090454101562, 15.626510620117188, 16.875930786132812, 18.125350952148438, 19.374773025512695, 20.62419319152832, 21.873613357543945, 23.123035430908203, 24.372455596923828, 25.621875762939453, 26.871295928955078, 28.120716094970703, 29.37013816833496, 30.619558334350586, 31.86897850036621, 33.11840057373047, 34.367820739746094, 35.61724090576172, 36.866661071777344, 38.11608123779297, 39.365501403808594, 40.61492156982422, 41.86434555053711, 43.113765716552734, 44.36318588256836, 45.612606048583984]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 6.0, 7.0, 16.0, 26.0, 30.0, 45.0, 86.0, 130.0, 185.0, 310.0, 464.0, 727.0, 1239.0, 1930.0, 3078.0, 4985.0, 8371.0, 13626.0, 22279.0, 35698.0, 54563.0, 78687.0, 104799.0, 127010.0, 135149.0, 126442.0, 104709.0, 77909.0, 54019.0, 34981.0, 22039.0, 13584.0, 8286.0, 4940.0, 2995.0, 1919.0, 1214.0, 744.0, 477.0, 288.0, 223.0, 131.0, 66.0, 54.0, 32.0, 25.0, 11.0, 10.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.453125, -18.770263671875, -18.08740234375, -17.404541015625, -16.7216796875, -16.038818359375, -15.35595703125, -14.673095703125, -13.990234375, -13.307373046875, -12.62451171875, -11.941650390625, -11.2587890625, -10.575927734375, -9.89306640625, -9.210205078125, -8.52734375, -7.844482421875, -7.16162109375, -6.478759765625, -5.7958984375, -5.113037109375, -4.43017578125, -3.747314453125, -3.064453125, -2.381591796875, -1.69873046875, -1.015869140625, -0.3330078125, 0.349853515625, 1.03271484375, 1.715576171875, 2.3984375, 3.081298828125, 3.76416015625, 4.447021484375, 5.1298828125, 5.812744140625, 6.49560546875, 7.178466796875, 7.861328125, 8.544189453125, 9.22705078125, 9.909912109375, 10.5927734375, 11.275634765625, 11.95849609375, 12.641357421875, 13.32421875, 14.007080078125, 14.68994140625, 15.372802734375, 16.0556640625, 16.738525390625, 17.42138671875, 18.104248046875, 18.787109375, 19.469970703125, 20.15283203125, 20.835693359375, 21.5185546875, 22.201416015625, 22.88427734375, 23.567138671875, 24.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 10.0, 7.0, 4.0, 7.0, 6.0, 16.0, 13.0, 21.0, 26.0, 25.0, 15.0, 27.0, 30.0, 33.0, 28.0, 31.0, 38.0, 36.0, 43.0, 51.0, 49.0, 50.0, 46.0, 45.0, 41.0, 42.0, 34.0, 40.0, 21.0, 31.0, 23.0, 18.0, 17.0, 12.0, 18.0, 7.0, 11.0, 6.0, 10.0, 3.0, 4.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.5, -32.2783203125, -31.056640625, -29.8349609375, -28.61328125, -27.3916015625, -26.169921875, -24.9482421875, -23.7265625, -22.5048828125, -21.283203125, -20.0615234375, -18.83984375, -17.6181640625, -16.396484375, -15.1748046875, -13.953125, -12.7314453125, -11.509765625, -10.2880859375, -9.06640625, -7.8447265625, -6.623046875, -5.4013671875, -4.1796875, -2.9580078125, -1.736328125, -0.5146484375, 0.70703125, 1.9287109375, 3.150390625, 4.3720703125, 5.59375, 6.8154296875, 8.037109375, 9.2587890625, 10.48046875, 11.7021484375, 12.923828125, 14.1455078125, 15.3671875, 16.5888671875, 17.810546875, 19.0322265625, 20.25390625, 21.4755859375, 22.697265625, 23.9189453125, 25.140625, 26.3623046875, 27.583984375, 28.8056640625, 30.02734375, 31.2490234375, 32.470703125, 33.6923828125, 34.9140625, 36.1357421875, 37.357421875, 38.5791015625, 39.80078125, 41.0224609375, 42.244140625, 43.4658203125, 44.6875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 8.0, 15.0, 22.0, 31.0, 51.0, 88.0, 150.0, 167.0, 314.0, 418.0, 712.0, 1046.0, 1667.0, 2754.0, 4425.0, 7310.0, 12171.0, 19916.0, 32614.0, 50782.0, 75944.0, 104970.0, 130066.0, 141420.0, 132664.0, 107755.0, 79110.0, 53702.0, 34042.0, 21124.0, 12769.0, 7720.0, 4661.0, 2845.0, 1798.0, 1132.0, 719.0, 519.0, 261.0, 218.0, 152.0, 93.0, 62.0, 49.0, 23.0, 21.0, 18.0, 11.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0], "bins": [-24.59375, -23.86083984375, -23.1279296875, -22.39501953125, -21.662109375, -20.92919921875, -20.1962890625, -19.46337890625, -18.73046875, -17.99755859375, -17.2646484375, -16.53173828125, -15.798828125, -15.06591796875, -14.3330078125, -13.60009765625, -12.8671875, -12.13427734375, -11.4013671875, -10.66845703125, -9.935546875, -9.20263671875, -8.4697265625, -7.73681640625, -7.00390625, -6.27099609375, -5.5380859375, -4.80517578125, -4.072265625, -3.33935546875, -2.6064453125, -1.87353515625, -1.140625, -0.40771484375, 0.3251953125, 1.05810546875, 1.791015625, 2.52392578125, 3.2568359375, 3.98974609375, 4.72265625, 5.45556640625, 6.1884765625, 6.92138671875, 7.654296875, 8.38720703125, 9.1201171875, 9.85302734375, 10.5859375, 11.31884765625, 12.0517578125, 12.78466796875, 13.517578125, 14.25048828125, 14.9833984375, 15.71630859375, 16.44921875, 17.18212890625, 17.9150390625, 18.64794921875, 19.380859375, 20.11376953125, 20.8466796875, 21.57958984375, 22.3125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 5.0, 9.0, 15.0, 8.0, 13.0, 8.0, 16.0, 15.0, 23.0, 29.0, 20.0, 30.0, 24.0, 25.0, 29.0, 26.0, 37.0, 46.0, 45.0, 40.0, 43.0, 55.0, 46.0, 37.0, 40.0, 28.0, 53.0, 37.0, 26.0, 24.0, 25.0, 21.0, 15.0, 20.0, 13.0, 13.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.434814453125, -22.63525390625, -21.835693359375, -21.0361328125, -20.236572265625, -19.43701171875, -18.637451171875, -17.837890625, -17.038330078125, -16.23876953125, -15.439208984375, -14.6396484375, -13.840087890625, -13.04052734375, -12.240966796875, -11.44140625, -10.641845703125, -9.84228515625, -9.042724609375, -8.2431640625, -7.443603515625, -6.64404296875, -5.844482421875, -5.044921875, -4.245361328125, -3.44580078125, -2.646240234375, -1.8466796875, -1.047119140625, -0.24755859375, 0.552001953125, 1.3515625, 2.151123046875, 2.95068359375, 3.750244140625, 4.5498046875, 5.349365234375, 6.14892578125, 6.948486328125, 7.748046875, 8.547607421875, 9.34716796875, 10.146728515625, 10.9462890625, 11.745849609375, 12.54541015625, 13.344970703125, 14.14453125, 14.944091796875, 15.74365234375, 16.543212890625, 17.3427734375, 18.142333984375, 18.94189453125, 19.741455078125, 20.541015625, 21.340576171875, 22.14013671875, 22.939697265625, 23.7392578125, 24.538818359375, 25.33837890625, 26.137939453125, 26.9375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 15.0, 5.0, 10.0, 16.0, 24.0, 33.0, 64.0, 84.0, 102.0, 186.0, 252.0, 364.0, 613.0, 933.0, 1445.0, 2270.0, 3672.0, 5922.0, 9382.0, 15118.0, 24283.0, 38316.0, 58938.0, 84795.0, 110471.0, 130231.0, 135307.0, 123041.0, 98646.0, 72294.0, 48553.0, 30978.0, 19578.0, 12311.0, 7491.0, 4614.0, 2956.0, 1855.0, 1154.0, 768.0, 473.0, 338.0, 214.0, 148.0, 96.0, 70.0, 46.0, 27.0, 21.0, 12.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.36328125, -6.16607666015625, -5.9688720703125, -5.77166748046875, -5.574462890625, -5.37725830078125, -5.1800537109375, -4.98284912109375, -4.78564453125, -4.58843994140625, -4.3912353515625, -4.19403076171875, -3.996826171875, -3.79962158203125, -3.6024169921875, -3.40521240234375, -3.2080078125, -3.01080322265625, -2.8135986328125, -2.61639404296875, -2.419189453125, -2.22198486328125, -2.0247802734375, -1.82757568359375, -1.63037109375, -1.43316650390625, -1.2359619140625, -1.03875732421875, -0.841552734375, -0.64434814453125, -0.4471435546875, -0.24993896484375, -0.052734375, 0.14447021484375, 0.3416748046875, 0.53887939453125, 0.736083984375, 0.93328857421875, 1.1304931640625, 1.32769775390625, 1.52490234375, 1.72210693359375, 1.9193115234375, 2.11651611328125, 2.313720703125, 2.51092529296875, 2.7081298828125, 2.90533447265625, 3.1025390625, 3.29974365234375, 3.4969482421875, 3.69415283203125, 3.891357421875, 4.08856201171875, 4.2857666015625, 4.48297119140625, 4.68017578125, 4.87738037109375, 5.0745849609375, 5.27178955078125, 5.468994140625, 5.66619873046875, 5.8634033203125, 6.06060791015625, 6.2578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 11.0, 5.0, 9.0, 14.0, 14.0, 9.0, 13.0, 28.0, 22.0, 28.0, 39.0, 46.0, 36.0, 44.0, 46.0, 45.0, 67.0, 41.0, 72.0, 56.0, 47.0, 47.0, 40.0, 38.0, 52.0, 21.0, 32.0, 15.0, 21.0, 6.0, 10.0, 9.0, 8.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006341934204101562, -0.0006134212017059326, -0.000592648983001709, -0.0005718767642974854, -0.0005511045455932617, -0.0005303323268890381, -0.0005095601081848145, -0.0004887878894805908, -0.0004680156707763672, -0.00044724345207214355, -0.0004264712333679199, -0.0004056990146636963, -0.00038492679595947266, -0.000364154577255249, -0.0003433823585510254, -0.00032261013984680176, -0.0003018379211425781, -0.0002810657024383545, -0.00026029348373413086, -0.00023952126502990723, -0.0002187490463256836, -0.00019797682762145996, -0.00017720460891723633, -0.0001564323902130127, -0.00013566017150878906, -0.00011488795280456543, -9.41157341003418e-05, -7.334351539611816e-05, -5.257129669189453e-05, -3.17990779876709e-05, -1.1026859283447266e-05, 9.745359420776367e-06, 3.0517578125e-05, 5.128979682922363e-05, 7.206201553344727e-05, 9.28342342376709e-05, 0.00011360645294189453, 0.00013437867164611816, 0.0001551508903503418, 0.00017592310905456543, 0.00019669532775878906, 0.0002174675464630127, 0.00023823976516723633, 0.00025901198387145996, 0.0002797842025756836, 0.0003005564212799072, 0.00032132863998413086, 0.0003421008586883545, 0.0003628730773925781, 0.00038364529609680176, 0.0004044175148010254, 0.000425189733505249, 0.00044596195220947266, 0.0004667341709136963, 0.0004875063896179199, 0.0005082786083221436, 0.0005290508270263672, 0.0005498230457305908, 0.0005705952644348145, 0.0005913674831390381, 0.0006121397018432617, 0.0006329119205474854, 0.000653684139251709, 0.0006744563579559326, 0.0006952285766601562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 13.0, 15.0, 20.0, 45.0, 53.0, 79.0, 112.0, 155.0, 218.0, 314.0, 537.0, 794.0, 1117.0, 1676.0, 2762.0, 4189.0, 6831.0, 11174.0, 18482.0, 31104.0, 51782.0, 82291.0, 119996.0, 151117.0, 158146.0, 136953.0, 100587.0, 66158.0, 40130.0, 23931.0, 14245.0, 8472.0, 5332.0, 3396.0, 2008.0, 1389.0, 952.0, 627.0, 429.0, 303.0, 184.0, 127.0, 100.0, 62.0, 46.0, 41.0, 20.0, 12.0, 8.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.171875, -7.91845703125, -7.6650390625, -7.41162109375, -7.158203125, -6.90478515625, -6.6513671875, -6.39794921875, -6.14453125, -5.89111328125, -5.6376953125, -5.38427734375, -5.130859375, -4.87744140625, -4.6240234375, -4.37060546875, -4.1171875, -3.86376953125, -3.6103515625, -3.35693359375, -3.103515625, -2.85009765625, -2.5966796875, -2.34326171875, -2.08984375, -1.83642578125, -1.5830078125, -1.32958984375, -1.076171875, -0.82275390625, -0.5693359375, -0.31591796875, -0.0625, 0.19091796875, 0.4443359375, 0.69775390625, 0.951171875, 1.20458984375, 1.4580078125, 1.71142578125, 1.96484375, 2.21826171875, 2.4716796875, 2.72509765625, 2.978515625, 3.23193359375, 3.4853515625, 3.73876953125, 3.9921875, 4.24560546875, 4.4990234375, 4.75244140625, 5.005859375, 5.25927734375, 5.5126953125, 5.76611328125, 6.01953125, 6.27294921875, 6.5263671875, 6.77978515625, 7.033203125, 7.28662109375, 7.5400390625, 7.79345703125, 8.046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 12.0, 12.0, 19.0, 22.0, 22.0, 38.0, 51.0, 59.0, 75.0, 73.0, 87.0, 85.0, 67.0, 58.0, 57.0, 44.0, 44.0, 31.0, 26.0, 20.0, 19.0, 12.0, 6.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21875, -5.0557861328125, -4.892822265625, -4.7298583984375, -4.56689453125, -4.4039306640625, -4.240966796875, -4.0780029296875, -3.9150390625, -3.7520751953125, -3.589111328125, -3.4261474609375, -3.26318359375, -3.1002197265625, -2.937255859375, -2.7742919921875, -2.611328125, -2.4483642578125, -2.285400390625, -2.1224365234375, -1.95947265625, -1.7965087890625, -1.633544921875, -1.4705810546875, -1.3076171875, -1.1446533203125, -0.981689453125, -0.8187255859375, -0.65576171875, -0.4927978515625, -0.329833984375, -0.1668701171875, -0.00390625, 0.1590576171875, 0.322021484375, 0.4849853515625, 0.64794921875, 0.8109130859375, 0.973876953125, 1.1368408203125, 1.2998046875, 1.4627685546875, 1.625732421875, 1.7886962890625, 1.95166015625, 2.1146240234375, 2.277587890625, 2.4405517578125, 2.603515625, 2.7664794921875, 2.929443359375, 3.0924072265625, 3.25537109375, 3.4183349609375, 3.581298828125, 3.7442626953125, 3.9072265625, 4.0701904296875, 4.233154296875, 4.3961181640625, 4.55908203125, 4.7220458984375, 4.885009765625, 5.0479736328125, 5.2109375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 8.0, 1.0, 14.0, 16.0, 14.0, 12.0, 23.0, 30.0, 32.0, 25.0, 41.0, 41.0, 42.0, 48.0, 39.0, 40.0, 55.0, 38.0, 43.0, 48.0, 49.0, 38.0, 42.0, 29.0, 42.0, 25.0, 28.0, 25.0, 18.0, 14.0, 10.0, 14.0, 4.0, 11.0, 4.0, 7.0, 8.0, 4.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.093250274658203, -25.272445678710938, -24.451641082763672, -23.630836486816406, -22.810033798217773, -21.989229202270508, -21.168424606323242, -20.347620010375977, -19.526817321777344, -18.706012725830078, -17.885208129882812, -17.064403533935547, -16.243600845336914, -15.422796249389648, -14.601991653442383, -13.781187057495117, -12.960382461547852, -12.139577865600586, -11.318774223327637, -10.497969627380371, -9.677165985107422, -8.856361389160156, -8.03555679321289, -7.214752674102783, -6.393948554992676, -5.573144435882568, -4.752340316772461, -3.9315357208251953, -3.110731601715088, -2.2899274826049805, -1.4691228866577148, -0.6483187675476074, 0.1724834442138672, 0.9932876825332642, 1.8140919208526611, 2.6348962783813477, 3.455700397491455, 4.2765045166015625, 5.097309112548828, 5.9181132316589355, 6.738917350769043, 7.55972146987915, 8.380525588989258, 9.201330184936523, 10.022134780883789, 10.842938423156738, 11.663743019104004, 12.484546661376953, 13.305351257324219, 14.126155853271484, 14.946959495544434, 15.7677640914917, 16.58856773376465, 17.409372329711914, 18.23017692565918, 19.050981521606445, 19.871784210205078, 20.692588806152344, 21.51339340209961, 22.334197998046875, 23.155000686645508, 23.975805282592773, 24.79660987854004, 25.617414474487305, 26.43821907043457]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 10.0, 14.0, 14.0, 12.0, 19.0, 25.0, 16.0, 20.0, 30.0, 27.0, 26.0, 35.0, 27.0, 42.0, 40.0, 42.0, 44.0, 38.0, 45.0, 35.0, 43.0, 42.0, 30.0, 31.0, 43.0, 27.0, 24.0, 26.0, 26.0, 18.0, 22.0, 10.0, 16.0, 8.0, 13.0, 3.0, 6.0, 7.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.659465789794922, -30.462419509887695, -29.265371322631836, -28.06832504272461, -26.87127685546875, -25.674230575561523, -24.477184295654297, -23.280136108398438, -22.08308982849121, -20.886043548583984, -19.688995361328125, -18.4919490814209, -17.294902801513672, -16.097854614257812, -14.900808334350586, -13.703761100769043, -12.5067138671875, -11.309666633605957, -10.112619400024414, -8.915573120117188, -7.7185258865356445, -6.521478652954102, -5.324431896209717, -4.127385139465332, -2.930337905883789, -1.7332909107208252, -0.5362439155578613, 0.6608030796051025, 1.8578500747680664, 3.0548973083496094, 4.251944065093994, 5.448990821838379, 6.6460418701171875, 7.8430891036987305, 9.040136337280273, 10.2371826171875, 11.434229850769043, 12.631277084350586, 13.828323364257812, 15.025370597839355, 16.2224178314209, 17.419464111328125, 18.616512298583984, 19.81355857849121, 21.010604858398438, 22.207653045654297, 23.404699325561523, 24.60174560546875, 25.79879379272461, 26.995840072631836, 28.192888259887695, 29.389934539794922, 30.58698272705078, 31.784029006958008, 32.981075286865234, 34.178123474121094, 35.37516784667969, 36.57221603393555, 37.76926040649414, 38.96630859375, 40.16335678100586, 41.36040496826172, 42.55744934082031, 43.75449752807617, 44.95154571533203]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 8.0, 11.0, 10.0, 22.0, 44.0, 73.0, 119.0, 167.0, 295.0, 489.0, 774.0, 1360.0, 2069.0, 3393.0, 5279.0, 8310.0, 13250.0, 20587.0, 32106.0, 48843.0, 75428.0, 111451.0, 162269.0, 227732.0, 303391.0, 380049.0, 441205.0, 464856.0, 445886.0, 390007.0, 314659.0, 236628.0, 169136.0, 116785.0, 77359.0, 50871.0, 32659.0, 20826.0, 13271.0, 8408.0, 5269.0, 3224.0, 2123.0, 1319.0, 851.0, 512.0, 316.0, 190.0, 169.0, 92.0, 57.0, 30.0, 22.0, 18.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-20.171875, -19.532470703125, -18.89306640625, -18.253662109375, -17.6142578125, -16.974853515625, -16.33544921875, -15.696044921875, -15.056640625, -14.417236328125, -13.77783203125, -13.138427734375, -12.4990234375, -11.859619140625, -11.22021484375, -10.580810546875, -9.94140625, -9.302001953125, -8.66259765625, -8.023193359375, -7.3837890625, -6.744384765625, -6.10498046875, -5.465576171875, -4.826171875, -4.186767578125, -3.54736328125, -2.907958984375, -2.2685546875, -1.629150390625, -0.98974609375, -0.350341796875, 0.2890625, 0.928466796875, 1.56787109375, 2.207275390625, 2.8466796875, 3.486083984375, 4.12548828125, 4.764892578125, 5.404296875, 6.043701171875, 6.68310546875, 7.322509765625, 7.9619140625, 8.601318359375, 9.24072265625, 9.880126953125, 10.51953125, 11.158935546875, 11.79833984375, 12.437744140625, 13.0771484375, 13.716552734375, 14.35595703125, 14.995361328125, 15.634765625, 16.274169921875, 16.91357421875, 17.552978515625, 18.1923828125, 18.831787109375, 19.47119140625, 20.110595703125, 20.75]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 1.0, 4.0, 9.0, 7.0, 6.0, 8.0, 15.0, 11.0, 12.0, 19.0, 24.0, 15.0, 19.0, 25.0, 29.0, 28.0, 24.0, 41.0, 34.0, 39.0, 43.0, 41.0, 42.0, 43.0, 41.0, 34.0, 48.0, 39.0, 35.0, 30.0, 35.0, 28.0, 20.0, 26.0, 22.0, 23.0, 14.0, 16.0, 10.0, 11.0, 6.0, 5.0, 8.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.328125, -24.355712890625, -23.38330078125, -22.410888671875, -21.4384765625, -20.466064453125, -19.49365234375, -18.521240234375, -17.548828125, -16.576416015625, -15.60400390625, -14.631591796875, -13.6591796875, -12.686767578125, -11.71435546875, -10.741943359375, -9.76953125, -8.797119140625, -7.82470703125, -6.852294921875, -5.8798828125, -4.907470703125, -3.93505859375, -2.962646484375, -1.990234375, -1.017822265625, -0.04541015625, 0.927001953125, 1.8994140625, 2.871826171875, 3.84423828125, 4.816650390625, 5.7890625, 6.761474609375, 7.73388671875, 8.706298828125, 9.6787109375, 10.651123046875, 11.62353515625, 12.595947265625, 13.568359375, 14.540771484375, 15.51318359375, 16.485595703125, 17.4580078125, 18.430419921875, 19.40283203125, 20.375244140625, 21.34765625, 22.320068359375, 23.29248046875, 24.264892578125, 25.2373046875, 26.209716796875, 27.18212890625, 28.154541015625, 29.126953125, 30.099365234375, 31.07177734375, 32.044189453125, 33.0166015625, 33.989013671875, 34.96142578125, 35.933837890625, 36.90625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 11.0, 22.0, 33.0, 44.0, 81.0, 154.0, 233.0, 461.0, 788.0, 1311.0, 2175.0, 3722.0, 5994.0, 9899.0, 16112.0, 25538.0, 40079.0, 60181.0, 89201.0, 126655.0, 174185.0, 229232.0, 285807.0, 339997.0, 379909.0, 398993.0, 391606.0, 363729.0, 317013.0, 260881.0, 201119.0, 151202.0, 107991.0, 74393.0, 49998.0, 32210.0, 20879.0, 12987.0, 7815.0, 4731.0, 2843.0, 1730.0, 965.0, 573.0, 333.0, 202.0, 118.0, 64.0, 33.0, 23.0, 17.0, 4.0, 6.0, 1.0, 5.0], "bins": [-19.34375, -18.787353515625, -18.23095703125, -17.674560546875, -17.1181640625, -16.561767578125, -16.00537109375, -15.448974609375, -14.892578125, -14.336181640625, -13.77978515625, -13.223388671875, -12.6669921875, -12.110595703125, -11.55419921875, -10.997802734375, -10.44140625, -9.885009765625, -9.32861328125, -8.772216796875, -8.2158203125, -7.659423828125, -7.10302734375, -6.546630859375, -5.990234375, -5.433837890625, -4.87744140625, -4.321044921875, -3.7646484375, -3.208251953125, -2.65185546875, -2.095458984375, -1.5390625, -0.982666015625, -0.42626953125, 0.130126953125, 0.6865234375, 1.242919921875, 1.79931640625, 2.355712890625, 2.912109375, 3.468505859375, 4.02490234375, 4.581298828125, 5.1376953125, 5.694091796875, 6.25048828125, 6.806884765625, 7.36328125, 7.919677734375, 8.47607421875, 9.032470703125, 9.5888671875, 10.145263671875, 10.70166015625, 11.258056640625, 11.814453125, 12.370849609375, 12.92724609375, 13.483642578125, 14.0400390625, 14.596435546875, 15.15283203125, 15.709228515625, 16.265625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 9.0, 2.0, 7.0, 11.0, 15.0, 24.0, 31.0, 34.0, 30.0, 43.0, 49.0, 70.0, 90.0, 98.0, 115.0, 110.0, 139.0, 162.0, 181.0, 165.0, 184.0, 197.0, 177.0, 182.0, 189.0, 193.0, 180.0, 194.0, 171.0, 136.0, 131.0, 137.0, 112.0, 82.0, 81.0, 62.0, 63.0, 48.0, 37.0, 23.0, 31.0, 26.0, 14.0, 12.0, 9.0, 11.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-12.90625, -12.498779296875, -12.09130859375, -11.683837890625, -11.2763671875, -10.868896484375, -10.46142578125, -10.053955078125, -9.646484375, -9.239013671875, -8.83154296875, -8.424072265625, -8.0166015625, -7.609130859375, -7.20166015625, -6.794189453125, -6.38671875, -5.979248046875, -5.57177734375, -5.164306640625, -4.7568359375, -4.349365234375, -3.94189453125, -3.534423828125, -3.126953125, -2.719482421875, -2.31201171875, -1.904541015625, -1.4970703125, -1.089599609375, -0.68212890625, -0.274658203125, 0.1328125, 0.540283203125, 0.94775390625, 1.355224609375, 1.7626953125, 2.170166015625, 2.57763671875, 2.985107421875, 3.392578125, 3.800048828125, 4.20751953125, 4.614990234375, 5.0224609375, 5.429931640625, 5.83740234375, 6.244873046875, 6.65234375, 7.059814453125, 7.46728515625, 7.874755859375, 8.2822265625, 8.689697265625, 9.09716796875, 9.504638671875, 9.912109375, 10.319580078125, 10.72705078125, 11.134521484375, 11.5419921875, 11.949462890625, 12.35693359375, 12.764404296875, 13.171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 10.0, 8.0, 7.0, 10.0, 13.0, 16.0, 23.0, 20.0, 28.0, 35.0, 31.0, 38.0, 42.0, 33.0, 44.0, 41.0, 57.0, 37.0, 37.0, 36.0, 52.0, 40.0, 36.0, 47.0, 34.0, 25.0, 29.0, 23.0, 18.0, 15.0, 16.0, 26.0, 15.0, 12.0, 10.0, 8.0, 4.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.832704544067383, -25.061813354492188, -24.290922164916992, -23.520030975341797, -22.749141693115234, -21.97825050354004, -21.207359313964844, -20.43646812438965, -19.665576934814453, -18.894685745239258, -18.123794555664062, -17.3529052734375, -16.582014083862305, -15.81112289428711, -15.040231704711914, -14.269340515136719, -13.498451232910156, -12.727560043334961, -11.956669807434082, -11.185778617858887, -10.414888381958008, -9.643997192382812, -8.873106002807617, -8.102214813232422, -7.331324577331543, -6.560433864593506, -5.789543151855469, -5.018651962280273, -4.247761249542236, -3.476870536804199, -2.705979347229004, -1.9350886344909668, -1.1641960144042969, -0.3933051824569702, 0.37758564949035645, 1.1484766006469727, 1.9193673133850098, 2.690258026123047, 3.461149215698242, 4.232039928436279, 5.002930641174316, 5.7738213539123535, 6.544712066650391, 7.315603256225586, 8.086494445800781, 8.85738468170166, 9.628275871276855, 10.399166107177734, 11.17005729675293, 11.940948486328125, 12.711838722229004, 13.4827299118042, 14.253620147705078, 15.024511337280273, 15.795402526855469, 16.566293716430664, 17.33718490600586, 18.108076095581055, 18.87896728515625, 19.649856567382812, 20.420747756958008, 21.191638946533203, 21.9625301361084, 22.733421325683594, 23.504310607910156]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 8.0, 7.0, 6.0, 9.0, 18.0, 16.0, 22.0, 10.0, 22.0, 23.0, 19.0, 24.0, 25.0, 23.0, 41.0, 37.0, 37.0, 40.0, 31.0, 45.0, 33.0, 36.0, 37.0, 39.0, 32.0, 40.0, 32.0, 26.0, 34.0, 25.0, 25.0, 32.0, 23.0, 19.0, 18.0, 14.0, 13.0, 11.0, 8.0, 7.0, 6.0, 7.0, 2.0, 4.0, 0.0, 6.0, 1.0, 1.0, 2.0, 3.0], "bins": [-38.8551139831543, -37.74711990356445, -36.63912582397461, -35.53113555908203, -34.42314147949219, -33.315147399902344, -32.2071533203125, -31.099159240722656, -29.991167068481445, -28.8831729888916, -27.77518081665039, -26.667186737060547, -25.559192657470703, -24.451200485229492, -23.34320640563965, -22.235214233398438, -21.127220153808594, -20.01922607421875, -18.91123390197754, -17.803239822387695, -16.695247650146484, -15.58725357055664, -14.479259490966797, -13.37126636505127, -12.263273239135742, -11.155280113220215, -10.047286987304688, -8.939292907714844, -7.831299781799316, -6.723306655883789, -5.6153130531311035, -4.507319450378418, -3.399322509765625, -2.2913291454315186, -1.183335781097412, -0.07534241676330566, 1.0326509475708008, 2.140644073486328, 3.2486376762390137, 4.356631278991699, 5.464624404907227, 6.572617530822754, 7.6806111335754395, 8.788604736328125, 9.896597862243652, 11.00459098815918, 12.112585067749023, 13.22057819366455, 14.328571319580078, 15.436564445495605, 16.544557571411133, 17.652551651000977, 18.760543823242188, 19.86853790283203, 20.976531982421875, 22.08452606201172, 23.19251823425293, 24.300512313842773, 25.408504486083984, 26.516498565673828, 27.624492645263672, 28.732484817504883, 29.840478897094727, 30.948471069335938, 32.05646514892578]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 1.0, 10.0, 7.0, 20.0, 23.0, 21.0, 33.0, 52.0, 59.0, 107.0, 126.0, 227.0, 310.0, 387.0, 610.0, 803.0, 1224.0, 1853.0, 2712.0, 4093.0, 6501.0, 10241.0, 16434.0, 28197.0, 49062.0, 93924.0, 192318.0, 290207.0, 161312.0, 79432.0, 42698.0, 24454.0, 14721.0, 8949.0, 5772.0, 3781.0, 2495.0, 1648.0, 1072.0, 827.0, 562.0, 379.0, 276.0, 176.0, 104.0, 99.0, 75.0, 56.0, 37.0, 22.0, 12.0, 15.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-4.046875, -3.91790771484375, -3.7889404296875, -3.65997314453125, -3.531005859375, -3.40203857421875, -3.2730712890625, -3.14410400390625, -3.01513671875, -2.88616943359375, -2.7572021484375, -2.62823486328125, -2.499267578125, -2.37030029296875, -2.2413330078125, -2.11236572265625, -1.9833984375, -1.85443115234375, -1.7254638671875, -1.59649658203125, -1.467529296875, -1.33856201171875, -1.2095947265625, -1.08062744140625, -0.95166015625, -0.82269287109375, -0.6937255859375, -0.56475830078125, -0.435791015625, -0.30682373046875, -0.1778564453125, -0.04888916015625, 0.080078125, 0.20904541015625, 0.3380126953125, 0.46697998046875, 0.595947265625, 0.72491455078125, 0.8538818359375, 0.98284912109375, 1.11181640625, 1.24078369140625, 1.3697509765625, 1.49871826171875, 1.627685546875, 1.75665283203125, 1.8856201171875, 2.01458740234375, 2.1435546875, 2.27252197265625, 2.4014892578125, 2.53045654296875, 2.659423828125, 2.78839111328125, 2.9173583984375, 3.04632568359375, 3.17529296875, 3.30426025390625, 3.4332275390625, 3.56219482421875, 3.691162109375, 3.82012939453125, 3.9490966796875, 4.07806396484375, 4.20703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 8.0, 7.0, 7.0, 9.0, 17.0, 17.0, 21.0, 10.0, 23.0, 22.0, 19.0, 26.0, 23.0, 25.0, 39.0, 37.0, 37.0, 40.0, 34.0, 44.0, 34.0, 36.0, 37.0, 38.0, 34.0, 37.0, 35.0, 23.0, 37.0, 23.0, 23.0, 34.0, 23.0, 19.0, 17.0, 14.0, 12.0, 11.0, 9.0, 6.0, 7.0, 6.0, 2.0, 4.0, 0.0, 6.0, 1.0, 0.0, 3.0, 3.0], "bins": [-38.375, -37.2685546875, -36.162109375, -35.0556640625, -33.94921875, -32.8427734375, -31.736328125, -30.6298828125, -29.5234375, -28.4169921875, -27.310546875, -26.2041015625, -25.09765625, -23.9912109375, -22.884765625, -21.7783203125, -20.671875, -19.5654296875, -18.458984375, -17.3525390625, -16.24609375, -15.1396484375, -14.033203125, -12.9267578125, -11.8203125, -10.7138671875, -9.607421875, -8.5009765625, -7.39453125, -6.2880859375, -5.181640625, -4.0751953125, -2.96875, -1.8623046875, -0.755859375, 0.3505859375, 1.45703125, 2.5634765625, 3.669921875, 4.7763671875, 5.8828125, 6.9892578125, 8.095703125, 9.2021484375, 10.30859375, 11.4150390625, 12.521484375, 13.6279296875, 14.734375, 15.8408203125, 16.947265625, 18.0537109375, 19.16015625, 20.2666015625, 21.373046875, 22.4794921875, 23.5859375, 24.6923828125, 25.798828125, 26.9052734375, 28.01171875, 29.1181640625, 30.224609375, 31.3310546875, 32.4375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 11.0, 15.0, 21.0, 25.0, 39.0, 71.0, 108.0, 170.0, 271.0, 444.0, 740.0, 1146.0, 2071.0, 3830.0, 7246.0, 14312.0, 28890.0, 61768.0, 147746.0, 371355.0, 236196.0, 90045.0, 40790.0, 20041.0, 9491.0, 4954.0, 2739.0, 1578.0, 981.0, 558.0, 326.0, 210.0, 126.0, 84.0, 52.0, 37.0, 20.0, 19.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.34375, -6.16619873046875, -5.9886474609375, -5.81109619140625, -5.633544921875, -5.45599365234375, -5.2784423828125, -5.10089111328125, -4.92333984375, -4.74578857421875, -4.5682373046875, -4.39068603515625, -4.213134765625, -4.03558349609375, -3.8580322265625, -3.68048095703125, -3.5029296875, -3.32537841796875, -3.1478271484375, -2.97027587890625, -2.792724609375, -2.61517333984375, -2.4376220703125, -2.26007080078125, -2.08251953125, -1.90496826171875, -1.7274169921875, -1.54986572265625, -1.372314453125, -1.19476318359375, -1.0172119140625, -0.83966064453125, -0.662109375, -0.48455810546875, -0.3070068359375, -0.12945556640625, 0.048095703125, 0.22564697265625, 0.4031982421875, 0.58074951171875, 0.75830078125, 0.93585205078125, 1.1134033203125, 1.29095458984375, 1.468505859375, 1.64605712890625, 1.8236083984375, 2.00115966796875, 2.1787109375, 2.35626220703125, 2.5338134765625, 2.71136474609375, 2.888916015625, 3.06646728515625, 3.2440185546875, 3.42156982421875, 3.59912109375, 3.77667236328125, 3.9542236328125, 4.13177490234375, 4.309326171875, 4.48687744140625, 4.6644287109375, 4.84197998046875, 5.01953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 8.0, 12.0, 13.0, 22.0, 20.0, 18.0, 27.0, 29.0, 35.0, 33.0, 29.0, 36.0, 37.0, 40.0, 49.0, 47.0, 52.0, 42.0, 46.0, 37.0, 43.0, 30.0, 38.0, 36.0, 33.0, 26.0, 30.0, 23.0, 23.0, 17.0, 13.0, 12.0, 7.0, 10.0, 5.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.787109375, -30.91796875, -30.048828125, -29.1796875, -28.310546875, -27.44140625, -26.572265625, -25.703125, -24.833984375, -23.96484375, -23.095703125, -22.2265625, -21.357421875, -20.48828125, -19.619140625, -18.75, -17.880859375, -17.01171875, -16.142578125, -15.2734375, -14.404296875, -13.53515625, -12.666015625, -11.796875, -10.927734375, -10.05859375, -9.189453125, -8.3203125, -7.451171875, -6.58203125, -5.712890625, -4.84375, -3.974609375, -3.10546875, -2.236328125, -1.3671875, -0.498046875, 0.37109375, 1.240234375, 2.109375, 2.978515625, 3.84765625, 4.716796875, 5.5859375, 6.455078125, 7.32421875, 8.193359375, 9.0625, 9.931640625, 10.80078125, 11.669921875, 12.5390625, 13.408203125, 14.27734375, 15.146484375, 16.015625, 16.884765625, 17.75390625, 18.623046875, 19.4921875, 20.361328125, 21.23046875, 22.099609375, 22.96875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 12.0, 12.0, 13.0, 20.0, 24.0, 29.0, 52.0, 56.0, 102.0, 127.0, 217.0, 298.0, 455.0, 740.0, 1360.0, 2774.0, 6167.0, 17591.0, 65412.0, 347379.0, 479476.0, 89263.0, 22358.0, 7511.0, 3240.0, 1534.0, 829.0, 502.0, 321.0, 191.0, 143.0, 76.0, 78.0, 47.0, 28.0, 30.0, 19.0, 12.0, 12.0, 8.0, 6.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6544189453125, -0.634033203125, -0.6136474609375, -0.59326171875, -0.5728759765625, -0.552490234375, -0.5321044921875, -0.51171875, -0.4913330078125, -0.470947265625, -0.4505615234375, -0.43017578125, -0.4097900390625, -0.389404296875, -0.3690185546875, -0.3486328125, -0.3282470703125, -0.307861328125, -0.2874755859375, -0.26708984375, -0.2467041015625, -0.226318359375, -0.2059326171875, -0.185546875, -0.1651611328125, -0.144775390625, -0.1243896484375, -0.10400390625, -0.0836181640625, -0.063232421875, -0.0428466796875, -0.0224609375, -0.0020751953125, 0.018310546875, 0.0386962890625, 0.05908203125, 0.0794677734375, 0.099853515625, 0.1202392578125, 0.140625, 0.1610107421875, 0.181396484375, 0.2017822265625, 0.22216796875, 0.2425537109375, 0.262939453125, 0.2833251953125, 0.3037109375, 0.3240966796875, 0.344482421875, 0.3648681640625, 0.38525390625, 0.4056396484375, 0.426025390625, 0.4464111328125, 0.466796875, 0.4871826171875, 0.507568359375, 0.5279541015625, 0.54833984375, 0.5687255859375, 0.589111328125, 0.6094970703125, 0.6298828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 14.0, 20.0, 21.0, 46.0, 60.0, 88.0, 120.0, 134.0, 125.0, 99.0, 85.0, 55.0, 38.0, 23.0, 16.0, 10.0, 9.0, 6.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7816505432128906e-05, -5.5577605962753296e-05, -5.3338706493377686e-05, -5.1099807024002075e-05, -4.8860907554626465e-05, -4.6622008085250854e-05, -4.4383108615875244e-05, -4.2144209146499634e-05, -3.9905309677124023e-05, -3.766641020774841e-05, -3.54275107383728e-05, -3.318861126899719e-05, -3.094971179962158e-05, -2.871081233024597e-05, -2.647191286087036e-05, -2.423301339149475e-05, -2.199411392211914e-05, -1.975521445274353e-05, -1.751631498336792e-05, -1.527741551399231e-05, -1.30385160446167e-05, -1.0799616575241089e-05, -8.560717105865479e-06, -6.321817636489868e-06, -4.082918167114258e-06, -1.8440186977386475e-06, 3.948807716369629e-07, 2.6337802410125732e-06, 4.872679710388184e-06, 7.111579179763794e-06, 9.350478649139404e-06, 1.1589378118515015e-05, 1.3828277587890625e-05, 1.6067177057266235e-05, 1.8306076526641846e-05, 2.0544975996017456e-05, 2.2783875465393066e-05, 2.5022774934768677e-05, 2.7261674404144287e-05, 2.9500573873519897e-05, 3.173947334289551e-05, 3.397837281227112e-05, 3.621727228164673e-05, 3.845617175102234e-05, 4.069507122039795e-05, 4.293397068977356e-05, 4.517287015914917e-05, 4.741176962852478e-05, 4.965066909790039e-05, 5.1889568567276e-05, 5.412846803665161e-05, 5.636736750602722e-05, 5.860626697540283e-05, 6.084516644477844e-05, 6.308406591415405e-05, 6.532296538352966e-05, 6.756186485290527e-05, 6.980076432228088e-05, 7.20396637916565e-05, 7.42785632610321e-05, 7.651746273040771e-05, 7.875636219978333e-05, 8.099526166915894e-05, 8.323416113853455e-05, 8.547306060791016e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 6.0, 21.0, 22.0, 46.0, 47.0, 90.0, 116.0, 177.0, 262.0, 430.0, 577.0, 934.0, 1310.0, 1871.0, 2831.0, 4260.0, 6253.0, 9482.0, 14339.0, 22520.0, 35486.0, 57884.0, 97960.0, 193890.0, 265732.0, 132487.0, 74194.0, 44838.0, 27931.0, 17801.0, 11523.0, 7498.0, 5030.0, 3510.0, 2273.0, 1542.0, 1070.0, 691.0, 535.0, 354.0, 237.0, 169.0, 101.0, 68.0, 46.0, 30.0, 18.0, 17.0, 14.0, 9.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.56201171875, -0.5440216064453125, -0.526031494140625, -0.5080413818359375, -0.49005126953125, -0.4720611572265625, -0.454071044921875, -0.4360809326171875, -0.4180908203125, -0.4001007080078125, -0.382110595703125, -0.3641204833984375, -0.34613037109375, -0.3281402587890625, -0.310150146484375, -0.2921600341796875, -0.274169921875, -0.2561798095703125, -0.238189697265625, -0.2201995849609375, -0.20220947265625, -0.1842193603515625, -0.166229248046875, -0.1482391357421875, -0.1302490234375, -0.1122589111328125, -0.094268798828125, -0.0762786865234375, -0.05828857421875, -0.0402984619140625, -0.022308349609375, -0.0043182373046875, 0.013671875, 0.0316619873046875, 0.049652099609375, 0.0676422119140625, 0.08563232421875, 0.1036224365234375, 0.121612548828125, 0.1396026611328125, 0.1575927734375, 0.1755828857421875, 0.193572998046875, 0.2115631103515625, 0.22955322265625, 0.2475433349609375, 0.265533447265625, 0.2835235595703125, 0.301513671875, 0.3195037841796875, 0.337493896484375, 0.3554840087890625, 0.37347412109375, 0.3914642333984375, 0.409454345703125, 0.4274444580078125, 0.4454345703125, 0.4634246826171875, 0.481414794921875, 0.4994049072265625, 0.51739501953125, 0.5353851318359375, 0.553375244140625, 0.5713653564453125, 0.58935546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 11.0, 11.0, 14.0, 16.0, 16.0, 32.0, 16.0, 25.0, 22.0, 28.0, 16.0, 34.0, 29.0, 22.0, 30.0, 35.0, 35.0, 31.0, 45.0, 47.0, 50.0, 40.0, 19.0, 28.0, 26.0, 41.0, 26.0, 32.0, 30.0, 33.0, 23.0, 29.0, 14.0, 11.0, 9.0, 9.0, 16.0, 14.0, 4.0, 5.0, 3.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4417304992675781, -0.42813873291015625, -0.4145469665527344, -0.4009552001953125, -0.3873634338378906, -0.37377166748046875, -0.3601799011230469, -0.346588134765625, -0.3329963684082031, -0.31940460205078125, -0.3058128356933594, -0.2922210693359375, -0.2786293029785156, -0.26503753662109375, -0.2514457702636719, -0.23785400390625, -0.22426223754882812, -0.21067047119140625, -0.19707870483398438, -0.1834869384765625, -0.16989517211914062, -0.15630340576171875, -0.14271163940429688, -0.129119873046875, -0.11552810668945312, -0.10193634033203125, -0.08834457397460938, -0.0747528076171875, -0.061161041259765625, -0.04756927490234375, -0.033977508544921875, -0.0203857421875, -0.006793975830078125, 0.00679779052734375, 0.020389556884765625, 0.0339813232421875, 0.047573089599609375, 0.06116485595703125, 0.07475662231445312, 0.088348388671875, 0.10194015502929688, 0.11553192138671875, 0.12912368774414062, 0.1427154541015625, 0.15630722045898438, 0.16989898681640625, 0.18349075317382812, 0.19708251953125, 0.21067428588867188, 0.22426605224609375, 0.23785781860351562, 0.2514495849609375, 0.2650413513183594, 0.27863311767578125, 0.2922248840332031, 0.305816650390625, 0.3194084167480469, 0.33300018310546875, 0.3465919494628906, 0.3601837158203125, 0.3737754821777344, 0.38736724853515625, 0.4009590148925781, 0.41455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 8.0, 10.0, 7.0, 10.0, 12.0, 21.0, 17.0, 33.0, 32.0, 25.0, 31.0, 44.0, 51.0, 27.0, 49.0, 38.0, 45.0, 44.0, 40.0, 40.0, 51.0, 42.0, 35.0, 40.0, 35.0, 24.0, 28.0, 18.0, 20.0, 12.0, 24.0, 21.0, 14.0, 8.0, 11.0, 4.0, 5.0, 3.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-26.424856185913086, -25.648263931274414, -24.871671676635742, -24.09507942199707, -23.31848907470703, -22.54189682006836, -21.765304565429688, -20.988712310791016, -20.212120056152344, -19.435527801513672, -18.658935546875, -17.882343292236328, -17.105751037597656, -16.329160690307617, -15.552568435668945, -14.775976181030273, -13.999383926391602, -13.22279167175293, -12.446199417114258, -11.669608116149902, -10.89301586151123, -10.116423606872559, -9.339832305908203, -8.563240051269531, -7.786647796630859, -7.0100555419921875, -6.233463764190674, -5.45687198638916, -4.680279731750488, -3.9036877155303955, -3.1270956993103027, -2.350503921508789, -1.57391357421875, -0.7973215579986572, -0.020729541778564453, 0.7558624744415283, 1.532454490661621, 2.309046506881714, 3.0856385231018066, 3.8622303009033203, 4.638822555541992, 5.415414810180664, 6.192006587982178, 6.968598365783691, 7.745190620422363, 8.521782875061035, 9.29837417602539, 10.074966430664062, 10.851558685302734, 11.628150939941406, 12.404743194580078, 13.181334495544434, 13.957926750183105, 14.734519004821777, 15.511110305786133, 16.287702560424805, 17.064294815063477, 17.84088706970215, 18.61747932434082, 19.394071578979492, 20.17066192626953, 20.947254180908203, 21.723846435546875, 22.500438690185547, 23.27703094482422]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 6.0, 8.0, 14.0, 14.0, 17.0, 20.0, 12.0, 20.0, 20.0, 24.0, 25.0, 25.0, 23.0, 38.0, 39.0, 38.0, 40.0, 33.0, 47.0, 34.0, 32.0, 38.0, 36.0, 37.0, 35.0, 30.0, 29.0, 32.0, 27.0, 24.0, 31.0, 23.0, 21.0, 16.0, 13.0, 12.0, 13.0, 7.0, 5.0, 9.0, 4.0, 2.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0], "bins": [-38.25230407714844, -37.147125244140625, -36.04194641113281, -34.936763763427734, -33.83158493041992, -32.72640609741211, -31.621225357055664, -30.51604461669922, -29.410865783691406, -28.305686950683594, -27.20050621032715, -26.095325469970703, -24.99014663696289, -23.884967803955078, -22.779787063598633, -21.674606323242188, -20.569427490234375, -19.464248657226562, -18.359067916870117, -17.253887176513672, -16.14870834350586, -15.04352855682373, -13.938348770141602, -12.833168983459473, -11.727989196777344, -10.622809410095215, -9.517629623413086, -8.412449836730957, -7.307270050048828, -6.202090263366699, -5.09691047668457, -3.9917306900024414, -2.886554718017578, -1.7813749313354492, -0.6761951446533203, 0.4289846420288086, 1.5341644287109375, 2.6393442153930664, 3.7445240020751953, 4.849703788757324, 5.954883575439453, 7.060063362121582, 8.165243148803711, 9.27042293548584, 10.375602722167969, 11.480782508850098, 12.585962295532227, 13.691142082214355, 14.796321868896484, 15.901501655578613, 17.006681442260742, 18.111862182617188, 19.217041015625, 20.322219848632812, 21.427400588989258, 22.532581329345703, 23.637760162353516, 24.742938995361328, 25.848119735717773, 26.95330047607422, 28.05847930908203, 29.163658142089844, 30.26883888244629, 31.374019622802734, 32.47919845581055]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 18.0, 14.0, 26.0, 22.0, 54.0, 78.0, 103.0, 160.0, 234.0, 381.0, 587.0, 943.0, 1382.0, 2201.0, 3287.0, 5374.0, 8461.0, 13485.0, 20059.0, 29955.0, 43753.0, 60407.0, 79471.0, 97561.0, 110204.0, 114339.0, 108439.0, 94145.0, 75509.0, 57141.0, 40690.0, 27885.0, 18491.0, 12090.0, 7501.0, 5077.0, 3260.0, 1988.0, 1301.0, 856.0, 568.0, 370.0, 223.0, 141.0, 94.0, 71.0, 53.0, 33.0, 19.0, 20.0, 13.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0], "bins": [-18.203125, -17.641357421875, -17.07958984375, -16.517822265625, -15.9560546875, -15.394287109375, -14.83251953125, -14.270751953125, -13.708984375, -13.147216796875, -12.58544921875, -12.023681640625, -11.4619140625, -10.900146484375, -10.33837890625, -9.776611328125, -9.21484375, -8.653076171875, -8.09130859375, -7.529541015625, -6.9677734375, -6.406005859375, -5.84423828125, -5.282470703125, -4.720703125, -4.158935546875, -3.59716796875, -3.035400390625, -2.4736328125, -1.911865234375, -1.35009765625, -0.788330078125, -0.2265625, 0.335205078125, 0.89697265625, 1.458740234375, 2.0205078125, 2.582275390625, 3.14404296875, 3.705810546875, 4.267578125, 4.829345703125, 5.39111328125, 5.952880859375, 6.5146484375, 7.076416015625, 7.63818359375, 8.199951171875, 8.76171875, 9.323486328125, 9.88525390625, 10.447021484375, 11.0087890625, 11.570556640625, 12.13232421875, 12.694091796875, 13.255859375, 13.817626953125, 14.37939453125, 14.941162109375, 15.5029296875, 16.064697265625, 16.62646484375, 17.188232421875, 17.75]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 7.0, 8.0, 5.0, 15.0, 16.0, 16.0, 19.0, 12.0, 20.0, 20.0, 25.0, 24.0, 26.0, 23.0, 44.0, 33.0, 40.0, 37.0, 35.0, 47.0, 33.0, 34.0, 37.0, 39.0, 35.0, 36.0, 28.0, 31.0, 30.0, 25.0, 27.0, 28.0, 26.0, 17.0, 18.0, 13.0, 11.0, 14.0, 7.0, 3.0, 10.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0, 0.0, 3.0, 3.0], "bins": [-37.40625, -36.32373046875, -35.2412109375, -34.15869140625, -33.076171875, -31.99365234375, -30.9111328125, -29.82861328125, -28.74609375, -27.66357421875, -26.5810546875, -25.49853515625, -24.416015625, -23.33349609375, -22.2509765625, -21.16845703125, -20.0859375, -19.00341796875, -17.9208984375, -16.83837890625, -15.755859375, -14.67333984375, -13.5908203125, -12.50830078125, -11.42578125, -10.34326171875, -9.2607421875, -8.17822265625, -7.095703125, -6.01318359375, -4.9306640625, -3.84814453125, -2.765625, -1.68310546875, -0.6005859375, 0.48193359375, 1.564453125, 2.64697265625, 3.7294921875, 4.81201171875, 5.89453125, 6.97705078125, 8.0595703125, 9.14208984375, 10.224609375, 11.30712890625, 12.3896484375, 13.47216796875, 14.5546875, 15.63720703125, 16.7197265625, 17.80224609375, 18.884765625, 19.96728515625, 21.0498046875, 22.13232421875, 23.21484375, 24.29736328125, 25.3798828125, 26.46240234375, 27.544921875, 28.62744140625, 29.7099609375, 30.79248046875, 31.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 26.0, 37.0, 41.0, 64.0, 111.0, 152.0, 277.0, 423.0, 606.0, 932.0, 1521.0, 2321.0, 3755.0, 5788.0, 9059.0, 14046.0, 21257.0, 31810.0, 45533.0, 62591.0, 81149.0, 99152.0, 110669.0, 113278.0, 106583.0, 92100.0, 73408.0, 55112.0, 39439.0, 26867.0, 18021.0, 11668.0, 7443.0, 4925.0, 2992.0, 2004.0, 1172.0, 791.0, 491.0, 334.0, 208.0, 150.0, 79.0, 62.0, 29.0, 22.0, 23.0, 8.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.3125, -17.745361328125, -17.17822265625, -16.611083984375, -16.0439453125, -15.476806640625, -14.90966796875, -14.342529296875, -13.775390625, -13.208251953125, -12.64111328125, -12.073974609375, -11.5068359375, -10.939697265625, -10.37255859375, -9.805419921875, -9.23828125, -8.671142578125, -8.10400390625, -7.536865234375, -6.9697265625, -6.402587890625, -5.83544921875, -5.268310546875, -4.701171875, -4.134033203125, -3.56689453125, -2.999755859375, -2.4326171875, -1.865478515625, -1.29833984375, -0.731201171875, -0.1640625, 0.403076171875, 0.97021484375, 1.537353515625, 2.1044921875, 2.671630859375, 3.23876953125, 3.805908203125, 4.373046875, 4.940185546875, 5.50732421875, 6.074462890625, 6.6416015625, 7.208740234375, 7.77587890625, 8.343017578125, 8.91015625, 9.477294921875, 10.04443359375, 10.611572265625, 11.1787109375, 11.745849609375, 12.31298828125, 12.880126953125, 13.447265625, 14.014404296875, 14.58154296875, 15.148681640625, 15.7158203125, 16.282958984375, 16.85009765625, 17.417236328125, 17.984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 10.0, 12.0, 10.0, 14.0, 11.0, 14.0, 26.0, 21.0, 31.0, 29.0, 27.0, 26.0, 38.0, 33.0, 34.0, 42.0, 43.0, 41.0, 32.0, 44.0, 29.0, 45.0, 27.0, 44.0, 42.0, 33.0, 29.0, 30.0, 28.0, 24.0, 21.0, 13.0, 16.0, 18.0, 8.0, 9.0, 18.0, 6.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.03125, -24.30078125, -23.5703125, -22.83984375, -22.109375, -21.37890625, -20.6484375, -19.91796875, -19.1875, -18.45703125, -17.7265625, -16.99609375, -16.265625, -15.53515625, -14.8046875, -14.07421875, -13.34375, -12.61328125, -11.8828125, -11.15234375, -10.421875, -9.69140625, -8.9609375, -8.23046875, -7.5, -6.76953125, -6.0390625, -5.30859375, -4.578125, -3.84765625, -3.1171875, -2.38671875, -1.65625, -0.92578125, -0.1953125, 0.53515625, 1.265625, 1.99609375, 2.7265625, 3.45703125, 4.1875, 4.91796875, 5.6484375, 6.37890625, 7.109375, 7.83984375, 8.5703125, 9.30078125, 10.03125, 10.76171875, 11.4921875, 12.22265625, 12.953125, 13.68359375, 14.4140625, 15.14453125, 15.875, 16.60546875, 17.3359375, 18.06640625, 18.796875, 19.52734375, 20.2578125, 20.98828125, 21.71875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 4.0, 9.0, 12.0, 31.0, 34.0, 41.0, 72.0, 108.0, 205.0, 327.0, 593.0, 915.0, 1636.0, 2864.0, 5124.0, 9686.0, 17712.0, 31314.0, 52956.0, 84563.0, 120598.0, 149097.0, 156029.0, 138848.0, 106094.0, 70677.0, 43262.0, 24833.0, 13725.0, 7495.0, 4183.0, 2343.0, 1281.0, 738.0, 456.0, 225.0, 136.0, 107.0, 64.0, 45.0, 27.0, 17.0, 13.0, 14.0, 13.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.81414794921875, -6.5892333984375, -6.36431884765625, -6.139404296875, -5.91448974609375, -5.6895751953125, -5.46466064453125, -5.23974609375, -5.01483154296875, -4.7899169921875, -4.56500244140625, -4.340087890625, -4.11517333984375, -3.8902587890625, -3.66534423828125, -3.4404296875, -3.21551513671875, -2.9906005859375, -2.76568603515625, -2.540771484375, -2.31585693359375, -2.0909423828125, -1.86602783203125, -1.64111328125, -1.41619873046875, -1.1912841796875, -0.96636962890625, -0.741455078125, -0.51654052734375, -0.2916259765625, -0.06671142578125, 0.158203125, 0.38311767578125, 0.6080322265625, 0.83294677734375, 1.057861328125, 1.28277587890625, 1.5076904296875, 1.73260498046875, 1.95751953125, 2.18243408203125, 2.4073486328125, 2.63226318359375, 2.857177734375, 3.08209228515625, 3.3070068359375, 3.53192138671875, 3.7568359375, 3.98175048828125, 4.2066650390625, 4.43157958984375, 4.656494140625, 4.88140869140625, 5.1063232421875, 5.33123779296875, 5.55615234375, 5.78106689453125, 6.0059814453125, 6.23089599609375, 6.455810546875, 6.68072509765625, 6.9056396484375, 7.13055419921875, 7.35546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 8.0, 9.0, 7.0, 12.0, 22.0, 14.0, 17.0, 22.0, 27.0, 35.0, 42.0, 37.0, 30.0, 47.0, 52.0, 41.0, 44.0, 52.0, 45.0, 55.0, 38.0, 49.0, 42.0, 36.0, 32.0, 20.0, 28.0, 24.0, 20.0, 17.0, 14.0, 12.0, 10.0, 5.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.0006847381591796875, -0.0006669424474239349, -0.0006491467356681824, -0.0006313510239124298, -0.0006135553121566772, -0.0005957596004009247, -0.0005779638886451721, -0.0005601681768894196, -0.000542372465133667, -0.0005245767533779144, -0.0005067810416221619, -0.0004889853298664093, -0.00047118961811065674, -0.0004533939063549042, -0.0004355981945991516, -0.00041780248284339905, -0.0004000067710876465, -0.0003822110593318939, -0.00036441534757614136, -0.0003466196358203888, -0.00032882392406463623, -0.00031102821230888367, -0.0002932325005531311, -0.00027543678879737854, -0.000257641077041626, -0.0002398453652858734, -0.00022204965353012085, -0.00020425394177436829, -0.00018645823001861572, -0.00016866251826286316, -0.0001508668065071106, -0.00013307109475135803, -0.00011527538299560547, -9.74796712398529e-05, -7.968395948410034e-05, -6.188824772834778e-05, -4.4092535972595215e-05, -2.629682421684265e-05, -8.501112461090088e-06, 9.294599294662476e-06, 2.709031105041504e-05, 4.48860228061676e-05, 6.268173456192017e-05, 8.047744631767273e-05, 9.827315807342529e-05, 0.00011606886982917786, 0.00013386458158493042, 0.00015166029334068298, 0.00016945600509643555, 0.0001872517168521881, 0.00020504742860794067, 0.00022284314036369324, 0.0002406388521194458, 0.00025843456387519836, 0.00027623027563095093, 0.0002940259873867035, 0.00031182169914245605, 0.0003296174108982086, 0.0003474131226539612, 0.00036520883440971375, 0.0003830045461654663, 0.00040080025792121887, 0.00041859596967697144, 0.000436391681432724, 0.00045418739318847656]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 7.0, 18.0, 27.0, 46.0, 53.0, 72.0, 128.0, 196.0, 269.0, 473.0, 645.0, 1107.0, 1776.0, 2944.0, 4701.0, 7471.0, 12288.0, 19580.0, 30532.0, 46892.0, 67326.0, 91196.0, 113106.0, 126287.0, 125981.0, 112228.0, 90374.0, 66325.0, 45636.0, 30288.0, 19247.0, 11952.0, 7342.0, 4480.0, 2827.0, 1787.0, 1056.0, 671.0, 419.0, 277.0, 169.0, 122.0, 78.0, 50.0, 37.0, 18.0, 21.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-6.3359375, -6.143798828125, -5.95166015625, -5.759521484375, -5.5673828125, -5.375244140625, -5.18310546875, -4.990966796875, -4.798828125, -4.606689453125, -4.41455078125, -4.222412109375, -4.0302734375, -3.838134765625, -3.64599609375, -3.453857421875, -3.26171875, -3.069580078125, -2.87744140625, -2.685302734375, -2.4931640625, -2.301025390625, -2.10888671875, -1.916748046875, -1.724609375, -1.532470703125, -1.34033203125, -1.148193359375, -0.9560546875, -0.763916015625, -0.57177734375, -0.379638671875, -0.1875, 0.004638671875, 0.19677734375, 0.388916015625, 0.5810546875, 0.773193359375, 0.96533203125, 1.157470703125, 1.349609375, 1.541748046875, 1.73388671875, 1.926025390625, 2.1181640625, 2.310302734375, 2.50244140625, 2.694580078125, 2.88671875, 3.078857421875, 3.27099609375, 3.463134765625, 3.6552734375, 3.847412109375, 4.03955078125, 4.231689453125, 4.423828125, 4.615966796875, 4.80810546875, 5.000244140625, 5.1923828125, 5.384521484375, 5.57666015625, 5.768798828125, 5.9609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 7.0, 9.0, 7.0, 8.0, 19.0, 17.0, 13.0, 21.0, 25.0, 36.0, 46.0, 49.0, 45.0, 46.0, 56.0, 53.0, 61.0, 57.0, 60.0, 42.0, 47.0, 37.0, 43.0, 38.0, 31.0, 28.0, 22.0, 20.0, 13.0, 7.0, 7.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.718475341796875, -3.59515380859375, -3.471832275390625, -3.3485107421875, -3.225189208984375, -3.10186767578125, -2.978546142578125, -2.855224609375, -2.731903076171875, -2.60858154296875, -2.485260009765625, -2.3619384765625, -2.238616943359375, -2.11529541015625, -1.991973876953125, -1.86865234375, -1.745330810546875, -1.62200927734375, -1.498687744140625, -1.3753662109375, -1.252044677734375, -1.12872314453125, -1.005401611328125, -0.882080078125, -0.758758544921875, -0.63543701171875, -0.512115478515625, -0.3887939453125, -0.265472412109375, -0.14215087890625, -0.018829345703125, 0.1044921875, 0.227813720703125, 0.35113525390625, 0.474456787109375, 0.5977783203125, 0.721099853515625, 0.84442138671875, 0.967742919921875, 1.091064453125, 1.214385986328125, 1.33770751953125, 1.461029052734375, 1.5843505859375, 1.707672119140625, 1.83099365234375, 1.954315185546875, 2.07763671875, 2.200958251953125, 2.32427978515625, 2.447601318359375, 2.5709228515625, 2.694244384765625, 2.81756591796875, 2.940887451171875, 3.064208984375, 3.187530517578125, 3.31085205078125, 3.434173583984375, 3.5574951171875, 3.680816650390625, 3.80413818359375, 3.927459716796875, 4.05078125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 9.0, 11.0, 20.0, 18.0, 31.0, 31.0, 35.0, 41.0, 44.0, 44.0, 47.0, 53.0, 52.0, 51.0, 40.0, 57.0, 41.0, 45.0, 34.0, 43.0, 28.0, 28.0, 30.0, 26.0, 29.0, 17.0, 16.0, 15.0, 11.0, 12.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0], "bins": [-32.187217712402344, -31.323226928710938, -30.45923614501953, -29.595245361328125, -28.73125457763672, -27.867263793945312, -27.00327491760254, -26.139284133911133, -25.275293350219727, -24.41130256652832, -23.547311782836914, -22.683320999145508, -21.819332122802734, -20.955341339111328, -20.091350555419922, -19.227359771728516, -18.36336898803711, -17.499378204345703, -16.635387420654297, -15.771397590637207, -14.9074068069458, -14.043416023254395, -13.179426193237305, -12.315435409545898, -11.451444625854492, -10.587453842163086, -9.72346305847168, -8.85947322845459, -7.995482444763184, -7.131491661071777, -6.267501354217529, -5.403511047363281, -4.539520263671875, -3.675529718399048, -2.8115391731262207, -1.9475486278533936, -1.0835580825805664, -0.21956729888916016, 0.6444230079650879, 1.508413314819336, 2.372404098510742, 3.2363946437835693, 4.1003851890563965, 4.9643754959106445, 5.828366279602051, 6.692357063293457, 7.556347370147705, 8.420337677001953, 9.28432846069336, 10.148319244384766, 11.012310028076172, 11.876299858093262, 12.740290641784668, 13.604281425476074, 14.468271255493164, 15.33226203918457, 16.196252822875977, 17.060243606567383, 17.92423439025879, 18.788225173950195, 19.65221405029297, 20.516204833984375, 21.38019561767578, 22.244186401367188, 23.108177185058594]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 0.0, 9.0, 10.0, 11.0, 13.0, 12.0, 17.0, 14.0, 19.0, 22.0, 19.0, 31.0, 33.0, 27.0, 27.0, 27.0, 38.0, 39.0, 42.0, 32.0, 35.0, 45.0, 38.0, 41.0, 34.0, 44.0, 36.0, 37.0, 21.0, 27.0, 26.0, 16.0, 33.0, 28.0, 22.0, 14.0, 9.0, 10.0, 9.0, 4.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0], "bins": [-41.57878494262695, -40.39208221435547, -39.20538330078125, -38.018680572509766, -36.83197784423828, -35.6452751159668, -34.45857238769531, -33.271873474121094, -32.08517074584961, -30.898468017578125, -29.711767196655273, -28.525066375732422, -27.338363647460938, -26.151660919189453, -24.9649600982666, -23.77825927734375, -22.591556549072266, -21.40485382080078, -20.21815299987793, -19.031452178955078, -17.844749450683594, -16.65804672241211, -15.471345901489258, -14.28464412689209, -13.097942352294922, -11.911240577697754, -10.724538803100586, -9.537837028503418, -8.35113525390625, -7.164433479309082, -5.977731704711914, -4.791029930114746, -3.6043243408203125, -2.4176225662231445, -1.2309207916259766, -0.044219017028808594, 1.1424827575683594, 2.3291845321655273, 3.5158863067626953, 4.702588081359863, 5.889289855957031, 7.075991630554199, 8.262693405151367, 9.449395179748535, 10.636096954345703, 11.822798728942871, 13.009500503540039, 14.196202278137207, 15.382904052734375, 16.56960678100586, 17.75630760192871, 18.943008422851562, 20.129711151123047, 21.31641387939453, 22.503114700317383, 23.689815521240234, 24.87651824951172, 26.063220977783203, 27.249921798706055, 28.436622619628906, 29.62332534790039, 30.810028076171875, 31.996728897094727, 33.18342971801758, 34.37013244628906]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 6.0, 10.0, 12.0, 16.0, 37.0, 62.0, 110.0, 158.0, 290.0, 495.0, 862.0, 1394.0, 2557.0, 4307.0, 7206.0, 12380.0, 20287.0, 33760.0, 55662.0, 87762.0, 135485.0, 200773.0, 283922.0, 373644.0, 451627.0, 496179.0, 488751.0, 432704.0, 348046.0, 259056.0, 179970.0, 120098.0, 76654.0, 48129.0, 29330.0, 17379.0, 10375.0, 6183.0, 3550.0, 2126.0, 1255.0, 688.0, 414.0, 235.0, 138.0, 82.0, 40.0, 29.0, 24.0, 14.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.828125, -23.124267578125, -22.42041015625, -21.716552734375, -21.0126953125, -20.308837890625, -19.60498046875, -18.901123046875, -18.197265625, -17.493408203125, -16.78955078125, -16.085693359375, -15.3818359375, -14.677978515625, -13.97412109375, -13.270263671875, -12.56640625, -11.862548828125, -11.15869140625, -10.454833984375, -9.7509765625, -9.047119140625, -8.34326171875, -7.639404296875, -6.935546875, -6.231689453125, -5.52783203125, -4.823974609375, -4.1201171875, -3.416259765625, -2.71240234375, -2.008544921875, -1.3046875, -0.600830078125, 0.10302734375, 0.806884765625, 1.5107421875, 2.214599609375, 2.91845703125, 3.622314453125, 4.326171875, 5.030029296875, 5.73388671875, 6.437744140625, 7.1416015625, 7.845458984375, 8.54931640625, 9.253173828125, 9.95703125, 10.660888671875, 11.36474609375, 12.068603515625, 12.7724609375, 13.476318359375, 14.18017578125, 14.884033203125, 15.587890625, 16.291748046875, 16.99560546875, 17.699462890625, 18.4033203125, 19.107177734375, 19.81103515625, 20.514892578125, 21.21875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 0.0, 8.0, 11.0, 12.0, 16.0, 10.0, 17.0, 12.0, 23.0, 16.0, 26.0, 28.0, 33.0, 33.0, 19.0, 31.0, 40.0, 36.0, 40.0, 38.0, 37.0, 40.0, 42.0, 39.0, 41.0, 37.0, 41.0, 27.0, 25.0, 29.0, 20.0, 22.0, 39.0, 18.0, 23.0, 13.0, 11.0, 7.0, 8.0, 5.0, 3.0, 7.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0], "bins": [-34.375, -33.39453125, -32.4140625, -31.43359375, -30.453125, -29.47265625, -28.4921875, -27.51171875, -26.53125, -25.55078125, -24.5703125, -23.58984375, -22.609375, -21.62890625, -20.6484375, -19.66796875, -18.6875, -17.70703125, -16.7265625, -15.74609375, -14.765625, -13.78515625, -12.8046875, -11.82421875, -10.84375, -9.86328125, -8.8828125, -7.90234375, -6.921875, -5.94140625, -4.9609375, -3.98046875, -3.0, -2.01953125, -1.0390625, -0.05859375, 0.921875, 1.90234375, 2.8828125, 3.86328125, 4.84375, 5.82421875, 6.8046875, 7.78515625, 8.765625, 9.74609375, 10.7265625, 11.70703125, 12.6875, 13.66796875, 14.6484375, 15.62890625, 16.609375, 17.58984375, 18.5703125, 19.55078125, 20.53125, 21.51171875, 22.4921875, 23.47265625, 24.453125, 25.43359375, 26.4140625, 27.39453125, 28.375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 13.0, 15.0, 29.0, 52.0, 104.0, 177.0, 330.0, 607.0, 914.0, 1786.0, 2935.0, 4921.0, 8606.0, 14005.0, 22263.0, 35652.0, 54955.0, 82518.0, 119090.0, 165180.0, 219760.0, 277958.0, 332709.0, 376801.0, 399028.0, 397398.0, 372299.0, 327090.0, 271088.0, 213379.0, 159525.0, 114142.0, 78578.0, 52791.0, 33881.0, 21296.0, 13207.0, 7980.0, 4815.0, 2710.0, 1609.0, 901.0, 514.0, 331.0, 149.0, 100.0, 55.0, 23.0, 10.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.065673828125, -15.49072265625, -14.915771484375, -14.3408203125, -13.765869140625, -13.19091796875, -12.615966796875, -12.041015625, -11.466064453125, -10.89111328125, -10.316162109375, -9.7412109375, -9.166259765625, -8.59130859375, -8.016357421875, -7.44140625, -6.866455078125, -6.29150390625, -5.716552734375, -5.1416015625, -4.566650390625, -3.99169921875, -3.416748046875, -2.841796875, -2.266845703125, -1.69189453125, -1.116943359375, -0.5419921875, 0.032958984375, 0.60791015625, 1.182861328125, 1.7578125, 2.332763671875, 2.90771484375, 3.482666015625, 4.0576171875, 4.632568359375, 5.20751953125, 5.782470703125, 6.357421875, 6.932373046875, 7.50732421875, 8.082275390625, 8.6572265625, 9.232177734375, 9.80712890625, 10.382080078125, 10.95703125, 11.531982421875, 12.10693359375, 12.681884765625, 13.2568359375, 13.831787109375, 14.40673828125, 14.981689453125, 15.556640625, 16.131591796875, 16.70654296875, 17.281494140625, 17.8564453125, 18.431396484375, 19.00634765625, 19.581298828125, 20.15625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 3.0, 2.0, 4.0, 8.0, 15.0, 21.0, 15.0, 24.0, 29.0, 47.0, 47.0, 49.0, 69.0, 82.0, 94.0, 108.0, 128.0, 132.0, 144.0, 178.0, 188.0, 183.0, 171.0, 181.0, 192.0, 229.0, 170.0, 193.0, 173.0, 155.0, 136.0, 135.0, 117.0, 106.0, 100.0, 87.0, 71.0, 55.0, 40.0, 43.0, 29.0, 21.0, 24.0, 21.0, 17.0, 8.0, 9.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.03125, -12.6170654296875, -12.202880859375, -11.7886962890625, -11.37451171875, -10.9603271484375, -10.546142578125, -10.1319580078125, -9.7177734375, -9.3035888671875, -8.889404296875, -8.4752197265625, -8.06103515625, -7.6468505859375, -7.232666015625, -6.8184814453125, -6.404296875, -5.9901123046875, -5.575927734375, -5.1617431640625, -4.74755859375, -4.3333740234375, -3.919189453125, -3.5050048828125, -3.0908203125, -2.6766357421875, -2.262451171875, -1.8482666015625, -1.43408203125, -1.0198974609375, -0.605712890625, -0.1915283203125, 0.22265625, 0.6368408203125, 1.051025390625, 1.4652099609375, 1.87939453125, 2.2935791015625, 2.707763671875, 3.1219482421875, 3.5361328125, 3.9503173828125, 4.364501953125, 4.7786865234375, 5.19287109375, 5.6070556640625, 6.021240234375, 6.4354248046875, 6.849609375, 7.2637939453125, 7.677978515625, 8.0921630859375, 8.50634765625, 8.9205322265625, 9.334716796875, 9.7489013671875, 10.1630859375, 10.5772705078125, 10.991455078125, 11.4056396484375, 11.81982421875, 12.2340087890625, 12.648193359375, 13.0623779296875, 13.4765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 8.0, 10.0, 12.0, 14.0, 14.0, 20.0, 22.0, 26.0, 28.0, 26.0, 31.0, 42.0, 32.0, 37.0, 30.0, 34.0, 55.0, 35.0, 45.0, 42.0, 38.0, 30.0, 37.0, 38.0, 32.0, 28.0, 32.0, 27.0, 27.0, 27.0, 17.0, 9.0, 16.0, 13.0, 7.0, 10.0, 4.0, 6.0, 7.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-21.883691787719727, -21.15606689453125, -20.428442001342773, -19.70081901550293, -18.973194122314453, -18.245569229125977, -17.5179443359375, -16.790321350097656, -16.06269645690918, -15.335071563720703, -14.607447624206543, -13.879822731018066, -13.152198791503906, -12.42457389831543, -11.696949005126953, -10.969325065612793, -10.241700172424316, -9.51407527923584, -8.78645133972168, -8.058826446533203, -7.331202507019043, -6.603577613830566, -5.875953197479248, -5.14832878112793, -4.420704364776611, -3.693079948425293, -2.9654555320739746, -2.237830877304077, -1.5102064609527588, -0.7825820446014404, -0.05495738983154297, 0.6726670265197754, 1.4002914428710938, 2.127915859222412, 2.8555402755737305, 3.583164930343628, 4.310789108276367, 5.038414001464844, 5.766038417816162, 6.4936628341674805, 7.221287250518799, 7.948911666870117, 8.676536560058594, 9.404160499572754, 10.13178539276123, 10.85940933227539, 11.587034225463867, 12.314659118652344, 13.042283058166504, 13.76990795135498, 14.49753189086914, 15.225156784057617, 15.952780723571777, 16.680404663085938, 17.408029556274414, 18.13565444946289, 18.863279342651367, 19.590904235839844, 20.31852912902832, 21.046152114868164, 21.77377700805664, 22.501401901245117, 23.229026794433594, 23.956649780273438, 24.684274673461914]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 11.0, 10.0, 5.0, 6.0, 9.0, 11.0, 15.0, 13.0, 12.0, 23.0, 21.0, 21.0, 26.0, 25.0, 36.0, 31.0, 29.0, 37.0, 37.0, 45.0, 48.0, 36.0, 38.0, 42.0, 40.0, 38.0, 30.0, 29.0, 38.0, 24.0, 40.0, 32.0, 22.0, 22.0, 17.0, 14.0, 13.0, 9.0, 6.0, 10.0, 9.0, 4.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-42.06842041015625, -40.89487075805664, -39.7213249206543, -38.54777526855469, -37.37422561645508, -36.20067596435547, -35.027130126953125, -33.853580474853516, -32.680030822753906, -31.50648307800293, -30.33293342590332, -29.159385681152344, -27.985836029052734, -26.812288284301758, -25.63874053955078, -24.465190887451172, -23.291645050048828, -22.11809730529785, -20.944547653198242, -19.770999908447266, -18.597450256347656, -17.42390251159668, -16.250354766845703, -15.07680606842041, -13.903257369995117, -12.729708671569824, -11.556159973144531, -10.382612228393555, -9.209063529968262, -8.035514831542969, -6.861966609954834, -5.688418388366699, -4.514873504638672, -3.341325044631958, -2.167776584625244, -0.9942281246185303, 0.1793203353881836, 1.3528690338134766, 2.5264172554016113, 3.699965476989746, 4.873514175415039, 6.047062873840332, 7.220611095428467, 8.394159317016602, 9.567708015441895, 10.741256713867188, 11.914804458618164, 13.088353157043457, 14.26190185546875, 15.435450553894043, 16.608999252319336, 17.782546997070312, 18.956096649169922, 20.1296443939209, 21.303192138671875, 22.476741790771484, 23.65028953552246, 24.823837280273438, 25.997386932373047, 27.170934677124023, 28.344482421875, 29.51803207397461, 30.691579818725586, 31.865127563476562, 33.03867721557617]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 20.0, 14.0, 36.0, 45.0, 61.0, 106.0, 155.0, 234.0, 338.0, 528.0, 855.0, 1258.0, 2004.0, 3321.0, 5575.0, 9428.0, 16631.0, 31271.0, 61834.0, 129105.0, 287506.0, 260320.0, 115763.0, 55839.0, 28567.0, 15384.0, 8737.0, 5249.0, 3101.0, 1959.0, 1146.0, 743.0, 489.0, 299.0, 205.0, 140.0, 79.0, 60.0, 45.0, 33.0, 24.0, 12.0, 7.0, 11.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.38671875, -4.24932861328125, -4.1119384765625, -3.97454833984375, -3.837158203125, -3.69976806640625, -3.5623779296875, -3.42498779296875, -3.28759765625, -3.15020751953125, -3.0128173828125, -2.87542724609375, -2.738037109375, -2.60064697265625, -2.4632568359375, -2.32586669921875, -2.1884765625, -2.05108642578125, -1.9136962890625, -1.77630615234375, -1.638916015625, -1.50152587890625, -1.3641357421875, -1.22674560546875, -1.08935546875, -0.95196533203125, -0.8145751953125, -0.67718505859375, -0.539794921875, -0.40240478515625, -0.2650146484375, -0.12762451171875, 0.009765625, 0.14715576171875, 0.2845458984375, 0.42193603515625, 0.559326171875, 0.69671630859375, 0.8341064453125, 0.97149658203125, 1.10888671875, 1.24627685546875, 1.3836669921875, 1.52105712890625, 1.658447265625, 1.79583740234375, 1.9332275390625, 2.07061767578125, 2.2080078125, 2.34539794921875, 2.4827880859375, 2.62017822265625, 2.757568359375, 2.89495849609375, 3.0323486328125, 3.16973876953125, 3.30712890625, 3.44451904296875, 3.5819091796875, 3.71929931640625, 3.856689453125, 3.99407958984375, 4.1314697265625, 4.26885986328125, 4.40625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 11.0, 10.0, 4.0, 7.0, 9.0, 11.0, 15.0, 13.0, 12.0, 23.0, 20.0, 22.0, 27.0, 24.0, 35.0, 32.0, 30.0, 37.0, 37.0, 43.0, 49.0, 36.0, 38.0, 42.0, 40.0, 39.0, 29.0, 30.0, 36.0, 26.0, 38.0, 32.0, 25.0, 20.0, 17.0, 14.0, 14.0, 8.0, 6.0, 10.0, 9.0, 4.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-42.0, -40.82666015625, -39.6533203125, -38.47998046875, -37.306640625, -36.13330078125, -34.9599609375, -33.78662109375, -32.61328125, -31.43994140625, -30.2666015625, -29.09326171875, -27.919921875, -26.74658203125, -25.5732421875, -24.39990234375, -23.2265625, -22.05322265625, -20.8798828125, -19.70654296875, -18.533203125, -17.35986328125, -16.1865234375, -15.01318359375, -13.83984375, -12.66650390625, -11.4931640625, -10.31982421875, -9.146484375, -7.97314453125, -6.7998046875, -5.62646484375, -4.453125, -3.27978515625, -2.1064453125, -0.93310546875, 0.240234375, 1.41357421875, 2.5869140625, 3.76025390625, 4.93359375, 6.10693359375, 7.2802734375, 8.45361328125, 9.626953125, 10.80029296875, 11.9736328125, 13.14697265625, 14.3203125, 15.49365234375, 16.6669921875, 17.84033203125, 19.013671875, 20.18701171875, 21.3603515625, 22.53369140625, 23.70703125, 24.88037109375, 26.0537109375, 27.22705078125, 28.400390625, 29.57373046875, 30.7470703125, 31.92041015625, 33.09375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 8.0, 6.0, 20.0, 26.0, 33.0, 52.0, 65.0, 109.0, 182.0, 309.0, 419.0, 731.0, 1116.0, 1911.0, 3226.0, 6031.0, 11337.0, 22498.0, 46711.0, 105858.0, 290617.0, 331700.0, 120746.0, 51615.0, 25114.0, 12602.0, 6616.0, 3616.0, 2019.0, 1280.0, 716.0, 446.0, 277.0, 170.0, 130.0, 80.0, 55.0, 35.0, 23.0, 15.0, 6.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.04296875, -5.87066650390625, -5.6983642578125, -5.52606201171875, -5.353759765625, -5.18145751953125, -5.0091552734375, -4.83685302734375, -4.66455078125, -4.49224853515625, -4.3199462890625, -4.14764404296875, -3.975341796875, -3.80303955078125, -3.6307373046875, -3.45843505859375, -3.2861328125, -3.11383056640625, -2.9415283203125, -2.76922607421875, -2.596923828125, -2.42462158203125, -2.2523193359375, -2.08001708984375, -1.90771484375, -1.73541259765625, -1.5631103515625, -1.39080810546875, -1.218505859375, -1.04620361328125, -0.8739013671875, -0.70159912109375, -0.529296875, -0.35699462890625, -0.1846923828125, -0.01239013671875, 0.159912109375, 0.33221435546875, 0.5045166015625, 0.67681884765625, 0.84912109375, 1.02142333984375, 1.1937255859375, 1.36602783203125, 1.538330078125, 1.71063232421875, 1.8829345703125, 2.05523681640625, 2.2275390625, 2.39984130859375, 2.5721435546875, 2.74444580078125, 2.916748046875, 3.08905029296875, 3.2613525390625, 3.43365478515625, 3.60595703125, 3.77825927734375, 3.9505615234375, 4.12286376953125, 4.295166015625, 4.46746826171875, 4.6397705078125, 4.81207275390625, 4.984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 8.0, 7.0, 16.0, 12.0, 20.0, 19.0, 19.0, 25.0, 21.0, 35.0, 29.0, 37.0, 31.0, 44.0, 36.0, 38.0, 33.0, 47.0, 46.0, 39.0, 40.0, 47.0, 35.0, 34.0, 38.0, 37.0, 22.0, 21.0, 24.0, 20.0, 17.0, 13.0, 12.0, 17.0, 11.0, 10.0, 9.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.451171875, -22.65234375, -21.853515625, -21.0546875, -20.255859375, -19.45703125, -18.658203125, -17.859375, -17.060546875, -16.26171875, -15.462890625, -14.6640625, -13.865234375, -13.06640625, -12.267578125, -11.46875, -10.669921875, -9.87109375, -9.072265625, -8.2734375, -7.474609375, -6.67578125, -5.876953125, -5.078125, -4.279296875, -3.48046875, -2.681640625, -1.8828125, -1.083984375, -0.28515625, 0.513671875, 1.3125, 2.111328125, 2.91015625, 3.708984375, 4.5078125, 5.306640625, 6.10546875, 6.904296875, 7.703125, 8.501953125, 9.30078125, 10.099609375, 10.8984375, 11.697265625, 12.49609375, 13.294921875, 14.09375, 14.892578125, 15.69140625, 16.490234375, 17.2890625, 18.087890625, 18.88671875, 19.685546875, 20.484375, 21.283203125, 22.08203125, 22.880859375, 23.6796875, 24.478515625, 25.27734375, 26.076171875, 26.875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 12.0, 8.0, 26.0, 29.0, 46.0, 58.0, 62.0, 104.0, 127.0, 206.0, 328.0, 479.0, 794.0, 1365.0, 2327.0, 4272.0, 8138.0, 16937.0, 39772.0, 108391.0, 351324.0, 337784.0, 103181.0, 38132.0, 16547.0, 8074.0, 4285.0, 2254.0, 1340.0, 755.0, 469.0, 282.0, 194.0, 123.0, 97.0, 60.0, 51.0, 23.0, 31.0, 11.0, 4.0, 19.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.40283203125, -0.3916358947753906, -0.38043975830078125, -0.3692436218261719, -0.3580474853515625, -0.3468513488769531, -0.33565521240234375, -0.3244590759277344, -0.313262939453125, -0.3020668029785156, -0.29087066650390625, -0.2796745300292969, -0.2684783935546875, -0.2572822570800781, -0.24608612060546875, -0.23488998413085938, -0.22369384765625, -0.21249771118164062, -0.20130157470703125, -0.19010543823242188, -0.1789093017578125, -0.16771316528320312, -0.15651702880859375, -0.14532089233398438, -0.134124755859375, -0.12292861938476562, -0.11173248291015625, -0.10053634643554688, -0.0893402099609375, -0.07814407348632812, -0.06694793701171875, -0.055751800537109375, -0.0445556640625, -0.033359527587890625, -0.02216339111328125, -0.010967254638671875, 0.0002288818359375, 0.011425018310546875, 0.02262115478515625, 0.033817291259765625, 0.045013427734375, 0.056209564208984375, 0.06740570068359375, 0.07860183715820312, 0.0897979736328125, 0.10099411010742188, 0.11219024658203125, 0.12338638305664062, 0.13458251953125, 0.14577865600585938, 0.15697479248046875, 0.16817092895507812, 0.1793670654296875, 0.19056320190429688, 0.20175933837890625, 0.21295547485351562, 0.224151611328125, 0.23534774780273438, 0.24654388427734375, 0.2577400207519531, 0.2689361572265625, 0.2801322937011719, 0.29132843017578125, 0.3025245666503906, 0.313720703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 13.0, 8.0, 11.0, 31.0, 25.0, 35.0, 30.0, 37.0, 47.0, 63.0, 76.0, 82.0, 74.0, 79.0, 74.0, 70.0, 52.0, 42.0, 30.0, 32.0, 28.0, 13.0, 10.0, 9.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.845857620239258e-05, -4.7186389565467834e-05, -4.591420292854309e-05, -4.464201629161835e-05, -4.3369829654693604e-05, -4.209764301776886e-05, -4.0825456380844116e-05, -3.955326974391937e-05, -3.828108310699463e-05, -3.7008896470069885e-05, -3.573670983314514e-05, -3.44645231962204e-05, -3.3192336559295654e-05, -3.192014992237091e-05, -3.064796328544617e-05, -2.9375776648521423e-05, -2.810359001159668e-05, -2.6831403374671936e-05, -2.5559216737747192e-05, -2.428703010082245e-05, -2.3014843463897705e-05, -2.174265682697296e-05, -2.0470470190048218e-05, -1.9198283553123474e-05, -1.792609691619873e-05, -1.6653910279273987e-05, -1.5381723642349243e-05, -1.41095370054245e-05, -1.2837350368499756e-05, -1.1565163731575012e-05, -1.0292977094650269e-05, -9.020790457725525e-06, -7.748603820800781e-06, -6.476417183876038e-06, -5.204230546951294e-06, -3.93204391002655e-06, -2.6598572731018066e-06, -1.387670636177063e-06, -1.1548399925231934e-07, 1.1567026376724243e-06, 2.428889274597168e-06, 3.7010759115219116e-06, 4.973262548446655e-06, 6.245449185371399e-06, 7.517635822296143e-06, 8.789822459220886e-06, 1.006200909614563e-05, 1.1334195733070374e-05, 1.2606382369995117e-05, 1.387856900691986e-05, 1.5150755643844604e-05, 1.6422942280769348e-05, 1.7695128917694092e-05, 1.8967315554618835e-05, 2.023950219154358e-05, 2.1511688828468323e-05, 2.2783875465393066e-05, 2.405606210231781e-05, 2.5328248739242554e-05, 2.6600435376167297e-05, 2.787262201309204e-05, 2.9144808650016785e-05, 3.041699528694153e-05, 3.168918192386627e-05, 3.2961368560791016e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 9.0, 5.0, 16.0, 24.0, 38.0, 55.0, 61.0, 95.0, 149.0, 201.0, 330.0, 457.0, 650.0, 978.0, 1418.0, 2107.0, 3338.0, 5002.0, 7603.0, 11679.0, 18428.0, 29417.0, 49162.0, 86014.0, 163850.0, 278916.0, 167254.0, 87497.0, 49940.0, 30299.0, 18863.0, 11874.0, 7623.0, 5027.0, 3373.0, 2222.0, 1475.0, 1005.0, 703.0, 394.0, 318.0, 209.0, 159.0, 108.0, 67.0, 53.0, 37.0, 17.0, 14.0, 8.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.445556640625, -0.4304618835449219, -0.41536712646484375, -0.4002723693847656, -0.3851776123046875, -0.3700828552246094, -0.35498809814453125, -0.3398933410644531, -0.324798583984375, -0.3097038269042969, -0.29460906982421875, -0.2795143127441406, -0.2644195556640625, -0.24932479858398438, -0.23423004150390625, -0.21913528442382812, -0.20404052734375, -0.18894577026367188, -0.17385101318359375, -0.15875625610351562, -0.1436614990234375, -0.12856674194335938, -0.11347198486328125, -0.09837722778320312, -0.083282470703125, -0.06818771362304688, -0.05309295654296875, -0.037998199462890625, -0.0229034423828125, -0.007808685302734375, 0.00728607177734375, 0.022380828857421875, 0.0374755859375, 0.052570343017578125, 0.06766510009765625, 0.08275985717773438, 0.0978546142578125, 0.11294937133789062, 0.12804412841796875, 0.14313888549804688, 0.158233642578125, 0.17332839965820312, 0.18842315673828125, 0.20351791381835938, 0.2186126708984375, 0.23370742797851562, 0.24880218505859375, 0.2638969421386719, 0.27899169921875, 0.2940864562988281, 0.30918121337890625, 0.3242759704589844, 0.3393707275390625, 0.3544654846191406, 0.36956024169921875, 0.3846549987792969, 0.399749755859375, 0.4148445129394531, 0.42993927001953125, 0.4450340270996094, 0.4601287841796875, 0.4752235412597656, 0.49031829833984375, 0.5054130554199219, 0.5205078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 8.0, 4.0, 7.0, 7.0, 12.0, 16.0, 14.0, 14.0, 22.0, 27.0, 20.0, 30.0, 40.0, 43.0, 41.0, 52.0, 47.0, 52.0, 48.0, 47.0, 44.0, 39.0, 43.0, 49.0, 47.0, 29.0, 26.0, 31.0, 21.0, 16.0, 16.0, 20.0, 17.0, 5.0, 16.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.44921875, -0.4351158142089844, -0.42101287841796875, -0.4069099426269531, -0.3928070068359375, -0.3787040710449219, -0.36460113525390625, -0.3504981994628906, -0.336395263671875, -0.3222923278808594, -0.30818939208984375, -0.2940864562988281, -0.2799835205078125, -0.2658805847167969, -0.25177764892578125, -0.23767471313476562, -0.22357177734375, -0.20946884155273438, -0.19536590576171875, -0.18126296997070312, -0.1671600341796875, -0.15305709838867188, -0.13895416259765625, -0.12485122680664062, -0.110748291015625, -0.09664535522460938, -0.08254241943359375, -0.06843948364257812, -0.0543365478515625, -0.040233612060546875, -0.02613067626953125, -0.012027740478515625, 0.0020751953125, 0.016178131103515625, 0.03028106689453125, 0.044384002685546875, 0.0584869384765625, 0.07258987426757812, 0.08669281005859375, 0.10079574584960938, 0.114898681640625, 0.12900161743164062, 0.14310455322265625, 0.15720748901367188, 0.1713104248046875, 0.18541336059570312, 0.19951629638671875, 0.21361923217773438, 0.22772216796875, 0.24182510375976562, 0.25592803955078125, 0.2700309753417969, 0.2841339111328125, 0.2982368469238281, 0.31233978271484375, 0.3264427185058594, 0.340545654296875, 0.3546485900878906, 0.36875152587890625, 0.3828544616699219, 0.3969573974609375, 0.4110603332519531, 0.42516326904296875, 0.4392662048339844, 0.453369140625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 11.0, 8.0, 11.0, 11.0, 14.0, 16.0, 13.0, 21.0, 29.0, 26.0, 27.0, 32.0, 34.0, 36.0, 27.0, 34.0, 34.0, 45.0, 50.0, 34.0, 46.0, 32.0, 37.0, 35.0, 43.0, 33.0, 23.0, 27.0, 30.0, 25.0, 32.0, 22.0, 15.0, 10.0, 12.0, 13.0, 8.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-21.71767807006836, -21.006126403808594, -20.294574737548828, -19.583023071289062, -18.871471405029297, -18.15991973876953, -17.448368072509766, -16.73681640625, -16.025264739990234, -15.313713073730469, -14.602161407470703, -13.890609741210938, -13.179058074951172, -12.467506408691406, -11.755955696105957, -11.044404029846191, -10.332853317260742, -9.621301651000977, -8.909749984741211, -8.198198318481445, -7.486647129058838, -6.775095462799072, -6.063544273376465, -5.351992607116699, -4.640440940856934, -3.928889274597168, -3.2173378467559814, -2.505786418914795, -1.7942347526550293, -1.0826830863952637, -0.37113189697265625, 0.3404197692871094, 1.0519733428955078, 1.7635248899459839, 2.47507643699646, 3.1866278648376465, 3.898179531097412, 4.609731197357178, 5.321282386779785, 6.032834053039551, 6.744385719299316, 7.455937385559082, 8.167489051818848, 8.879039764404297, 9.590591430664062, 10.302143096923828, 11.013694763183594, 11.72524642944336, 12.436798095703125, 13.14834976196289, 13.859901428222656, 14.571453094482422, 15.283004760742188, 15.994556427001953, 16.70610809326172, 17.417659759521484, 18.12921142578125, 18.840763092041016, 19.55231475830078, 20.263866424560547, 20.975418090820312, 21.686969757080078, 22.398521423339844, 23.11007308959961, 23.821622848510742]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 8.0, 7.0, 10.0, 5.0, 10.0, 13.0, 13.0, 18.0, 15.0, 21.0, 25.0, 27.0, 24.0, 32.0, 32.0, 29.0, 35.0, 38.0, 38.0, 49.0, 42.0, 40.0, 45.0, 35.0, 39.0, 30.0, 34.0, 32.0, 27.0, 38.0, 34.0, 24.0, 26.0, 13.0, 16.0, 13.0, 11.0, 4.0, 8.0, 10.0, 5.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0], "bins": [-42.43125915527344, -41.25423812866211, -40.07722091674805, -38.90019989013672, -37.72317886352539, -36.54616165161133, -35.369140625, -34.19212341308594, -33.01510238647461, -31.838083267211914, -30.661062240600586, -29.48404312133789, -28.307024002075195, -27.1300048828125, -25.952983856201172, -24.775964736938477, -23.59894371032715, -22.421924591064453, -21.244903564453125, -20.06788444519043, -18.890865325927734, -17.713844299316406, -16.53682518005371, -15.359806060791016, -14.182785987854004, -13.005765914916992, -11.828746795654297, -10.651726722717285, -9.474706649780273, -8.297687530517578, -7.120667457580566, -5.943648338317871, -4.766628265380859, -3.589608669281006, -2.4125888347625732, -1.2355690002441406, -0.05854940414428711, 1.1184701919555664, 2.295490264892578, 3.4725093841552734, 4.649529457092285, 5.826549053192139, 7.003568649291992, 8.180588722229004, 9.357608795166016, 10.534627914428711, 11.711647987365723, 12.888667106628418, 14.06568717956543, 15.242707252502441, 16.419727325439453, 17.59674644470215, 18.773765563964844, 19.950786590576172, 21.127805709838867, 22.304824829101562, 23.48184585571289, 24.658864974975586, 25.835886001586914, 27.01290512084961, 28.189924240112305, 29.366943359375, 30.543964385986328, 31.720983505249023, 32.89800262451172]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 7.0, 9.0, 17.0, 34.0, 57.0, 75.0, 114.0, 168.0, 263.0, 421.0, 712.0, 1146.0, 1840.0, 2950.0, 4695.0, 7778.0, 11946.0, 18909.0, 29003.0, 42821.0, 60626.0, 81149.0, 101441.0, 115333.0, 119514.0, 111858.0, 95958.0, 75116.0, 55549.0, 38313.0, 25781.0, 16578.0, 10689.0, 6711.0, 4135.0, 2582.0, 1671.0, 986.0, 579.0, 366.0, 240.0, 142.0, 101.0, 66.0, 36.0, 27.0, 21.0, 12.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.621337890625, -16.05517578125, -15.489013671875, -14.9228515625, -14.356689453125, -13.79052734375, -13.224365234375, -12.658203125, -12.092041015625, -11.52587890625, -10.959716796875, -10.3935546875, -9.827392578125, -9.26123046875, -8.695068359375, -8.12890625, -7.562744140625, -6.99658203125, -6.430419921875, -5.8642578125, -5.298095703125, -4.73193359375, -4.165771484375, -3.599609375, -3.033447265625, -2.46728515625, -1.901123046875, -1.3349609375, -0.768798828125, -0.20263671875, 0.363525390625, 0.9296875, 1.495849609375, 2.06201171875, 2.628173828125, 3.1943359375, 3.760498046875, 4.32666015625, 4.892822265625, 5.458984375, 6.025146484375, 6.59130859375, 7.157470703125, 7.7236328125, 8.289794921875, 8.85595703125, 9.422119140625, 9.98828125, 10.554443359375, 11.12060546875, 11.686767578125, 12.2529296875, 12.819091796875, 13.38525390625, 13.951416015625, 14.517578125, 15.083740234375, 15.64990234375, 16.216064453125, 16.7822265625, 17.348388671875, 17.91455078125, 18.480712890625, 19.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 10.0, 6.0, 10.0, 6.0, 9.0, 14.0, 14.0, 16.0, 15.0, 23.0, 23.0, 28.0, 24.0, 34.0, 29.0, 31.0, 32.0, 42.0, 40.0, 48.0, 39.0, 43.0, 41.0, 36.0, 42.0, 32.0, 28.0, 41.0, 23.0, 33.0, 35.0, 26.0, 23.0, 16.0, 16.0, 10.0, 13.0, 3.0, 7.0, 12.0, 4.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0], "bins": [-41.5625, -40.4072265625, -39.251953125, -38.0966796875, -36.94140625, -35.7861328125, -34.630859375, -33.4755859375, -32.3203125, -31.1650390625, -30.009765625, -28.8544921875, -27.69921875, -26.5439453125, -25.388671875, -24.2333984375, -23.078125, -21.9228515625, -20.767578125, -19.6123046875, -18.45703125, -17.3017578125, -16.146484375, -14.9912109375, -13.8359375, -12.6806640625, -11.525390625, -10.3701171875, -9.21484375, -8.0595703125, -6.904296875, -5.7490234375, -4.59375, -3.4384765625, -2.283203125, -1.1279296875, 0.02734375, 1.1826171875, 2.337890625, 3.4931640625, 4.6484375, 5.8037109375, 6.958984375, 8.1142578125, 9.26953125, 10.4248046875, 11.580078125, 12.7353515625, 13.890625, 15.0458984375, 16.201171875, 17.3564453125, 18.51171875, 19.6669921875, 20.822265625, 21.9775390625, 23.1328125, 24.2880859375, 25.443359375, 26.5986328125, 27.75390625, 28.9091796875, 30.064453125, 31.2197265625, 32.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 15.0, 23.0, 31.0, 56.0, 68.0, 123.0, 146.0, 247.0, 354.0, 545.0, 836.0, 1323.0, 1815.0, 2753.0, 4169.0, 6327.0, 9391.0, 13387.0, 19308.0, 27837.0, 38283.0, 51478.0, 66892.0, 81845.0, 94245.0, 101610.0, 100976.0, 94080.0, 82322.0, 67226.0, 52145.0, 38872.0, 28103.0, 19712.0, 13577.0, 9266.0, 6387.0, 4297.0, 2860.0, 1877.0, 1281.0, 822.0, 517.0, 376.0, 262.0, 163.0, 107.0, 70.0, 51.0, 28.0, 28.0, 17.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0], "bins": [-15.921875, -15.424560546875, -14.92724609375, -14.429931640625, -13.9326171875, -13.435302734375, -12.93798828125, -12.440673828125, -11.943359375, -11.446044921875, -10.94873046875, -10.451416015625, -9.9541015625, -9.456787109375, -8.95947265625, -8.462158203125, -7.96484375, -7.467529296875, -6.97021484375, -6.472900390625, -5.9755859375, -5.478271484375, -4.98095703125, -4.483642578125, -3.986328125, -3.489013671875, -2.99169921875, -2.494384765625, -1.9970703125, -1.499755859375, -1.00244140625, -0.505126953125, -0.0078125, 0.489501953125, 0.98681640625, 1.484130859375, 1.9814453125, 2.478759765625, 2.97607421875, 3.473388671875, 3.970703125, 4.468017578125, 4.96533203125, 5.462646484375, 5.9599609375, 6.457275390625, 6.95458984375, 7.451904296875, 7.94921875, 8.446533203125, 8.94384765625, 9.441162109375, 9.9384765625, 10.435791015625, 10.93310546875, 11.430419921875, 11.927734375, 12.425048828125, 12.92236328125, 13.419677734375, 13.9169921875, 14.414306640625, 14.91162109375, 15.408935546875, 15.90625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 7.0, 3.0, 2.0, 5.0, 5.0, 9.0, 12.0, 11.0, 22.0, 14.0, 10.0, 17.0, 25.0, 16.0, 34.0, 25.0, 25.0, 28.0, 49.0, 26.0, 32.0, 29.0, 40.0, 44.0, 33.0, 31.0, 27.0, 41.0, 39.0, 27.0, 39.0, 22.0, 39.0, 32.0, 26.0, 23.0, 21.0, 16.0, 16.0, 14.0, 11.0, 13.0, 6.0, 9.0, 7.0, 9.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-23.671875, -22.97412109375, -22.2763671875, -21.57861328125, -20.880859375, -20.18310546875, -19.4853515625, -18.78759765625, -18.08984375, -17.39208984375, -16.6943359375, -15.99658203125, -15.298828125, -14.60107421875, -13.9033203125, -13.20556640625, -12.5078125, -11.81005859375, -11.1123046875, -10.41455078125, -9.716796875, -9.01904296875, -8.3212890625, -7.62353515625, -6.92578125, -6.22802734375, -5.5302734375, -4.83251953125, -4.134765625, -3.43701171875, -2.7392578125, -2.04150390625, -1.34375, -0.64599609375, 0.0517578125, 0.74951171875, 1.447265625, 2.14501953125, 2.8427734375, 3.54052734375, 4.23828125, 4.93603515625, 5.6337890625, 6.33154296875, 7.029296875, 7.72705078125, 8.4248046875, 9.12255859375, 9.8203125, 10.51806640625, 11.2158203125, 11.91357421875, 12.611328125, 13.30908203125, 14.0068359375, 14.70458984375, 15.40234375, 16.10009765625, 16.7978515625, 17.49560546875, 18.193359375, 18.89111328125, 19.5888671875, 20.28662109375, 20.984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 9.0, 5.0, 4.0, 4.0, 20.0, 36.0, 32.0, 40.0, 81.0, 114.0, 188.0, 270.0, 446.0, 668.0, 1011.0, 1412.0, 2160.0, 3478.0, 5351.0, 8078.0, 12529.0, 18981.0, 28135.0, 40705.0, 56463.0, 74368.0, 91378.0, 105843.0, 111264.0, 108079.0, 96145.0, 80321.0, 62020.0, 45288.0, 31663.0, 21349.0, 14151.0, 9211.0, 5985.0, 3943.0, 2472.0, 1705.0, 1062.0, 738.0, 468.0, 287.0, 190.0, 142.0, 100.0, 64.0, 38.0, 22.0, 19.0, 8.0, 8.0, 9.0, 2.0, 2.0, 1.0, 4.0], "bins": [-5.19140625, -5.03240966796875, -4.8734130859375, -4.71441650390625, -4.555419921875, -4.39642333984375, -4.2374267578125, -4.07843017578125, -3.91943359375, -3.76043701171875, -3.6014404296875, -3.44244384765625, -3.283447265625, -3.12445068359375, -2.9654541015625, -2.80645751953125, -2.6474609375, -2.48846435546875, -2.3294677734375, -2.17047119140625, -2.011474609375, -1.85247802734375, -1.6934814453125, -1.53448486328125, -1.37548828125, -1.21649169921875, -1.0574951171875, -0.89849853515625, -0.739501953125, -0.58050537109375, -0.4215087890625, -0.26251220703125, -0.103515625, 0.05548095703125, 0.2144775390625, 0.37347412109375, 0.532470703125, 0.69146728515625, 0.8504638671875, 1.00946044921875, 1.16845703125, 1.32745361328125, 1.4864501953125, 1.64544677734375, 1.804443359375, 1.96343994140625, 2.1224365234375, 2.28143310546875, 2.4404296875, 2.59942626953125, 2.7584228515625, 2.91741943359375, 3.076416015625, 3.23541259765625, 3.3944091796875, 3.55340576171875, 3.71240234375, 3.87139892578125, 4.0303955078125, 4.18939208984375, 4.348388671875, 4.50738525390625, 4.6663818359375, 4.82537841796875, 4.984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 8.0, 16.0, 9.0, 19.0, 14.0, 19.0, 24.0, 20.0, 33.0, 39.0, 43.0, 47.0, 37.0, 45.0, 47.0, 34.0, 40.0, 41.0, 56.0, 35.0, 45.0, 37.0, 44.0, 37.0, 41.0, 33.0, 24.0, 9.0, 21.0, 14.0, 16.0, 10.0, 9.0, 3.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00064849853515625, -0.0006296336650848389, -0.0006107687950134277, -0.0005919039249420166, -0.0005730390548706055, -0.0005541741847991943, -0.0005353093147277832, -0.0005164444446563721, -0.0004975795745849609, -0.0004787147045135498, -0.00045984983444213867, -0.00044098496437072754, -0.0004221200942993164, -0.0004032552242279053, -0.00038439035415649414, -0.000365525484085083, -0.0003466606140136719, -0.00032779574394226074, -0.0003089308738708496, -0.0002900660037994385, -0.00027120113372802734, -0.0002523362636566162, -0.00023347139358520508, -0.00021460652351379395, -0.0001957416534423828, -0.00017687678337097168, -0.00015801191329956055, -0.00013914704322814941, -0.00012028217315673828, -0.00010141730308532715, -8.255243301391602e-05, -6.368756294250488e-05, -4.482269287109375e-05, -2.5957822799682617e-05, -7.092952728271484e-06, 1.1771917343139648e-05, 3.063678741455078e-05, 4.9501657485961914e-05, 6.836652755737305e-05, 8.723139762878418e-05, 0.00010609626770019531, 0.00012496113777160645, 0.00014382600784301758, 0.0001626908779144287, 0.00018155574798583984, 0.00020042061805725098, 0.0002192854881286621, 0.00023815035820007324, 0.0002570152282714844, 0.0002758800983428955, 0.00029474496841430664, 0.0003136098384857178, 0.0003324747085571289, 0.00035133957862854004, 0.00037020444869995117, 0.0003890693187713623, 0.00040793418884277344, 0.00042679905891418457, 0.0004456639289855957, 0.00046452879905700684, 0.00048339366912841797, 0.0005022585391998291, 0.0005211234092712402, 0.0005399882793426514, 0.0005588531494140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 11.0, 16.0, 24.0, 27.0, 51.0, 75.0, 130.0, 207.0, 319.0, 548.0, 804.0, 1368.0, 2260.0, 3771.0, 6396.0, 10933.0, 19495.0, 32739.0, 53148.0, 82032.0, 114112.0, 140178.0, 148191.0, 135080.0, 106222.0, 74097.0, 47431.0, 28475.0, 16643.0, 9646.0, 5616.0, 3368.0, 2022.0, 1201.0, 695.0, 443.0, 271.0, 200.0, 98.0, 80.0, 35.0, 27.0, 28.0, 12.0, 7.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.96484375, -6.73553466796875, -6.5062255859375, -6.27691650390625, -6.047607421875, -5.81829833984375, -5.5889892578125, -5.35968017578125, -5.13037109375, -4.90106201171875, -4.6717529296875, -4.44244384765625, -4.213134765625, -3.98382568359375, -3.7545166015625, -3.52520751953125, -3.2958984375, -3.06658935546875, -2.8372802734375, -2.60797119140625, -2.378662109375, -2.14935302734375, -1.9200439453125, -1.69073486328125, -1.46142578125, -1.23211669921875, -1.0028076171875, -0.77349853515625, -0.544189453125, -0.31488037109375, -0.0855712890625, 0.14373779296875, 0.373046875, 0.60235595703125, 0.8316650390625, 1.06097412109375, 1.290283203125, 1.51959228515625, 1.7489013671875, 1.97821044921875, 2.20751953125, 2.43682861328125, 2.6661376953125, 2.89544677734375, 3.124755859375, 3.35406494140625, 3.5833740234375, 3.81268310546875, 4.0419921875, 4.27130126953125, 4.5006103515625, 4.72991943359375, 4.959228515625, 5.18853759765625, 5.4178466796875, 5.64715576171875, 5.87646484375, 6.10577392578125, 6.3350830078125, 6.56439208984375, 6.793701171875, 7.02301025390625, 7.2523193359375, 7.48162841796875, 7.7109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 5.0, 10.0, 9.0, 21.0, 21.0, 24.0, 42.0, 37.0, 38.0, 68.0, 59.0, 54.0, 44.0, 62.0, 46.0, 65.0, 65.0, 48.0, 50.0, 46.0, 45.0, 27.0, 28.0, 12.0, 18.0, 9.0, 8.0, 11.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.26953125, -5.121337890625, -4.97314453125, -4.824951171875, -4.6767578125, -4.528564453125, -4.38037109375, -4.232177734375, -4.083984375, -3.935791015625, -3.78759765625, -3.639404296875, -3.4912109375, -3.343017578125, -3.19482421875, -3.046630859375, -2.8984375, -2.750244140625, -2.60205078125, -2.453857421875, -2.3056640625, -2.157470703125, -2.00927734375, -1.861083984375, -1.712890625, -1.564697265625, -1.41650390625, -1.268310546875, -1.1201171875, -0.971923828125, -0.82373046875, -0.675537109375, -0.52734375, -0.379150390625, -0.23095703125, -0.082763671875, 0.0654296875, 0.213623046875, 0.36181640625, 0.510009765625, 0.658203125, 0.806396484375, 0.95458984375, 1.102783203125, 1.2509765625, 1.399169921875, 1.54736328125, 1.695556640625, 1.84375, 1.991943359375, 2.14013671875, 2.288330078125, 2.4365234375, 2.584716796875, 2.73291015625, 2.881103515625, 3.029296875, 3.177490234375, 3.32568359375, 3.473876953125, 3.6220703125, 3.770263671875, 3.91845703125, 4.066650390625, 4.21484375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 7.0, 10.0, 9.0, 15.0, 13.0, 27.0, 18.0, 28.0, 33.0, 21.0, 17.0, 43.0, 35.0, 37.0, 49.0, 37.0, 38.0, 43.0, 51.0, 42.0, 37.0, 31.0, 39.0, 40.0, 42.0, 39.0, 25.0, 20.0, 21.0, 13.0, 20.0, 13.0, 14.0, 7.0, 11.0, 8.0, 6.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.897541046142578, -22.153785705566406, -21.410030364990234, -20.666275024414062, -19.92251968383789, -19.17876434326172, -18.435009002685547, -17.691253662109375, -16.947498321533203, -16.20374298095703, -15.45998764038086, -14.716232299804688, -13.972476959228516, -13.228721618652344, -12.484966278076172, -11.7412109375, -10.997456550598145, -10.253701210021973, -9.5099458694458, -8.766190528869629, -8.022435188293457, -7.278679847717285, -6.5349249839782715, -5.7911696434021, -5.047414302825928, -4.303658962249756, -3.559903621673584, -2.816148519515991, -2.0723931789398193, -1.3286378383636475, -0.5848827362060547, 0.1588726043701172, 0.9026279449462891, 1.646383285522461, 2.390138626098633, 3.1338937282562256, 3.8776490688323975, 4.621404647827148, 5.365159511566162, 6.108914852142334, 6.852670192718506, 7.596425533294678, 8.340180397033691, 9.083935737609863, 9.827691078186035, 10.571446418762207, 11.315201759338379, 12.05895709991455, 12.802712440490723, 13.546467781066895, 14.290223121643066, 15.033978462219238, 15.77773380279541, 16.521488189697266, 17.265243530273438, 18.00899887084961, 18.75275421142578, 19.496509552001953, 20.240264892578125, 20.984020233154297, 21.72777557373047, 22.47153091430664, 23.215286254882812, 23.959041595458984, 24.702796936035156]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 17.0, 9.0, 16.0, 11.0, 14.0, 28.0, 28.0, 33.0, 32.0, 28.0, 35.0, 23.0, 31.0, 43.0, 37.0, 39.0, 48.0, 44.0, 35.0, 38.0, 34.0, 30.0, 37.0, 32.0, 34.0, 23.0, 21.0, 28.0, 21.0, 16.0, 19.0, 11.0, 11.0, 14.0, 12.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-39.788150787353516, -38.56487274169922, -37.341590881347656, -36.11831283569336, -34.89503479003906, -33.6717529296875, -32.4484748840332, -31.225196838378906, -30.001916885375977, -28.778636932373047, -27.55535888671875, -26.33207893371582, -25.10879898071289, -23.885520935058594, -22.662240982055664, -21.438961029052734, -20.215682983398438, -18.992403030395508, -17.76912498474121, -16.54584503173828, -15.322566032409668, -14.099287033081055, -12.876007080078125, -11.652728080749512, -10.429449081420898, -9.206170082092285, -7.982890605926514, -6.759611129760742, -5.536332130432129, -4.313053131103516, -3.089773654937744, -1.8664941787719727, -0.643218994140625, 0.5800602436065674, 1.8033394813537598, 3.026618719100952, 4.2498979568481445, 5.473176956176758, 6.696456432342529, 7.919735908508301, 9.143014907836914, 10.366293907165527, 11.58957290649414, 12.81285285949707, 14.036131858825684, 15.259410858154297, 16.482690811157227, 17.705970764160156, 18.929248809814453, 20.152528762817383, 21.37580680847168, 22.59908676147461, 23.822364807128906, 25.045644760131836, 26.268924713134766, 27.492202758789062, 28.715482711791992, 29.938762664794922, 31.16204071044922, 32.385318756103516, 33.60860061645508, 34.831878662109375, 36.05515670776367, 37.278438568115234, 38.50171661376953]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [3.0, 15.0, 16.0, 33.0, 54.0, 67.0, 101.0, 172.0, 292.0, 515.0, 791.0, 1417.0, 2205.0, 3564.0, 5592.0, 8924.0, 14850.0, 23125.0, 35631.0, 54970.0, 81823.0, 118211.0, 165832.0, 225102.0, 287856.0, 348199.0, 396678.0, 420325.0, 413413.0, 378537.0, 321499.0, 257801.0, 196479.0, 142795.0, 99841.0, 67296.0, 44588.0, 28659.0, 18118.0, 11313.0, 7093.0, 4126.0, 2596.0, 1475.0, 926.0, 556.0, 345.0, 196.0, 100.0, 75.0, 49.0, 29.0, 16.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.794189453125, -16.16650390625, -15.538818359375, -14.9111328125, -14.283447265625, -13.65576171875, -13.028076171875, -12.400390625, -11.772705078125, -11.14501953125, -10.517333984375, -9.8896484375, -9.261962890625, -8.63427734375, -8.006591796875, -7.37890625, -6.751220703125, -6.12353515625, -5.495849609375, -4.8681640625, -4.240478515625, -3.61279296875, -2.985107421875, -2.357421875, -1.729736328125, -1.10205078125, -0.474365234375, 0.1533203125, 0.781005859375, 1.40869140625, 2.036376953125, 2.6640625, 3.291748046875, 3.91943359375, 4.547119140625, 5.1748046875, 5.802490234375, 6.43017578125, 7.057861328125, 7.685546875, 8.313232421875, 8.94091796875, 9.568603515625, 10.1962890625, 10.823974609375, 11.45166015625, 12.079345703125, 12.70703125, 13.334716796875, 13.96240234375, 14.590087890625, 15.2177734375, 15.845458984375, 16.47314453125, 17.100830078125, 17.728515625, 18.356201171875, 18.98388671875, 19.611572265625, 20.2392578125, 20.866943359375, 21.49462890625, 22.122314453125, 22.75]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 9.0, 11.0, 16.0, 10.0, 15.0, 12.0, 19.0, 25.0, 33.0, 37.0, 26.0, 34.0, 26.0, 23.0, 36.0, 42.0, 39.0, 49.0, 39.0, 40.0, 40.0, 32.0, 40.0, 30.0, 34.0, 36.0, 31.0, 25.0, 23.0, 24.0, 22.0, 11.0, 16.0, 13.0, 14.0, 12.0, 9.0, 9.0, 5.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.3125, -32.2822265625, -31.251953125, -30.2216796875, -29.19140625, -28.1611328125, -27.130859375, -26.1005859375, -25.0703125, -24.0400390625, -23.009765625, -21.9794921875, -20.94921875, -19.9189453125, -18.888671875, -17.8583984375, -16.828125, -15.7978515625, -14.767578125, -13.7373046875, -12.70703125, -11.6767578125, -10.646484375, -9.6162109375, -8.5859375, -7.5556640625, -6.525390625, -5.4951171875, -4.46484375, -3.4345703125, -2.404296875, -1.3740234375, -0.34375, 0.6865234375, 1.716796875, 2.7470703125, 3.77734375, 4.8076171875, 5.837890625, 6.8681640625, 7.8984375, 8.9287109375, 9.958984375, 10.9892578125, 12.01953125, 13.0498046875, 14.080078125, 15.1103515625, 16.140625, 17.1708984375, 18.201171875, 19.2314453125, 20.26171875, 21.2919921875, 22.322265625, 23.3525390625, 24.3828125, 25.4130859375, 26.443359375, 27.4736328125, 28.50390625, 29.5341796875, 30.564453125, 31.5947265625, 32.625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 13.0, 27.0, 39.0, 73.0, 107.0, 198.0, 341.0, 575.0, 960.0, 1519.0, 2586.0, 4220.0, 6580.0, 10601.0, 16251.0, 24883.0, 36479.0, 53408.0, 75942.0, 103999.0, 140324.0, 179085.0, 223803.0, 266620.0, 305937.0, 334317.0, 348563.0, 345719.0, 328956.0, 296149.0, 258263.0, 213342.0, 171086.0, 131181.0, 97048.0, 70358.0, 49392.0, 33083.0, 22409.0, 14760.0, 9280.0, 5996.0, 3826.0, 2377.0, 1507.0, 849.0, 503.0, 308.0, 188.0, 92.0, 69.0, 39.0, 35.0, 12.0, 4.0, 1.0, 3.0, 2.0], "bins": [-17.390625, -16.86181640625, -16.3330078125, -15.80419921875, -15.275390625, -14.74658203125, -14.2177734375, -13.68896484375, -13.16015625, -12.63134765625, -12.1025390625, -11.57373046875, -11.044921875, -10.51611328125, -9.9873046875, -9.45849609375, -8.9296875, -8.40087890625, -7.8720703125, -7.34326171875, -6.814453125, -6.28564453125, -5.7568359375, -5.22802734375, -4.69921875, -4.17041015625, -3.6416015625, -3.11279296875, -2.583984375, -2.05517578125, -1.5263671875, -0.99755859375, -0.46875, 0.06005859375, 0.5888671875, 1.11767578125, 1.646484375, 2.17529296875, 2.7041015625, 3.23291015625, 3.76171875, 4.29052734375, 4.8193359375, 5.34814453125, 5.876953125, 6.40576171875, 6.9345703125, 7.46337890625, 7.9921875, 8.52099609375, 9.0498046875, 9.57861328125, 10.107421875, 10.63623046875, 11.1650390625, 11.69384765625, 12.22265625, 12.75146484375, 13.2802734375, 13.80908203125, 14.337890625, 14.86669921875, 15.3955078125, 15.92431640625, 16.453125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 11.0, 18.0, 13.0, 27.0, 26.0, 28.0, 39.0, 42.0, 54.0, 60.0, 67.0, 84.0, 94.0, 94.0, 118.0, 126.0, 146.0, 158.0, 158.0, 167.0, 157.0, 180.0, 185.0, 171.0, 176.0, 162.0, 179.0, 146.0, 172.0, 139.0, 130.0, 93.0, 94.0, 76.0, 67.0, 84.0, 55.0, 43.0, 51.0, 36.0, 34.0, 26.0, 22.0, 15.0, 11.0, 6.0, 10.0, 2.0, 5.0, 8.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.7890625, -12.3843994140625, -11.979736328125, -11.5750732421875, -11.17041015625, -10.7657470703125, -10.361083984375, -9.9564208984375, -9.5517578125, -9.1470947265625, -8.742431640625, -8.3377685546875, -7.93310546875, -7.5284423828125, -7.123779296875, -6.7191162109375, -6.314453125, -5.9097900390625, -5.505126953125, -5.1004638671875, -4.69580078125, -4.2911376953125, -3.886474609375, -3.4818115234375, -3.0771484375, -2.6724853515625, -2.267822265625, -1.8631591796875, -1.45849609375, -1.0538330078125, -0.649169921875, -0.2445068359375, 0.16015625, 0.5648193359375, 0.969482421875, 1.3741455078125, 1.77880859375, 2.1834716796875, 2.588134765625, 2.9927978515625, 3.3974609375, 3.8021240234375, 4.206787109375, 4.6114501953125, 5.01611328125, 5.4207763671875, 5.825439453125, 6.2301025390625, 6.634765625, 7.0394287109375, 7.444091796875, 7.8487548828125, 8.25341796875, 8.6580810546875, 9.062744140625, 9.4674072265625, 9.8720703125, 10.2767333984375, 10.681396484375, 11.0860595703125, 11.49072265625, 11.8953857421875, 12.300048828125, 12.7047119140625, 13.109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 8.0, 8.0, 13.0, 9.0, 16.0, 12.0, 19.0, 19.0, 22.0, 28.0, 27.0, 21.0, 30.0, 37.0, 38.0, 34.0, 38.0, 42.0, 35.0, 47.0, 44.0, 42.0, 48.0, 33.0, 28.0, 32.0, 27.0, 27.0, 29.0, 27.0, 20.0, 22.0, 17.0, 13.0, 10.0, 12.0, 11.0, 9.0, 9.0, 3.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.19637107849121, -23.421733856201172, -22.647098541259766, -21.872461318969727, -21.097824096679688, -20.32318687438965, -19.54854965209961, -18.773914337158203, -17.999277114868164, -17.224639892578125, -16.45000457763672, -15.67536735534668, -14.90073013305664, -14.126092910766602, -13.351456642150879, -12.576820373535156, -11.802183151245117, -11.027545928955078, -10.252909660339355, -9.478273391723633, -8.703636169433594, -7.928999423980713, -7.154362678527832, -6.379725933074951, -5.60508918762207, -4.8304524421691895, -4.055815696716309, -3.2811789512634277, -2.506542205810547, -1.731905460357666, -0.9572687149047852, -0.1826319694519043, 0.5920066833496094, 1.3666434288024902, 2.141280174255371, 2.915916919708252, 3.690553665161133, 4.465190410614014, 5.2398271560668945, 6.014463901519775, 6.789100646972656, 7.563737392425537, 8.338374137878418, 9.11301040649414, 9.88764762878418, 10.662284851074219, 11.436921119689941, 12.211557388305664, 12.986194610595703, 13.760831832885742, 14.535468101501465, 15.310104370117188, 16.084741592407227, 16.859378814697266, 17.634014129638672, 18.40865135192871, 19.18328857421875, 19.95792579650879, 20.732563018798828, 21.507198333740234, 22.281835556030273, 23.056472778320312, 23.83110809326172, 24.605745315551758, 25.380382537841797]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 6.0, 12.0, 9.0, 8.0, 16.0, 11.0, 15.0, 19.0, 29.0, 20.0, 26.0, 21.0, 26.0, 25.0, 38.0, 29.0, 44.0, 45.0, 39.0, 31.0, 43.0, 37.0, 32.0, 30.0, 42.0, 32.0, 32.0, 44.0, 26.0, 27.0, 27.0, 25.0, 17.0, 10.0, 15.0, 14.0, 17.0, 10.0, 11.0, 5.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.0294303894043, -38.8283576965332, -37.627288818359375, -36.42621612548828, -35.22514343261719, -34.024070739746094, -32.822998046875, -31.621929168701172, -30.420856475830078, -29.219783782958984, -28.018712997436523, -26.817642211914062, -25.61656951904297, -24.415496826171875, -23.214426040649414, -22.013355255126953, -20.81228256225586, -19.611209869384766, -18.410139083862305, -17.209068298339844, -16.00799560546875, -14.806923866271973, -13.605852127075195, -12.404780387878418, -11.20370864868164, -10.002636909484863, -8.801565170288086, -7.600493431091309, -6.399421691894531, -5.198349952697754, -3.9972782135009766, -2.796206474304199, -1.5951347351074219, -0.39406299591064453, 0.8070087432861328, 2.00808048248291, 3.2091522216796875, 4.410223960876465, 5.611295700073242, 6.8123674392700195, 8.013439178466797, 9.214510917663574, 10.415582656860352, 11.616654396057129, 12.817726135253906, 14.018797874450684, 15.219869613647461, 16.420940399169922, 17.622013092041016, 18.82308578491211, 20.02415657043457, 21.22522735595703, 22.426300048828125, 23.62737274169922, 24.82844352722168, 26.02951431274414, 27.230587005615234, 28.431659698486328, 29.63273048400879, 30.83380126953125, 32.034873962402344, 33.23594665527344, 34.43701934814453, 35.63808822631836, 36.83916091918945]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 12.0, 28.0, 28.0, 35.0, 71.0, 96.0, 151.0, 246.0, 357.0, 583.0, 972.0, 1651.0, 2704.0, 4473.0, 7641.0, 14068.0, 26678.0, 54463.0, 121774.0, 278204.0, 287224.0, 127760.0, 57212.0, 27852.0, 14407.0, 8007.0, 4622.0, 2706.0, 1712.0, 995.0, 625.0, 445.0, 263.0, 161.0, 106.0, 68.0, 55.0, 26.0, 25.0, 17.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.1400146484375, -4.006591796875, -3.8731689453125, -3.73974609375, -3.6063232421875, -3.472900390625, -3.3394775390625, -3.2060546875, -3.0726318359375, -2.939208984375, -2.8057861328125, -2.67236328125, -2.5389404296875, -2.405517578125, -2.2720947265625, -2.138671875, -2.0052490234375, -1.871826171875, -1.7384033203125, -1.60498046875, -1.4715576171875, -1.338134765625, -1.2047119140625, -1.0712890625, -0.9378662109375, -0.804443359375, -0.6710205078125, -0.53759765625, -0.4041748046875, -0.270751953125, -0.1373291015625, -0.00390625, 0.1295166015625, 0.262939453125, 0.3963623046875, 0.52978515625, 0.6632080078125, 0.796630859375, 0.9300537109375, 1.0634765625, 1.1968994140625, 1.330322265625, 1.4637451171875, 1.59716796875, 1.7305908203125, 1.864013671875, 1.9974365234375, 2.130859375, 2.2642822265625, 2.397705078125, 2.5311279296875, 2.66455078125, 2.7979736328125, 2.931396484375, 3.0648193359375, 3.1982421875, 3.3316650390625, 3.465087890625, 3.5985107421875, 3.73193359375, 3.8653564453125, 3.998779296875, 4.1322021484375, 4.265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 4.0, 6.0, 12.0, 9.0, 8.0, 16.0, 12.0, 15.0, 18.0, 30.0, 20.0, 27.0, 20.0, 27.0, 25.0, 40.0, 24.0, 46.0, 44.0, 41.0, 31.0, 43.0, 35.0, 33.0, 28.0, 44.0, 31.0, 32.0, 45.0, 27.0, 26.0, 28.0, 23.0, 18.0, 8.0, 16.0, 13.0, 18.0, 11.0, 10.0, 5.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.8125, -38.61279296875, -37.4130859375, -36.21337890625, -35.013671875, -33.81396484375, -32.6142578125, -31.41455078125, -30.21484375, -29.01513671875, -27.8154296875, -26.61572265625, -25.416015625, -24.21630859375, -23.0166015625, -21.81689453125, -20.6171875, -19.41748046875, -18.2177734375, -17.01806640625, -15.818359375, -14.61865234375, -13.4189453125, -12.21923828125, -11.01953125, -9.81982421875, -8.6201171875, -7.42041015625, -6.220703125, -5.02099609375, -3.8212890625, -2.62158203125, -1.421875, -0.22216796875, 0.9775390625, 2.17724609375, 3.376953125, 4.57666015625, 5.7763671875, 6.97607421875, 8.17578125, 9.37548828125, 10.5751953125, 11.77490234375, 12.974609375, 14.17431640625, 15.3740234375, 16.57373046875, 17.7734375, 18.97314453125, 20.1728515625, 21.37255859375, 22.572265625, 23.77197265625, 24.9716796875, 26.17138671875, 27.37109375, 28.57080078125, 29.7705078125, 30.97021484375, 32.169921875, 33.36962890625, 34.5693359375, 35.76904296875, 36.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 14.0, 19.0, 23.0, 49.0, 53.0, 84.0, 129.0, 171.0, 253.0, 374.0, 598.0, 1011.0, 1662.0, 2629.0, 4639.0, 8465.0, 15495.0, 30138.0, 61448.0, 138330.0, 336899.0, 248315.0, 99245.0, 46530.0, 23443.0, 12190.0, 6570.0, 3795.0, 2191.0, 1346.0, 833.0, 561.0, 346.0, 235.0, 158.0, 91.0, 72.0, 45.0, 27.0, 21.0, 12.0, 17.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.54296875, -5.38372802734375, -5.2244873046875, -5.06524658203125, -4.906005859375, -4.74676513671875, -4.5875244140625, -4.42828369140625, -4.26904296875, -4.10980224609375, -3.9505615234375, -3.79132080078125, -3.632080078125, -3.47283935546875, -3.3135986328125, -3.15435791015625, -2.9951171875, -2.83587646484375, -2.6766357421875, -2.51739501953125, -2.358154296875, -2.19891357421875, -2.0396728515625, -1.88043212890625, -1.72119140625, -1.56195068359375, -1.4027099609375, -1.24346923828125, -1.084228515625, -0.92498779296875, -0.7657470703125, -0.60650634765625, -0.447265625, -0.28802490234375, -0.1287841796875, 0.03045654296875, 0.189697265625, 0.34893798828125, 0.5081787109375, 0.66741943359375, 0.82666015625, 0.98590087890625, 1.1451416015625, 1.30438232421875, 1.463623046875, 1.62286376953125, 1.7821044921875, 1.94134521484375, 2.1005859375, 2.25982666015625, 2.4190673828125, 2.57830810546875, 2.737548828125, 2.89678955078125, 3.0560302734375, 3.21527099609375, 3.37451171875, 3.53375244140625, 3.6929931640625, 3.85223388671875, 4.011474609375, 4.17071533203125, 4.3299560546875, 4.48919677734375, 4.6484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 2.0, 5.0, 4.0, 9.0, 8.0, 23.0, 15.0, 20.0, 16.0, 22.0, 25.0, 21.0, 31.0, 33.0, 44.0, 28.0, 48.0, 42.0, 40.0, 44.0, 37.0, 33.0, 54.0, 40.0, 36.0, 39.0, 28.0, 34.0, 30.0, 22.0, 21.0, 21.0, 14.0, 12.0, 17.0, 8.0, 14.0, 10.0, 12.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.796875, -22.95263671875, -22.1083984375, -21.26416015625, -20.419921875, -19.57568359375, -18.7314453125, -17.88720703125, -17.04296875, -16.19873046875, -15.3544921875, -14.51025390625, -13.666015625, -12.82177734375, -11.9775390625, -11.13330078125, -10.2890625, -9.44482421875, -8.6005859375, -7.75634765625, -6.912109375, -6.06787109375, -5.2236328125, -4.37939453125, -3.53515625, -2.69091796875, -1.8466796875, -1.00244140625, -0.158203125, 0.68603515625, 1.5302734375, 2.37451171875, 3.21875, 4.06298828125, 4.9072265625, 5.75146484375, 6.595703125, 7.43994140625, 8.2841796875, 9.12841796875, 9.97265625, 10.81689453125, 11.6611328125, 12.50537109375, 13.349609375, 14.19384765625, 15.0380859375, 15.88232421875, 16.7265625, 17.57080078125, 18.4150390625, 19.25927734375, 20.103515625, 20.94775390625, 21.7919921875, 22.63623046875, 23.48046875, 24.32470703125, 25.1689453125, 26.01318359375, 26.857421875, 27.70166015625, 28.5458984375, 29.39013671875, 30.234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 6.0, 9.0, 10.0, 13.0, 12.0, 14.0, 20.0, 22.0, 24.0, 36.0, 46.0, 63.0, 87.0, 99.0, 175.0, 238.0, 343.0, 530.0, 820.0, 1345.0, 2292.0, 4129.0, 8054.0, 16595.0, 38301.0, 106808.0, 355625.0, 340131.0, 101752.0, 36962.0, 15952.0, 7877.0, 4073.0, 2277.0, 1323.0, 813.0, 473.0, 379.0, 254.0, 164.0, 111.0, 87.0, 60.0, 51.0, 31.0, 17.0, 13.0, 9.0, 7.0, 9.0, 7.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.3466796875, -0.33704376220703125, -0.3274078369140625, -0.31777191162109375, -0.308135986328125, -0.29850006103515625, -0.2888641357421875, -0.27922821044921875, -0.26959228515625, -0.25995635986328125, -0.2503204345703125, -0.24068450927734375, -0.231048583984375, -0.22141265869140625, -0.2117767333984375, -0.20214080810546875, -0.1925048828125, -0.18286895751953125, -0.1732330322265625, -0.16359710693359375, -0.153961181640625, -0.14432525634765625, -0.1346893310546875, -0.12505340576171875, -0.11541748046875, -0.10578155517578125, -0.0961456298828125, -0.08650970458984375, -0.076873779296875, -0.06723785400390625, -0.0576019287109375, -0.04796600341796875, -0.038330078125, -0.02869415283203125, -0.0190582275390625, -0.00942230224609375, 0.000213623046875, 0.00984954833984375, 0.0194854736328125, 0.02912139892578125, 0.03875732421875, 0.04839324951171875, 0.0580291748046875, 0.06766510009765625, 0.077301025390625, 0.08693695068359375, 0.0965728759765625, 0.10620880126953125, 0.1158447265625, 0.12548065185546875, 0.1351165771484375, 0.14475250244140625, 0.154388427734375, 0.16402435302734375, 0.1736602783203125, 0.18329620361328125, 0.19293212890625, 0.20256805419921875, 0.2122039794921875, 0.22183990478515625, 0.231475830078125, 0.24111175537109375, 0.2507476806640625, 0.26038360595703125, 0.27001953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 4.0, 2.0, 5.0, 7.0, 10.0, 12.0, 20.0, 23.0, 28.0, 30.0, 44.0, 52.0, 79.0, 68.0, 67.0, 76.0, 62.0, 64.0, 71.0, 53.0, 36.0, 42.0, 28.0, 19.0, 23.0, 11.0, 17.0, 9.0, 8.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.172922879457474e-05, -3.067590296268463e-05, -2.9622577130794525e-05, -2.856925129890442e-05, -2.7515925467014313e-05, -2.6462599635124207e-05, -2.54092738032341e-05, -2.4355947971343994e-05, -2.3302622139453888e-05, -2.2249296307563782e-05, -2.1195970475673676e-05, -2.014264464378357e-05, -1.9089318811893463e-05, -1.8035992980003357e-05, -1.698266714811325e-05, -1.5929341316223145e-05, -1.4876015484333038e-05, -1.3822689652442932e-05, -1.2769363820552826e-05, -1.171603798866272e-05, -1.0662712156772614e-05, -9.609386324882507e-06, -8.556060492992401e-06, -7.502734661102295e-06, -6.449408829212189e-06, -5.3960829973220825e-06, -4.342757165431976e-06, -3.28943133354187e-06, -2.236105501651764e-06, -1.1827796697616577e-06, -1.2945383787155151e-07, 9.238719940185547e-07, 1.977197825908661e-06, 3.030523657798767e-06, 4.083849489688873e-06, 5.1371753215789795e-06, 6.190501153469086e-06, 7.243826985359192e-06, 8.297152817249298e-06, 9.350478649139404e-06, 1.040380448102951e-05, 1.1457130312919617e-05, 1.2510456144809723e-05, 1.3563781976699829e-05, 1.4617107808589935e-05, 1.567043364048004e-05, 1.6723759472370148e-05, 1.7777085304260254e-05, 1.883041113615036e-05, 1.9883736968040466e-05, 2.0937062799930573e-05, 2.199038863182068e-05, 2.3043714463710785e-05, 2.409704029560089e-05, 2.5150366127490997e-05, 2.6203691959381104e-05, 2.725701779127121e-05, 2.8310343623161316e-05, 2.9363669455051422e-05, 3.041699528694153e-05, 3.1470321118831635e-05, 3.252364695072174e-05, 3.357697278261185e-05, 3.463029861450195e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 9.0, 8.0, 13.0, 27.0, 27.0, 45.0, 68.0, 123.0, 181.0, 265.0, 417.0, 701.0, 1007.0, 1602.0, 2553.0, 4103.0, 6533.0, 10699.0, 17317.0, 30160.0, 54205.0, 106913.0, 256848.0, 291579.0, 121150.0, 59288.0, 32801.0, 19163.0, 11678.0, 7125.0, 4465.0, 2722.0, 1739.0, 1070.0, 683.0, 473.0, 279.0, 177.0, 109.0, 88.0, 53.0, 30.0, 18.0, 15.0, 8.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4156379699707031, -0.40134429931640625, -0.3870506286621094, -0.3727569580078125, -0.3584632873535156, -0.34416961669921875, -0.3298759460449219, -0.315582275390625, -0.3012886047363281, -0.28699493408203125, -0.2727012634277344, -0.2584075927734375, -0.24411392211914062, -0.22982025146484375, -0.21552658081054688, -0.20123291015625, -0.18693923950195312, -0.17264556884765625, -0.15835189819335938, -0.1440582275390625, -0.12976455688476562, -0.11547088623046875, -0.10117721557617188, -0.086883544921875, -0.07258987426757812, -0.05829620361328125, -0.044002532958984375, -0.0297088623046875, -0.015415191650390625, -0.00112152099609375, 0.013172149658203125, 0.0274658203125, 0.041759490966796875, 0.05605316162109375, 0.07034683227539062, 0.0846405029296875, 0.09893417358398438, 0.11322784423828125, 0.12752151489257812, 0.141815185546875, 0.15610885620117188, 0.17040252685546875, 0.18469619750976562, 0.1989898681640625, 0.21328353881835938, 0.22757720947265625, 0.24187088012695312, 0.25616455078125, 0.2704582214355469, 0.28475189208984375, 0.2990455627441406, 0.3133392333984375, 0.3276329040527344, 0.34192657470703125, 0.3562202453613281, 0.370513916015625, 0.3848075866699219, 0.39910125732421875, 0.4133949279785156, 0.4276885986328125, 0.4419822692871094, 0.45627593994140625, 0.4705696105957031, 0.48486328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 9.0, 15.0, 14.0, 12.0, 19.0, 18.0, 25.0, 21.0, 20.0, 37.0, 24.0, 26.0, 31.0, 49.0, 33.0, 48.0, 59.0, 63.0, 52.0, 39.0, 35.0, 42.0, 30.0, 37.0, 33.0, 26.0, 27.0, 19.0, 13.0, 17.0, 24.0, 11.0, 9.0, 10.0, 1.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.362060546875, -0.3507881164550781, -0.33951568603515625, -0.3282432556152344, -0.3169708251953125, -0.3056983947753906, -0.29442596435546875, -0.2831535339355469, -0.271881103515625, -0.2606086730957031, -0.24933624267578125, -0.23806381225585938, -0.2267913818359375, -0.21551895141601562, -0.20424652099609375, -0.19297409057617188, -0.18170166015625, -0.17042922973632812, -0.15915679931640625, -0.14788436889648438, -0.1366119384765625, -0.12533950805664062, -0.11406707763671875, -0.10279464721679688, -0.091522216796875, -0.08024978637695312, -0.06897735595703125, -0.057704925537109375, -0.0464324951171875, -0.035160064697265625, -0.02388763427734375, -0.012615203857421875, -0.0013427734375, 0.009929656982421875, 0.02120208740234375, 0.032474517822265625, 0.0437469482421875, 0.055019378662109375, 0.06629180908203125, 0.07756423950195312, 0.088836669921875, 0.10010910034179688, 0.11138153076171875, 0.12265396118164062, 0.1339263916015625, 0.14519882202148438, 0.15647125244140625, 0.16774368286132812, 0.17901611328125, 0.19028854370117188, 0.20156097412109375, 0.21283340454101562, 0.2241058349609375, 0.23537826538085938, 0.24665069580078125, 0.2579231262207031, 0.269195556640625, 0.2804679870605469, 0.29174041748046875, 0.3030128479003906, 0.3142852783203125, 0.3255577087402344, 0.33683013916015625, 0.3481025695800781, 0.359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 5.0, 11.0, 12.0, 13.0, 10.0, 12.0, 21.0, 18.0, 26.0, 27.0, 31.0, 22.0, 29.0, 36.0, 39.0, 32.0, 43.0, 39.0, 37.0, 47.0, 49.0, 38.0, 44.0, 38.0, 26.0, 30.0, 26.0, 31.0, 26.0, 25.0, 26.0, 17.0, 19.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.241376876831055, -24.456005096435547, -23.670635223388672, -22.885263442993164, -22.099891662597656, -21.31452178955078, -20.529150009155273, -19.743778228759766, -18.95840835571289, -18.173036575317383, -17.387666702270508, -16.602294921875, -15.816924095153809, -15.031553268432617, -14.24618148803711, -13.460810661315918, -12.675439834594727, -11.890069007873535, -11.104698181152344, -10.319326400756836, -9.533955574035645, -8.748584747314453, -7.9632134437561035, -7.177842140197754, -6.3924713134765625, -5.607100486755371, -4.8217291831970215, -4.036357879638672, -3.2509870529174805, -2.46561598777771, -1.6802449226379395, -0.8948736190795898, -0.10950469970703125, 0.6758663654327393, 1.4612374305725098, 2.2466084957122803, 3.031979560852051, 3.8173506259918213, 4.602721691131592, 5.388092994689941, 6.173463821411133, 6.958834648132324, 7.744205951690674, 8.529577255249023, 9.314948081970215, 10.100318908691406, 10.885690689086914, 11.671061515808105, 12.456432342529297, 13.241803169250488, 14.02717399597168, 14.812545776367188, 15.597916603088379, 16.38328742980957, 17.168659210205078, 17.954029083251953, 18.73940086364746, 19.52477264404297, 20.310142517089844, 21.09551429748535, 21.88088607788086, 22.666255950927734, 23.451627731323242, 24.23699951171875, 25.022369384765625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 7.0, 9.0, 11.0, 9.0, 16.0, 10.0, 14.0, 20.0, 28.0, 22.0, 26.0, 20.0, 27.0, 24.0, 40.0, 30.0, 44.0, 43.0, 37.0, 36.0, 40.0, 38.0, 29.0, 31.0, 42.0, 31.0, 36.0, 42.0, 28.0, 20.0, 31.0, 25.0, 18.0, 9.0, 16.0, 14.0, 17.0, 8.0, 13.0, 4.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.79856491088867, -38.59925079345703, -37.39993667602539, -36.20062255859375, -35.001312255859375, -33.801998138427734, -32.602684020996094, -31.403369903564453, -30.204055786132812, -29.004741668701172, -27.805429458618164, -26.606115341186523, -25.406801223754883, -24.207489013671875, -23.008174896240234, -21.808860778808594, -20.609548568725586, -19.410234451293945, -18.210922241210938, -17.011608123779297, -15.812294006347656, -14.612980842590332, -13.413667678833008, -12.214353561401367, -11.015040397644043, -9.815727233886719, -8.616413116455078, -7.417099952697754, -6.2177863121032715, -5.018472671508789, -3.819159507751465, -2.619845390319824, -1.4205322265625, -0.22121870517730713, 0.9780948162078857, 2.177408218383789, 3.3767218589782715, 4.576035499572754, 5.775348663330078, 6.974662780761719, 8.173975944519043, 9.373289108276367, 10.572603225708008, 11.771916389465332, 12.971229553222656, 14.170543670654297, 15.369856834411621, 16.569171905517578, 17.768484115600586, 18.967798233032227, 20.167110443115234, 21.366424560546875, 22.565738677978516, 23.765052795410156, 24.964365005493164, 26.163679122924805, 27.362991333007812, 28.562305450439453, 29.76161766052246, 30.9609317779541, 32.16024398803711, 33.35955810546875, 34.55887222290039, 35.75818634033203, 36.95750045776367]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 11.0, 11.0, 11.0, 15.0, 26.0, 36.0, 63.0, 122.0, 156.0, 323.0, 486.0, 868.0, 1576.0, 2606.0, 4553.0, 7560.0, 12158.0, 19973.0, 31181.0, 47581.0, 67404.0, 90449.0, 110471.0, 123016.0, 123287.0, 111906.0, 91616.0, 68601.0, 48515.0, 32162.0, 20544.0, 12535.0, 7664.0, 4532.0, 2716.0, 1595.0, 940.0, 544.0, 278.0, 185.0, 114.0, 62.0, 46.0, 23.0, 12.0, 10.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.203125, -19.609375, -19.015625, -18.421875, -17.828125, -17.234375, -16.640625, -16.046875, -15.453125, -14.859375, -14.265625, -13.671875, -13.078125, -12.484375, -11.890625, -11.296875, -10.703125, -10.109375, -9.515625, -8.921875, -8.328125, -7.734375, -7.140625, -6.546875, -5.953125, -5.359375, -4.765625, -4.171875, -3.578125, -2.984375, -2.390625, -1.796875, -1.203125, -0.609375, -0.015625, 0.578125, 1.171875, 1.765625, 2.359375, 2.953125, 3.546875, 4.140625, 4.734375, 5.328125, 5.921875, 6.515625, 7.109375, 7.703125, 8.296875, 8.890625, 9.484375, 10.078125, 10.671875, 11.265625, 11.859375, 12.453125, 13.046875, 13.640625, 14.234375, 14.828125, 15.421875, 16.015625, 16.609375, 17.203125, 17.796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 2.0, 5.0, 8.0, 9.0, 10.0, 11.0, 14.0, 10.0, 16.0, 23.0, 27.0, 23.0, 24.0, 20.0, 27.0, 33.0, 29.0, 32.0, 52.0, 37.0, 38.0, 35.0, 42.0, 37.0, 26.0, 31.0, 46.0, 27.0, 41.0, 41.0, 26.0, 27.0, 26.0, 21.0, 17.0, 10.0, 13.0, 16.0, 16.0, 10.0, 10.0, 5.0, 5.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.96875, -37.78857421875, -36.6083984375, -35.42822265625, -34.248046875, -33.06787109375, -31.8876953125, -30.70751953125, -29.52734375, -28.34716796875, -27.1669921875, -25.98681640625, -24.806640625, -23.62646484375, -22.4462890625, -21.26611328125, -20.0859375, -18.90576171875, -17.7255859375, -16.54541015625, -15.365234375, -14.18505859375, -13.0048828125, -11.82470703125, -10.64453125, -9.46435546875, -8.2841796875, -7.10400390625, -5.923828125, -4.74365234375, -3.5634765625, -2.38330078125, -1.203125, -0.02294921875, 1.1572265625, 2.33740234375, 3.517578125, 4.69775390625, 5.8779296875, 7.05810546875, 8.23828125, 9.41845703125, 10.5986328125, 11.77880859375, 12.958984375, 14.13916015625, 15.3193359375, 16.49951171875, 17.6796875, 18.85986328125, 20.0400390625, 21.22021484375, 22.400390625, 23.58056640625, 24.7607421875, 25.94091796875, 27.12109375, 28.30126953125, 29.4814453125, 30.66162109375, 31.841796875, 33.02197265625, 34.2021484375, 35.38232421875, 36.5625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 11.0, 20.0, 24.0, 39.0, 47.0, 88.0, 127.0, 199.0, 291.0, 393.0, 703.0, 990.0, 1502.0, 2125.0, 3370.0, 5037.0, 7777.0, 11365.0, 16910.0, 24383.0, 33978.0, 46625.0, 60987.0, 75712.0, 89798.0, 99080.0, 102308.0, 97595.0, 87936.0, 73736.0, 58410.0, 44463.0, 32377.0, 22609.0, 15676.0, 10589.0, 7136.0, 4703.0, 3172.0, 2136.0, 1351.0, 916.0, 594.0, 400.0, 288.0, 193.0, 117.0, 101.0, 67.0, 36.0, 25.0, 16.0, 4.0, 8.0, 7.0, 1.0, 2.0, 5.0], "bins": [-15.875, -15.38525390625, -14.8955078125, -14.40576171875, -13.916015625, -13.42626953125, -12.9365234375, -12.44677734375, -11.95703125, -11.46728515625, -10.9775390625, -10.48779296875, -9.998046875, -9.50830078125, -9.0185546875, -8.52880859375, -8.0390625, -7.54931640625, -7.0595703125, -6.56982421875, -6.080078125, -5.59033203125, -5.1005859375, -4.61083984375, -4.12109375, -3.63134765625, -3.1416015625, -2.65185546875, -2.162109375, -1.67236328125, -1.1826171875, -0.69287109375, -0.203125, 0.28662109375, 0.7763671875, 1.26611328125, 1.755859375, 2.24560546875, 2.7353515625, 3.22509765625, 3.71484375, 4.20458984375, 4.6943359375, 5.18408203125, 5.673828125, 6.16357421875, 6.6533203125, 7.14306640625, 7.6328125, 8.12255859375, 8.6123046875, 9.10205078125, 9.591796875, 10.08154296875, 10.5712890625, 11.06103515625, 11.55078125, 12.04052734375, 12.5302734375, 13.02001953125, 13.509765625, 13.99951171875, 14.4892578125, 14.97900390625, 15.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 9.0, 5.0, 7.0, 13.0, 18.0, 17.0, 14.0, 14.0, 16.0, 19.0, 21.0, 18.0, 32.0, 30.0, 29.0, 27.0, 47.0, 35.0, 49.0, 36.0, 43.0, 32.0, 46.0, 43.0, 37.0, 42.0, 36.0, 40.0, 25.0, 27.0, 30.0, 26.0, 10.0, 18.0, 21.0, 12.0, 9.0, 9.0, 6.0, 7.0, 2.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.765625, -20.004638671875, -19.24365234375, -18.482666015625, -17.7216796875, -16.960693359375, -16.19970703125, -15.438720703125, -14.677734375, -13.916748046875, -13.15576171875, -12.394775390625, -11.6337890625, -10.872802734375, -10.11181640625, -9.350830078125, -8.58984375, -7.828857421875, -7.06787109375, -6.306884765625, -5.5458984375, -4.784912109375, -4.02392578125, -3.262939453125, -2.501953125, -1.740966796875, -0.97998046875, -0.218994140625, 0.5419921875, 1.302978515625, 2.06396484375, 2.824951171875, 3.5859375, 4.346923828125, 5.10791015625, 5.868896484375, 6.6298828125, 7.390869140625, 8.15185546875, 8.912841796875, 9.673828125, 10.434814453125, 11.19580078125, 11.956787109375, 12.7177734375, 13.478759765625, 14.23974609375, 15.000732421875, 15.76171875, 16.522705078125, 17.28369140625, 18.044677734375, 18.8056640625, 19.566650390625, 20.32763671875, 21.088623046875, 21.849609375, 22.610595703125, 23.37158203125, 24.132568359375, 24.8935546875, 25.654541015625, 26.41552734375, 27.176513671875, 27.9375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 11.0, 16.0, 14.0, 23.0, 35.0, 51.0, 59.0, 103.0, 143.0, 187.0, 326.0, 448.0, 727.0, 1116.0, 1856.0, 3323.0, 5457.0, 9891.0, 17466.0, 31091.0, 52468.0, 82921.0, 117712.0, 144372.0, 152389.0, 138007.0, 107339.0, 73816.0, 45573.0, 26514.0, 14581.0, 8444.0, 4806.0, 2751.0, 1665.0, 956.0, 619.0, 394.0, 288.0, 197.0, 125.0, 82.0, 67.0, 44.0, 25.0, 22.0, 15.0, 7.0, 5.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0], "bins": [-7.77734375, -7.544189453125, -7.31103515625, -7.077880859375, -6.8447265625, -6.611572265625, -6.37841796875, -6.145263671875, -5.912109375, -5.678955078125, -5.44580078125, -5.212646484375, -4.9794921875, -4.746337890625, -4.51318359375, -4.280029296875, -4.046875, -3.813720703125, -3.58056640625, -3.347412109375, -3.1142578125, -2.881103515625, -2.64794921875, -2.414794921875, -2.181640625, -1.948486328125, -1.71533203125, -1.482177734375, -1.2490234375, -1.015869140625, -0.78271484375, -0.549560546875, -0.31640625, -0.083251953125, 0.14990234375, 0.383056640625, 0.6162109375, 0.849365234375, 1.08251953125, 1.315673828125, 1.548828125, 1.781982421875, 2.01513671875, 2.248291015625, 2.4814453125, 2.714599609375, 2.94775390625, 3.180908203125, 3.4140625, 3.647216796875, 3.88037109375, 4.113525390625, 4.3466796875, 4.579833984375, 4.81298828125, 5.046142578125, 5.279296875, 5.512451171875, 5.74560546875, 5.978759765625, 6.2119140625, 6.445068359375, 6.67822265625, 6.911376953125, 7.14453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 2.0, 6.0, 2.0, 9.0, 4.0, 12.0, 11.0, 14.0, 8.0, 12.0, 19.0, 18.0, 25.0, 24.0, 22.0, 32.0, 27.0, 47.0, 36.0, 32.0, 44.0, 38.0, 38.0, 26.0, 60.0, 47.0, 42.0, 33.0, 39.0, 32.0, 27.0, 22.0, 27.0, 19.0, 20.0, 21.0, 17.0, 21.0, 17.0, 10.0, 6.0, 6.0, 9.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.000545501708984375, -0.000528581440448761, -0.000511661171913147, -0.000494740903377533, -0.00047782063484191895, -0.00046090036630630493, -0.0004439800977706909, -0.0004270598292350769, -0.0004101395606994629, -0.0003932192921638489, -0.00037629902362823486, -0.00035937875509262085, -0.00034245848655700684, -0.0003255382180213928, -0.0003086179494857788, -0.0002916976809501648, -0.0002747774124145508, -0.00025785714387893677, -0.00024093687534332275, -0.00022401660680770874, -0.00020709633827209473, -0.0001901760697364807, -0.0001732558012008667, -0.00015633553266525269, -0.00013941526412963867, -0.00012249499559402466, -0.00010557472705841064, -8.865445852279663e-05, -7.173418998718262e-05, -5.4813921451568604e-05, -3.789365291595459e-05, -2.0973384380340576e-05, -4.0531158447265625e-06, 1.2867152690887451e-05, 2.9787421226501465e-05, 4.670768976211548e-05, 6.362795829772949e-05, 8.05482268333435e-05, 9.746849536895752e-05, 0.00011438876390457153, 0.00013130903244018555, 0.00014822930097579956, 0.00016514956951141357, 0.0001820698380470276, 0.0001989901065826416, 0.00021591037511825562, 0.00023283064365386963, 0.00024975091218948364, 0.00026667118072509766, 0.00028359144926071167, 0.0003005117177963257, 0.0003174319863319397, 0.0003343522548675537, 0.0003512725234031677, 0.00036819279193878174, 0.00038511306047439575, 0.00040203332901000977, 0.0004189535975456238, 0.0004358738660812378, 0.0004527941346168518, 0.0004697144031524658, 0.00048663467168807983, 0.0005035549402236938, 0.0005204752087593079, 0.0005373954772949219]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 8.0, 13.0, 20.0, 17.0, 26.0, 39.0, 56.0, 86.0, 129.0, 184.0, 300.0, 444.0, 632.0, 1012.0, 1662.0, 2611.0, 4542.0, 7858.0, 14356.0, 26869.0, 50386.0, 88696.0, 137330.0, 175854.0, 178561.0, 142843.0, 94470.0, 54252.0, 28972.0, 15494.0, 8446.0, 4679.0, 2801.0, 1736.0, 1098.0, 674.0, 429.0, 291.0, 199.0, 138.0, 104.0, 69.0, 45.0, 45.0, 26.0, 16.0, 9.0, 12.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.8671875, -9.5687255859375, -9.270263671875, -8.9718017578125, -8.67333984375, -8.3748779296875, -8.076416015625, -7.7779541015625, -7.4794921875, -7.1810302734375, -6.882568359375, -6.5841064453125, -6.28564453125, -5.9871826171875, -5.688720703125, -5.3902587890625, -5.091796875, -4.7933349609375, -4.494873046875, -4.1964111328125, -3.89794921875, -3.5994873046875, -3.301025390625, -3.0025634765625, -2.7041015625, -2.4056396484375, -2.107177734375, -1.8087158203125, -1.51025390625, -1.2117919921875, -0.913330078125, -0.6148681640625, -0.31640625, -0.0179443359375, 0.280517578125, 0.5789794921875, 0.87744140625, 1.1759033203125, 1.474365234375, 1.7728271484375, 2.0712890625, 2.3697509765625, 2.668212890625, 2.9666748046875, 3.26513671875, 3.5635986328125, 3.862060546875, 4.1605224609375, 4.458984375, 4.7574462890625, 5.055908203125, 5.3543701171875, 5.65283203125, 5.9512939453125, 6.249755859375, 6.5482177734375, 6.8466796875, 7.1451416015625, 7.443603515625, 7.7420654296875, 8.04052734375, 8.3389892578125, 8.637451171875, 8.9359130859375, 9.234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 6.0, 10.0, 10.0, 10.0, 18.0, 11.0, 16.0, 28.0, 24.0, 53.0, 61.0, 79.0, 77.0, 93.0, 75.0, 88.0, 87.0, 51.0, 44.0, 38.0, 16.0, 26.0, 13.0, 13.0, 12.0, 7.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.828125, -5.64215087890625, -5.4561767578125, -5.27020263671875, -5.084228515625, -4.89825439453125, -4.7122802734375, -4.52630615234375, -4.34033203125, -4.15435791015625, -3.9683837890625, -3.78240966796875, -3.596435546875, -3.41046142578125, -3.2244873046875, -3.03851318359375, -2.8525390625, -2.66656494140625, -2.4805908203125, -2.29461669921875, -2.108642578125, -1.92266845703125, -1.7366943359375, -1.55072021484375, -1.36474609375, -1.17877197265625, -0.9927978515625, -0.80682373046875, -0.620849609375, -0.43487548828125, -0.2489013671875, -0.06292724609375, 0.123046875, 0.30902099609375, 0.4949951171875, 0.68096923828125, 0.866943359375, 1.05291748046875, 1.2388916015625, 1.42486572265625, 1.61083984375, 1.79681396484375, 1.9827880859375, 2.16876220703125, 2.354736328125, 2.54071044921875, 2.7266845703125, 2.91265869140625, 3.0986328125, 3.28460693359375, 3.4705810546875, 3.65655517578125, 3.842529296875, 4.02850341796875, 4.2144775390625, 4.40045166015625, 4.58642578125, 4.77239990234375, 4.9583740234375, 5.14434814453125, 5.330322265625, 5.51629638671875, 5.7022705078125, 5.88824462890625, 6.07421875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 3.0, 9.0, 5.0, 14.0, 15.0, 16.0, 14.0, 15.0, 26.0, 30.0, 24.0, 21.0, 36.0, 30.0, 34.0, 30.0, 48.0, 44.0, 49.0, 43.0, 38.0, 43.0, 40.0, 47.0, 26.0, 32.0, 30.0, 37.0, 28.0, 21.0, 23.0, 24.0, 16.0, 19.0, 8.0, 11.0, 10.0, 6.0, 9.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.88111114501953, -24.069246292114258, -23.257381439208984, -22.445514678955078, -21.633649826049805, -20.82178497314453, -20.009920120239258, -19.198055267333984, -18.386188507080078, -17.574323654174805, -16.76245880126953, -15.950592994689941, -15.138727188110352, -14.326862335205078, -13.514997482299805, -12.703132629394531, -11.891267776489258, -11.079402923583984, -10.267537117004395, -9.455672264099121, -8.643806457519531, -7.831941604614258, -7.020076751708984, -6.208211421966553, -5.396346092224121, -4.5844807624816895, -3.772615671157837, -2.9607505798339844, -2.1488852500915527, -1.337019920349121, -0.5251550674438477, 0.286710262298584, 1.0985736846923828, 1.910438895225525, 2.722304105758667, 3.5341691970825195, 4.346034526824951, 5.157899856567383, 5.969764709472656, 6.781630039215088, 7.5934953689575195, 8.405360221862793, 9.217226028442383, 10.029090881347656, 10.84095573425293, 11.65282154083252, 12.464686393737793, 13.276552200317383, 14.088417053222656, 14.90028190612793, 15.71214771270752, 16.52401351928711, 17.335878372192383, 18.147743225097656, 18.95960807800293, 19.771472930908203, 20.58333969116211, 21.395204544067383, 22.207069396972656, 23.018936157226562, 23.830801010131836, 24.64266586303711, 25.454530715942383, 26.266395568847656, 27.07826042175293]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 4.0, 9.0, 7.0, 17.0, 19.0, 20.0, 14.0, 29.0, 32.0, 26.0, 23.0, 29.0, 37.0, 45.0, 41.0, 37.0, 32.0, 41.0, 50.0, 41.0, 44.0, 29.0, 36.0, 37.0, 35.0, 27.0, 28.0, 22.0, 26.0, 29.0, 22.0, 15.0, 13.0, 21.0, 10.0, 9.0, 8.0, 11.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.78567886352539, -47.401756286621094, -46.0178337097168, -44.6339111328125, -43.2499885559082, -41.866065979003906, -40.482139587402344, -39.09822082519531, -37.71429443359375, -36.33037185668945, -34.946449279785156, -33.56252670288086, -32.17860412597656, -30.794681549072266, -29.410757064819336, -28.02683448791504, -26.642913818359375, -25.258991241455078, -23.87506866455078, -22.491146087646484, -21.107223510742188, -19.72330093383789, -18.33937644958496, -16.955453872680664, -15.571531295776367, -14.18760871887207, -12.803686141967773, -11.41976261138916, -10.035840034484863, -8.651917457580566, -7.267993927001953, -5.884071350097656, -4.500152587890625, -3.116229772567749, -1.732306957244873, -0.34838390350341797, 1.035538673400879, 2.419461250305176, 3.803384780883789, 5.187307357788086, 6.571229934692383, 7.95515251159668, 9.339075088500977, 10.72299861907959, 12.106921195983887, 13.490843772888184, 14.874767303466797, 16.258689880371094, 17.64261245727539, 19.026535034179688, 20.410457611083984, 21.79438018798828, 23.178302764892578, 24.562225341796875, 25.946149826049805, 27.3300724029541, 28.7139949798584, 30.097917556762695, 31.481840133666992, 32.86576461791992, 34.24968719482422, 35.633609771728516, 37.01753234863281, 38.40145492553711, 39.785377502441406]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 4.0, 11.0, 16.0, 21.0, 49.0, 78.0, 140.0, 216.0, 360.0, 536.0, 907.0, 1479.0, 2395.0, 3898.0, 6003.0, 9635.0, 15047.0, 23968.0, 35475.0, 53553.0, 78376.0, 112611.0, 153198.0, 205726.0, 260098.0, 314243.0, 360489.0, 387796.0, 392234.0, 372719.0, 333456.0, 282429.0, 224751.0, 172618.0, 126509.0, 89487.0, 61123.0, 41350.0, 26592.0, 17100.0, 10852.0, 6595.0, 3967.0, 2525.0, 1480.0, 925.0, 519.0, 293.0, 174.0, 114.0, 62.0, 33.0, 26.0, 13.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.484375, -19.8271484375, -19.169921875, -18.5126953125, -17.85546875, -17.1982421875, -16.541015625, -15.8837890625, -15.2265625, -14.5693359375, -13.912109375, -13.2548828125, -12.59765625, -11.9404296875, -11.283203125, -10.6259765625, -9.96875, -9.3115234375, -8.654296875, -7.9970703125, -7.33984375, -6.6826171875, -6.025390625, -5.3681640625, -4.7109375, -4.0537109375, -3.396484375, -2.7392578125, -2.08203125, -1.4248046875, -0.767578125, -0.1103515625, 0.546875, 1.2041015625, 1.861328125, 2.5185546875, 3.17578125, 3.8330078125, 4.490234375, 5.1474609375, 5.8046875, 6.4619140625, 7.119140625, 7.7763671875, 8.43359375, 9.0908203125, 9.748046875, 10.4052734375, 11.0625, 11.7197265625, 12.376953125, 13.0341796875, 13.69140625, 14.3486328125, 15.005859375, 15.6630859375, 16.3203125, 16.9775390625, 17.634765625, 18.2919921875, 18.94921875, 19.6064453125, 20.263671875, 20.9208984375, 21.578125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 14.0, 14.0, 22.0, 17.0, 27.0, 23.0, 26.0, 26.0, 27.0, 37.0, 42.0, 41.0, 38.0, 36.0, 34.0, 53.0, 41.0, 41.0, 36.0, 35.0, 38.0, 32.0, 30.0, 35.0, 23.0, 22.0, 34.0, 21.0, 18.0, 13.0, 18.0, 14.0, 11.0, 4.0, 12.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.78125, -40.58447265625, -39.3876953125, -38.19091796875, -36.994140625, -35.79736328125, -34.6005859375, -33.40380859375, -32.20703125, -31.01025390625, -29.8134765625, -28.61669921875, -27.419921875, -26.22314453125, -25.0263671875, -23.82958984375, -22.6328125, -21.43603515625, -20.2392578125, -19.04248046875, -17.845703125, -16.64892578125, -15.4521484375, -14.25537109375, -13.05859375, -11.86181640625, -10.6650390625, -9.46826171875, -8.271484375, -7.07470703125, -5.8779296875, -4.68115234375, -3.484375, -2.28759765625, -1.0908203125, 0.10595703125, 1.302734375, 2.49951171875, 3.6962890625, 4.89306640625, 6.08984375, 7.28662109375, 8.4833984375, 9.68017578125, 10.876953125, 12.07373046875, 13.2705078125, 14.46728515625, 15.6640625, 16.86083984375, 18.0576171875, 19.25439453125, 20.451171875, 21.64794921875, 22.8447265625, 24.04150390625, 25.23828125, 26.43505859375, 27.6318359375, 28.82861328125, 30.025390625, 31.22216796875, 32.4189453125, 33.61572265625, 34.8125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 13.0, 14.0, 16.0, 47.0, 65.0, 121.0, 189.0, 302.0, 511.0, 796.0, 1298.0, 2122.0, 3486.0, 5360.0, 8464.0, 12803.0, 19918.0, 29807.0, 44428.0, 63635.0, 87885.0, 119878.0, 156480.0, 198453.0, 242862.0, 282597.0, 316726.0, 337488.0, 345474.0, 337658.0, 313825.0, 280036.0, 239277.0, 195604.0, 154899.0, 117632.0, 86144.0, 61760.0, 43058.0, 28973.0, 19590.0, 12827.0, 8148.0, 5123.0, 3265.0, 2001.0, 1261.0, 799.0, 494.0, 236.0, 187.0, 104.0, 60.0, 39.0, 23.0, 13.0, 9.0, 9.0, 3.0], "bins": [-19.4375, -18.856689453125, -18.27587890625, -17.695068359375, -17.1142578125, -16.533447265625, -15.95263671875, -15.371826171875, -14.791015625, -14.210205078125, -13.62939453125, -13.048583984375, -12.4677734375, -11.886962890625, -11.30615234375, -10.725341796875, -10.14453125, -9.563720703125, -8.98291015625, -8.402099609375, -7.8212890625, -7.240478515625, -6.65966796875, -6.078857421875, -5.498046875, -4.917236328125, -4.33642578125, -3.755615234375, -3.1748046875, -2.593994140625, -2.01318359375, -1.432373046875, -0.8515625, -0.270751953125, 0.31005859375, 0.890869140625, 1.4716796875, 2.052490234375, 2.63330078125, 3.214111328125, 3.794921875, 4.375732421875, 4.95654296875, 5.537353515625, 6.1181640625, 6.698974609375, 7.27978515625, 7.860595703125, 8.44140625, 9.022216796875, 9.60302734375, 10.183837890625, 10.7646484375, 11.345458984375, 11.92626953125, 12.507080078125, 13.087890625, 13.668701171875, 14.24951171875, 14.830322265625, 15.4111328125, 15.991943359375, 16.57275390625, 17.153564453125, 17.734375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 0.0, 4.0, 9.0, 9.0, 22.0, 31.0, 40.0, 47.0, 59.0, 55.0, 77.0, 101.0, 116.0, 139.0, 150.0, 202.0, 186.0, 179.0, 233.0, 206.0, 235.0, 250.0, 234.0, 217.0, 184.0, 189.0, 143.0, 136.0, 138.0, 89.0, 74.0, 69.0, 60.0, 50.0, 35.0, 32.0, 25.0, 18.0, 13.0, 5.0, 5.0, 9.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4453125, -14.8629150390625, -14.280517578125, -13.6981201171875, -13.11572265625, -12.5333251953125, -11.950927734375, -11.3685302734375, -10.7861328125, -10.2037353515625, -9.621337890625, -9.0389404296875, -8.45654296875, -7.8741455078125, -7.291748046875, -6.7093505859375, -6.126953125, -5.5445556640625, -4.962158203125, -4.3797607421875, -3.79736328125, -3.2149658203125, -2.632568359375, -2.0501708984375, -1.4677734375, -0.8853759765625, -0.302978515625, 0.2794189453125, 0.86181640625, 1.4442138671875, 2.026611328125, 2.6090087890625, 3.19140625, 3.7738037109375, 4.356201171875, 4.9385986328125, 5.52099609375, 6.1033935546875, 6.685791015625, 7.2681884765625, 7.8505859375, 8.4329833984375, 9.015380859375, 9.5977783203125, 10.18017578125, 10.7625732421875, 11.344970703125, 11.9273681640625, 12.509765625, 13.0921630859375, 13.674560546875, 14.2569580078125, 14.83935546875, 15.4217529296875, 16.004150390625, 16.5865478515625, 17.1689453125, 17.7513427734375, 18.333740234375, 18.9161376953125, 19.49853515625, 20.0809326171875, 20.663330078125, 21.2457275390625, 21.828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 4.0, 3.0, 7.0, 13.0, 8.0, 16.0, 10.0, 9.0, 16.0, 23.0, 27.0, 20.0, 30.0, 31.0, 27.0, 32.0, 39.0, 45.0, 43.0, 37.0, 39.0, 52.0, 37.0, 45.0, 39.0, 36.0, 26.0, 25.0, 34.0, 33.0, 25.0, 23.0, 30.0, 25.0, 16.0, 15.0, 15.0, 5.0, 8.0, 8.0, 5.0, 8.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.941373825073242, -25.001123428344727, -24.06087303161621, -23.120622634887695, -22.18037223815918, -21.240121841430664, -20.29987335205078, -19.359622955322266, -18.41937255859375, -17.479122161865234, -16.53887176513672, -15.598621368408203, -14.658370971679688, -13.718120574951172, -12.777871131896973, -11.837620735168457, -10.897369384765625, -9.95711898803711, -9.016868591308594, -8.076618194580078, -7.136368274688721, -6.196117877960205, -5.255867958068848, -4.315617561340332, -3.3753671646118164, -2.435116767883301, -1.4948666095733643, -0.5546164512634277, 0.3856339454650879, 1.3258843421936035, 2.266134262084961, 3.2063846588134766, 4.146636962890625, 5.086887359619141, 6.027137756347656, 6.967387676239014, 7.907638072967529, 8.847888946533203, 9.788138389587402, 10.728388786315918, 11.668639183044434, 12.60888957977295, 13.549139976501465, 14.489389419555664, 15.42963981628418, 16.369890213012695, 17.31014060974121, 18.250391006469727, 19.190641403198242, 20.130891799926758, 21.071142196655273, 22.01139259338379, 22.951642990112305, 23.89189338684082, 24.832141876220703, 25.77239227294922, 26.712642669677734, 27.65289306640625, 28.593143463134766, 29.53339385986328, 30.473644256591797, 31.413894653320312, 32.35414505004883, 33.294395446777344, 34.23464584350586]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 5.0, 8.0, 11.0, 7.0, 12.0, 14.0, 17.0, 21.0, 22.0, 25.0, 27.0, 22.0, 23.0, 46.0, 33.0, 39.0, 43.0, 45.0, 41.0, 43.0, 42.0, 43.0, 43.0, 39.0, 38.0, 31.0, 28.0, 20.0, 30.0, 27.0, 22.0, 23.0, 19.0, 19.0, 9.0, 6.0, 14.0, 10.0, 7.0, 4.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.83561325073242, -43.35862731933594, -41.88164138793945, -40.40465545654297, -38.927669525146484, -37.45068359375, -35.973697662353516, -34.49671173095703, -33.01972579956055, -31.542739868164062, -30.065753936767578, -28.588768005371094, -27.11178207397461, -25.634796142578125, -24.15781021118164, -22.680824279785156, -21.20383644104004, -19.726850509643555, -18.24986457824707, -16.772878646850586, -15.295892715454102, -13.818906784057617, -12.341919898986816, -10.864933967590332, -9.387948036193848, -7.910962104797363, -6.433976173400879, -4.956989765167236, -3.480003833770752, -2.0030179023742676, -0.526031494140625, 0.9509544372558594, 2.4279403686523438, 3.904926300048828, 5.3819122314453125, 6.858898639678955, 8.335884094238281, 9.812870025634766, 11.289856910705566, 12.76684284210205, 14.243828773498535, 15.72081470489502, 17.19780158996582, 18.674787521362305, 20.15177345275879, 21.628759384155273, 23.105745315551758, 24.582731246948242, 26.059717178344727, 27.53670310974121, 29.013689041137695, 30.49067497253418, 31.967660903930664, 33.44464874267578, 34.921634674072266, 36.39862060546875, 37.875606536865234, 39.35259246826172, 40.8295783996582, 42.30656433105469, 43.78355026245117, 45.260536193847656, 46.73752212524414, 48.214508056640625, 49.69149398803711]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 10.0, 21.0, 20.0, 35.0, 56.0, 84.0, 116.0, 202.0, 301.0, 420.0, 687.0, 1041.0, 1757.0, 2747.0, 4551.0, 7846.0, 13715.0, 25422.0, 49033.0, 99748.0, 205138.0, 294646.0, 168478.0, 81768.0, 40461.0, 21165.0, 11707.0, 6744.0, 3996.0, 2468.0, 1413.0, 989.0, 604.0, 405.0, 238.0, 178.0, 129.0, 68.0, 48.0, 34.0, 18.0, 15.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.734375, -3.61529541015625, -3.4962158203125, -3.37713623046875, -3.258056640625, -3.13897705078125, -3.0198974609375, -2.90081787109375, -2.78173828125, -2.66265869140625, -2.5435791015625, -2.42449951171875, -2.305419921875, -2.18634033203125, -2.0672607421875, -1.94818115234375, -1.8291015625, -1.71002197265625, -1.5909423828125, -1.47186279296875, -1.352783203125, -1.23370361328125, -1.1146240234375, -0.99554443359375, -0.87646484375, -0.75738525390625, -0.6383056640625, -0.51922607421875, -0.400146484375, -0.28106689453125, -0.1619873046875, -0.04290771484375, 0.076171875, 0.19525146484375, 0.3143310546875, 0.43341064453125, 0.552490234375, 0.67156982421875, 0.7906494140625, 0.90972900390625, 1.02880859375, 1.14788818359375, 1.2669677734375, 1.38604736328125, 1.505126953125, 1.62420654296875, 1.7432861328125, 1.86236572265625, 1.9814453125, 2.10052490234375, 2.2196044921875, 2.33868408203125, 2.457763671875, 2.57684326171875, 2.6959228515625, 2.81500244140625, 2.93408203125, 3.05316162109375, 3.1722412109375, 3.29132080078125, 3.410400390625, 3.52947998046875, 3.6485595703125, 3.76763916015625, 3.88671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 6.0, 8.0, 11.0, 7.0, 12.0, 14.0, 15.0, 22.0, 23.0, 25.0, 27.0, 22.0, 24.0, 43.0, 34.0, 39.0, 43.0, 45.0, 40.0, 44.0, 42.0, 45.0, 40.0, 41.0, 38.0, 30.0, 27.0, 21.0, 31.0, 26.0, 22.0, 22.0, 21.0, 18.0, 10.0, 6.0, 14.0, 9.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.03125, -43.55517578125, -42.0791015625, -40.60302734375, -39.126953125, -37.65087890625, -36.1748046875, -34.69873046875, -33.22265625, -31.74658203125, -30.2705078125, -28.79443359375, -27.318359375, -25.84228515625, -24.3662109375, -22.89013671875, -21.4140625, -19.93798828125, -18.4619140625, -16.98583984375, -15.509765625, -14.03369140625, -12.5576171875, -11.08154296875, -9.60546875, -8.12939453125, -6.6533203125, -5.17724609375, -3.701171875, -2.22509765625, -0.7490234375, 0.72705078125, 2.203125, 3.67919921875, 5.1552734375, 6.63134765625, 8.107421875, 9.58349609375, 11.0595703125, 12.53564453125, 14.01171875, 15.48779296875, 16.9638671875, 18.43994140625, 19.916015625, 21.39208984375, 22.8681640625, 24.34423828125, 25.8203125, 27.29638671875, 28.7724609375, 30.24853515625, 31.724609375, 33.20068359375, 34.6767578125, 36.15283203125, 37.62890625, 39.10498046875, 40.5810546875, 42.05712890625, 43.533203125, 45.00927734375, 46.4853515625, 47.96142578125, 49.4375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 17.0, 17.0, 19.0, 41.0, 59.0, 91.0, 150.0, 223.0, 367.0, 575.0, 893.0, 1512.0, 2687.0, 4818.0, 9399.0, 18315.0, 38435.0, 83823.0, 212181.0, 374328.0, 166625.0, 68543.0, 31948.0, 15307.0, 7946.0, 4263.0, 2400.0, 1381.0, 768.0, 514.0, 302.0, 210.0, 134.0, 85.0, 53.0, 43.0, 23.0, 17.0, 13.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.69140625, -5.515625, -5.33984375, -5.1640625, -4.98828125, -4.8125, -4.63671875, -4.4609375, -4.28515625, -4.109375, -3.93359375, -3.7578125, -3.58203125, -3.40625, -3.23046875, -3.0546875, -2.87890625, -2.703125, -2.52734375, -2.3515625, -2.17578125, -2.0, -1.82421875, -1.6484375, -1.47265625, -1.296875, -1.12109375, -0.9453125, -0.76953125, -0.59375, -0.41796875, -0.2421875, -0.06640625, 0.109375, 0.28515625, 0.4609375, 0.63671875, 0.8125, 0.98828125, 1.1640625, 1.33984375, 1.515625, 1.69140625, 1.8671875, 2.04296875, 2.21875, 2.39453125, 2.5703125, 2.74609375, 2.921875, 3.09765625, 3.2734375, 3.44921875, 3.625, 3.80078125, 3.9765625, 4.15234375, 4.328125, 4.50390625, 4.6796875, 4.85546875, 5.03125, 5.20703125, 5.3828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 2.0, 7.0, 7.0, 11.0, 13.0, 9.0, 13.0, 14.0, 15.0, 17.0, 18.0, 27.0, 22.0, 28.0, 38.0, 41.0, 30.0, 36.0, 42.0, 38.0, 39.0, 37.0, 43.0, 35.0, 29.0, 38.0, 27.0, 33.0, 30.0, 20.0, 36.0, 23.0, 23.0, 20.0, 12.0, 13.0, 16.0, 16.0, 13.0, 11.0, 10.0, 8.0, 8.0, 10.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-26.453125, -25.602783203125, -24.75244140625, -23.902099609375, -23.0517578125, -22.201416015625, -21.35107421875, -20.500732421875, -19.650390625, -18.800048828125, -17.94970703125, -17.099365234375, -16.2490234375, -15.398681640625, -14.54833984375, -13.697998046875, -12.84765625, -11.997314453125, -11.14697265625, -10.296630859375, -9.4462890625, -8.595947265625, -7.74560546875, -6.895263671875, -6.044921875, -5.194580078125, -4.34423828125, -3.493896484375, -2.6435546875, -1.793212890625, -0.94287109375, -0.092529296875, 0.7578125, 1.608154296875, 2.45849609375, 3.308837890625, 4.1591796875, 5.009521484375, 5.85986328125, 6.710205078125, 7.560546875, 8.410888671875, 9.26123046875, 10.111572265625, 10.9619140625, 11.812255859375, 12.66259765625, 13.512939453125, 14.36328125, 15.213623046875, 16.06396484375, 16.914306640625, 17.7646484375, 18.614990234375, 19.46533203125, 20.315673828125, 21.166015625, 22.016357421875, 22.86669921875, 23.717041015625, 24.5673828125, 25.417724609375, 26.26806640625, 27.118408203125, 27.96875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 0.0, 7.0, 3.0, 8.0, 10.0, 16.0, 20.0, 36.0, 43.0, 55.0, 58.0, 90.0, 151.0, 188.0, 303.0, 475.0, 805.0, 1248.0, 2344.0, 4563.0, 10456.0, 28761.0, 104114.0, 494800.0, 301533.0, 63153.0, 19386.0, 7672.0, 3547.0, 1830.0, 1028.0, 628.0, 395.0, 245.0, 177.0, 111.0, 78.0, 61.0, 49.0, 22.0, 23.0, 14.0, 16.0, 8.0, 9.0, 6.0, 7.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.43798828125, -0.42464447021484375, -0.4113006591796875, -0.39795684814453125, -0.384613037109375, -0.37126922607421875, -0.3579254150390625, -0.34458160400390625, -0.33123779296875, -0.31789398193359375, -0.3045501708984375, -0.29120635986328125, -0.277862548828125, -0.26451873779296875, -0.2511749267578125, -0.23783111572265625, -0.2244873046875, -0.21114349365234375, -0.1977996826171875, -0.18445587158203125, -0.171112060546875, -0.15776824951171875, -0.1444244384765625, -0.13108062744140625, -0.11773681640625, -0.10439300537109375, -0.0910491943359375, -0.07770538330078125, -0.064361572265625, -0.05101776123046875, -0.0376739501953125, -0.02433013916015625, -0.010986328125, 0.00235748291015625, 0.0157012939453125, 0.02904510498046875, 0.042388916015625, 0.05573272705078125, 0.0690765380859375, 0.08242034912109375, 0.09576416015625, 0.10910797119140625, 0.1224517822265625, 0.13579559326171875, 0.149139404296875, 0.16248321533203125, 0.1758270263671875, 0.18917083740234375, 0.2025146484375, 0.21585845947265625, 0.2292022705078125, 0.24254608154296875, 0.255889892578125, 0.26923370361328125, 0.2825775146484375, 0.29592132568359375, 0.30926513671875, 0.32260894775390625, 0.3359527587890625, 0.34929656982421875, 0.362640380859375, 0.37598419189453125, 0.3893280029296875, 0.40267181396484375, 0.416015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 13.0, 15.0, 24.0, 32.0, 45.0, 53.0, 67.0, 81.0, 74.0, 72.0, 83.0, 76.0, 75.0, 60.0, 65.0, 39.0, 31.0, 25.0, 24.0, 16.0, 10.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0994415283203125e-05, -2.975575625896454e-05, -2.8517097234725952e-05, -2.7278438210487366e-05, -2.603977918624878e-05, -2.4801120162010193e-05, -2.3562461137771606e-05, -2.232380211353302e-05, -2.1085143089294434e-05, -1.9846484065055847e-05, -1.860782504081726e-05, -1.7369166016578674e-05, -1.6130506992340088e-05, -1.4891847968101501e-05, -1.3653188943862915e-05, -1.2414529919624329e-05, -1.1175870895385742e-05, -9.937211871147156e-06, -8.69855284690857e-06, -7.459893822669983e-06, -6.2212347984313965e-06, -4.98257577419281e-06, -3.7439167499542236e-06, -2.505257725715637e-06, -1.2665987014770508e-06, -2.7939677238464355e-08, 1.210719347000122e-06, 2.4493783712387085e-06, 3.688037395477295e-06, 4.926696419715881e-06, 6.165355443954468e-06, 7.404014468193054e-06, 8.64267349243164e-06, 9.881332516670227e-06, 1.1119991540908813e-05, 1.23586505651474e-05, 1.3597309589385986e-05, 1.4835968613624573e-05, 1.607462763786316e-05, 1.7313286662101746e-05, 1.8551945686340332e-05, 1.979060471057892e-05, 2.1029263734817505e-05, 2.226792275905609e-05, 2.3506581783294678e-05, 2.4745240807533264e-05, 2.598389983177185e-05, 2.7222558856010437e-05, 2.8461217880249023e-05, 2.969987690448761e-05, 3.0938535928726196e-05, 3.217719495296478e-05, 3.341585397720337e-05, 3.4654513001441956e-05, 3.589317202568054e-05, 3.713183104991913e-05, 3.8370490074157715e-05, 3.96091490983963e-05, 4.084780812263489e-05, 4.2086467146873474e-05, 4.332512617111206e-05, 4.456378519535065e-05, 4.5802444219589233e-05, 4.704110324382782e-05, 4.8279762268066406e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 3.0, 10.0, 12.0, 21.0, 26.0, 34.0, 64.0, 82.0, 135.0, 243.0, 421.0, 574.0, 1064.0, 1703.0, 3026.0, 5357.0, 9899.0, 18656.0, 38799.0, 94153.0, 281260.0, 373676.0, 122483.0, 47917.0, 22333.0, 11727.0, 6209.0, 3541.0, 2092.0, 1140.0, 702.0, 438.0, 269.0, 155.0, 94.0, 78.0, 51.0, 33.0, 29.0, 18.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.488494873046875, -0.47113037109375, -0.453765869140625, -0.4364013671875, -0.419036865234375, -0.40167236328125, -0.384307861328125, -0.366943359375, -0.349578857421875, -0.33221435546875, -0.314849853515625, -0.2974853515625, -0.280120849609375, -0.26275634765625, -0.245391845703125, -0.22802734375, -0.210662841796875, -0.19329833984375, -0.175933837890625, -0.1585693359375, -0.141204833984375, -0.12384033203125, -0.106475830078125, -0.089111328125, -0.071746826171875, -0.05438232421875, -0.037017822265625, -0.0196533203125, -0.002288818359375, 0.01507568359375, 0.032440185546875, 0.0498046875, 0.067169189453125, 0.08453369140625, 0.101898193359375, 0.1192626953125, 0.136627197265625, 0.15399169921875, 0.171356201171875, 0.188720703125, 0.206085205078125, 0.22344970703125, 0.240814208984375, 0.2581787109375, 0.275543212890625, 0.29290771484375, 0.310272216796875, 0.32763671875, 0.345001220703125, 0.36236572265625, 0.379730224609375, 0.3970947265625, 0.414459228515625, 0.43182373046875, 0.449188232421875, 0.466552734375, 0.483917236328125, 0.50128173828125, 0.518646240234375, 0.5360107421875, 0.553375244140625, 0.57073974609375, 0.588104248046875, 0.60546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 11.0, 9.0, 11.0, 10.0, 12.0, 12.0, 37.0, 38.0, 47.0, 61.0, 79.0, 84.0, 119.0, 96.0, 81.0, 65.0, 64.0, 49.0, 30.0, 14.0, 7.0, 12.0, 12.0, 11.0, 8.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6976852416992188, -0.6775970458984375, -0.6575088500976562, -0.637420654296875, -0.6173324584960938, -0.5972442626953125, -0.5771560668945312, -0.55706787109375, -0.5369796752929688, -0.5168914794921875, -0.49680328369140625, -0.476715087890625, -0.45662689208984375, -0.4365386962890625, -0.41645050048828125, -0.3963623046875, -0.37627410888671875, -0.3561859130859375, -0.33609771728515625, -0.316009521484375, -0.29592132568359375, -0.2758331298828125, -0.25574493408203125, -0.23565673828125, -0.21556854248046875, -0.1954803466796875, -0.17539215087890625, -0.155303955078125, -0.13521575927734375, -0.1151275634765625, -0.09503936767578125, -0.074951171875, -0.05486297607421875, -0.0347747802734375, -0.01468658447265625, 0.005401611328125, 0.02548980712890625, 0.0455780029296875, 0.06566619873046875, 0.08575439453125, 0.10584259033203125, 0.1259307861328125, 0.14601898193359375, 0.166107177734375, 0.18619537353515625, 0.2062835693359375, 0.22637176513671875, 0.2464599609375, 0.26654815673828125, 0.2866363525390625, 0.30672454833984375, 0.326812744140625, 0.34690093994140625, 0.3669891357421875, 0.38707733154296875, 0.40716552734375, 0.42725372314453125, 0.4473419189453125, 0.46743011474609375, 0.487518310546875, 0.5076065063476562, 0.5276947021484375, 0.5477828979492188, 0.56787109375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 6.0, 3.0, 14.0, 9.0, 15.0, 13.0, 5.0, 16.0, 22.0, 22.0, 28.0, 26.0, 35.0, 29.0, 28.0, 41.0, 38.0, 48.0, 32.0, 46.0, 45.0, 43.0, 41.0, 41.0, 41.0, 27.0, 23.0, 30.0, 36.0, 24.0, 27.0, 29.0, 23.0, 16.0, 19.0, 13.0, 4.0, 8.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.16318130493164, -25.219078063964844, -24.274974822998047, -23.330869674682617, -22.38676643371582, -21.442663192749023, -20.498558044433594, -19.554454803466797, -18.6103515625, -17.666248321533203, -16.722145080566406, -15.778039932250977, -14.83393669128418, -13.889833450317383, -12.94572925567627, -12.001625061035156, -11.05752182006836, -10.113418579101562, -9.16931438446045, -8.225210189819336, -7.281106948852539, -6.337003231048584, -5.392899513244629, -4.448795795440674, -3.5046920776367188, -2.5605883598327637, -1.6164846420288086, -0.6723809242248535, 0.27172279357910156, 1.2158265113830566, 2.1599302291870117, 3.104033946990967, 4.048137664794922, 4.992241382598877, 5.936345100402832, 6.880448818206787, 7.824552536010742, 8.768655776977539, 9.712759971618652, 10.656864166259766, 11.600967407226562, 12.54507064819336, 13.489174842834473, 14.433279037475586, 15.377382278442383, 16.32148551940918, 17.26559066772461, 18.209693908691406, 19.153797149658203, 20.097900390625, 21.042003631591797, 21.986108779907227, 22.930212020874023, 23.87431526184082, 24.81842041015625, 25.762523651123047, 26.706626892089844, 27.65073013305664, 28.594833374023438, 29.538938522338867, 30.483041763305664, 31.42714500427246, 32.37125015258789, 33.31535339355469, 34.259456634521484]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 6.0, 7.0, 12.0, 6.0, 12.0, 15.0, 16.0, 23.0, 21.0, 27.0, 26.0, 21.0, 26.0, 41.0, 35.0, 36.0, 45.0, 46.0, 41.0, 44.0, 40.0, 45.0, 42.0, 39.0, 36.0, 32.0, 30.0, 19.0, 30.0, 27.0, 21.0, 28.0, 14.0, 21.0, 8.0, 6.0, 14.0, 10.0, 7.0, 4.0, 7.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.181785583496094, -43.699798583984375, -42.217811584472656, -40.73582458496094, -39.25383758544922, -37.7718505859375, -36.28986358642578, -34.80787658691406, -33.325889587402344, -31.843902587890625, -30.361915588378906, -28.879928588867188, -27.39794158935547, -25.91595458984375, -24.433969497680664, -22.951982498168945, -21.46999740600586, -19.98801040649414, -18.506023406982422, -17.024036407470703, -15.5420503616333, -14.060063362121582, -12.57807731628418, -11.096090316772461, -9.614103317260742, -8.132116317749023, -6.650129795074463, -5.168143272399902, -3.6861562728881836, -2.204169273376465, -0.7221832275390625, 0.7598037719726562, 2.2417945861816406, 3.7237813472747803, 5.20576810836792, 6.6877546310424805, 8.1697416305542, 9.651728630065918, 11.13371467590332, 12.615701675415039, 14.097688674926758, 15.579675674438477, 17.061662673950195, 18.54364776611328, 20.025634765625, 21.50762176513672, 22.989608764648438, 24.471595764160156, 25.953582763671875, 27.435569763183594, 28.917556762695312, 30.39954376220703, 31.88153076171875, 33.36351776123047, 34.84550476074219, 36.327491760253906, 37.809478759765625, 39.291465759277344, 40.77345275878906, 42.25543975830078, 43.7374267578125, 45.21941375732422, 46.70140075683594, 48.183387756347656, 49.66537094116211]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 10.0, 21.0, 36.0, 52.0, 84.0, 132.0, 202.0, 354.0, 545.0, 891.0, 1395.0, 2238.0, 3659.0, 5972.0, 9270.0, 14340.0, 21545.0, 31799.0, 44929.0, 59991.0, 76242.0, 91069.0, 101570.0, 106547.0, 102953.0, 91799.0, 77881.0, 61131.0, 45793.0, 32803.0, 22373.0, 14790.0, 9584.0, 6248.0, 3955.0, 2494.0, 1471.0, 918.0, 560.0, 357.0, 212.0, 140.0, 73.0, 48.0, 27.0, 19.0, 10.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.8046875, -15.2872314453125, -14.769775390625, -14.2523193359375, -13.73486328125, -13.2174072265625, -12.699951171875, -12.1824951171875, -11.6650390625, -11.1475830078125, -10.630126953125, -10.1126708984375, -9.59521484375, -9.0777587890625, -8.560302734375, -8.0428466796875, -7.525390625, -7.0079345703125, -6.490478515625, -5.9730224609375, -5.45556640625, -4.9381103515625, -4.420654296875, -3.9031982421875, -3.3857421875, -2.8682861328125, -2.350830078125, -1.8333740234375, -1.31591796875, -0.7984619140625, -0.281005859375, 0.2364501953125, 0.75390625, 1.2713623046875, 1.788818359375, 2.3062744140625, 2.82373046875, 3.3411865234375, 3.858642578125, 4.3760986328125, 4.8935546875, 5.4110107421875, 5.928466796875, 6.4459228515625, 6.96337890625, 7.4808349609375, 7.998291015625, 8.5157470703125, 9.033203125, 9.5506591796875, 10.068115234375, 10.5855712890625, 11.10302734375, 11.6204833984375, 12.137939453125, 12.6553955078125, 13.1728515625, 13.6903076171875, 14.207763671875, 14.7252197265625, 15.24267578125, 15.7601318359375, 16.277587890625, 16.7950439453125, 17.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 14.0, 6.0, 11.0, 14.0, 16.0, 23.0, 22.0, 29.0, 22.0, 27.0, 21.0, 44.0, 33.0, 38.0, 47.0, 43.0, 44.0, 44.0, 37.0, 48.0, 41.0, 40.0, 35.0, 33.0, 29.0, 21.0, 30.0, 25.0, 24.0, 24.0, 16.0, 19.0, 8.0, 5.0, 14.0, 10.0, 7.0, 5.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.625, -43.1591796875, -41.693359375, -40.2275390625, -38.76171875, -37.2958984375, -35.830078125, -34.3642578125, -32.8984375, -31.4326171875, -29.966796875, -28.5009765625, -27.03515625, -25.5693359375, -24.103515625, -22.6376953125, -21.171875, -19.7060546875, -18.240234375, -16.7744140625, -15.30859375, -13.8427734375, -12.376953125, -10.9111328125, -9.4453125, -7.9794921875, -6.513671875, -5.0478515625, -3.58203125, -2.1162109375, -0.650390625, 0.8154296875, 2.28125, 3.7470703125, 5.212890625, 6.6787109375, 8.14453125, 9.6103515625, 11.076171875, 12.5419921875, 14.0078125, 15.4736328125, 16.939453125, 18.4052734375, 19.87109375, 21.3369140625, 22.802734375, 24.2685546875, 25.734375, 27.2001953125, 28.666015625, 30.1318359375, 31.59765625, 33.0634765625, 34.529296875, 35.9951171875, 37.4609375, 38.9267578125, 40.392578125, 41.8583984375, 43.32421875, 44.7900390625, 46.255859375, 47.7216796875, 49.1875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 10.0, 19.0, 38.0, 45.0, 76.0, 112.0, 176.0, 319.0, 484.0, 750.0, 1193.0, 1866.0, 2878.0, 4352.0, 6897.0, 10193.0, 15295.0, 22355.0, 31726.0, 43807.0, 58530.0, 73634.0, 88544.0, 98415.0, 103420.0, 100350.0, 91134.0, 76878.0, 61345.0, 46824.0, 34099.0, 24090.0, 16685.0, 11230.0, 7454.0, 4777.0, 3083.0, 1968.0, 1249.0, 788.0, 526.0, 365.0, 203.0, 140.0, 86.0, 61.0, 35.0, 21.0, 15.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.890625, -16.37255859375, -15.8544921875, -15.33642578125, -14.818359375, -14.30029296875, -13.7822265625, -13.26416015625, -12.74609375, -12.22802734375, -11.7099609375, -11.19189453125, -10.673828125, -10.15576171875, -9.6376953125, -9.11962890625, -8.6015625, -8.08349609375, -7.5654296875, -7.04736328125, -6.529296875, -6.01123046875, -5.4931640625, -4.97509765625, -4.45703125, -3.93896484375, -3.4208984375, -2.90283203125, -2.384765625, -1.86669921875, -1.3486328125, -0.83056640625, -0.3125, 0.20556640625, 0.7236328125, 1.24169921875, 1.759765625, 2.27783203125, 2.7958984375, 3.31396484375, 3.83203125, 4.35009765625, 4.8681640625, 5.38623046875, 5.904296875, 6.42236328125, 6.9404296875, 7.45849609375, 7.9765625, 8.49462890625, 9.0126953125, 9.53076171875, 10.048828125, 10.56689453125, 11.0849609375, 11.60302734375, 12.12109375, 12.63916015625, 13.1572265625, 13.67529296875, 14.193359375, 14.71142578125, 15.2294921875, 15.74755859375, 16.265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 0.0, 4.0, 3.0, 15.0, 13.0, 14.0, 15.0, 18.0, 17.0, 26.0, 18.0, 25.0, 43.0, 29.0, 44.0, 40.0, 46.0, 45.0, 50.0, 32.0, 45.0, 36.0, 40.0, 35.0, 30.0, 38.0, 41.0, 24.0, 34.0, 26.0, 28.0, 18.0, 24.0, 19.0, 8.0, 11.0, 7.0, 13.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.953125, -27.006103515625, -26.05908203125, -25.112060546875, -24.1650390625, -23.218017578125, -22.27099609375, -21.323974609375, -20.376953125, -19.429931640625, -18.48291015625, -17.535888671875, -16.5888671875, -15.641845703125, -14.69482421875, -13.747802734375, -12.80078125, -11.853759765625, -10.90673828125, -9.959716796875, -9.0126953125, -8.065673828125, -7.11865234375, -6.171630859375, -5.224609375, -4.277587890625, -3.33056640625, -2.383544921875, -1.4365234375, -0.489501953125, 0.45751953125, 1.404541015625, 2.3515625, 3.298583984375, 4.24560546875, 5.192626953125, 6.1396484375, 7.086669921875, 8.03369140625, 8.980712890625, 9.927734375, 10.874755859375, 11.82177734375, 12.768798828125, 13.7158203125, 14.662841796875, 15.60986328125, 16.556884765625, 17.50390625, 18.450927734375, 19.39794921875, 20.344970703125, 21.2919921875, 22.239013671875, 23.18603515625, 24.133056640625, 25.080078125, 26.027099609375, 26.97412109375, 27.921142578125, 28.8681640625, 29.815185546875, 30.76220703125, 31.709228515625, 32.65625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 16.0, 19.0, 20.0, 42.0, 55.0, 86.0, 132.0, 222.0, 371.0, 613.0, 929.0, 1442.0, 2419.0, 3770.0, 5897.0, 9205.0, 14022.0, 20679.0, 29627.0, 40594.0, 54131.0, 67814.0, 81032.0, 91937.0, 98201.0, 98129.0, 91608.0, 81711.0, 68614.0, 54110.0, 40694.0, 29578.0, 20795.0, 14264.0, 9425.0, 6006.0, 3893.0, 2343.0, 1571.0, 936.0, 586.0, 394.0, 258.0, 139.0, 94.0, 42.0, 37.0, 18.0, 18.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0], "bins": [-5.16015625, -5.00384521484375, -4.8475341796875, -4.69122314453125, -4.534912109375, -4.37860107421875, -4.2222900390625, -4.06597900390625, -3.90966796875, -3.75335693359375, -3.5970458984375, -3.44073486328125, -3.284423828125, -3.12811279296875, -2.9718017578125, -2.81549072265625, -2.6591796875, -2.50286865234375, -2.3465576171875, -2.19024658203125, -2.033935546875, -1.87762451171875, -1.7213134765625, -1.56500244140625, -1.40869140625, -1.25238037109375, -1.0960693359375, -0.93975830078125, -0.783447265625, -0.62713623046875, -0.4708251953125, -0.31451416015625, -0.158203125, -0.00189208984375, 0.1544189453125, 0.31072998046875, 0.467041015625, 0.62335205078125, 0.7796630859375, 0.93597412109375, 1.09228515625, 1.24859619140625, 1.4049072265625, 1.56121826171875, 1.717529296875, 1.87384033203125, 2.0301513671875, 2.18646240234375, 2.3427734375, 2.49908447265625, 2.6553955078125, 2.81170654296875, 2.968017578125, 3.12432861328125, 3.2806396484375, 3.43695068359375, 3.59326171875, 3.74957275390625, 3.9058837890625, 4.06219482421875, 4.218505859375, 4.37481689453125, 4.5311279296875, 4.68743896484375, 4.84375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 13.0, 6.0, 11.0, 9.0, 18.0, 14.0, 28.0, 16.0, 35.0, 32.0, 38.0, 40.0, 50.0, 42.0, 52.0, 39.0, 38.0, 44.0, 43.0, 50.0, 39.0, 43.0, 29.0, 21.0, 37.0, 27.0, 31.0, 24.0, 19.0, 19.0, 14.0, 13.0, 13.0, 3.0, 10.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0006160736083984375, -0.0005959570407867432, -0.0005758404731750488, -0.0005557239055633545, -0.0005356073379516602, -0.0005154907703399658, -0.0004953742027282715, -0.00047525763511657715, -0.0004551410675048828, -0.0004350244998931885, -0.00041490793228149414, -0.0003947913646697998, -0.00037467479705810547, -0.00035455822944641113, -0.0003344416618347168, -0.00031432509422302246, -0.0002942085266113281, -0.0002740919589996338, -0.00025397539138793945, -0.00023385882377624512, -0.00021374225616455078, -0.00019362568855285645, -0.0001735091209411621, -0.00015339255332946777, -0.00013327598571777344, -0.0001131594181060791, -9.304285049438477e-05, -7.292628288269043e-05, -5.2809715270996094e-05, -3.269314765930176e-05, -1.2576580047607422e-05, 7.539987564086914e-06, 2.765655517578125e-05, 4.7773122787475586e-05, 6.788969039916992e-05, 8.800625801086426e-05, 0.0001081228256225586, 0.00012823939323425293, 0.00014835596084594727, 0.0001684725284576416, 0.00018858909606933594, 0.00020870566368103027, 0.0002288222312927246, 0.00024893879890441895, 0.0002690553665161133, 0.0002891719341278076, 0.00030928850173950195, 0.0003294050693511963, 0.0003495216369628906, 0.00036963820457458496, 0.0003897547721862793, 0.00040987133979797363, 0.00042998790740966797, 0.0004501044750213623, 0.00047022104263305664, 0.000490337610244751, 0.0005104541778564453, 0.0005305707454681396, 0.000550687313079834, 0.0005708038806915283, 0.0005909204483032227, 0.000611037015914917, 0.0006311535835266113, 0.0006512701511383057, 0.00067138671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 19.0, 27.0, 30.0, 34.0, 71.0, 109.0, 173.0, 295.0, 432.0, 696.0, 1000.0, 1638.0, 2640.0, 4285.0, 6929.0, 11091.0, 17288.0, 26659.0, 38816.0, 54880.0, 73134.0, 91370.0, 105404.0, 112383.0, 110373.0, 99886.0, 82983.0, 65109.0, 47377.0, 33218.0, 22015.0, 14021.0, 9057.0, 5516.0, 3504.0, 2250.0, 1388.0, 910.0, 535.0, 338.0, 218.0, 173.0, 112.0, 51.0, 34.0, 36.0, 22.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.67279052734375, -5.4822998046875, -5.29180908203125, -5.101318359375, -4.91082763671875, -4.7203369140625, -4.52984619140625, -4.33935546875, -4.14886474609375, -3.9583740234375, -3.76788330078125, -3.577392578125, -3.38690185546875, -3.1964111328125, -3.00592041015625, -2.8154296875, -2.62493896484375, -2.4344482421875, -2.24395751953125, -2.053466796875, -1.86297607421875, -1.6724853515625, -1.48199462890625, -1.29150390625, -1.10101318359375, -0.9105224609375, -0.72003173828125, -0.529541015625, -0.33905029296875, -0.1485595703125, 0.04193115234375, 0.232421875, 0.42291259765625, 0.6134033203125, 0.80389404296875, 0.994384765625, 1.18487548828125, 1.3753662109375, 1.56585693359375, 1.75634765625, 1.94683837890625, 2.1373291015625, 2.32781982421875, 2.518310546875, 2.70880126953125, 2.8992919921875, 3.08978271484375, 3.2802734375, 3.47076416015625, 3.6612548828125, 3.85174560546875, 4.042236328125, 4.23272705078125, 4.4232177734375, 4.61370849609375, 4.80419921875, 4.99468994140625, 5.1851806640625, 5.37567138671875, 5.566162109375, 5.75665283203125, 5.9471435546875, 6.13763427734375, 6.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 15.0, 12.0, 12.0, 18.0, 29.0, 31.0, 32.0, 40.0, 54.0, 35.0, 54.0, 56.0, 50.0, 50.0, 47.0, 57.0, 50.0, 54.0, 44.0, 39.0, 39.0, 29.0, 26.0, 24.0, 13.0, 12.0, 10.0, 13.0, 5.0, 7.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.902587890625, -3.76611328125, -3.629638671875, -3.4931640625, -3.356689453125, -3.22021484375, -3.083740234375, -2.947265625, -2.810791015625, -2.67431640625, -2.537841796875, -2.4013671875, -2.264892578125, -2.12841796875, -1.991943359375, -1.85546875, -1.718994140625, -1.58251953125, -1.446044921875, -1.3095703125, -1.173095703125, -1.03662109375, -0.900146484375, -0.763671875, -0.627197265625, -0.49072265625, -0.354248046875, -0.2177734375, -0.081298828125, 0.05517578125, 0.191650390625, 0.328125, 0.464599609375, 0.60107421875, 0.737548828125, 0.8740234375, 1.010498046875, 1.14697265625, 1.283447265625, 1.419921875, 1.556396484375, 1.69287109375, 1.829345703125, 1.9658203125, 2.102294921875, 2.23876953125, 2.375244140625, 2.51171875, 2.648193359375, 2.78466796875, 2.921142578125, 3.0576171875, 3.194091796875, 3.33056640625, 3.467041015625, 3.603515625, 3.739990234375, 3.87646484375, 4.012939453125, 4.1494140625, 4.285888671875, 4.42236328125, 4.558837890625, 4.6953125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 13.0, 13.0, 13.0, 17.0, 11.0, 18.0, 22.0, 33.0, 31.0, 29.0, 36.0, 39.0, 42.0, 46.0, 39.0, 37.0, 51.0, 32.0, 48.0, 34.0, 40.0, 34.0, 35.0, 24.0, 36.0, 33.0, 24.0, 22.0, 20.0, 12.0, 20.0, 15.0, 13.0, 7.0, 8.0, 4.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-26.285898208618164, -25.34469985961914, -24.403501510620117, -23.462303161621094, -22.52110481262207, -21.579906463623047, -20.638710021972656, -19.697509765625, -18.75631332397461, -17.815114974975586, -16.873916625976562, -15.932718276977539, -14.991519927978516, -14.050321578979492, -13.109124183654785, -12.167925834655762, -11.226726531982422, -10.285528182983398, -9.344329833984375, -8.403131484985352, -7.461933612823486, -6.520735263824463, -5.579537391662598, -4.638339042663574, -3.697140693664551, -2.7559423446655273, -1.814744234085083, -0.8735461235046387, 0.06765222549438477, 1.0088505744934082, 1.9500484466552734, 2.891246795654297, 3.832447052001953, 4.773645401000977, 5.71484375, 6.656041622161865, 7.597239971160889, 8.53843879699707, 9.479636192321777, 10.4208345413208, 11.362032890319824, 12.303231239318848, 13.244429588317871, 14.185626983642578, 15.126825332641602, 16.068023681640625, 17.00922203063965, 17.950420379638672, 18.891618728637695, 19.83281707763672, 20.774015426635742, 21.715213775634766, 22.65641212463379, 23.597610473632812, 24.538806915283203, 25.48000717163086, 26.42120361328125, 27.362401962280273, 28.303600311279297, 29.24479866027832, 30.185997009277344, 31.127195358276367, 32.06839370727539, 33.00959014892578, 33.95079040527344]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 7.0, 4.0, 5.0, 7.0, 11.0, 16.0, 17.0, 17.0, 22.0, 19.0, 35.0, 27.0, 27.0, 29.0, 30.0, 36.0, 36.0, 51.0, 54.0, 42.0, 38.0, 31.0, 53.0, 39.0, 39.0, 36.0, 31.0, 38.0, 22.0, 24.0, 28.0, 18.0, 22.0, 18.0, 17.0, 14.0, 11.0, 9.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-53.528202056884766, -51.900970458984375, -50.27373504638672, -48.64650344848633, -47.01926803588867, -45.39203643798828, -43.764801025390625, -42.137569427490234, -40.510337829589844, -38.88310623168945, -37.2558708190918, -35.628639221191406, -34.00140380859375, -32.37417221069336, -30.746938705444336, -29.119705200195312, -27.49247169494629, -25.865238189697266, -24.238004684448242, -22.61077117919922, -20.983539581298828, -19.356306076049805, -17.72907257080078, -16.10184097290039, -14.47460651397705, -12.847373008728027, -11.22014045715332, -9.592906951904297, -7.965673923492432, -6.338440895080566, -4.711207389831543, -3.083974838256836, -1.4567413330078125, 0.17049181461334229, 1.797724962234497, 3.4249582290649414, 5.052191257476807, 6.679424285888672, 8.306657791137695, 9.933890342712402, 11.561123847961426, 13.18835735321045, 14.815589904785156, 16.44282341003418, 18.070056915283203, 19.697288513183594, 21.32452392578125, 22.95175552368164, 24.578989028930664, 26.206222534179688, 27.83345603942871, 29.460689544677734, 31.087921142578125, 32.71515655517578, 34.34238815307617, 35.96961975097656, 37.59685516357422, 39.22408676147461, 40.851322174072266, 42.478553771972656, 44.10578918457031, 45.7330207824707, 47.360252380371094, 48.98748779296875, 50.61471939086914]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 13.0, 33.0, 43.0, 93.0, 126.0, 209.0, 389.0, 693.0, 1144.0, 1920.0, 3300.0, 5343.0, 8878.0, 14150.0, 23172.0, 36420.0, 56711.0, 85452.0, 124840.0, 175378.0, 235394.0, 297001.0, 356504.0, 398814.0, 417356.0, 408673.0, 372229.0, 318337.0, 254426.0, 192789.0, 138984.0, 96317.0, 63277.0, 40998.0, 25533.0, 15790.0, 9591.0, 5816.0, 3364.0, 1938.0, 1186.0, 732.0, 395.0, 226.0, 136.0, 62.0, 45.0, 30.0, 15.0, 14.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.75, -25.930419921875, -25.11083984375, -24.291259765625, -23.4716796875, -22.652099609375, -21.83251953125, -21.012939453125, -20.193359375, -19.373779296875, -18.55419921875, -17.734619140625, -16.9150390625, -16.095458984375, -15.27587890625, -14.456298828125, -13.63671875, -12.817138671875, -11.99755859375, -11.177978515625, -10.3583984375, -9.538818359375, -8.71923828125, -7.899658203125, -7.080078125, -6.260498046875, -5.44091796875, -4.621337890625, -3.8017578125, -2.982177734375, -2.16259765625, -1.343017578125, -0.5234375, 0.296142578125, 1.11572265625, 1.935302734375, 2.7548828125, 3.574462890625, 4.39404296875, 5.213623046875, 6.033203125, 6.852783203125, 7.67236328125, 8.491943359375, 9.3115234375, 10.131103515625, 10.95068359375, 11.770263671875, 12.58984375, 13.409423828125, 14.22900390625, 15.048583984375, 15.8681640625, 16.687744140625, 17.50732421875, 18.326904296875, 19.146484375, 19.966064453125, 20.78564453125, 21.605224609375, 22.4248046875, 23.244384765625, 24.06396484375, 24.883544921875, 25.703125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 6.0, 2.0, 9.0, 12.0, 18.0, 15.0, 20.0, 20.0, 21.0, 34.0, 31.0, 23.0, 40.0, 25.0, 37.0, 39.0, 58.0, 48.0, 42.0, 37.0, 33.0, 48.0, 40.0, 36.0, 34.0, 38.0, 33.0, 20.0, 28.0, 22.0, 21.0, 21.0, 18.0, 15.0, 8.0, 12.0, 7.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-47.96875, -46.501953125, -45.03515625, -43.568359375, -42.1015625, -40.634765625, -39.16796875, -37.701171875, -36.234375, -34.767578125, -33.30078125, -31.833984375, -30.3671875, -28.900390625, -27.43359375, -25.966796875, -24.5, -23.033203125, -21.56640625, -20.099609375, -18.6328125, -17.166015625, -15.69921875, -14.232421875, -12.765625, -11.298828125, -9.83203125, -8.365234375, -6.8984375, -5.431640625, -3.96484375, -2.498046875, -1.03125, 0.435546875, 1.90234375, 3.369140625, 4.8359375, 6.302734375, 7.76953125, 9.236328125, 10.703125, 12.169921875, 13.63671875, 15.103515625, 16.5703125, 18.037109375, 19.50390625, 20.970703125, 22.4375, 23.904296875, 25.37109375, 26.837890625, 28.3046875, 29.771484375, 31.23828125, 32.705078125, 34.171875, 35.638671875, 37.10546875, 38.572265625, 40.0390625, 41.505859375, 42.97265625, 44.439453125, 45.90625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 12.0, 21.0, 42.0, 84.0, 140.0, 284.0, 513.0, 835.0, 1574.0, 2699.0, 4824.0, 8420.0, 14773.0, 24847.0, 40696.0, 64670.0, 99124.0, 145815.0, 203848.0, 269010.0, 335236.0, 390488.0, 424949.0, 428556.0, 403485.0, 353390.0, 289083.0, 223121.0, 162431.0, 111977.0, 73868.0, 47075.0, 28578.0, 17054.0, 9801.0, 5722.0, 3235.0, 1798.0, 1053.0, 506.0, 297.0, 173.0, 82.0, 45.0, 25.0, 19.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-30.09375, -29.237548828125, -28.38134765625, -27.525146484375, -26.6689453125, -25.812744140625, -24.95654296875, -24.100341796875, -23.244140625, -22.387939453125, -21.53173828125, -20.675537109375, -19.8193359375, -18.963134765625, -18.10693359375, -17.250732421875, -16.39453125, -15.538330078125, -14.68212890625, -13.825927734375, -12.9697265625, -12.113525390625, -11.25732421875, -10.401123046875, -9.544921875, -8.688720703125, -7.83251953125, -6.976318359375, -6.1201171875, -5.263916015625, -4.40771484375, -3.551513671875, -2.6953125, -1.839111328125, -0.98291015625, -0.126708984375, 0.7294921875, 1.585693359375, 2.44189453125, 3.298095703125, 4.154296875, 5.010498046875, 5.86669921875, 6.722900390625, 7.5791015625, 8.435302734375, 9.29150390625, 10.147705078125, 11.00390625, 11.860107421875, 12.71630859375, 13.572509765625, 14.4287109375, 15.284912109375, 16.14111328125, 16.997314453125, 17.853515625, 18.709716796875, 19.56591796875, 20.422119140625, 21.2783203125, 22.134521484375, 22.99072265625, 23.846923828125, 24.703125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 7.0, 12.0, 22.0, 20.0, 25.0, 36.0, 43.0, 54.0, 69.0, 80.0, 85.0, 121.0, 112.0, 117.0, 156.0, 159.0, 167.0, 177.0, 183.0, 216.0, 208.0, 180.0, 186.0, 205.0, 165.0, 184.0, 160.0, 155.0, 127.0, 120.0, 99.0, 81.0, 82.0, 53.0, 33.0, 35.0, 32.0, 18.0, 23.0, 16.0, 6.0, 10.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.09375, -19.48046875, -18.8671875, -18.25390625, -17.640625, -17.02734375, -16.4140625, -15.80078125, -15.1875, -14.57421875, -13.9609375, -13.34765625, -12.734375, -12.12109375, -11.5078125, -10.89453125, -10.28125, -9.66796875, -9.0546875, -8.44140625, -7.828125, -7.21484375, -6.6015625, -5.98828125, -5.375, -4.76171875, -4.1484375, -3.53515625, -2.921875, -2.30859375, -1.6953125, -1.08203125, -0.46875, 0.14453125, 0.7578125, 1.37109375, 1.984375, 2.59765625, 3.2109375, 3.82421875, 4.4375, 5.05078125, 5.6640625, 6.27734375, 6.890625, 7.50390625, 8.1171875, 8.73046875, 9.34375, 9.95703125, 10.5703125, 11.18359375, 11.796875, 12.41015625, 13.0234375, 13.63671875, 14.25, 14.86328125, 15.4765625, 16.08984375, 16.703125, 17.31640625, 17.9296875, 18.54296875, 19.15625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 8.0, 2.0, 6.0, 10.0, 11.0, 9.0, 13.0, 13.0, 23.0, 26.0, 29.0, 30.0, 38.0, 39.0, 34.0, 51.0, 37.0, 46.0, 42.0, 47.0, 40.0, 49.0, 40.0, 36.0, 32.0, 28.0, 27.0, 26.0, 26.0, 23.0, 14.0, 23.0, 18.0, 12.0, 18.0, 13.0, 15.0, 11.0, 7.0, 6.0, 3.0, 3.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-35.503841400146484, -34.36326217651367, -33.22268295288086, -32.08210372924805, -30.941526412963867, -29.800947189331055, -28.660369873046875, -27.519790649414062, -26.37921142578125, -25.238632202148438, -24.098052978515625, -22.957475662231445, -21.816896438598633, -20.67631721496582, -19.53573989868164, -18.395160675048828, -17.254581451416016, -16.114002227783203, -14.973423957824707, -13.832845687866211, -12.692266464233398, -11.551687240600586, -10.41110897064209, -9.270530700683594, -8.129951477050781, -6.989372730255127, -5.848793983459473, -4.708215236663818, -3.567636489868164, -2.4270577430725098, -1.2864789962768555, -0.14590024948120117, 0.9946784973144531, 2.1352572441101074, 3.2758359909057617, 4.416414737701416, 5.55699348449707, 6.697572231292725, 7.838150978088379, 8.978729248046875, 10.119308471679688, 11.2598876953125, 12.400465965270996, 13.541044235229492, 14.681623458862305, 15.822202682495117, 16.962779998779297, 18.10335922241211, 19.243938446044922, 20.384517669677734, 21.525096893310547, 22.665674209594727, 23.80625343322754, 24.94683265686035, 26.08740997314453, 27.227989196777344, 28.368568420410156, 29.50914764404297, 30.64972686767578, 31.79030418395996, 32.930885314941406, 34.07146072387695, 35.212039947509766, 36.35261917114258, 37.49319839477539]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 5.0, 6.0, 5.0, 14.0, 11.0, 13.0, 9.0, 17.0, 25.0, 22.0, 30.0, 32.0, 25.0, 46.0, 27.0, 37.0, 43.0, 54.0, 55.0, 29.0, 41.0, 48.0, 44.0, 38.0, 42.0, 33.0, 31.0, 35.0, 18.0, 32.0, 20.0, 16.0, 21.0, 18.0, 11.0, 11.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.556190490722656, -59.65354537963867, -57.75090408325195, -55.84825897216797, -53.945613861083984, -52.04296875, -50.14032745361328, -48.2376823425293, -46.33503723144531, -44.43239212036133, -42.52975082397461, -40.627105712890625, -38.72446060180664, -36.821815490722656, -34.91917419433594, -33.01652908325195, -31.113887786865234, -29.211244583129883, -27.3085994720459, -25.405956268310547, -23.503311157226562, -21.60066795349121, -19.69802474975586, -17.795379638671875, -15.892736434936523, -13.990092277526855, -12.087448120117188, -10.184804916381836, -8.282160758972168, -6.3795166015625, -4.476873397827148, -2.5742292404174805, -0.6715850830078125, 1.2310588359832764, 3.1337027549743652, 5.036346435546875, 6.938990592956543, 8.841634750366211, 10.744277954101562, 12.64692211151123, 14.549566268920898, 16.45220947265625, 18.354854583740234, 20.257497787475586, 22.160140991210938, 24.062786102294922, 25.965429306030273, 27.868072509765625, 29.77071762084961, 31.67336082458496, 33.57600402832031, 35.4786491394043, 37.38129425048828, 39.283935546875, 41.186580657958984, 43.08922576904297, 44.99186706542969, 46.89451217651367, 48.79715347290039, 50.699798583984375, 52.60244369506836, 54.505088806152344, 56.40773010253906, 58.31037521362305, 60.21302032470703]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 5.0, 9.0, 8.0, 12.0, 15.0, 27.0, 39.0, 52.0, 81.0, 111.0, 143.0, 201.0, 287.0, 384.0, 534.0, 821.0, 1174.0, 1707.0, 2439.0, 3684.0, 5461.0, 8126.0, 12887.0, 21237.0, 35645.0, 64447.0, 119048.0, 213262.0, 235969.0, 138304.0, 74372.0, 41264.0, 24195.0, 14787.0, 9152.0, 5950.0, 3923.0, 2638.0, 1915.0, 1274.0, 873.0, 614.0, 426.0, 305.0, 244.0, 139.0, 94.0, 80.0, 58.0, 46.0, 31.0, 18.0, 17.0, 13.0, 8.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.818359375, -3.699493408203125, -3.58062744140625, -3.461761474609375, -3.3428955078125, -3.224029541015625, -3.10516357421875, -2.986297607421875, -2.867431640625, -2.748565673828125, -2.62969970703125, -2.510833740234375, -2.3919677734375, -2.273101806640625, -2.15423583984375, -2.035369873046875, -1.91650390625, -1.797637939453125, -1.67877197265625, -1.559906005859375, -1.4410400390625, -1.322174072265625, -1.20330810546875, -1.084442138671875, -0.965576171875, -0.846710205078125, -0.72784423828125, -0.608978271484375, -0.4901123046875, -0.371246337890625, -0.25238037109375, -0.133514404296875, -0.0146484375, 0.104217529296875, 0.22308349609375, 0.341949462890625, 0.4608154296875, 0.579681396484375, 0.69854736328125, 0.817413330078125, 0.936279296875, 1.055145263671875, 1.17401123046875, 1.292877197265625, 1.4117431640625, 1.530609130859375, 1.64947509765625, 1.768341064453125, 1.88720703125, 2.006072998046875, 2.12493896484375, 2.243804931640625, 2.3626708984375, 2.481536865234375, 2.60040283203125, 2.719268798828125, 2.838134765625, 2.957000732421875, 3.07586669921875, 3.194732666015625, 3.3135986328125, 3.432464599609375, 3.55133056640625, 3.670196533203125, 3.7890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 5.0, 6.0, 5.0, 14.0, 11.0, 13.0, 9.0, 16.0, 27.0, 22.0, 30.0, 31.0, 28.0, 42.0, 28.0, 39.0, 42.0, 54.0, 54.0, 31.0, 42.0, 46.0, 45.0, 39.0, 39.0, 33.0, 34.0, 34.0, 17.0, 32.0, 19.0, 17.0, 21.0, 17.0, 11.0, 13.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.90625, -59.99951171875, -58.0927734375, -56.18603515625, -54.279296875, -52.37255859375, -50.4658203125, -48.55908203125, -46.65234375, -44.74560546875, -42.8388671875, -40.93212890625, -39.025390625, -37.11865234375, -35.2119140625, -33.30517578125, -31.3984375, -29.49169921875, -27.5849609375, -25.67822265625, -23.771484375, -21.86474609375, -19.9580078125, -18.05126953125, -16.14453125, -14.23779296875, -12.3310546875, -10.42431640625, -8.517578125, -6.61083984375, -4.7041015625, -2.79736328125, -0.890625, 1.01611328125, 2.9228515625, 4.82958984375, 6.736328125, 8.64306640625, 10.5498046875, 12.45654296875, 14.36328125, 16.27001953125, 18.1767578125, 20.08349609375, 21.990234375, 23.89697265625, 25.8037109375, 27.71044921875, 29.6171875, 31.52392578125, 33.4306640625, 35.33740234375, 37.244140625, 39.15087890625, 41.0576171875, 42.96435546875, 44.87109375, 46.77783203125, 48.6845703125, 50.59130859375, 52.498046875, 54.40478515625, 56.3115234375, 58.21826171875, 60.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 5.0, 5.0, 8.0, 10.0, 16.0, 22.0, 27.0, 37.0, 67.0, 107.0, 145.0, 204.0, 325.0, 497.0, 743.0, 1191.0, 1904.0, 3186.0, 5759.0, 10560.0, 19249.0, 37388.0, 77511.0, 179610.0, 352616.0, 190893.0, 81708.0, 39059.0, 20133.0, 10622.0, 5799.0, 3536.0, 2147.0, 1243.0, 760.0, 521.0, 307.0, 215.0, 139.0, 88.0, 65.0, 46.0, 30.0, 15.0, 20.0, 14.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.76947021484375, -5.5740966796875, -5.37872314453125, -5.183349609375, -4.98797607421875, -4.7926025390625, -4.59722900390625, -4.40185546875, -4.20648193359375, -4.0111083984375, -3.81573486328125, -3.620361328125, -3.42498779296875, -3.2296142578125, -3.03424072265625, -2.8388671875, -2.64349365234375, -2.4481201171875, -2.25274658203125, -2.057373046875, -1.86199951171875, -1.6666259765625, -1.47125244140625, -1.27587890625, -1.08050537109375, -0.8851318359375, -0.68975830078125, -0.494384765625, -0.29901123046875, -0.1036376953125, 0.09173583984375, 0.287109375, 0.48248291015625, 0.6778564453125, 0.87322998046875, 1.068603515625, 1.26397705078125, 1.4593505859375, 1.65472412109375, 1.85009765625, 2.04547119140625, 2.2408447265625, 2.43621826171875, 2.631591796875, 2.82696533203125, 3.0223388671875, 3.21771240234375, 3.4130859375, 3.60845947265625, 3.8038330078125, 3.99920654296875, 4.194580078125, 4.38995361328125, 4.5853271484375, 4.78070068359375, 4.97607421875, 5.17144775390625, 5.3668212890625, 5.56219482421875, 5.757568359375, 5.95294189453125, 6.1483154296875, 6.34368896484375, 6.5390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 2.0, 2.0, 5.0, 10.0, 12.0, 12.0, 11.0, 21.0, 16.0, 13.0, 27.0, 19.0, 27.0, 22.0, 29.0, 33.0, 29.0, 38.0, 34.0, 41.0, 32.0, 41.0, 27.0, 35.0, 44.0, 41.0, 34.0, 37.0, 22.0, 35.0, 37.0, 35.0, 34.0, 24.0, 14.0, 11.0, 19.0, 9.0, 19.0, 8.0, 8.0, 8.0, 10.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-35.375, -34.271484375, -33.16796875, -32.064453125, -30.9609375, -29.857421875, -28.75390625, -27.650390625, -26.546875, -25.443359375, -24.33984375, -23.236328125, -22.1328125, -21.029296875, -19.92578125, -18.822265625, -17.71875, -16.615234375, -15.51171875, -14.408203125, -13.3046875, -12.201171875, -11.09765625, -9.994140625, -8.890625, -7.787109375, -6.68359375, -5.580078125, -4.4765625, -3.373046875, -2.26953125, -1.166015625, -0.0625, 1.041015625, 2.14453125, 3.248046875, 4.3515625, 5.455078125, 6.55859375, 7.662109375, 8.765625, 9.869140625, 10.97265625, 12.076171875, 13.1796875, 14.283203125, 15.38671875, 16.490234375, 17.59375, 18.697265625, 19.80078125, 20.904296875, 22.0078125, 23.111328125, 24.21484375, 25.318359375, 26.421875, 27.525390625, 28.62890625, 29.732421875, 30.8359375, 31.939453125, 33.04296875, 34.146484375, 35.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 3.0, 12.0, 18.0, 19.0, 27.0, 33.0, 67.0, 76.0, 137.0, 141.0, 276.0, 429.0, 661.0, 1116.0, 1927.0, 3552.0, 7085.0, 15468.0, 37929.0, 112005.0, 396584.0, 322954.0, 89420.0, 31655.0, 13237.0, 6183.0, 3095.0, 1708.0, 999.0, 582.0, 408.0, 229.0, 148.0, 101.0, 80.0, 47.0, 43.0, 21.0, 27.0, 14.0, 8.0, 9.0, 3.0, 3.0, 9.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38525390625, -0.3723716735839844, -0.35948944091796875, -0.3466072082519531, -0.3337249755859375, -0.3208427429199219, -0.30796051025390625, -0.2950782775878906, -0.282196044921875, -0.2693138122558594, -0.25643157958984375, -0.24354934692382812, -0.2306671142578125, -0.21778488159179688, -0.20490264892578125, -0.19202041625976562, -0.17913818359375, -0.16625595092773438, -0.15337371826171875, -0.14049148559570312, -0.1276092529296875, -0.11472702026367188, -0.10184478759765625, -0.08896255493164062, -0.076080322265625, -0.06319808959960938, -0.05031585693359375, -0.037433624267578125, -0.0245513916015625, -0.011669158935546875, 0.00121307373046875, 0.014095306396484375, 0.0269775390625, 0.039859771728515625, 0.05274200439453125, 0.06562423706054688, 0.0785064697265625, 0.09138870239257812, 0.10427093505859375, 0.11715316772460938, 0.130035400390625, 0.14291763305664062, 0.15579986572265625, 0.16868209838867188, 0.1815643310546875, 0.19444656372070312, 0.20732879638671875, 0.22021102905273438, 0.23309326171875, 0.24597549438476562, 0.25885772705078125, 0.2717399597167969, 0.2846221923828125, 0.2975044250488281, 0.31038665771484375, 0.3232688903808594, 0.336151123046875, 0.3490333557128906, 0.36191558837890625, 0.3747978210449219, 0.3876800537109375, 0.4005622863769531, 0.41344451904296875, 0.4263267517089844, 0.439208984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 5.0, 13.0, 9.0, 10.0, 21.0, 17.0, 17.0, 28.0, 40.0, 32.0, 46.0, 47.0, 67.0, 56.0, 66.0, 47.0, 55.0, 66.0, 54.0, 43.0, 41.0, 45.0, 34.0, 24.0, 22.0, 17.0, 10.0, 9.0, 18.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.321748226881027e-05, -3.2162293791770935e-05, -3.11071053147316e-05, -3.005191683769226e-05, -2.8996728360652924e-05, -2.7941539883613586e-05, -2.688635140657425e-05, -2.5831162929534912e-05, -2.4775974452495575e-05, -2.3720785975456238e-05, -2.26655974984169e-05, -2.1610409021377563e-05, -2.0555220544338226e-05, -1.950003206729889e-05, -1.8444843590259552e-05, -1.7389655113220215e-05, -1.6334466636180878e-05, -1.527927815914154e-05, -1.4224089682102203e-05, -1.3168901205062866e-05, -1.2113712728023529e-05, -1.1058524250984192e-05, -1.0003335773944855e-05, -8.948147296905518e-06, -7.89295881986618e-06, -6.837770342826843e-06, -5.782581865787506e-06, -4.727393388748169e-06, -3.6722049117088318e-06, -2.6170164346694946e-06, -1.5618279576301575e-06, -5.066394805908203e-07, 5.485489964485168e-07, 1.603737473487854e-06, 2.658925950527191e-06, 3.7141144275665283e-06, 4.7693029046058655e-06, 5.824491381645203e-06, 6.87967985868454e-06, 7.934868335723877e-06, 8.990056812763214e-06, 1.0045245289802551e-05, 1.1100433766841888e-05, 1.2155622243881226e-05, 1.3210810720920563e-05, 1.42659991979599e-05, 1.5321187674999237e-05, 1.6376376152038574e-05, 1.743156462907791e-05, 1.848675310611725e-05, 1.9541941583156586e-05, 2.0597130060195923e-05, 2.165231853723526e-05, 2.2707507014274597e-05, 2.3762695491313934e-05, 2.481788396835327e-05, 2.587307244539261e-05, 2.6928260922431946e-05, 2.7983449399471283e-05, 2.903863787651062e-05, 3.0093826353549957e-05, 3.1149014830589294e-05, 3.220420330762863e-05, 3.325939178466797e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 14.0, 18.0, 21.0, 39.0, 43.0, 63.0, 90.0, 136.0, 185.0, 295.0, 465.0, 651.0, 1007.0, 1456.0, 2172.0, 3401.0, 5276.0, 8265.0, 13418.0, 22218.0, 38148.0, 69455.0, 134920.0, 267274.0, 225963.0, 110995.0, 58365.0, 32540.0, 19298.0, 11601.0, 7168.0, 4573.0, 3036.0, 1991.0, 1288.0, 873.0, 573.0, 382.0, 284.0, 194.0, 118.0, 93.0, 73.0, 34.0, 25.0, 21.0, 13.0, 5.0, 10.0, 5.0, 3.0, 5.0], "bins": [-0.484375, -0.4708671569824219, -0.45735931396484375, -0.4438514709472656, -0.4303436279296875, -0.4168357849121094, -0.40332794189453125, -0.3898200988769531, -0.376312255859375, -0.3628044128417969, -0.34929656982421875, -0.3357887268066406, -0.3222808837890625, -0.3087730407714844, -0.29526519775390625, -0.2817573547363281, -0.26824951171875, -0.2547416687011719, -0.24123382568359375, -0.22772598266601562, -0.2142181396484375, -0.20071029663085938, -0.18720245361328125, -0.17369461059570312, -0.160186767578125, -0.14667892456054688, -0.13317108154296875, -0.11966323852539062, -0.1061553955078125, -0.09264755249023438, -0.07913970947265625, -0.06563186645507812, -0.0521240234375, -0.038616180419921875, -0.02510833740234375, -0.011600494384765625, 0.0019073486328125, 0.015415191650390625, 0.02892303466796875, 0.042430877685546875, 0.055938720703125, 0.06944656372070312, 0.08295440673828125, 0.09646224975585938, 0.1099700927734375, 0.12347793579101562, 0.13698577880859375, 0.15049362182617188, 0.16400146484375, 0.17750930786132812, 0.19101715087890625, 0.20452499389648438, 0.2180328369140625, 0.23154067993164062, 0.24504852294921875, 0.2585563659667969, 0.272064208984375, 0.2855720520019531, 0.29907989501953125, 0.3125877380371094, 0.3260955810546875, 0.3396034240722656, 0.35311126708984375, 0.3666191101074219, 0.380126953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 7.0, 12.0, 18.0, 15.0, 21.0, 32.0, 41.0, 39.0, 49.0, 50.0, 55.0, 57.0, 55.0, 71.0, 62.0, 61.0, 64.0, 59.0, 43.0, 44.0, 25.0, 26.0, 16.0, 10.0, 13.0, 10.0, 10.0, 7.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5142593383789062, -0.4972686767578125, -0.48027801513671875, -0.463287353515625, -0.44629669189453125, -0.4293060302734375, -0.41231536865234375, -0.39532470703125, -0.37833404541015625, -0.3613433837890625, -0.34435272216796875, -0.327362060546875, -0.31037139892578125, -0.2933807373046875, -0.27639007568359375, -0.2593994140625, -0.24240875244140625, -0.2254180908203125, -0.20842742919921875, -0.191436767578125, -0.17444610595703125, -0.1574554443359375, -0.14046478271484375, -0.12347412109375, -0.10648345947265625, -0.0894927978515625, -0.07250213623046875, -0.055511474609375, -0.03852081298828125, -0.0215301513671875, -0.00453948974609375, 0.012451171875, 0.02944183349609375, 0.0464324951171875, 0.06342315673828125, 0.080413818359375, 0.09740447998046875, 0.1143951416015625, 0.13138580322265625, 0.14837646484375, 0.16536712646484375, 0.1823577880859375, 0.19934844970703125, 0.216339111328125, 0.23332977294921875, 0.2503204345703125, 0.26731109619140625, 0.2843017578125, 0.30129241943359375, 0.3182830810546875, 0.33527374267578125, 0.352264404296875, 0.36925506591796875, 0.3862457275390625, 0.40323638916015625, 0.42022705078125, 0.43721771240234375, 0.4542083740234375, 0.47119903564453125, 0.488189697265625, 0.5051803588867188, 0.5221710205078125, 0.5391616821289062, 0.55615234375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 2.0, 3.0, 12.0, 11.0, 12.0, 9.0, 15.0, 16.0, 27.0, 28.0, 34.0, 36.0, 41.0, 30.0, 51.0, 44.0, 39.0, 47.0, 47.0, 43.0, 44.0, 41.0, 37.0, 32.0, 29.0, 28.0, 26.0, 27.0, 26.0, 15.0, 20.0, 18.0, 15.0, 15.0, 15.0, 16.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-36.02802658081055, -34.8749885559082, -33.72195053100586, -32.56890869140625, -31.415870666503906, -30.262832641601562, -29.10979461669922, -27.956754684448242, -26.803714752197266, -25.650676727294922, -24.497636795043945, -23.3445987701416, -22.191558837890625, -21.03852081298828, -19.885482788085938, -18.73244285583496, -17.579404830932617, -16.426366806030273, -15.273326873779297, -14.120288848876953, -12.967248916625977, -11.814210891723633, -10.661171913146973, -9.508132934570312, -8.355093955993652, -7.202054977416992, -6.049015998840332, -4.89597749710083, -3.74293851852417, -2.5898995399475098, -1.4368610382080078, -0.28382205963134766, 0.8692169189453125, 2.0222558975219727, 3.1752946376800537, 4.328333377838135, 5.481372356414795, 6.634411334991455, 7.787449836730957, 8.940488815307617, 10.093527793884277, 11.246566772460938, 12.399605751037598, 13.552644729614258, 14.705682754516602, 15.858722686767578, 17.011760711669922, 18.164798736572266, 19.317838668823242, 20.470876693725586, 21.623916625976562, 22.776954650878906, 23.929994583129883, 25.083032608032227, 26.236072540283203, 27.389110565185547, 28.54214859008789, 29.695186614990234, 30.84822654724121, 32.00126647949219, 33.15430450439453, 34.307342529296875, 35.46038055419922, 36.61341857910156, 37.76646041870117]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 6.0, 5.0, 5.0, 14.0, 11.0, 14.0, 8.0, 16.0, 25.0, 24.0, 29.0, 31.0, 26.0, 45.0, 26.0, 39.0, 41.0, 56.0, 53.0, 31.0, 40.0, 48.0, 46.0, 38.0, 40.0, 33.0, 33.0, 34.0, 18.0, 31.0, 21.0, 15.0, 22.0, 17.0, 12.0, 10.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.99052429199219, -60.08445739746094, -58.17838668823242, -56.27231979370117, -54.366249084472656, -52.460182189941406, -50.55411148071289, -48.64804458618164, -46.741973876953125, -44.835906982421875, -42.92983627319336, -41.02376937866211, -39.117698669433594, -37.211631774902344, -35.30556106567383, -33.39949417114258, -31.493425369262695, -29.587356567382812, -27.68128776550293, -25.775218963623047, -23.869150161743164, -21.96308135986328, -20.05701446533203, -18.150943756103516, -16.244876861572266, -14.338808059692383, -12.4327392578125, -10.526670455932617, -8.620601654052734, -6.714533805847168, -4.808465003967285, -2.9023962020874023, -0.9963264465332031, 0.9097422361373901, 2.8158109188079834, 4.721879482269287, 6.62794828414917, 8.534016609191895, 10.440085411071777, 12.34615421295166, 14.252223014831543, 16.15829086303711, 18.064359664916992, 19.970428466796875, 21.876497268676758, 23.78256607055664, 25.688634872436523, 27.594703674316406, 29.50077247619629, 31.406841278076172, 33.31290817260742, 35.21897888183594, 37.12504577636719, 39.0311164855957, 40.93718338012695, 42.84325408935547, 44.74932098388672, 46.65538787841797, 48.561458587646484, 50.467525482177734, 52.37359619140625, 54.2796630859375, 56.185733795166016, 58.091800689697266, 59.99787139892578]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 8.0, 10.0, 12.0, 14.0, 13.0, 20.0, 47.0, 75.0, 96.0, 172.0, 235.0, 390.0, 587.0, 973.0, 1595.0, 2602.0, 4018.0, 6379.0, 9947.0, 15103.0, 22211.0, 32325.0, 45145.0, 59995.0, 75487.0, 89059.0, 99434.0, 103818.0, 100447.0, 91411.0, 77780.0, 61523.0, 46389.0, 33496.0, 23202.0, 15902.0, 10333.0, 6646.0, 4388.0, 2614.0, 1650.0, 1128.0, 651.0, 445.0, 283.0, 170.0, 124.0, 77.0, 43.0, 32.0, 28.0, 12.0, 15.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-18.671875, -18.098388671875, -17.52490234375, -16.951416015625, -16.3779296875, -15.804443359375, -15.23095703125, -14.657470703125, -14.083984375, -13.510498046875, -12.93701171875, -12.363525390625, -11.7900390625, -11.216552734375, -10.64306640625, -10.069580078125, -9.49609375, -8.922607421875, -8.34912109375, -7.775634765625, -7.2021484375, -6.628662109375, -6.05517578125, -5.481689453125, -4.908203125, -4.334716796875, -3.76123046875, -3.187744140625, -2.6142578125, -2.040771484375, -1.46728515625, -0.893798828125, -0.3203125, 0.253173828125, 0.82666015625, 1.400146484375, 1.9736328125, 2.547119140625, 3.12060546875, 3.694091796875, 4.267578125, 4.841064453125, 5.41455078125, 5.988037109375, 6.5615234375, 7.135009765625, 7.70849609375, 8.281982421875, 8.85546875, 9.428955078125, 10.00244140625, 10.575927734375, 11.1494140625, 11.722900390625, 12.29638671875, 12.869873046875, 13.443359375, 14.016845703125, 14.59033203125, 15.163818359375, 15.7373046875, 16.310791015625, 16.88427734375, 17.457763671875, 18.03125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 0.0, 5.0, 7.0, 6.0, 6.0, 11.0, 13.0, 15.0, 6.0, 19.0, 24.0, 22.0, 30.0, 31.0, 28.0, 41.0, 30.0, 40.0, 43.0, 53.0, 52.0, 34.0, 38.0, 48.0, 48.0, 38.0, 39.0, 35.0, 32.0, 32.0, 18.0, 33.0, 18.0, 17.0, 21.0, 18.0, 9.0, 12.0, 10.0, 9.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.625, -59.72705078125, -57.8291015625, -55.93115234375, -54.033203125, -52.13525390625, -50.2373046875, -48.33935546875, -46.44140625, -44.54345703125, -42.6455078125, -40.74755859375, -38.849609375, -36.95166015625, -35.0537109375, -33.15576171875, -31.2578125, -29.35986328125, -27.4619140625, -25.56396484375, -23.666015625, -21.76806640625, -19.8701171875, -17.97216796875, -16.07421875, -14.17626953125, -12.2783203125, -10.38037109375, -8.482421875, -6.58447265625, -4.6865234375, -2.78857421875, -0.890625, 1.00732421875, 2.9052734375, 4.80322265625, 6.701171875, 8.59912109375, 10.4970703125, 12.39501953125, 14.29296875, 16.19091796875, 18.0888671875, 19.98681640625, 21.884765625, 23.78271484375, 25.6806640625, 27.57861328125, 29.4765625, 31.37451171875, 33.2724609375, 35.17041015625, 37.068359375, 38.96630859375, 40.8642578125, 42.76220703125, 44.66015625, 46.55810546875, 48.4560546875, 50.35400390625, 52.251953125, 54.14990234375, 56.0478515625, 57.94580078125, 59.84375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 9.0, 15.0, 37.0, 38.0, 60.0, 96.0, 140.0, 241.0, 384.0, 580.0, 933.0, 1587.0, 2669.0, 4469.0, 7030.0, 11919.0, 19062.0, 29616.0, 45208.0, 64580.0, 86477.0, 107017.0, 119744.0, 121624.0, 112608.0, 94166.0, 72375.0, 52017.0, 34476.0, 22634.0, 14536.0, 8783.0, 5276.0, 3063.0, 1937.0, 1184.0, 778.0, 435.0, 256.0, 174.0, 124.0, 63.0, 55.0, 26.0, 12.0, 11.0, 9.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0], "bins": [-22.984375, -22.270263671875, -21.55615234375, -20.842041015625, -20.1279296875, -19.413818359375, -18.69970703125, -17.985595703125, -17.271484375, -16.557373046875, -15.84326171875, -15.129150390625, -14.4150390625, -13.700927734375, -12.98681640625, -12.272705078125, -11.55859375, -10.844482421875, -10.13037109375, -9.416259765625, -8.7021484375, -7.988037109375, -7.27392578125, -6.559814453125, -5.845703125, -5.131591796875, -4.41748046875, -3.703369140625, -2.9892578125, -2.275146484375, -1.56103515625, -0.846923828125, -0.1328125, 0.581298828125, 1.29541015625, 2.009521484375, 2.7236328125, 3.437744140625, 4.15185546875, 4.865966796875, 5.580078125, 6.294189453125, 7.00830078125, 7.722412109375, 8.4365234375, 9.150634765625, 9.86474609375, 10.578857421875, 11.29296875, 12.007080078125, 12.72119140625, 13.435302734375, 14.1494140625, 14.863525390625, 15.57763671875, 16.291748046875, 17.005859375, 17.719970703125, 18.43408203125, 19.148193359375, 19.8623046875, 20.576416015625, 21.29052734375, 22.004638671875, 22.71875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 8.0, 6.0, 12.0, 16.0, 12.0, 14.0, 21.0, 27.0, 39.0, 41.0, 45.0, 54.0, 41.0, 51.0, 53.0, 47.0, 61.0, 64.0, 49.0, 50.0, 43.0, 48.0, 35.0, 27.0, 32.0, 31.0, 12.0, 15.0, 10.0, 15.0, 9.0, 7.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.5625, -44.0859375, -42.609375, -41.1328125, -39.65625, -38.1796875, -36.703125, -35.2265625, -33.75, -32.2734375, -30.796875, -29.3203125, -27.84375, -26.3671875, -24.890625, -23.4140625, -21.9375, -20.4609375, -18.984375, -17.5078125, -16.03125, -14.5546875, -13.078125, -11.6015625, -10.125, -8.6484375, -7.171875, -5.6953125, -4.21875, -2.7421875, -1.265625, 0.2109375, 1.6875, 3.1640625, 4.640625, 6.1171875, 7.59375, 9.0703125, 10.546875, 12.0234375, 13.5, 14.9765625, 16.453125, 17.9296875, 19.40625, 20.8828125, 22.359375, 23.8359375, 25.3125, 26.7890625, 28.265625, 29.7421875, 31.21875, 32.6953125, 34.171875, 35.6484375, 37.125, 38.6015625, 40.078125, 41.5546875, 43.03125, 44.5078125, 45.984375, 47.4609375, 48.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 9.0, 13.0, 18.0, 22.0, 44.0, 55.0, 89.0, 190.0, 257.0, 406.0, 652.0, 1104.0, 1899.0, 2812.0, 4511.0, 7133.0, 10962.0, 17014.0, 25603.0, 36723.0, 50765.0, 66082.0, 82140.0, 95107.0, 103630.0, 103970.0, 98903.0, 87175.0, 71647.0, 55555.0, 40845.0, 28772.0, 19192.0, 12821.0, 8382.0, 5284.0, 3307.0, 2105.0, 1251.0, 787.0, 490.0, 334.0, 175.0, 117.0, 76.0, 44.0, 36.0, 21.0, 14.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.3203125, -6.11749267578125, -5.9146728515625, -5.71185302734375, -5.509033203125, -5.30621337890625, -5.1033935546875, -4.90057373046875, -4.69775390625, -4.49493408203125, -4.2921142578125, -4.08929443359375, -3.886474609375, -3.68365478515625, -3.4808349609375, -3.27801513671875, -3.0751953125, -2.87237548828125, -2.6695556640625, -2.46673583984375, -2.263916015625, -2.06109619140625, -1.8582763671875, -1.65545654296875, -1.45263671875, -1.24981689453125, -1.0469970703125, -0.84417724609375, -0.641357421875, -0.43853759765625, -0.2357177734375, -0.03289794921875, 0.169921875, 0.37274169921875, 0.5755615234375, 0.77838134765625, 0.981201171875, 1.18402099609375, 1.3868408203125, 1.58966064453125, 1.79248046875, 1.99530029296875, 2.1981201171875, 2.40093994140625, 2.603759765625, 2.80657958984375, 3.0093994140625, 3.21221923828125, 3.4150390625, 3.61785888671875, 3.8206787109375, 4.02349853515625, 4.226318359375, 4.42913818359375, 4.6319580078125, 4.83477783203125, 5.03759765625, 5.24041748046875, 5.4432373046875, 5.64605712890625, 5.848876953125, 6.05169677734375, 6.2545166015625, 6.45733642578125, 6.66015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 12.0, 9.0, 13.0, 15.0, 16.0, 34.0, 20.0, 31.0, 31.0, 33.0, 39.0, 39.0, 51.0, 30.0, 55.0, 42.0, 52.0, 45.0, 39.0, 41.0, 37.0, 43.0, 54.0, 34.0, 38.0, 29.0, 21.0, 12.0, 12.0, 11.0, 15.0, 9.0, 6.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007510185241699219, -0.0007246807217597961, -0.0006983429193496704, -0.0006720051169395447, -0.0006456673145294189, -0.0006193295121192932, -0.0005929917097091675, -0.0005666539072990417, -0.000540316104888916, -0.0005139783024787903, -0.00048764050006866455, -0.0004613026976585388, -0.0004349648952484131, -0.00040862709283828735, -0.0003822892904281616, -0.0003559514880180359, -0.00032961368560791016, -0.0003032758831977844, -0.0002769380807876587, -0.00025060027837753296, -0.00022426247596740723, -0.0001979246735572815, -0.00017158687114715576, -0.00014524906873703003, -0.0001189112663269043, -9.257346391677856e-05, -6.623566150665283e-05, -3.98978590965271e-05, -1.3560056686401367e-05, 1.2777745723724365e-05, 3.91155481338501e-05, 6.545335054397583e-05, 9.179115295410156e-05, 0.0001181289553642273, 0.00014446675777435303, 0.00017080456018447876, 0.0001971423625946045, 0.00022348016500473022, 0.00024981796741485596, 0.0002761557698249817, 0.0003024935722351074, 0.00032883137464523315, 0.0003551691770553589, 0.0003815069794654846, 0.00040784478187561035, 0.0004341825842857361, 0.0004605203866958618, 0.00048685818910598755, 0.0005131959915161133, 0.000539533793926239, 0.0005658715963363647, 0.0005922093987464905, 0.0006185472011566162, 0.0006448850035667419, 0.0006712228059768677, 0.0006975606083869934, 0.0007238984107971191, 0.0007502362132072449, 0.0007765740156173706, 0.0008029118180274963, 0.0008292496204376221, 0.0008555874228477478, 0.0008819252252578735, 0.0009082630276679993, 0.000934600830078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 11.0, 26.0, 35.0, 47.0, 80.0, 118.0, 207.0, 354.0, 568.0, 850.0, 1489.0, 2533.0, 4441.0, 7637.0, 12973.0, 21770.0, 34642.0, 53155.0, 75006.0, 99912.0, 119772.0, 129310.0, 124437.0, 108202.0, 84659.0, 61119.0, 41145.0, 25887.0, 15677.0, 9356.0, 5330.0, 3155.0, 1847.0, 1108.0, 645.0, 395.0, 213.0, 164.0, 100.0, 66.0, 33.0, 16.0, 24.0, 10.0, 7.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-9.0234375, -8.7633056640625, -8.503173828125, -8.2430419921875, -7.98291015625, -7.7227783203125, -7.462646484375, -7.2025146484375, -6.9423828125, -6.6822509765625, -6.422119140625, -6.1619873046875, -5.90185546875, -5.6417236328125, -5.381591796875, -5.1214599609375, -4.861328125, -4.6011962890625, -4.341064453125, -4.0809326171875, -3.82080078125, -3.5606689453125, -3.300537109375, -3.0404052734375, -2.7802734375, -2.5201416015625, -2.260009765625, -1.9998779296875, -1.73974609375, -1.4796142578125, -1.219482421875, -0.9593505859375, -0.69921875, -0.4390869140625, -0.178955078125, 0.0811767578125, 0.34130859375, 0.6014404296875, 0.861572265625, 1.1217041015625, 1.3818359375, 1.6419677734375, 1.902099609375, 2.1622314453125, 2.42236328125, 2.6824951171875, 2.942626953125, 3.2027587890625, 3.462890625, 3.7230224609375, 3.983154296875, 4.2432861328125, 4.50341796875, 4.7635498046875, 5.023681640625, 5.2838134765625, 5.5439453125, 5.8040771484375, 6.064208984375, 6.3243408203125, 6.58447265625, 6.8446044921875, 7.104736328125, 7.3648681640625, 7.625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 23.0, 29.0, 26.0, 33.0, 42.0, 53.0, 70.0, 72.0, 64.0, 67.0, 65.0, 65.0, 71.0, 57.0, 38.0, 46.0, 32.0, 31.0, 9.0, 19.0, 11.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.19537353515625, -6.9805908203125, -6.76580810546875, -6.551025390625, -6.33624267578125, -6.1214599609375, -5.90667724609375, -5.69189453125, -5.47711181640625, -5.2623291015625, -5.04754638671875, -4.832763671875, -4.61798095703125, -4.4031982421875, -4.18841552734375, -3.9736328125, -3.75885009765625, -3.5440673828125, -3.32928466796875, -3.114501953125, -2.89971923828125, -2.6849365234375, -2.47015380859375, -2.25537109375, -2.04058837890625, -1.8258056640625, -1.61102294921875, -1.396240234375, -1.18145751953125, -0.9666748046875, -0.75189208984375, -0.537109375, -0.32232666015625, -0.1075439453125, 0.10723876953125, 0.322021484375, 0.53680419921875, 0.7515869140625, 0.96636962890625, 1.18115234375, 1.39593505859375, 1.6107177734375, 1.82550048828125, 2.040283203125, 2.25506591796875, 2.4698486328125, 2.68463134765625, 2.8994140625, 3.11419677734375, 3.3289794921875, 3.54376220703125, 3.758544921875, 3.97332763671875, 4.1881103515625, 4.40289306640625, 4.61767578125, 4.83245849609375, 5.0472412109375, 5.26202392578125, 5.476806640625, 5.69158935546875, 5.9063720703125, 6.12115478515625, 6.3359375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 5.0, 5.0, 10.0, 11.0, 16.0, 21.0, 15.0, 23.0, 32.0, 24.0, 37.0, 40.0, 41.0, 43.0, 41.0, 58.0, 47.0, 46.0, 38.0, 34.0, 46.0, 45.0, 38.0, 33.0, 37.0, 21.0, 29.0, 19.0, 14.0, 24.0, 18.0, 10.0, 15.0, 6.0, 11.0, 11.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.89731979370117, -34.66121292114258, -33.42510223388672, -32.188995361328125, -30.9528865814209, -29.716777801513672, -28.480670928955078, -27.24456214904785, -26.008453369140625, -24.7723445892334, -23.536235809326172, -22.300128936767578, -21.06402015686035, -19.827911376953125, -18.59180450439453, -17.355695724487305, -16.119586944580078, -14.883478164672852, -13.647370338439941, -12.411262512207031, -11.175153732299805, -9.939044952392578, -8.702937126159668, -7.466829299926758, -6.230720520019531, -4.994612216949463, -3.7585039138793945, -2.522395610809326, -1.2862873077392578, -0.05017900466918945, 1.185929298400879, 2.422037124633789, 3.65814208984375, 4.894250392913818, 6.130358695983887, 7.366466999053955, 8.602575302124023, 9.83868408203125, 11.07479190826416, 12.31089973449707, 13.547008514404297, 14.783117294311523, 16.01922607421875, 17.255332946777344, 18.49144172668457, 19.727550506591797, 20.96365737915039, 22.199766159057617, 23.435874938964844, 24.67198371887207, 25.908092498779297, 27.14419937133789, 28.380308151245117, 29.616416931152344, 30.852523803710938, 32.08863067626953, 33.32474136352539, 34.560848236083984, 35.796958923339844, 37.03306579589844, 38.26917266845703, 39.50528335571289, 40.741390228271484, 41.977500915527344, 43.21360778808594]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 1.0, 4.0, 4.0, 10.0, 11.0, 7.0, 10.0, 9.0, 19.0, 14.0, 15.0, 34.0, 23.0, 25.0, 23.0, 27.0, 31.0, 39.0, 46.0, 34.0, 41.0, 50.0, 45.0, 49.0, 40.0, 42.0, 34.0, 34.0, 41.0, 37.0, 18.0, 28.0, 21.0, 14.0, 24.0, 20.0, 16.0, 12.0, 12.0, 8.0, 13.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-72.7590103149414, -70.6967544555664, -68.63450622558594, -66.57225036621094, -64.51000213623047, -62.447750091552734, -60.385498046875, -58.3232421875, -56.26099395751953, -54.1987419128418, -52.13648986816406, -50.07423782348633, -48.011985778808594, -45.94973373413086, -43.887481689453125, -41.825225830078125, -39.76297378540039, -37.700721740722656, -35.63846969604492, -33.57621765136719, -31.513965606689453, -29.45171356201172, -27.38945960998535, -25.327207565307617, -23.264955520629883, -21.20270347595215, -19.140451431274414, -17.078197479248047, -15.015946388244629, -12.953694343566895, -10.891441345214844, -8.82918930053711, -6.766941070556641, -4.704689025878906, -2.6424365043640137, -0.5801839828491211, 1.4820680618286133, 3.5443201065063477, 5.606573104858398, 7.668825149536133, 9.731077194213867, 11.793329238891602, 13.855581283569336, 15.917834281921387, 17.980087280273438, 20.042339324951172, 22.104591369628906, 24.16684341430664, 26.229095458984375, 28.29134750366211, 30.353599548339844, 32.41585159301758, 34.47810363769531, 36.54035568237305, 38.60260772705078, 40.66486358642578, 42.72711181640625, 44.789363861083984, 46.85161590576172, 48.91386795043945, 50.97611999511719, 53.03837203979492, 55.100624084472656, 57.162879943847656, 59.22513198852539]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 14.0, 10.0, 22.0, 31.0, 39.0, 93.0, 121.0, 215.0, 320.0, 459.0, 805.0, 1322.0, 2132.0, 3528.0, 5564.0, 9192.0, 14583.0, 23370.0, 37265.0, 57809.0, 87649.0, 128408.0, 182728.0, 244841.0, 315133.0, 378602.0, 422749.0, 436763.0, 418153.0, 371829.0, 306914.0, 236445.0, 172922.0, 120472.0, 79831.0, 51484.0, 32687.0, 20114.0, 12139.0, 7214.0, 4286.0, 2479.0, 1486.0, 881.0, 503.0, 302.0, 147.0, 102.0, 54.0, 32.0, 18.0, 12.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0], "bins": [-36.84375, -35.740234375, -34.63671875, -33.533203125, -32.4296875, -31.326171875, -30.22265625, -29.119140625, -28.015625, -26.912109375, -25.80859375, -24.705078125, -23.6015625, -22.498046875, -21.39453125, -20.291015625, -19.1875, -18.083984375, -16.98046875, -15.876953125, -14.7734375, -13.669921875, -12.56640625, -11.462890625, -10.359375, -9.255859375, -8.15234375, -7.048828125, -5.9453125, -4.841796875, -3.73828125, -2.634765625, -1.53125, -0.427734375, 0.67578125, 1.779296875, 2.8828125, 3.986328125, 5.08984375, 6.193359375, 7.296875, 8.400390625, 9.50390625, 10.607421875, 11.7109375, 12.814453125, 13.91796875, 15.021484375, 16.125, 17.228515625, 18.33203125, 19.435546875, 20.5390625, 21.642578125, 22.74609375, 23.849609375, 24.953125, 26.056640625, 27.16015625, 28.263671875, 29.3671875, 30.470703125, 31.57421875, 32.677734375, 33.78125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 0.0, 5.0, 6.0, 8.0, 11.0, 6.0, 13.0, 12.0, 17.0, 14.0, 16.0, 33.0, 28.0, 25.0, 23.0, 25.0, 34.0, 42.0, 45.0, 31.0, 45.0, 52.0, 47.0, 42.0, 44.0, 40.0, 34.0, 37.0, 33.0, 33.0, 24.0, 27.0, 19.0, 15.0, 29.0, 13.0, 13.0, 13.0, 13.0, 7.0, 13.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-68.125, -66.181640625, -64.23828125, -62.294921875, -60.3515625, -58.408203125, -56.46484375, -54.521484375, -52.578125, -50.634765625, -48.69140625, -46.748046875, -44.8046875, -42.861328125, -40.91796875, -38.974609375, -37.03125, -35.087890625, -33.14453125, -31.201171875, -29.2578125, -27.314453125, -25.37109375, -23.427734375, -21.484375, -19.541015625, -17.59765625, -15.654296875, -13.7109375, -11.767578125, -9.82421875, -7.880859375, -5.9375, -3.994140625, -2.05078125, -0.107421875, 1.8359375, 3.779296875, 5.72265625, 7.666015625, 9.609375, 11.552734375, 13.49609375, 15.439453125, 17.3828125, 19.326171875, 21.26953125, 23.212890625, 25.15625, 27.099609375, 29.04296875, 30.986328125, 32.9296875, 34.873046875, 36.81640625, 38.759765625, 40.703125, 42.646484375, 44.58984375, 46.533203125, 48.4765625, 50.419921875, 52.36328125, 54.306640625, 56.25]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 14.0, 9.0, 23.0, 27.0, 58.0, 69.0, 124.0, 193.0, 316.0, 478.0, 802.0, 1206.0, 2058.0, 3242.0, 5010.0, 8104.0, 12766.0, 20031.0, 31149.0, 47042.0, 69977.0, 102235.0, 143620.0, 192747.0, 249864.0, 304986.0, 354689.0, 387015.0, 396239.0, 381426.0, 345905.0, 294796.0, 237992.0, 182610.0, 134413.0, 95518.0, 65240.0, 43443.0, 28680.0, 18375.0, 11949.0, 7534.0, 4655.0, 2881.0, 1804.0, 1078.0, 701.0, 490.0, 281.0, 168.0, 107.0, 57.0, 42.0, 21.0, 12.0, 14.0, 4.0, 2.0, 6.0], "bins": [-34.40625, -33.376220703125, -32.34619140625, -31.316162109375, -30.2861328125, -29.256103515625, -28.22607421875, -27.196044921875, -26.166015625, -25.135986328125, -24.10595703125, -23.075927734375, -22.0458984375, -21.015869140625, -19.98583984375, -18.955810546875, -17.92578125, -16.895751953125, -15.86572265625, -14.835693359375, -13.8056640625, -12.775634765625, -11.74560546875, -10.715576171875, -9.685546875, -8.655517578125, -7.62548828125, -6.595458984375, -5.5654296875, -4.535400390625, -3.50537109375, -2.475341796875, -1.4453125, -0.415283203125, 0.61474609375, 1.644775390625, 2.6748046875, 3.704833984375, 4.73486328125, 5.764892578125, 6.794921875, 7.824951171875, 8.85498046875, 9.885009765625, 10.9150390625, 11.945068359375, 12.97509765625, 14.005126953125, 15.03515625, 16.065185546875, 17.09521484375, 18.125244140625, 19.1552734375, 20.185302734375, 21.21533203125, 22.245361328125, 23.275390625, 24.305419921875, 25.33544921875, 26.365478515625, 27.3955078125, 28.425537109375, 29.45556640625, 30.485595703125, 31.515625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 10.0, 8.0, 9.0, 15.0, 17.0, 17.0, 22.0, 34.0, 47.0, 47.0, 66.0, 67.0, 77.0, 101.0, 109.0, 124.0, 163.0, 152.0, 167.0, 172.0, 184.0, 218.0, 195.0, 238.0, 179.0, 191.0, 162.0, 189.0, 152.0, 131.0, 130.0, 111.0, 99.0, 111.0, 79.0, 54.0, 33.0, 35.0, 41.0, 29.0, 29.0, 20.0, 12.0, 10.0, 11.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.171875, -23.365234375, -22.55859375, -21.751953125, -20.9453125, -20.138671875, -19.33203125, -18.525390625, -17.71875, -16.912109375, -16.10546875, -15.298828125, -14.4921875, -13.685546875, -12.87890625, -12.072265625, -11.265625, -10.458984375, -9.65234375, -8.845703125, -8.0390625, -7.232421875, -6.42578125, -5.619140625, -4.8125, -4.005859375, -3.19921875, -2.392578125, -1.5859375, -0.779296875, 0.02734375, 0.833984375, 1.640625, 2.447265625, 3.25390625, 4.060546875, 4.8671875, 5.673828125, 6.48046875, 7.287109375, 8.09375, 8.900390625, 9.70703125, 10.513671875, 11.3203125, 12.126953125, 12.93359375, 13.740234375, 14.546875, 15.353515625, 16.16015625, 16.966796875, 17.7734375, 18.580078125, 19.38671875, 20.193359375, 21.0, 21.806640625, 22.61328125, 23.419921875, 24.2265625, 25.033203125, 25.83984375, 26.646484375, 27.453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 5.0, 5.0, 4.0, 8.0, 5.0, 17.0, 25.0, 24.0, 38.0, 40.0, 30.0, 56.0, 59.0, 51.0, 52.0, 46.0, 51.0, 60.0, 58.0, 46.0, 32.0, 39.0, 38.0, 36.0, 27.0, 27.0, 20.0, 28.0, 15.0, 9.0, 9.0, 9.0, 5.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.76199722290039, -48.79849624633789, -46.83499526977539, -44.87149429321289, -42.907989501953125, -40.944488525390625, -38.980987548828125, -37.017486572265625, -35.053985595703125, -33.090484619140625, -31.126983642578125, -29.163480758666992, -27.199979782104492, -25.236478805541992, -23.27297592163086, -21.30947494506836, -19.34597396850586, -17.38247299194336, -15.418971061706543, -13.455469131469727, -11.491968154907227, -9.528467178344727, -7.56496524810791, -5.601463317871094, -3.6379623413085938, -1.6744608879089355, 0.28904056549072266, 2.252542018890381, 4.216043472290039, 6.179544448852539, 8.143046379089355, 10.106548309326172, 12.070045471191406, 14.033546447753906, 15.997048377990723, 17.96055030822754, 19.92405128479004, 21.88755226135254, 23.851055145263672, 25.814556121826172, 27.778057098388672, 29.741558074951172, 31.705059051513672, 33.66856002807617, 35.63206481933594, 37.59556579589844, 39.55906677246094, 41.52256774902344, 43.48606872558594, 45.44956970214844, 47.41307067871094, 49.37657165527344, 51.34007263183594, 53.30357360839844, 55.2670783996582, 57.2305793762207, 59.1940803527832, 61.1575813293457, 63.1210823059082, 65.08458709716797, 67.04808807373047, 69.01158905029297, 70.97509002685547, 72.93859100341797, 74.90209197998047]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 5.0, 4.0, 6.0, 8.0, 6.0, 5.0, 6.0, 13.0, 20.0, 17.0, 17.0, 30.0, 27.0, 34.0, 35.0, 38.0, 35.0, 34.0, 41.0, 41.0, 47.0, 61.0, 47.0, 43.0, 43.0, 40.0, 35.0, 49.0, 32.0, 36.0, 35.0, 17.0, 22.0, 15.0, 17.0, 15.0, 9.0, 4.0, 6.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.90772247314453, -90.9971694946289, -88.08661651611328, -85.17606353759766, -82.26551055908203, -79.3549575805664, -76.44441223144531, -73.53385925292969, -70.62330627441406, -67.71275329589844, -64.80220031738281, -61.89164733886719, -58.98109436035156, -56.07054138183594, -53.15999221801758, -50.24943923950195, -47.33888244628906, -44.42832946777344, -41.51777648925781, -38.60722351074219, -35.69667053222656, -32.78611755371094, -29.875568389892578, -26.965015411376953, -24.054462432861328, -21.143909454345703, -18.233356475830078, -15.322805404663086, -12.412252426147461, -9.501699447631836, -6.591148376464844, -3.6805953979492188, -0.7700347900390625, 2.1405177116394043, 5.051070213317871, 7.96162223815918, 10.872175216674805, 13.78272819519043, 16.693279266357422, 19.603832244873047, 22.514385223388672, 25.424938201904297, 28.335491180419922, 31.246042251586914, 34.156593322753906, 37.06714630126953, 39.977699279785156, 42.88825225830078, 45.798805236816406, 48.70935821533203, 51.619911193847656, 54.53046417236328, 57.441017150878906, 60.35157012939453, 63.26211929321289, 66.17266845703125, 69.08322143554688, 71.9937744140625, 74.90432739257812, 77.81488037109375, 80.72543334960938, 83.635986328125, 86.54653930664062, 89.45709228515625, 92.36764526367188]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 9.0, 5.0, 14.0, 15.0, 21.0, 32.0, 47.0, 77.0, 97.0, 118.0, 182.0, 281.0, 378.0, 565.0, 797.0, 1200.0, 1783.0, 2682.0, 4365.0, 6659.0, 11100.0, 18098.0, 31505.0, 56923.0, 108211.0, 199789.0, 252947.0, 158080.0, 83055.0, 44518.0, 24868.0, 14878.0, 8946.0, 5545.0, 3487.0, 2392.0, 1514.0, 1072.0, 686.0, 482.0, 332.0, 247.0, 152.0, 105.0, 98.0, 62.0, 46.0, 28.0, 24.0, 15.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.50390625, -5.33349609375, -5.1630859375, -4.99267578125, -4.822265625, -4.65185546875, -4.4814453125, -4.31103515625, -4.140625, -3.97021484375, -3.7998046875, -3.62939453125, -3.458984375, -3.28857421875, -3.1181640625, -2.94775390625, -2.77734375, -2.60693359375, -2.4365234375, -2.26611328125, -2.095703125, -1.92529296875, -1.7548828125, -1.58447265625, -1.4140625, -1.24365234375, -1.0732421875, -0.90283203125, -0.732421875, -0.56201171875, -0.3916015625, -0.22119140625, -0.05078125, 0.11962890625, 0.2900390625, 0.46044921875, 0.630859375, 0.80126953125, 0.9716796875, 1.14208984375, 1.3125, 1.48291015625, 1.6533203125, 1.82373046875, 1.994140625, 2.16455078125, 2.3349609375, 2.50537109375, 2.67578125, 2.84619140625, 3.0166015625, 3.18701171875, 3.357421875, 3.52783203125, 3.6982421875, 3.86865234375, 4.0390625, 4.20947265625, 4.3798828125, 4.55029296875, 4.720703125, 4.89111328125, 5.0615234375, 5.23193359375, 5.40234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 5.0, 5.0, 5.0, 9.0, 5.0, 5.0, 6.0, 15.0, 19.0, 17.0, 20.0, 27.0, 29.0, 32.0, 36.0, 40.0, 35.0, 32.0, 44.0, 40.0, 51.0, 58.0, 46.0, 44.0, 43.0, 38.0, 39.0, 46.0, 32.0, 35.0, 35.0, 16.0, 22.0, 17.0, 16.0, 13.0, 9.0, 5.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.6875, -90.7724609375, -87.857421875, -84.9423828125, -82.02734375, -79.1123046875, -76.197265625, -73.2822265625, -70.3671875, -67.4521484375, -64.537109375, -61.6220703125, -58.70703125, -55.7919921875, -52.876953125, -49.9619140625, -47.046875, -44.1318359375, -41.216796875, -38.3017578125, -35.38671875, -32.4716796875, -29.556640625, -26.6416015625, -23.7265625, -20.8115234375, -17.896484375, -14.9814453125, -12.06640625, -9.1513671875, -6.236328125, -3.3212890625, -0.40625, 2.5087890625, 5.423828125, 8.3388671875, 11.25390625, 14.1689453125, 17.083984375, 19.9990234375, 22.9140625, 25.8291015625, 28.744140625, 31.6591796875, 34.57421875, 37.4892578125, 40.404296875, 43.3193359375, 46.234375, 49.1494140625, 52.064453125, 54.9794921875, 57.89453125, 60.8095703125, 63.724609375, 66.6396484375, 69.5546875, 72.4697265625, 75.384765625, 78.2998046875, 81.21484375, 84.1298828125, 87.044921875, 89.9599609375, 92.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 14.0, 17.0, 29.0, 46.0, 68.0, 134.0, 184.0, 292.0, 481.0, 794.0, 1373.0, 2464.0, 4675.0, 8986.0, 19300.0, 41913.0, 100769.0, 283424.0, 358874.0, 127160.0, 51154.0, 23351.0, 11069.0, 5428.0, 2792.0, 1478.0, 899.0, 538.0, 284.0, 188.0, 121.0, 77.0, 43.0, 35.0, 30.0, 14.0, 15.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.350830078125, -9.02978515625, -8.708740234375, -8.3876953125, -8.066650390625, -7.74560546875, -7.424560546875, -7.103515625, -6.782470703125, -6.46142578125, -6.140380859375, -5.8193359375, -5.498291015625, -5.17724609375, -4.856201171875, -4.53515625, -4.214111328125, -3.89306640625, -3.572021484375, -3.2509765625, -2.929931640625, -2.60888671875, -2.287841796875, -1.966796875, -1.645751953125, -1.32470703125, -1.003662109375, -0.6826171875, -0.361572265625, -0.04052734375, 0.280517578125, 0.6015625, 0.922607421875, 1.24365234375, 1.564697265625, 1.8857421875, 2.206787109375, 2.52783203125, 2.848876953125, 3.169921875, 3.490966796875, 3.81201171875, 4.133056640625, 4.4541015625, 4.775146484375, 5.09619140625, 5.417236328125, 5.73828125, 6.059326171875, 6.38037109375, 6.701416015625, 7.0224609375, 7.343505859375, 7.66455078125, 7.985595703125, 8.306640625, 8.627685546875, 8.94873046875, 9.269775390625, 9.5908203125, 9.911865234375, 10.23291015625, 10.553955078125, 10.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 5.0, 11.0, 11.0, 6.0, 10.0, 12.0, 9.0, 23.0, 19.0, 24.0, 29.0, 28.0, 26.0, 32.0, 35.0, 34.0, 40.0, 43.0, 41.0, 53.0, 46.0, 37.0, 44.0, 31.0, 46.0, 34.0, 30.0, 28.0, 19.0, 26.0, 31.0, 22.0, 21.0, 17.0, 10.0, 13.0, 18.0, 9.0, 4.0, 3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-55.40625, -53.77490234375, -52.1435546875, -50.51220703125, -48.880859375, -47.24951171875, -45.6181640625, -43.98681640625, -42.35546875, -40.72412109375, -39.0927734375, -37.46142578125, -35.830078125, -34.19873046875, -32.5673828125, -30.93603515625, -29.3046875, -27.67333984375, -26.0419921875, -24.41064453125, -22.779296875, -21.14794921875, -19.5166015625, -17.88525390625, -16.25390625, -14.62255859375, -12.9912109375, -11.35986328125, -9.728515625, -8.09716796875, -6.4658203125, -4.83447265625, -3.203125, -1.57177734375, 0.0595703125, 1.69091796875, 3.322265625, 4.95361328125, 6.5849609375, 8.21630859375, 9.84765625, 11.47900390625, 13.1103515625, 14.74169921875, 16.373046875, 18.00439453125, 19.6357421875, 21.26708984375, 22.8984375, 24.52978515625, 26.1611328125, 27.79248046875, 29.423828125, 31.05517578125, 32.6865234375, 34.31787109375, 35.94921875, 37.58056640625, 39.2119140625, 40.84326171875, 42.474609375, 44.10595703125, 45.7373046875, 47.36865234375, 49.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 8.0, 11.0, 14.0, 19.0, 20.0, 21.0, 39.0, 58.0, 86.0, 128.0, 182.0, 280.0, 406.0, 636.0, 1079.0, 1913.0, 3773.0, 9010.0, 28583.0, 140399.0, 686134.0, 131278.0, 27061.0, 8778.0, 3666.0, 1852.0, 1086.0, 704.0, 421.0, 273.0, 183.0, 122.0, 86.0, 63.0, 43.0, 31.0, 24.0, 23.0, 11.0, 12.0, 5.0, 5.0, 6.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2306671142578125, -1.192779541015625, -1.1548919677734375, -1.11700439453125, -1.0791168212890625, -1.041229248046875, -1.0033416748046875, -0.9654541015625, -0.9275665283203125, -0.889678955078125, -0.8517913818359375, -0.81390380859375, -0.7760162353515625, -0.738128662109375, -0.7002410888671875, -0.662353515625, -0.6244659423828125, -0.586578369140625, -0.5486907958984375, -0.51080322265625, -0.4729156494140625, -0.435028076171875, -0.3971405029296875, -0.3592529296875, -0.3213653564453125, -0.283477783203125, -0.2455902099609375, -0.20770263671875, -0.1698150634765625, -0.131927490234375, -0.0940399169921875, -0.05615234375, -0.0182647705078125, 0.019622802734375, 0.0575103759765625, 0.09539794921875, 0.1332855224609375, 0.171173095703125, 0.2090606689453125, 0.2469482421875, 0.2848358154296875, 0.322723388671875, 0.3606109619140625, 0.39849853515625, 0.4363861083984375, 0.474273681640625, 0.5121612548828125, 0.550048828125, 0.5879364013671875, 0.625823974609375, 0.6637115478515625, 0.70159912109375, 0.7394866943359375, 0.777374267578125, 0.8152618408203125, 0.8531494140625, 0.8910369873046875, 0.928924560546875, 0.9668121337890625, 1.00469970703125, 1.0425872802734375, 1.080474853515625, 1.1183624267578125, 1.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 11.0, 6.0, 13.0, 14.0, 21.0, 22.0, 31.0, 39.0, 43.0, 76.0, 86.0, 82.0, 68.0, 79.0, 68.0, 76.0, 57.0, 46.0, 44.0, 30.0, 20.0, 10.0, 22.0, 6.0, 8.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.693601608276367e-05, -6.467476487159729e-05, -6.241351366043091e-05, -6.0152262449264526e-05, -5.7891011238098145e-05, -5.562976002693176e-05, -5.336850881576538e-05, -5.1107257604599e-05, -4.884600639343262e-05, -4.6584755182266235e-05, -4.4323503971099854e-05, -4.206225275993347e-05, -3.980100154876709e-05, -3.753975033760071e-05, -3.5278499126434326e-05, -3.3017247915267944e-05, -3.075599670410156e-05, -2.849474549293518e-05, -2.62334942817688e-05, -2.3972243070602417e-05, -2.1710991859436035e-05, -1.9449740648269653e-05, -1.718848943710327e-05, -1.492723822593689e-05, -1.2665987014770508e-05, -1.0404735803604126e-05, -8.143484592437744e-06, -5.882233381271362e-06, -3.6209821701049805e-06, -1.3597309589385986e-06, 9.015202522277832e-07, 3.162771463394165e-06, 5.424022674560547e-06, 7.685273885726929e-06, 9.94652509689331e-06, 1.2207776308059692e-05, 1.4469027519226074e-05, 1.6730278730392456e-05, 1.8991529941558838e-05, 2.125278115272522e-05, 2.35140323638916e-05, 2.5775283575057983e-05, 2.8036534786224365e-05, 3.0297785997390747e-05, 3.255903720855713e-05, 3.482028841972351e-05, 3.708153963088989e-05, 3.9342790842056274e-05, 4.1604042053222656e-05, 4.386529326438904e-05, 4.612654447555542e-05, 4.83877956867218e-05, 5.0649046897888184e-05, 5.2910298109054565e-05, 5.517154932022095e-05, 5.743280053138733e-05, 5.969405174255371e-05, 6.195530295372009e-05, 6.421655416488647e-05, 6.647780537605286e-05, 6.873905658721924e-05, 7.100030779838562e-05, 7.3261559009552e-05, 7.552281022071838e-05, 7.778406143188477e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 11.0, 15.0, 17.0, 26.0, 27.0, 31.0, 50.0, 59.0, 98.0, 119.0, 173.0, 218.0, 319.0, 393.0, 595.0, 880.0, 1346.0, 1981.0, 3479.0, 5993.0, 11087.0, 21815.0, 46031.0, 118580.0, 428318.0, 256068.0, 78887.0, 33663.0, 16740.0, 8612.0, 4703.0, 2680.0, 1749.0, 1068.0, 798.0, 504.0, 384.0, 258.0, 189.0, 157.0, 114.0, 69.0, 61.0, 49.0, 44.0, 25.0, 15.0, 13.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.2470703125, -1.207855224609375, -1.16864013671875, -1.129425048828125, -1.0902099609375, -1.050994873046875, -1.01177978515625, -0.972564697265625, -0.933349609375, -0.894134521484375, -0.85491943359375, -0.815704345703125, -0.7764892578125, -0.737274169921875, -0.69805908203125, -0.658843994140625, -0.61962890625, -0.580413818359375, -0.54119873046875, -0.501983642578125, -0.4627685546875, -0.423553466796875, -0.38433837890625, -0.345123291015625, -0.305908203125, -0.266693115234375, -0.22747802734375, -0.188262939453125, -0.1490478515625, -0.109832763671875, -0.07061767578125, -0.031402587890625, 0.0078125, 0.047027587890625, 0.08624267578125, 0.125457763671875, 0.1646728515625, 0.203887939453125, 0.24310302734375, 0.282318115234375, 0.321533203125, 0.360748291015625, 0.39996337890625, 0.439178466796875, 0.4783935546875, 0.517608642578125, 0.55682373046875, 0.596038818359375, 0.63525390625, 0.674468994140625, 0.71368408203125, 0.752899169921875, 0.7921142578125, 0.831329345703125, 0.87054443359375, 0.909759521484375, 0.948974609375, 0.988189697265625, 1.02740478515625, 1.066619873046875, 1.1058349609375, 1.145050048828125, 1.18426513671875, 1.223480224609375, 1.2626953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 14.0, 14.0, 20.0, 30.0, 34.0, 51.0, 47.0, 75.0, 83.0, 76.0, 106.0, 93.0, 78.0, 64.0, 38.0, 38.0, 28.0, 20.0, 15.0, 18.0, 15.0, 6.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4296875, -1.3879852294921875, -1.346282958984375, -1.3045806884765625, -1.26287841796875, -1.2211761474609375, -1.179473876953125, -1.1377716064453125, -1.0960693359375, -1.0543670654296875, -1.012664794921875, -0.9709625244140625, -0.92926025390625, -0.8875579833984375, -0.845855712890625, -0.8041534423828125, -0.762451171875, -0.7207489013671875, -0.679046630859375, -0.6373443603515625, -0.59564208984375, -0.5539398193359375, -0.512237548828125, -0.4705352783203125, -0.4288330078125, -0.3871307373046875, -0.345428466796875, -0.3037261962890625, -0.26202392578125, -0.2203216552734375, -0.178619384765625, -0.1369171142578125, -0.09521484375, -0.0535125732421875, -0.011810302734375, 0.0298919677734375, 0.07159423828125, 0.1132965087890625, 0.154998779296875, 0.1967010498046875, 0.2384033203125, 0.2801055908203125, 0.321807861328125, 0.3635101318359375, 0.40521240234375, 0.4469146728515625, 0.488616943359375, 0.5303192138671875, 0.572021484375, 0.6137237548828125, 0.655426025390625, 0.6971282958984375, 0.73883056640625, 0.7805328369140625, 0.822235107421875, 0.8639373779296875, 0.9056396484375, 0.9473419189453125, 0.989044189453125, 1.0307464599609375, 1.07244873046875, 1.1141510009765625, 1.155853271484375, 1.1975555419921875, 1.2392578125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 10.0, 5.0, 4.0, 4.0, 7.0, 5.0, 15.0, 21.0, 29.0, 34.0, 40.0, 34.0, 54.0, 57.0, 54.0, 50.0, 48.0, 46.0, 55.0, 68.0, 43.0, 37.0, 36.0, 40.0, 34.0, 31.0, 24.0, 25.0, 22.0, 20.0, 10.0, 8.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4659309387207, -49.490482330322266, -47.515037536621094, -45.539588928222656, -43.56414031982422, -41.58869171142578, -39.613243103027344, -37.63779830932617, -35.662349700927734, -33.6869010925293, -31.711454391479492, -29.736007690429688, -27.76055908203125, -25.785110473632812, -23.809663772583008, -21.834217071533203, -19.858768463134766, -17.883319854736328, -15.907873153686523, -13.932425498962402, -11.956977844238281, -9.98153018951416, -8.006082534790039, -6.030634880065918, -4.055187225341797, -2.079739570617676, -0.10429191589355469, 1.8711557388305664, 3.8466033935546875, 5.822051048278809, 7.79749870300293, 9.77294635772705, 11.748397827148438, 13.723845481872559, 15.69929313659668, 17.674739837646484, 19.650188446044922, 21.62563705444336, 23.601083755493164, 25.57653045654297, 27.551979064941406, 29.527427673339844, 31.50287437438965, 33.47832107543945, 35.45376968383789, 37.42921829223633, 39.4046630859375, 41.38011169433594, 43.355560302734375, 45.33100891113281, 47.30645751953125, 49.28190231323242, 51.25735092163086, 53.2327995300293, 55.20824432373047, 57.183692932128906, 59.159141540527344, 61.13459014892578, 63.11003875732422, 65.08548736572266, 67.06092834472656, 69.036376953125, 71.01182556152344, 72.98727416992188, 74.96272277832031]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 7.0, 4.0, 7.0, 14.0, 19.0, 17.0, 19.0, 29.0, 26.0, 35.0, 30.0, 42.0, 36.0, 33.0, 45.0, 40.0, 49.0, 55.0, 48.0, 44.0, 45.0, 35.0, 40.0, 48.0, 32.0, 38.0, 31.0, 19.0, 20.0, 16.0, 15.0, 16.0, 9.0, 4.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.17234802246094, -91.24882507324219, -88.32530212402344, -85.40177917480469, -82.4782485961914, -79.55472564697266, -76.6312026977539, -73.70767974853516, -70.78414916992188, -67.86062622070312, -64.93710327148438, -62.01357650756836, -59.090049743652344, -56.166526794433594, -53.243003845214844, -50.319480895996094, -47.395957946777344, -44.472434997558594, -41.54890823364258, -38.62538528442383, -35.70185852050781, -32.77833557128906, -29.854812622070312, -26.93128776550293, -24.007762908935547, -21.084238052368164, -18.16071319580078, -15.237190246582031, -12.313665390014648, -9.390140533447266, -6.466617584228516, -3.543092727661133, -0.61956787109375, 2.3039565086364746, 5.227480888366699, 8.151004791259766, 11.074529647827148, 13.998054504394531, 16.92157745361328, 19.845102310180664, 22.768627166748047, 25.69215202331543, 28.615676879882812, 31.539199829101562, 34.46272277832031, 37.38624954223633, 40.30977249145508, 43.233299255371094, 46.156822204589844, 49.080345153808594, 52.00387191772461, 54.92739486694336, 57.850921630859375, 60.774444580078125, 63.697967529296875, 66.62149047851562, 69.54501342773438, 72.46853637695312, 75.39205932617188, 78.31558227539062, 81.2391128540039, 84.16263580322266, 87.0861587524414, 90.00968170166016, 92.93321228027344]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 15.0, 20.0, 20.0, 34.0, 52.0, 67.0, 109.0, 127.0, 211.0, 322.0, 453.0, 656.0, 969.0, 1434.0, 2245.0, 3632.0, 6147.0, 9805.0, 16086.0, 26375.0, 42434.0, 63740.0, 90968.0, 117432.0, 134947.0, 135300.0, 119577.0, 93316.0, 66311.0, 43775.0, 27546.0, 16824.0, 10356.0, 6238.0, 3884.0, 2389.0, 1588.0, 1016.0, 672.0, 470.0, 296.0, 219.0, 142.0, 99.0, 71.0, 49.0, 31.0, 24.0, 19.0, 6.0, 5.0, 8.0, 6.0, 7.0, 4.0, 2.0], "bins": [-35.09375, -34.03173828125, -32.9697265625, -31.90771484375, -30.845703125, -29.78369140625, -28.7216796875, -27.65966796875, -26.59765625, -25.53564453125, -24.4736328125, -23.41162109375, -22.349609375, -21.28759765625, -20.2255859375, -19.16357421875, -18.1015625, -17.03955078125, -15.9775390625, -14.91552734375, -13.853515625, -12.79150390625, -11.7294921875, -10.66748046875, -9.60546875, -8.54345703125, -7.4814453125, -6.41943359375, -5.357421875, -4.29541015625, -3.2333984375, -2.17138671875, -1.109375, -0.04736328125, 1.0146484375, 2.07666015625, 3.138671875, 4.20068359375, 5.2626953125, 6.32470703125, 7.38671875, 8.44873046875, 9.5107421875, 10.57275390625, 11.634765625, 12.69677734375, 13.7587890625, 14.82080078125, 15.8828125, 16.94482421875, 18.0068359375, 19.06884765625, 20.130859375, 21.19287109375, 22.2548828125, 23.31689453125, 24.37890625, 25.44091796875, 26.5029296875, 27.56494140625, 28.626953125, 29.68896484375, 30.7509765625, 31.81298828125, 32.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 4.0, 5.0, 8.0, 6.0, 4.0, 7.0, 16.0, 18.0, 17.0, 19.0, 29.0, 26.0, 35.0, 33.0, 40.0, 38.0, 34.0, 43.0, 39.0, 51.0, 56.0, 49.0, 42.0, 43.0, 37.0, 41.0, 51.0, 27.0, 40.0, 30.0, 15.0, 23.0, 16.0, 19.0, 10.0, 9.0, 5.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.625, -91.6787109375, -88.732421875, -85.7861328125, -82.83984375, -79.8935546875, -76.947265625, -74.0009765625, -71.0546875, -68.1083984375, -65.162109375, -62.2158203125, -59.26953125, -56.3232421875, -53.376953125, -50.4306640625, -47.484375, -44.5380859375, -41.591796875, -38.6455078125, -35.69921875, -32.7529296875, -29.806640625, -26.8603515625, -23.9140625, -20.9677734375, -18.021484375, -15.0751953125, -12.12890625, -9.1826171875, -6.236328125, -3.2900390625, -0.34375, 2.6025390625, 5.548828125, 8.4951171875, 11.44140625, 14.3876953125, 17.333984375, 20.2802734375, 23.2265625, 26.1728515625, 29.119140625, 32.0654296875, 35.01171875, 37.9580078125, 40.904296875, 43.8505859375, 46.796875, 49.7431640625, 52.689453125, 55.6357421875, 58.58203125, 61.5283203125, 64.474609375, 67.4208984375, 70.3671875, 73.3134765625, 76.259765625, 79.2060546875, 82.15234375, 85.0986328125, 88.044921875, 90.9912109375, 93.9375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 16.0, 20.0, 38.0, 49.0, 67.0, 122.0, 163.0, 279.0, 413.0, 621.0, 970.0, 1343.0, 2023.0, 3032.0, 4701.0, 7002.0, 10926.0, 16832.0, 26270.0, 40211.0, 59052.0, 84769.0, 109132.0, 127771.0, 130431.0, 118454.0, 95460.0, 70160.0, 47844.0, 31947.0, 20237.0, 13033.0, 8505.0, 5669.0, 3646.0, 2437.0, 1664.0, 1059.0, 736.0, 488.0, 324.0, 216.0, 148.0, 86.0, 64.0, 36.0, 38.0, 11.0, 12.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-36.84375, -35.66357421875, -34.4833984375, -33.30322265625, -32.123046875, -30.94287109375, -29.7626953125, -28.58251953125, -27.40234375, -26.22216796875, -25.0419921875, -23.86181640625, -22.681640625, -21.50146484375, -20.3212890625, -19.14111328125, -17.9609375, -16.78076171875, -15.6005859375, -14.42041015625, -13.240234375, -12.06005859375, -10.8798828125, -9.69970703125, -8.51953125, -7.33935546875, -6.1591796875, -4.97900390625, -3.798828125, -2.61865234375, -1.4384765625, -0.25830078125, 0.921875, 2.10205078125, 3.2822265625, 4.46240234375, 5.642578125, 6.82275390625, 8.0029296875, 9.18310546875, 10.36328125, 11.54345703125, 12.7236328125, 13.90380859375, 15.083984375, 16.26416015625, 17.4443359375, 18.62451171875, 19.8046875, 20.98486328125, 22.1650390625, 23.34521484375, 24.525390625, 25.70556640625, 26.8857421875, 28.06591796875, 29.24609375, 30.42626953125, 31.6064453125, 32.78662109375, 33.966796875, 35.14697265625, 36.3271484375, 37.50732421875, 38.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 2.0, 6.0, 8.0, 12.0, 15.0, 14.0, 13.0, 22.0, 16.0, 21.0, 29.0, 31.0, 26.0, 30.0, 27.0, 33.0, 46.0, 36.0, 36.0, 57.0, 44.0, 34.0, 46.0, 44.0, 42.0, 53.0, 33.0, 30.0, 27.0, 23.0, 18.0, 19.0, 19.0, 14.0, 14.0, 10.0, 11.0, 10.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5625, -42.9208984375, -41.279296875, -39.6376953125, -37.99609375, -36.3544921875, -34.712890625, -33.0712890625, -31.4296875, -29.7880859375, -28.146484375, -26.5048828125, -24.86328125, -23.2216796875, -21.580078125, -19.9384765625, -18.296875, -16.6552734375, -15.013671875, -13.3720703125, -11.73046875, -10.0888671875, -8.447265625, -6.8056640625, -5.1640625, -3.5224609375, -1.880859375, -0.2392578125, 1.40234375, 3.0439453125, 4.685546875, 6.3271484375, 7.96875, 9.6103515625, 11.251953125, 12.8935546875, 14.53515625, 16.1767578125, 17.818359375, 19.4599609375, 21.1015625, 22.7431640625, 24.384765625, 26.0263671875, 27.66796875, 29.3095703125, 30.951171875, 32.5927734375, 34.234375, 35.8759765625, 37.517578125, 39.1591796875, 40.80078125, 42.4423828125, 44.083984375, 45.7255859375, 47.3671875, 49.0087890625, 50.650390625, 52.2919921875, 53.93359375, 55.5751953125, 57.216796875, 58.8583984375, 60.5]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 22.0, 27.0, 36.0, 54.0, 78.0, 157.0, 192.0, 311.0, 522.0, 789.0, 1278.0, 2027.0, 3349.0, 5105.0, 8535.0, 13502.0, 21164.0, 31650.0, 46324.0, 63344.0, 81271.0, 98172.0, 109867.0, 112561.0, 105704.0, 92637.0, 75665.0, 57264.0, 40408.0, 27553.0, 18039.0, 11618.0, 7432.0, 4427.0, 2841.0, 1690.0, 1065.0, 596.0, 423.0, 278.0, 200.0, 133.0, 87.0, 43.0, 36.0, 25.0, 21.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.4375, -9.13623046875, -8.8349609375, -8.53369140625, -8.232421875, -7.93115234375, -7.6298828125, -7.32861328125, -7.02734375, -6.72607421875, -6.4248046875, -6.12353515625, -5.822265625, -5.52099609375, -5.2197265625, -4.91845703125, -4.6171875, -4.31591796875, -4.0146484375, -3.71337890625, -3.412109375, -3.11083984375, -2.8095703125, -2.50830078125, -2.20703125, -1.90576171875, -1.6044921875, -1.30322265625, -1.001953125, -0.70068359375, -0.3994140625, -0.09814453125, 0.203125, 0.50439453125, 0.8056640625, 1.10693359375, 1.408203125, 1.70947265625, 2.0107421875, 2.31201171875, 2.61328125, 2.91455078125, 3.2158203125, 3.51708984375, 3.818359375, 4.11962890625, 4.4208984375, 4.72216796875, 5.0234375, 5.32470703125, 5.6259765625, 5.92724609375, 6.228515625, 6.52978515625, 6.8310546875, 7.13232421875, 7.43359375, 7.73486328125, 8.0361328125, 8.33740234375, 8.638671875, 8.93994140625, 9.2412109375, 9.54248046875, 9.84375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 10.0, 16.0, 13.0, 14.0, 19.0, 18.0, 21.0, 23.0, 24.0, 34.0, 39.0, 40.0, 39.0, 41.0, 42.0, 36.0, 47.0, 50.0, 46.0, 49.0, 42.0, 44.0, 35.0, 42.0, 34.0, 25.0, 23.0, 15.0, 19.0, 15.0, 10.0, 6.0, 8.0, 10.0, 8.0, 2.0, 8.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011949539184570312, -0.001157909631729126, -0.0011208653450012207, -0.0010838210582733154, -0.0010467767715454102, -0.0010097324848175049, -0.0009726881980895996, -0.0009356439113616943, -0.0008985996246337891, -0.0008615553379058838, -0.0008245110511779785, -0.0007874667644500732, -0.000750422477722168, -0.0007133781909942627, -0.0006763339042663574, -0.0006392896175384521, -0.0006022453308105469, -0.0005652010440826416, -0.0005281567573547363, -0.0004911124706268311, -0.0004540681838989258, -0.0004170238971710205, -0.00037997961044311523, -0.00034293532371520996, -0.0003058910369873047, -0.0002688467502593994, -0.00023180246353149414, -0.00019475817680358887, -0.0001577138900756836, -0.00012066960334777832, -8.362531661987305e-05, -4.6581029891967773e-05, -9.5367431640625e-06, 2.7507543563842773e-05, 6.455183029174805e-05, 0.00010159611701965332, 0.0001386404037475586, 0.00017568469047546387, 0.00021272897720336914, 0.0002497732639312744, 0.0002868175506591797, 0.00032386183738708496, 0.00036090612411499023, 0.0003979504108428955, 0.0004349946975708008, 0.00047203898429870605, 0.0005090832710266113, 0.0005461275577545166, 0.0005831718444824219, 0.0006202161312103271, 0.0006572604179382324, 0.0006943047046661377, 0.000731348991394043, 0.0007683932781219482, 0.0008054375648498535, 0.0008424818515777588, 0.0008795261383056641, 0.0009165704250335693, 0.0009536147117614746, 0.0009906589984893799, 0.0010277032852172852, 0.0010647475719451904, 0.0011017918586730957, 0.001138836145401001, 0.0011758804321289062]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 3.0, 7.0, 6.0, 18.0, 23.0, 26.0, 53.0, 84.0, 121.0, 182.0, 278.0, 470.0, 813.0, 1275.0, 2148.0, 3519.0, 6117.0, 10213.0, 16914.0, 26718.0, 41014.0, 59553.0, 80868.0, 102631.0, 117728.0, 123545.0, 115624.0, 100324.0, 78259.0, 57016.0, 38463.0, 25211.0, 15740.0, 9524.0, 5655.0, 3362.0, 1867.0, 1221.0, 718.0, 485.0, 265.0, 183.0, 99.0, 66.0, 46.0, 37.0, 22.0, 11.0, 13.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.15625, -10.812255859375, -10.46826171875, -10.124267578125, -9.7802734375, -9.436279296875, -9.09228515625, -8.748291015625, -8.404296875, -8.060302734375, -7.71630859375, -7.372314453125, -7.0283203125, -6.684326171875, -6.34033203125, -5.996337890625, -5.65234375, -5.308349609375, -4.96435546875, -4.620361328125, -4.2763671875, -3.932373046875, -3.58837890625, -3.244384765625, -2.900390625, -2.556396484375, -2.21240234375, -1.868408203125, -1.5244140625, -1.180419921875, -0.83642578125, -0.492431640625, -0.1484375, 0.195556640625, 0.53955078125, 0.883544921875, 1.2275390625, 1.571533203125, 1.91552734375, 2.259521484375, 2.603515625, 2.947509765625, 3.29150390625, 3.635498046875, 3.9794921875, 4.323486328125, 4.66748046875, 5.011474609375, 5.35546875, 5.699462890625, 6.04345703125, 6.387451171875, 6.7314453125, 7.075439453125, 7.41943359375, 7.763427734375, 8.107421875, 8.451416015625, 8.79541015625, 9.139404296875, 9.4833984375, 9.827392578125, 10.17138671875, 10.515380859375, 10.859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 8.0, 9.0, 14.0, 16.0, 23.0, 15.0, 27.0, 19.0, 21.0, 28.0, 44.0, 42.0, 45.0, 55.0, 46.0, 50.0, 46.0, 54.0, 47.0, 36.0, 44.0, 34.0, 38.0, 36.0, 29.0, 25.0, 18.0, 23.0, 22.0, 14.0, 12.0, 10.0, 9.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.4739990234375, -4.311279296875, -4.1485595703125, -3.98583984375, -3.8231201171875, -3.660400390625, -3.4976806640625, -3.3349609375, -3.1722412109375, -3.009521484375, -2.8468017578125, -2.68408203125, -2.5213623046875, -2.358642578125, -2.1959228515625, -2.033203125, -1.8704833984375, -1.707763671875, -1.5450439453125, -1.38232421875, -1.2196044921875, -1.056884765625, -0.8941650390625, -0.7314453125, -0.5687255859375, -0.406005859375, -0.2432861328125, -0.08056640625, 0.0821533203125, 0.244873046875, 0.4075927734375, 0.5703125, 0.7330322265625, 0.895751953125, 1.0584716796875, 1.22119140625, 1.3839111328125, 1.546630859375, 1.7093505859375, 1.8720703125, 2.0347900390625, 2.197509765625, 2.3602294921875, 2.52294921875, 2.6856689453125, 2.848388671875, 3.0111083984375, 3.173828125, 3.3365478515625, 3.499267578125, 3.6619873046875, 3.82470703125, 3.9874267578125, 4.150146484375, 4.3128662109375, 4.4755859375, 4.6383056640625, 4.801025390625, 4.9637451171875, 5.12646484375, 5.2891845703125, 5.451904296875, 5.6146240234375, 5.77734375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 2.0, 6.0, 7.0, 11.0, 25.0, 17.0, 20.0, 40.0, 33.0, 47.0, 49.0, 53.0, 45.0, 60.0, 42.0, 44.0, 59.0, 52.0, 43.0, 33.0, 47.0, 36.0, 36.0, 20.0, 29.0, 24.0, 26.0, 17.0, 10.0, 12.0, 11.0, 10.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.44633102416992, -51.46088409423828, -49.47543716430664, -47.489990234375, -45.504547119140625, -43.51909637451172, -41.533653259277344, -39.5482063293457, -37.56275939941406, -35.57731246948242, -33.59186553955078, -31.606420516967773, -29.620973587036133, -27.635526657104492, -25.650081634521484, -23.664634704589844, -21.679187774658203, -19.693740844726562, -17.708293914794922, -15.722848892211914, -13.737401962280273, -11.751955032348633, -9.766509056091309, -7.781063079833984, -5.795616149902344, -3.8101696968078613, -1.824723243713379, 0.16072320938110352, 2.146169662475586, 4.131616592407227, 6.117062568664551, 8.102508544921875, 10.08795166015625, 12.07339859008789, 14.058844566345215, 16.04429054260254, 18.02973747253418, 20.01518440246582, 22.000629425048828, 23.98607635498047, 25.97152328491211, 27.95697021484375, 29.94241714477539, 31.9278621673584, 33.913307189941406, 35.89875793457031, 37.88420104980469, 39.86964797973633, 41.85509490966797, 43.84054183959961, 45.82598876953125, 47.81143569946289, 49.79688262939453, 51.782325744628906, 53.76777267456055, 55.75321960449219, 57.73866653442383, 59.72411346435547, 61.70956039428711, 63.69500732421875, 65.68045043945312, 67.66590118408203, 69.6513442993164, 71.63679504394531, 73.62223815917969]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 11.0, 9.0, 12.0, 17.0, 22.0, 16.0, 24.0, 30.0, 36.0, 37.0, 27.0, 38.0, 41.0, 38.0, 54.0, 50.0, 58.0, 42.0, 47.0, 34.0, 48.0, 42.0, 46.0, 38.0, 29.0, 22.0, 22.0, 17.0, 16.0, 13.0, 8.0, 12.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.47200012207031, -99.98099517822266, -96.489990234375, -92.99898529052734, -89.50798034667969, -86.01697540283203, -82.52597045898438, -79.03495788574219, -75.54396057128906, -72.0529556274414, -68.56195068359375, -65.0709457397461, -61.57994079589844, -58.08893585205078, -54.59792709350586, -51.1069221496582, -47.61591339111328, -44.124908447265625, -40.63390350341797, -37.14289855957031, -33.651893615722656, -30.160886764526367, -26.669879913330078, -23.178874969482422, -19.687870025634766, -16.19686508178711, -12.705859184265137, -9.214853286743164, -5.723848342895508, -2.2328433990478516, 1.2581634521484375, 4.749168395996094, 8.24017333984375, 11.731178283691406, 15.222184181213379, 18.71319007873535, 22.204195022583008, 25.695199966430664, 29.186206817626953, 32.67721176147461, 36.168216705322266, 39.65922164916992, 43.15022659301758, 46.6412353515625, 50.132240295410156, 53.62324523925781, 57.11425018310547, 60.605255126953125, 64.09626007080078, 67.58726501464844, 71.0782699584961, 74.56927490234375, 78.0602798461914, 81.55128479003906, 85.04229736328125, 88.53329467773438, 92.02430725097656, 95.51531219482422, 99.00631713867188, 102.49732208251953, 105.98832702636719, 109.47933197021484, 112.9703369140625, 116.46134948730469, 119.95234680175781]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 13.0, 9.0, 12.0, 24.0, 30.0, 42.0, 52.0, 76.0, 109.0, 157.0, 204.0, 302.0, 354.0, 458.0, 593.0, 774.0, 978.0, 1242.0, 1668.0, 2066.0, 2455.0, 3116.0, 3629.0, 4616.0, 1000998.0, 5338.0, 4217.0, 3406.0, 2833.0, 2343.0, 1982.0, 1469.0, 1214.0, 945.0, 709.0, 542.0, 395.0, 347.0, 233.0, 182.0, 147.0, 86.0, 70.0, 47.0, 43.0, 24.0, 15.0, 10.0, 10.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0], "bins": [-468.13397216796875, -453.87396240234375, -439.61395263671875, -425.35394287109375, -411.09393310546875, -396.83392333984375, -382.57391357421875, -368.3139343261719, -354.0539245605469, -339.7939147949219, -325.5339050292969, -311.2738952636719, -297.0138854980469, -282.75390625, -268.493896484375, -254.23388671875, -239.97386169433594, -225.71385192871094, -211.45384216308594, -197.19384765625, -182.933837890625, -168.673828125, -154.413818359375, -140.15380859375, -125.89380645751953, -111.63379669189453, -97.37379455566406, -83.11378479003906, -68.85377502441406, -54.593772888183594, -40.333763122558594, -26.073760986328125, -11.813751220703125, 2.446255683898926, 16.706262588500977, 30.966270446777344, 45.22627639770508, 59.48628234863281, 73.74629211425781, 88.00629425048828, 102.26630401611328, 116.52631378173828, 130.78631591796875, 145.04632568359375, 159.30633544921875, 173.56634521484375, 187.82635498046875, 202.0863494873047, 216.3463592529297, 230.6063690185547, 244.8663787841797, 259.1263732910156, 273.3863830566406, 287.6463928222656, 301.9064025878906, 316.1664123535156, 330.4264221191406, 344.6864318847656, 358.9464416503906, 373.2064514160156, 387.4664611816406, 401.7264404296875, 415.9864501953125, 430.2464599609375, 444.5064697265625]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 10.0, 13.0, 23.0, 42.0, 36.0, 52.0, 65.0, 107.0, 118.0, 169.0, 218.0, 306.0, 429.0, 604.0, 934.0, 1423.0, 2383.0, 4216.0, 7388.0, 13078.0, 21082.0, 31728.0, 165886.0, 51125692.0, 36164.0, 23198.0, 14684.0, 8550.0, 4881.0, 2787.0, 1645.0, 1059.0, 630.0, 466.0, 343.0, 229.0, 168.0, 134.0, 99.0, 66.0, 48.0, 43.0, 46.0, 25.0, 17.0, 8.0, 18.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-742.552734375, -720.133056640625, -697.7133178710938, -675.2935791015625, -652.8739013671875, -630.4542236328125, -608.0344848632812, -585.61474609375, -563.195068359375, -540.775390625, -518.3556518554688, -495.9359436035156, -473.5162353515625, -451.0965270996094, -428.67681884765625, -406.2571105957031, -383.83740234375, -361.4176940917969, -338.99798583984375, -316.5782775878906, -294.1585693359375, -271.7388610839844, -249.31915283203125, -226.89944458007812, -204.479736328125, -182.06002807617188, -159.64031982421875, -137.22061157226562, -114.8009033203125, -92.38119506835938, -69.96148681640625, -47.541778564453125, -25.1220703125, -2.702362060546875, 19.71734619140625, 42.137054443359375, 64.5567626953125, 86.97647094726562, 109.39617919921875, 131.81588745117188, 154.235595703125, 176.65530395507812, 199.07501220703125, 221.49472045898438, 243.9144287109375, 266.3341369628906, 288.75384521484375, 311.1735534667969, 333.59326171875, 356.0129699707031, 378.43267822265625, 400.8523864746094, 423.2720947265625, 445.6918029785156, 468.11151123046875, 490.5312194824219, 512.950927734375, 535.37060546875, 557.7903442382812, 580.2100830078125, 602.6297607421875, 625.0494384765625, 647.4691772460938, 669.888916015625, 692.30859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 2.0, 8.0, 13.0, 18.0, 33.0, 48.0, 73.0, 131.0, 191.0, 278.0, 366.0, 514.0, 936.0, 1403.0, 2328.0, 3955.0, 6723.0, 11669.0, 22107.0, 43868.0, 94975.0, 227864.0, 638754.0, 3485099.0, 1144531.0, 345035.0, 135581.0, 60076.0, 28834.0, 15121.0, 8435.0, 4719.0, 2818.0, 1785.0, 1152.0, 708.0, 452.0, 276.0, 185.0, 114.0, 71.0, 58.0, 44.0, 17.0, 24.0, 17.0, 5.0, 6.0, 2.0, 7.0, 5.0], "bins": [-23.671875, -23.027099609375, -22.38232421875, -21.737548828125, -21.0927734375, -20.447998046875, -19.80322265625, -19.158447265625, -18.513671875, -17.868896484375, -17.22412109375, -16.579345703125, -15.9345703125, -15.289794921875, -14.64501953125, -14.000244140625, -13.35546875, -12.710693359375, -12.06591796875, -11.421142578125, -10.7763671875, -10.131591796875, -9.48681640625, -8.842041015625, -8.197265625, -7.552490234375, -6.90771484375, -6.262939453125, -5.6181640625, -4.973388671875, -4.32861328125, -3.683837890625, -3.0390625, -2.394287109375, -1.74951171875, -1.104736328125, -0.4599609375, 0.184814453125, 0.82958984375, 1.474365234375, 2.119140625, 2.763916015625, 3.40869140625, 4.053466796875, 4.6982421875, 5.343017578125, 5.98779296875, 6.632568359375, 7.27734375, 7.922119140625, 8.56689453125, 9.211669921875, 9.8564453125, 10.501220703125, 11.14599609375, 11.790771484375, 12.435546875, 13.080322265625, 13.72509765625, 14.369873046875, 15.0146484375, 15.659423828125, 16.30419921875, 16.948974609375, 17.59375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 10.0, 19.0, 12.0, 22.0, 33.0, 26.0, 28.0, 25.0, 28.0, 35.0, 37.0, 47.0, 39.0, 54.0, 131.0, 805.0, 198.0, 60.0, 61.0, 36.0, 35.0, 42.0, 32.0, 28.0, 25.0, 22.0, 24.0, 17.0, 17.0, 8.0, 11.0, 6.0, 4.0, 6.0, 3.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-86.3125, -83.947265625, -81.58203125, -79.216796875, -76.8515625, -74.486328125, -72.12109375, -69.755859375, -67.390625, -65.025390625, -62.66015625, -60.294921875, -57.9296875, -55.564453125, -53.19921875, -50.833984375, -48.46875, -46.103515625, -43.73828125, -41.373046875, -39.0078125, -36.642578125, -34.27734375, -31.912109375, -29.546875, -27.181640625, -24.81640625, -22.451171875, -20.0859375, -17.720703125, -15.35546875, -12.990234375, -10.625, -8.259765625, -5.89453125, -3.529296875, -1.1640625, 1.201171875, 3.56640625, 5.931640625, 8.296875, 10.662109375, 13.02734375, 15.392578125, 17.7578125, 20.123046875, 22.48828125, 24.853515625, 27.21875, 29.583984375, 31.94921875, 34.314453125, 36.6796875, 39.044921875, 41.41015625, 43.775390625, 46.140625, 48.505859375, 50.87109375, 53.236328125, 55.6015625, 57.966796875, 60.33203125, 62.697265625, 65.0625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 2.0, 7.0, 5.0, 17.0, 21.0, 35.0, 29.0, 38.0, 61.0, 94.0, 141.0, 178.0, 250.0, 409.0, 631.0, 912.0, 1521.0, 2480.0, 3939.0, 6436.0, 10920.0, 20960.0, 40489.0, 87845.0, 221485.0, 854947.0, 4203002.0, 523262.0, 164984.0, 70201.0, 34141.0, 17408.0, 9646.0, 5525.0, 3445.0, 2154.0, 1234.0, 857.0, 509.0, 403.0, 266.0, 166.0, 105.0, 78.0, 72.0, 48.0, 25.0, 15.0, 12.0, 6.0, 6.0, 7.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-36.53125, -35.287109375, -34.04296875, -32.798828125, -31.5546875, -30.310546875, -29.06640625, -27.822265625, -26.578125, -25.333984375, -24.08984375, -22.845703125, -21.6015625, -20.357421875, -19.11328125, -17.869140625, -16.625, -15.380859375, -14.13671875, -12.892578125, -11.6484375, -10.404296875, -9.16015625, -7.916015625, -6.671875, -5.427734375, -4.18359375, -2.939453125, -1.6953125, -0.451171875, 0.79296875, 2.037109375, 3.28125, 4.525390625, 5.76953125, 7.013671875, 8.2578125, 9.501953125, 10.74609375, 11.990234375, 13.234375, 14.478515625, 15.72265625, 16.966796875, 18.2109375, 19.455078125, 20.69921875, 21.943359375, 23.1875, 24.431640625, 25.67578125, 26.919921875, 28.1640625, 29.408203125, 30.65234375, 31.896484375, 33.140625, 34.384765625, 35.62890625, 36.873046875, 38.1171875, 39.361328125, 40.60546875, 41.849609375, 43.09375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 12.0, 20.0, 22.0, 22.0, 16.0, 39.0, 37.0, 38.0, 53.0, 56.0, 46.0, 224.0, 906.0, 104.0, 73.0, 60.0, 57.0, 43.0, 31.0, 35.0, 23.0, 22.0, 19.0, 10.0, 10.0, 4.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.4375, -100.97265625, -97.5078125, -94.04296875, -90.578125, -87.11328125, -83.6484375, -80.18359375, -76.71875, -73.25390625, -69.7890625, -66.32421875, -62.859375, -59.39453125, -55.9296875, -52.46484375, -49.0, -45.53515625, -42.0703125, -38.60546875, -35.140625, -31.67578125, -28.2109375, -24.74609375, -21.28125, -17.81640625, -14.3515625, -10.88671875, -7.421875, -3.95703125, -0.4921875, 2.97265625, 6.4375, 9.90234375, 13.3671875, 16.83203125, 20.296875, 23.76171875, 27.2265625, 30.69140625, 34.15625, 37.62109375, 41.0859375, 44.55078125, 48.015625, 51.48046875, 54.9453125, 58.41015625, 61.875, 65.33984375, 68.8046875, 72.26953125, 75.734375, 79.19921875, 82.6640625, 86.12890625, 89.59375, 93.05859375, 96.5234375, 99.98828125, 103.453125, 106.91796875, 110.3828125, 113.84765625, 117.3125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 5.0, 8.0, 5.0, 11.0, 10.0, 10.0, 23.0, 28.0, 24.0, 38.0, 29.0, 49.0, 62.0, 79.0, 126.0, 145.0, 189.0, 234.0, 358.0, 462.0, 695.0, 1087.0, 1798.0, 3123.0, 5588.0, 11520.0, 30322.0, 140247.0, 5983915.0, 70325.0, 20532.0, 8692.0, 4494.0, 2420.0, 1462.0, 928.0, 620.0, 442.0, 300.0, 237.0, 177.0, 111.0, 114.0, 83.0, 70.0, 54.0, 26.0, 37.0, 30.0, 40.0, 4.0, 15.0, 13.0, 5.0, 5.0, 10.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-281.0, -272.02734375, -263.0546875, -254.08203125, -245.109375, -236.13671875, -227.1640625, -218.19140625, -209.21875, -200.24609375, -191.2734375, -182.30078125, -173.328125, -164.35546875, -155.3828125, -146.41015625, -137.4375, -128.46484375, -119.4921875, -110.51953125, -101.546875, -92.57421875, -83.6015625, -74.62890625, -65.65625, -56.68359375, -47.7109375, -38.73828125, -29.765625, -20.79296875, -11.8203125, -2.84765625, 6.125, 15.09765625, 24.0703125, 33.04296875, 42.015625, 50.98828125, 59.9609375, 68.93359375, 77.90625, 86.87890625, 95.8515625, 104.82421875, 113.796875, 122.76953125, 131.7421875, 140.71484375, 149.6875, 158.66015625, 167.6328125, 176.60546875, 185.578125, 194.55078125, 203.5234375, 212.49609375, 221.46875, 230.44140625, 239.4140625, 248.38671875, 257.359375, 266.33203125, 275.3046875, 284.27734375, 293.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 3.0, 8.0, 7.0, 9.0, 17.0, 19.0, 17.0, 28.0, 20.0, 33.0, 38.0, 52.0, 43.0, 64.0, 82.0, 306.0, 779.0, 120.0, 63.0, 50.0, 35.0, 31.0, 41.0, 31.0, 16.0, 13.0, 13.0, 8.0, 8.0, 7.0, 6.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.1875, -119.2333984375, -115.279296875, -111.3251953125, -107.37109375, -103.4169921875, -99.462890625, -95.5087890625, -91.5546875, -87.6005859375, -83.646484375, -79.6923828125, -75.73828125, -71.7841796875, -67.830078125, -63.8759765625, -59.921875, -55.9677734375, -52.013671875, -48.0595703125, -44.10546875, -40.1513671875, -36.197265625, -32.2431640625, -28.2890625, -24.3349609375, -20.380859375, -16.4267578125, -12.47265625, -8.5185546875, -4.564453125, -0.6103515625, 3.34375, 7.2978515625, 11.251953125, 15.2060546875, 19.16015625, 23.1142578125, 27.068359375, 31.0224609375, 34.9765625, 38.9306640625, 42.884765625, 46.8388671875, 50.79296875, 54.7470703125, 58.701171875, 62.6552734375, 66.609375, 70.5634765625, 74.517578125, 78.4716796875, 82.42578125, 86.3798828125, 90.333984375, 94.2880859375, 98.2421875, 102.1962890625, 106.150390625, 110.1044921875, 114.05859375, 118.0126953125, 121.966796875, 125.9208984375, 129.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 5.0, 8.0, 34.0, 131.0, 731.0, 40.0, 20.0, 10.0, 2.0, 9.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-423.29632568359375, -397.1758117675781, -371.0552978515625, -344.93475341796875, -318.81427001953125, -292.6937255859375, -266.5732116699219, -240.45269775390625, -214.33218383789062, -188.211669921875, -162.09115600585938, -135.9706268310547, -109.85011291503906, -83.72959899902344, -57.60906982421875, -31.488555908203125, -5.3680419921875, 20.75247573852539, 46.87299346923828, 72.99351501464844, 99.11402893066406, 125.23454284667969, 151.35507202148438, 177.4755859375, 203.59609985351562, 229.71661376953125, 255.83712768554688, 281.9576416015625, 308.07818603515625, 334.19866943359375, 360.3192138671875, 386.4397277832031, 412.5601806640625, 438.6806945800781, 464.80120849609375, 490.9217529296875, 517.042236328125, 543.1627807617188, 569.2833251953125, 595.40380859375, 621.5242919921875, 647.6448364257812, 673.7653198242188, 699.8858642578125, 726.00634765625, 752.1268920898438, 778.2474365234375, 804.367919921875, 830.4884643554688, 856.6090087890625, 882.7294921875, 908.8500366210938, 934.9705200195312, 961.091064453125, 987.2115478515625, 1013.3320922851562, 1039.45263671875, 1065.5731201171875, 1091.6937255859375, 1117.814208984375, 1143.9346923828125, 1170.05517578125, 1196.17578125, 1222.2962646484375, 1248.416748046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 15.0, 17.0, 24.0, 41.0, 335.0, 452.0, 46.0, 25.0, 19.0, 11.0, 5.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-327.74530029296875, -295.1753234863281, -262.6053466796875, -230.0353546142578, -197.4653778076172, -164.89540100097656, -132.32540893554688, -99.75543212890625, -67.18545532226562, -34.615474700927734, -2.0454940795898438, 30.524490356445312, 63.09446716308594, 95.66444396972656, 128.23443603515625, 160.80441284179688, 193.3743896484375, 225.94436645507812, 258.51434326171875, 291.0843505859375, 323.654296875, 356.22430419921875, 388.7942810058594, 421.3642578125, 453.9342346191406, 486.50421142578125, 519.07421875, 551.6441650390625, 584.2141723632812, 616.7841186523438, 649.3541259765625, 681.924072265625, 714.4940185546875, 747.0640258789062, 779.6339721679688, 812.2039794921875, 844.77392578125, 877.3439331054688, 909.9139404296875, 942.48388671875, 975.0538330078125, 1007.6238403320312, 1040.19384765625, 1072.7637939453125, 1105.333740234375, 1137.9036865234375, 1170.4737548828125, 1203.043701171875, 1235.61376953125, 1268.1837158203125, 1300.7537841796875, 1333.32373046875, 1365.8936767578125, 1398.463623046875, 1431.03369140625, 1463.6036376953125, 1496.173583984375, 1528.7435302734375, 1561.3135986328125, 1593.883544921875, 1626.4534912109375, 1659.0234375, 1691.593505859375, 1724.1634521484375, 1756.7333984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 8.0, 6.0, 9.0, 16.0, 18.0, 23.0, 31.0, 47.0, 68.0, 172.0, 218.0, 381.0, 536.0, 905.0, 1620.0, 2990.0, 7336.0, 24812.0, 321674.0, 3752777.0, 55674.0, 12703.0, 5512.0, 2785.0, 1499.0, 809.0, 467.0, 339.0, 199.0, 158.0, 106.0, 75.0, 74.0, 48.0, 38.0, 39.0, 37.0, 20.0, 14.0, 11.0, 8.0, 2.0, 4.0, 5.0, 0.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.046875, -4.82958984375, -4.6123046875, -4.39501953125, -4.177734375, -3.96044921875, -3.7431640625, -3.52587890625, -3.30859375, -3.09130859375, -2.8740234375, -2.65673828125, -2.439453125, -2.22216796875, -2.0048828125, -1.78759765625, -1.5703125, -1.35302734375, -1.1357421875, -0.91845703125, -0.701171875, -0.48388671875, -0.2666015625, -0.04931640625, 0.16796875, 0.38525390625, 0.6025390625, 0.81982421875, 1.037109375, 1.25439453125, 1.4716796875, 1.68896484375, 1.90625, 2.12353515625, 2.3408203125, 2.55810546875, 2.775390625, 2.99267578125, 3.2099609375, 3.42724609375, 3.64453125, 3.86181640625, 4.0791015625, 4.29638671875, 4.513671875, 4.73095703125, 4.9482421875, 5.16552734375, 5.3828125, 5.60009765625, 5.8173828125, 6.03466796875, 6.251953125, 6.46923828125, 6.6865234375, 6.90380859375, 7.12109375, 7.33837890625, 7.5556640625, 7.77294921875, 7.990234375, 8.20751953125, 8.4248046875, 8.64208984375, 8.859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 8.0, 10.0, 13.0, 47.0, 160.0, 338.0, 259.0, 102.0, 22.0, 10.0, 7.0, 7.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.3623199462890625, -0.345733642578125, -0.3291473388671875, -0.31256103515625, -0.2959747314453125, -0.279388427734375, -0.2628021240234375, -0.2462158203125, -0.2296295166015625, -0.213043212890625, -0.1964569091796875, -0.17987060546875, -0.1632843017578125, -0.146697998046875, -0.1301116943359375, -0.113525390625, -0.0969390869140625, -0.080352783203125, -0.0637664794921875, -0.04718017578125, -0.0305938720703125, -0.014007568359375, 0.0025787353515625, 0.0191650390625, 0.0357513427734375, 0.052337646484375, 0.0689239501953125, 0.08551025390625, 0.1020965576171875, 0.118682861328125, 0.1352691650390625, 0.15185546875, 0.1684417724609375, 0.185028076171875, 0.2016143798828125, 0.21820068359375, 0.2347869873046875, 0.251373291015625, 0.2679595947265625, 0.2845458984375, 0.3011322021484375, 0.317718505859375, 0.3343048095703125, 0.35089111328125, 0.3674774169921875, 0.384063720703125, 0.4006500244140625, 0.417236328125, 0.4338226318359375, 0.450408935546875, 0.4669952392578125, 0.48358154296875, 0.5001678466796875, 0.516754150390625, 0.5333404541015625, 0.5499267578125, 0.5665130615234375, 0.583099365234375, 0.5996856689453125, 0.61627197265625, 0.6328582763671875, 0.649444580078125, 0.6660308837890625, 0.6826171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 7.0, 6.0, 15.0, 20.0, 21.0, 39.0, 56.0, 86.0, 125.0, 157.0, 257.0, 426.0, 745.0, 1541.0, 3700.0, 12031.0, 56489.0, 967473.0, 3066349.0, 64541.0, 12395.0, 4006.0, 1659.0, 805.0, 454.0, 263.0, 183.0, 111.0, 82.0, 60.0, 43.0, 34.0, 25.0, 21.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.21649169921875, -5.0306396484375, -4.84478759765625, -4.658935546875, -4.47308349609375, -4.2872314453125, -4.10137939453125, -3.91552734375, -3.72967529296875, -3.5438232421875, -3.35797119140625, -3.172119140625, -2.98626708984375, -2.8004150390625, -2.61456298828125, -2.4287109375, -2.24285888671875, -2.0570068359375, -1.87115478515625, -1.685302734375, -1.49945068359375, -1.3135986328125, -1.12774658203125, -0.94189453125, -0.75604248046875, -0.5701904296875, -0.38433837890625, -0.198486328125, -0.01263427734375, 0.1732177734375, 0.35906982421875, 0.544921875, 0.73077392578125, 0.9166259765625, 1.10247802734375, 1.288330078125, 1.47418212890625, 1.6600341796875, 1.84588623046875, 2.03173828125, 2.21759033203125, 2.4034423828125, 2.58929443359375, 2.775146484375, 2.96099853515625, 3.1468505859375, 3.33270263671875, 3.5185546875, 3.70440673828125, 3.8902587890625, 4.07611083984375, 4.261962890625, 4.44781494140625, 4.6336669921875, 4.81951904296875, 5.00537109375, 5.19122314453125, 5.3770751953125, 5.56292724609375, 5.748779296875, 5.93463134765625, 6.1204833984375, 6.30633544921875, 6.4921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 4.0, 4.0, 11.0, 6.0, 9.0, 14.0, 19.0, 27.0, 30.0, 31.0, 27.0, 36.0, 50.0, 63.0, 72.0, 82.0, 77.0, 134.0, 130.0, 193.0, 264.0, 622.0, 951.0, 361.0, 257.0, 138.0, 119.0, 95.0, 63.0, 43.0, 34.0, 28.0, 25.0, 15.0, 12.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.82373046875, -0.8020858764648438, -0.7804412841796875, -0.7587966918945312, -0.737152099609375, -0.7155075073242188, -0.6938629150390625, -0.6722183227539062, -0.65057373046875, -0.6289291381835938, -0.6072845458984375, -0.5856399536132812, -0.563995361328125, -0.5423507690429688, -0.5207061767578125, -0.49906158447265625, -0.4774169921875, -0.45577239990234375, -0.4341278076171875, -0.41248321533203125, -0.390838623046875, -0.36919403076171875, -0.3475494384765625, -0.32590484619140625, -0.30426025390625, -0.28261566162109375, -0.2609710693359375, -0.23932647705078125, -0.217681884765625, -0.19603729248046875, -0.1743927001953125, -0.15274810791015625, -0.131103515625, -0.10945892333984375, -0.0878143310546875, -0.06616973876953125, -0.044525146484375, -0.02288055419921875, -0.0012359619140625, 0.02040863037109375, 0.04205322265625, 0.06369781494140625, 0.0853424072265625, 0.10698699951171875, 0.128631591796875, 0.15027618408203125, 0.1719207763671875, 0.19356536865234375, 0.2152099609375, 0.23685455322265625, 0.2584991455078125, 0.28014373779296875, 0.301788330078125, 0.32343292236328125, 0.3450775146484375, 0.36672210693359375, 0.38836669921875, 0.41001129150390625, 0.4316558837890625, 0.45330047607421875, 0.474945068359375, 0.49658966064453125, 0.5182342529296875, 0.5398788452148438, 0.5615234375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 8.0, 20.0, 35.0, 96.0, 199.0, 537.0, 88.0, 16.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.557106018066406, -41.3582763671875, -40.15944290161133, -38.960609436035156, -37.76177978515625, -36.562950134277344, -35.36411666870117, -34.165283203125, -32.966453552246094, -31.767621994018555, -30.568790435791016, -29.369958877563477, -28.171127319335938, -26.9722957611084, -25.77346420288086, -24.57463264465332, -23.37580108642578, -22.176969528198242, -20.978137969970703, -19.779306411743164, -18.580474853515625, -17.381643295288086, -16.182811737060547, -14.983980178833008, -13.785148620605469, -12.58631706237793, -11.38748550415039, -10.188653945922852, -8.989822387695312, -7.790990829467773, -6.592159271240234, -5.393327713012695, -4.194492340087891, -2.9956607818603516, -1.7968292236328125, -0.5979976654052734, 0.6008338928222656, 1.7996654510498047, 2.9984970092773438, 4.197328567504883, 5.396160125732422, 6.594991683959961, 7.7938232421875, 8.992654800415039, 10.191486358642578, 11.390317916870117, 12.589149475097656, 13.787981033325195, 14.986812591552734, 16.185644149780273, 17.384475708007812, 18.58330726623535, 19.78213882446289, 20.98097038269043, 22.17980194091797, 23.378633499145508, 24.577465057373047, 25.776296615600586, 26.975128173828125, 28.173959732055664, 29.372791290283203, 30.571622848510742, 31.77045440673828, 32.96928405761719, 34.16811752319336]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 14.0, 11.0, 22.0, 29.0, 25.0, 41.0, 45.0, 53.0, 75.0, 84.0, 76.0, 79.0, 70.0, 63.0, 70.0, 57.0, 46.0, 28.0, 23.0, 22.0, 21.0, 8.0, 10.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.30400276184082, -10.96466064453125, -10.625317573547363, -10.285975456237793, -9.946632385253906, -9.607290267944336, -9.267948150634766, -8.928606033325195, -8.589262962341309, -8.249920845031738, -7.910577774047852, -7.571235656738281, -7.231893062591553, -6.892550468444824, -6.553208351135254, -6.213865756988525, -5.874523162841797, -5.535180568695068, -5.19583797454834, -4.8564958572387695, -4.517153263092041, -4.1778106689453125, -3.838468313217163, -3.4991259574890137, -3.159783363342285, -2.8204407691955566, -2.4810984134674072, -2.141756057739258, -1.8024134635925293, -1.4630709886550903, -1.1237285137176514, -0.784386157989502, -0.44504356384277344, -0.10570108890533447, 0.2336413860321045, 0.5729838609695435, 0.9123263359069824, 1.2516688108444214, 1.5910112857818604, 1.9303536415100098, 2.2696962356567383, 2.609038829803467, 2.948381185531616, 3.2877235412597656, 3.627066135406494, 3.9664087295532227, 4.305750846862793, 4.6450934410095215, 4.98443603515625, 5.3237786293029785, 5.663121223449707, 6.002463340759277, 6.341805934906006, 6.681148529052734, 7.020490646362305, 7.359833240509033, 7.699175834655762, 8.038517951965332, 8.377861022949219, 8.717203140258789, 9.05654525756836, 9.395888328552246, 9.735230445861816, 10.074573516845703, 10.413915634155273]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 10.0, 11.0, 16.0, 23.0, 36.0, 41.0, 64.0, 74.0, 142.0, 188.0, 260.0, 391.0, 587.0, 1024.0, 1872.0, 4072.0, 10342.0, 43220.0, 699889.0, 245081.0, 26334.0, 7563.0, 3207.0, 1574.0, 875.0, 487.0, 344.0, 225.0, 144.0, 109.0, 78.0, 49.0, 51.0, 22.0, 30.0, 21.0, 11.0, 12.0, 7.0, 8.0, 5.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.04296875, -3.91192626953125, -3.7808837890625, -3.64984130859375, -3.518798828125, -3.38775634765625, -3.2567138671875, -3.12567138671875, -2.99462890625, -2.86358642578125, -2.7325439453125, -2.60150146484375, -2.470458984375, -2.33941650390625, -2.2083740234375, -2.07733154296875, -1.9462890625, -1.81524658203125, -1.6842041015625, -1.55316162109375, -1.422119140625, -1.29107666015625, -1.1600341796875, -1.02899169921875, -0.89794921875, -0.76690673828125, -0.6358642578125, -0.50482177734375, -0.373779296875, -0.24273681640625, -0.1116943359375, 0.01934814453125, 0.150390625, 0.28143310546875, 0.4124755859375, 0.54351806640625, 0.674560546875, 0.80560302734375, 0.9366455078125, 1.06768798828125, 1.19873046875, 1.32977294921875, 1.4608154296875, 1.59185791015625, 1.722900390625, 1.85394287109375, 1.9849853515625, 2.11602783203125, 2.2470703125, 2.37811279296875, 2.5091552734375, 2.64019775390625, 2.771240234375, 2.90228271484375, 3.0333251953125, 3.16436767578125, 3.29541015625, 3.42645263671875, 3.5574951171875, 3.68853759765625, 3.819580078125, 3.95062255859375, 4.0816650390625, 4.21270751953125, 4.34375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 5.0, 3.0, 10.0, 8.0, 20.0, 36.0, 73.0, 89.0, 117.0, 149.0, 168.0, 116.0, 84.0, 51.0, 26.0, 11.0, 5.0, 4.0, 2.0, 3.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4140625, -0.40247344970703125, -0.3908843994140625, -0.37929534912109375, -0.367706298828125, -0.35611724853515625, -0.3445281982421875, -0.33293914794921875, -0.32135009765625, -0.30976104736328125, -0.2981719970703125, -0.28658294677734375, -0.274993896484375, -0.26340484619140625, -0.2518157958984375, -0.24022674560546875, -0.2286376953125, -0.21704864501953125, -0.2054595947265625, -0.19387054443359375, -0.182281494140625, -0.17069244384765625, -0.1591033935546875, -0.14751434326171875, -0.13592529296875, -0.12433624267578125, -0.1127471923828125, -0.10115814208984375, -0.089569091796875, -0.07798004150390625, -0.0663909912109375, -0.05480194091796875, -0.043212890625, -0.03162384033203125, -0.0200347900390625, -0.00844573974609375, 0.003143310546875, 0.01473236083984375, 0.0263214111328125, 0.03791046142578125, 0.04949951171875, 0.06108856201171875, 0.0726776123046875, 0.08426666259765625, 0.095855712890625, 0.10744476318359375, 0.1190338134765625, 0.13062286376953125, 0.1422119140625, 0.15380096435546875, 0.1653900146484375, 0.17697906494140625, 0.188568115234375, 0.20015716552734375, 0.2117462158203125, 0.22333526611328125, 0.23492431640625, 0.24651336669921875, 0.2581024169921875, 0.26969146728515625, 0.281280517578125, 0.29286956787109375, 0.3044586181640625, 0.31604766845703125, 0.32763671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 14.0, 12.0, 18.0, 21.0, 46.0, 37.0, 69.0, 141.0, 206.0, 332.0, 587.0, 1065.0, 2056.0, 4346.0, 11000.0, 50472.0, 732905.0, 207246.0, 24110.0, 7189.0, 3018.0, 1552.0, 799.0, 502.0, 268.0, 175.0, 112.0, 74.0, 61.0, 27.0, 18.0, 9.0, 11.0, 10.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.25079345703125, -4.1031494140625, -3.95550537109375, -3.807861328125, -3.66021728515625, -3.5125732421875, -3.36492919921875, -3.21728515625, -3.06964111328125, -2.9219970703125, -2.77435302734375, -2.626708984375, -2.47906494140625, -2.3314208984375, -2.18377685546875, -2.0361328125, -1.88848876953125, -1.7408447265625, -1.59320068359375, -1.445556640625, -1.29791259765625, -1.1502685546875, -1.00262451171875, -0.85498046875, -0.70733642578125, -0.5596923828125, -0.41204833984375, -0.264404296875, -0.11676025390625, 0.0308837890625, 0.17852783203125, 0.326171875, 0.47381591796875, 0.6214599609375, 0.76910400390625, 0.916748046875, 1.06439208984375, 1.2120361328125, 1.35968017578125, 1.50732421875, 1.65496826171875, 1.8026123046875, 1.95025634765625, 2.097900390625, 2.24554443359375, 2.3931884765625, 2.54083251953125, 2.6884765625, 2.83612060546875, 2.9837646484375, 3.13140869140625, 3.279052734375, 3.42669677734375, 3.5743408203125, 3.72198486328125, 3.86962890625, 4.01727294921875, 4.1649169921875, 4.31256103515625, 4.460205078125, 4.60784912109375, 4.7554931640625, 4.90313720703125, 5.05078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 9.0, 12.0, 5.0, 14.0, 10.0, 11.0, 23.0, 22.0, 22.0, 25.0, 31.0, 17.0, 26.0, 30.0, 32.0, 43.0, 34.0, 45.0, 35.0, 42.0, 35.0, 36.0, 54.0, 41.0, 30.0, 38.0, 21.0, 33.0, 23.0, 22.0, 23.0, 26.0, 17.0, 10.0, 12.0, 12.0, 14.0, 16.0, 8.0, 6.0, 6.0, 5.0, 2.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.2000732421875, -1.158935546875, -1.1177978515625, -1.07666015625, -1.0355224609375, -0.994384765625, -0.9532470703125, -0.912109375, -0.8709716796875, -0.829833984375, -0.7886962890625, -0.74755859375, -0.7064208984375, -0.665283203125, -0.6241455078125, -0.5830078125, -0.5418701171875, -0.500732421875, -0.4595947265625, -0.41845703125, -0.3773193359375, -0.336181640625, -0.2950439453125, -0.25390625, -0.2127685546875, -0.171630859375, -0.1304931640625, -0.08935546875, -0.0482177734375, -0.007080078125, 0.0340576171875, 0.0751953125, 0.1163330078125, 0.157470703125, 0.1986083984375, 0.23974609375, 0.2808837890625, 0.322021484375, 0.3631591796875, 0.404296875, 0.4454345703125, 0.486572265625, 0.5277099609375, 0.56884765625, 0.6099853515625, 0.651123046875, 0.6922607421875, 0.7333984375, 0.7745361328125, 0.815673828125, 0.8568115234375, 0.89794921875, 0.9390869140625, 0.980224609375, 1.0213623046875, 1.0625, 1.1036376953125, 1.144775390625, 1.1859130859375, 1.22705078125, 1.2681884765625, 1.309326171875, 1.3504638671875, 1.3916015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 7.0, 13.0, 14.0, 31.0, 43.0, 94.0, 149.0, 241.0, 570.0, 1416.0, 5144.0, 55212.0, 962706.0, 17864.0, 3100.0, 1000.0, 449.0, 192.0, 120.0, 75.0, 42.0, 21.0, 17.0, 11.0, 6.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.421875, -8.1529541015625, -7.884033203125, -7.6151123046875, -7.34619140625, -7.0772705078125, -6.808349609375, -6.5394287109375, -6.2705078125, -6.0015869140625, -5.732666015625, -5.4637451171875, -5.19482421875, -4.9259033203125, -4.656982421875, -4.3880615234375, -4.119140625, -3.8502197265625, -3.581298828125, -3.3123779296875, -3.04345703125, -2.7745361328125, -2.505615234375, -2.2366943359375, -1.9677734375, -1.6988525390625, -1.429931640625, -1.1610107421875, -0.89208984375, -0.6231689453125, -0.354248046875, -0.0853271484375, 0.18359375, 0.4525146484375, 0.721435546875, 0.9903564453125, 1.25927734375, 1.5281982421875, 1.797119140625, 2.0660400390625, 2.3349609375, 2.6038818359375, 2.872802734375, 3.1417236328125, 3.41064453125, 3.6795654296875, 3.948486328125, 4.2174072265625, 4.486328125, 4.7552490234375, 5.024169921875, 5.2930908203125, 5.56201171875, 5.8309326171875, 6.099853515625, 6.3687744140625, 6.6376953125, 6.9066162109375, 7.175537109375, 7.4444580078125, 7.71337890625, 7.9822998046875, 8.251220703125, 8.5201416015625, 8.7890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 19.0, 29.0, 38.0, 44.0, 70.0, 109.0, 285.0, 121.0, 90.0, 45.0, 34.0, 24.0, 19.0, 13.0, 6.0, 5.0, 8.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034198760986328125, -0.0032617151737213135, -0.0031035542488098145, -0.0029453933238983154, -0.0027872323989868164, -0.0026290714740753174, -0.0024709105491638184, -0.0023127496242523193, -0.0021545886993408203, -0.0019964277744293213, -0.0018382668495178223, -0.0016801059246063232, -0.0015219449996948242, -0.0013637840747833252, -0.0012056231498718262, -0.0010474622249603271, -0.0008893013000488281, -0.0007311403751373291, -0.0005729794502258301, -0.00041481852531433105, -0.00025665760040283203, -9.849667549133301e-05, 5.9664249420166016e-05, 0.00021782517433166504, 0.00037598609924316406, 0.0005341470241546631, 0.0006923079490661621, 0.0008504688739776611, 0.0010086297988891602, 0.0011667907238006592, 0.0013249516487121582, 0.0014831125736236572, 0.0016412734985351562, 0.0017994344234466553, 0.0019575953483581543, 0.0021157562732696533, 0.0022739171981811523, 0.0024320781230926514, 0.0025902390480041504, 0.0027483999729156494, 0.0029065608978271484, 0.0030647218227386475, 0.0032228827476501465, 0.0033810436725616455, 0.0035392045974731445, 0.0036973655223846436, 0.0038555264472961426, 0.004013687372207642, 0.004171848297119141, 0.00433000922203064, 0.004488170146942139, 0.004646331071853638, 0.004804491996765137, 0.004962652921676636, 0.005120813846588135, 0.005278974771499634, 0.005437135696411133, 0.005595296621322632, 0.005753457546234131, 0.00591161847114563, 0.006069779396057129, 0.006227940320968628, 0.006386101245880127, 0.006544262170791626, 0.006702423095703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 0.0, 4.0, 7.0, 18.0, 20.0, 25.0, 61.0, 124.0, 235.0, 520.0, 1388.0, 4915.0, 48762.0, 961176.0, 25716.0, 3586.0, 1122.0, 437.0, 194.0, 83.0, 61.0, 31.0, 21.0, 13.0, 9.0, 9.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.18072509765625, -6.9278564453125, -6.67498779296875, -6.422119140625, -6.16925048828125, -5.9163818359375, -5.66351318359375, -5.41064453125, -5.15777587890625, -4.9049072265625, -4.65203857421875, -4.399169921875, -4.14630126953125, -3.8934326171875, -3.64056396484375, -3.3876953125, -3.13482666015625, -2.8819580078125, -2.62908935546875, -2.376220703125, -2.12335205078125, -1.8704833984375, -1.61761474609375, -1.36474609375, -1.11187744140625, -0.8590087890625, -0.60614013671875, -0.353271484375, -0.10040283203125, 0.1524658203125, 0.40533447265625, 0.658203125, 0.91107177734375, 1.1639404296875, 1.41680908203125, 1.669677734375, 1.92254638671875, 2.1754150390625, 2.42828369140625, 2.68115234375, 2.93402099609375, 3.1868896484375, 3.43975830078125, 3.692626953125, 3.94549560546875, 4.1983642578125, 4.45123291015625, 4.7041015625, 4.95697021484375, 5.2098388671875, 5.46270751953125, 5.715576171875, 5.96844482421875, 6.2213134765625, 6.47418212890625, 6.72705078125, 6.97991943359375, 7.2327880859375, 7.48565673828125, 7.738525390625, 7.99139404296875, 8.2442626953125, 8.49713134765625, 8.75]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 8.0, 12.0, 23.0, 38.0, 63.0, 135.0, 201.0, 196.0, 132.0, 75.0, 42.0, 26.0, 14.0, 8.0, 4.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.249603271484375, -4.14373779296875, -4.037872314453125, -3.9320068359375, -3.826141357421875, -3.72027587890625, -3.614410400390625, -3.508544921875, -3.402679443359375, -3.29681396484375, -3.190948486328125, -3.0850830078125, -2.979217529296875, -2.87335205078125, -2.767486572265625, -2.66162109375, -2.555755615234375, -2.44989013671875, -2.344024658203125, -2.2381591796875, -2.132293701171875, -2.02642822265625, -1.920562744140625, -1.814697265625, -1.708831787109375, -1.60296630859375, -1.497100830078125, -1.3912353515625, -1.285369873046875, -1.17950439453125, -1.073638916015625, -0.9677734375, -0.861907958984375, -0.75604248046875, -0.650177001953125, -0.5443115234375, -0.438446044921875, -0.33258056640625, -0.226715087890625, -0.120849609375, -0.014984130859375, 0.09088134765625, 0.196746826171875, 0.3026123046875, 0.408477783203125, 0.51434326171875, 0.620208740234375, 0.72607421875, 0.831939697265625, 0.93780517578125, 1.043670654296875, 1.1495361328125, 1.255401611328125, 1.36126708984375, 1.467132568359375, 1.572998046875, 1.678863525390625, 1.78472900390625, 1.890594482421875, 1.9964599609375, 2.102325439453125, 2.20819091796875, 2.314056396484375, 2.419921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 8.0, 11.0, 21.0, 16.0, 62.0, 108.0, 294.0, 345.0, 88.0, 21.0, 7.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.28443145751953, -67.81562042236328, -66.3468017578125, -64.87799072265625, -63.4091796875, -61.940364837646484, -60.47154998779297, -59.00273895263672, -57.53392791748047, -56.06511306762695, -54.5963020324707, -53.12748718261719, -51.65867614746094, -50.18986129760742, -48.721046447753906, -47.252235412597656, -45.78342056274414, -44.314605712890625, -42.845794677734375, -41.37697982788086, -39.90816879272461, -38.439353942871094, -36.970542907714844, -35.50172805786133, -34.03291320800781, -32.5640983581543, -31.095287322998047, -29.62647247314453, -28.15766143798828, -26.688846588134766, -25.220033645629883, -23.751220703125, -22.28240966796875, -20.813596725463867, -19.344783782958984, -17.87596893310547, -16.40715789794922, -14.93834400177002, -13.46953010559082, -12.000717163085938, -10.531904220581055, -9.063091278076172, -7.594277858734131, -6.12546443939209, -4.656651496887207, -3.187838554382324, -1.719024658203125, -0.2502117156982422, 1.2186012268066406, 2.6874144077301025, 4.1562275886535645, 5.6250410079956055, 7.093853950500488, 8.562666893005371, 10.03148078918457, 11.500293731689453, 12.969106674194336, 14.437919616699219, 15.906732559204102, 17.375545501708984, 18.8443603515625, 20.31317138671875, 21.781986236572266, 23.25079917907715, 24.71961212158203]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 12.0, 13.0, 8.0, 23.0, 36.0, 52.0, 59.0, 59.0, 105.0, 109.0, 91.0, 89.0, 76.0, 63.0, 45.0, 35.0, 24.0, 22.0, 14.0, 8.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.741636276245117, -25.93396759033203, -25.126298904418945, -24.31863021850586, -23.510961532592773, -22.703292846679688, -21.89562225341797, -21.087955474853516, -20.280284881591797, -19.47261619567871, -18.664947509765625, -17.85727882385254, -17.049610137939453, -16.241941452026367, -15.434271812438965, -14.626603126525879, -13.81893539428711, -13.011266708374023, -12.203598022460938, -11.395929336547852, -10.588260650634766, -9.78059196472168, -8.972922325134277, -8.165253639221191, -7.3575849533081055, -6.5499162673950195, -5.742247581481934, -4.9345784187316895, -4.1269097328186035, -3.3192410469055176, -2.5115718841552734, -1.7039031982421875, -0.8962364196777344, -0.08856761455535889, 0.7191011905670166, 1.5267701148986816, 2.3344388008117676, 3.1421074867248535, 3.9497766494750977, 4.757445335388184, 5.5651140213012695, 6.3727827072143555, 7.180451393127441, 7.9881205558776855, 8.79578971862793, 9.603458404541016, 10.411127090454102, 11.218795776367188, 12.026464462280273, 12.83413314819336, 13.641801834106445, 14.449470520019531, 15.257139205932617, 16.064807891845703, 16.872478485107422, 17.680145263671875, 18.487815856933594, 19.29548454284668, 20.103153228759766, 20.91082191467285, 21.718490600585938, 22.526159286499023, 23.33382797241211, 24.141498565673828, 24.94916534423828]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 12.0, 8.0, 18.0, 46.0, 149.0, 10802.0, 4182028.0, 935.0, 166.0, 51.0, 29.0, 14.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.3125, -102.9580078125, -97.603515625, -92.2490234375, -86.89453125, -81.5400390625, -76.185546875, -70.8310546875, -65.4765625, -60.1220703125, -54.767578125, -49.4130859375, -44.05859375, -38.7041015625, -33.349609375, -27.9951171875, -22.640625, -17.2861328125, -11.931640625, -6.5771484375, -1.22265625, 4.1318359375, 9.486328125, 14.8408203125, 20.1953125, 25.5498046875, 30.904296875, 36.2587890625, 41.61328125, 46.9677734375, 52.322265625, 57.6767578125, 63.03125, 68.3857421875, 73.740234375, 79.0947265625, 84.44921875, 89.8037109375, 95.158203125, 100.5126953125, 105.8671875, 111.2216796875, 116.576171875, 121.9306640625, 127.28515625, 132.6396484375, 137.994140625, 143.3486328125, 148.703125, 154.0576171875, 159.412109375, 164.7666015625, 170.12109375, 175.4755859375, 180.830078125, 186.1845703125, 191.5390625, 196.8935546875, 202.248046875, 207.6025390625, 212.95703125, 218.3115234375, 223.666015625, 229.0205078125, 234.375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 15.0, 23.0, 37.0, 40.0, 81.0, 83.0, 113.0, 127.0, 119.0, 108.0, 70.0, 58.0, 35.0, 18.0, 11.0, 10.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31787109375, -0.307464599609375, -0.29705810546875, -0.286651611328125, -0.2762451171875, -0.265838623046875, -0.25543212890625, -0.245025634765625, -0.234619140625, -0.224212646484375, -0.21380615234375, -0.203399658203125, -0.1929931640625, -0.182586669921875, -0.17218017578125, -0.161773681640625, -0.1513671875, -0.140960693359375, -0.13055419921875, -0.120147705078125, -0.1097412109375, -0.099334716796875, -0.08892822265625, -0.078521728515625, -0.068115234375, -0.057708740234375, -0.04730224609375, -0.036895751953125, -0.0264892578125, -0.016082763671875, -0.00567626953125, 0.004730224609375, 0.01513671875, 0.025543212890625, 0.03594970703125, 0.046356201171875, 0.0567626953125, 0.067169189453125, 0.07757568359375, 0.087982177734375, 0.098388671875, 0.108795166015625, 0.11920166015625, 0.129608154296875, 0.1400146484375, 0.150421142578125, 0.16082763671875, 0.171234130859375, 0.181640625, 0.192047119140625, 0.20245361328125, 0.212860107421875, 0.2232666015625, 0.233673095703125, 0.24407958984375, 0.254486083984375, 0.264892578125, 0.275299072265625, 0.28570556640625, 0.296112060546875, 0.3065185546875, 0.316925048828125, 0.32733154296875, 0.337738037109375, 0.34814453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 11.0, 20.0, 50.0, 109.0, 164.0, 305.0, 656.0, 34767.0, 4156798.0, 1168.0, 157.0, 55.0, 12.0, 7.0, 2.0, 1.0], "bins": [-101.375, -99.5711669921875, -97.767333984375, -95.9635009765625, -94.15966796875, -92.3558349609375, -90.552001953125, -88.7481689453125, -86.9443359375, -85.1405029296875, -83.336669921875, -81.5328369140625, -79.72900390625, -77.9251708984375, -76.121337890625, -74.3175048828125, -72.513671875, -70.7098388671875, -68.906005859375, -67.1021728515625, -65.29833984375, -63.4945068359375, -61.690673828125, -59.8868408203125, -58.0830078125, -56.2791748046875, -54.475341796875, -52.6715087890625, -50.86767578125, -49.0638427734375, -47.260009765625, -45.4561767578125, -43.65234375, -41.8485107421875, -40.044677734375, -38.2408447265625, -36.43701171875, -34.6331787109375, -32.829345703125, -31.0255126953125, -29.2216796875, -27.4178466796875, -25.614013671875, -23.8101806640625, -22.00634765625, -20.2025146484375, -18.398681640625, -16.5948486328125, -14.791015625, -12.9871826171875, -11.183349609375, -9.3795166015625, -7.57568359375, -5.7718505859375, -3.968017578125, -2.1641845703125, -0.3603515625, 1.4434814453125, 3.247314453125, 5.0511474609375, 6.85498046875, 8.6588134765625, 10.462646484375, 12.2664794921875, 14.0703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 13.0, 27.0, 29.0, 43.0, 46.0, 110.0, 217.0, 403.0, 690.0, 1696.0, 383.0, 160.0, 61.0, 48.0, 23.0, 19.0, 17.0, 17.0, 7.0, 5.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7783203125, -0.7563247680664062, -0.7343292236328125, -0.7123336791992188, -0.690338134765625, -0.6683425903320312, -0.6463470458984375, -0.6243515014648438, -0.60235595703125, -0.5803604125976562, -0.5583648681640625, -0.5363693237304688, -0.514373779296875, -0.49237823486328125, -0.4703826904296875, -0.44838714599609375, -0.4263916015625, -0.40439605712890625, -0.3824005126953125, -0.36040496826171875, -0.338409423828125, -0.31641387939453125, -0.2944183349609375, -0.27242279052734375, -0.25042724609375, -0.22843170166015625, -0.2064361572265625, -0.18444061279296875, -0.162445068359375, -0.14044952392578125, -0.1184539794921875, -0.09645843505859375, -0.074462890625, -0.05246734619140625, -0.0304718017578125, -0.00847625732421875, 0.013519287109375, 0.03551483154296875, 0.0575103759765625, 0.07950592041015625, 0.10150146484375, 0.12349700927734375, 0.1454925537109375, 0.16748809814453125, 0.189483642578125, 0.21147918701171875, 0.2334747314453125, 0.25547027587890625, 0.2774658203125, 0.29946136474609375, 0.3214569091796875, 0.34345245361328125, 0.365447998046875, 0.38744354248046875, 0.4094390869140625, 0.43143463134765625, 0.45343017578125, 0.47542572021484375, 0.4974212646484375, 0.5194168090820312, 0.541412353515625, 0.5634078979492188, 0.5854034423828125, 0.6073989868164062, 0.62939453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 21.0, 964.0, 32.0, 1.0], "bins": [-436.2700500488281, -429.2134094238281, -422.15673828125, -415.10009765625, -408.0434265136719, -400.9867858886719, -393.93011474609375, -386.87347412109375, -379.81683349609375, -372.76019287109375, -365.7035217285156, -358.6468811035156, -351.5902099609375, -344.5335693359375, -337.4769287109375, -330.4202575683594, -323.36358642578125, -316.30694580078125, -309.2502746582031, -302.1936340332031, -295.136962890625, -288.080322265625, -281.023681640625, -273.9670104980469, -266.9103698730469, -259.8537292480469, -252.79705810546875, -245.74041748046875, -238.6837615966797, -231.62710571289062, -224.57044982910156, -217.5137939453125, -210.4571533203125, -203.40049743652344, -196.34384155273438, -189.28720092773438, -182.2305450439453, -175.17388916015625, -168.1172332763672, -161.06057739257812, -154.00392150878906, -146.947265625, -139.89060974121094, -132.83395385742188, -125.77730560302734, -118.72065734863281, -111.66400146484375, -104.60734558105469, -97.55069732666016, -90.4940414428711, -83.43739318847656, -76.3807373046875, -69.32408142089844, -62.26742935180664, -55.210777282714844, -48.15412139892578, -41.09746551513672, -34.04081344604492, -26.98415756225586, -19.927505493164062, -12.870851516723633, -5.814197540283203, 1.2424545288085938, 8.299110412597656, 15.355761528015137]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 5.0, 26.0, 43.0, 62.0, 110.0, 153.0, 181.0, 146.0, 127.0, 64.0, 40.0, 12.0, 12.0, 11.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-28.041547775268555, -27.49420928955078, -26.94687271118164, -26.399534225463867, -25.852197647094727, -25.304859161376953, -24.757522583007812, -24.21018409729004, -23.662845611572266, -23.115507125854492, -22.56817054748535, -22.020832061767578, -21.473495483398438, -20.926156997680664, -20.378820419311523, -19.83148193359375, -19.28414535522461, -18.736806869506836, -18.189470291137695, -17.642131805419922, -17.09479522705078, -16.547456741333008, -16.000120162963867, -15.452781677246094, -14.905444145202637, -14.35810661315918, -13.810769081115723, -13.263431549072266, -12.716093063354492, -12.168756484985352, -11.621417999267578, -11.074080467224121, -10.526741981506348, -9.97940444946289, -9.432066917419434, -8.884729385375977, -8.337390899658203, -7.790053844451904, -7.242715835571289, -6.695378303527832, -6.148040771484375, -5.600703239440918, -5.053365707397461, -4.506027698516846, -3.9586901664733887, -3.4113526344299316, -2.8640148639678955, -2.3166770935058594, -1.7693395614624023, -1.2220019102096558, -0.6746642589569092, -0.1273266077041626, 0.420011043548584, 0.967348575592041, 1.5146863460540771, 2.0620241165161133, 2.6093616485595703, 3.1566991806030273, 3.7040369510650635, 4.2513747215271, 4.798712253570557, 5.346049785614014, 5.893387794494629, 6.440725326538086, 6.988062858581543]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 15.0, 16.0, 14.0, 15.0, 33.0, 49.0, 57.0, 77.0, 135.0, 177.0, 254.0, 398.0, 634.0, 1010.0, 1684.0, 2984.0, 5829.0, 13450.0, 38337.0, 168122.0, 633292.0, 126040.0, 31572.0, 11897.0, 5486.0, 2809.0, 1542.0, 900.0, 593.0, 342.0, 228.0, 148.0, 110.0, 89.0, 64.0, 38.0, 27.0, 27.0, 17.0, 11.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.0924072265625, -3.962158203125, -3.8319091796875, -3.70166015625, -3.5714111328125, -3.441162109375, -3.3109130859375, -3.1806640625, -3.0504150390625, -2.920166015625, -2.7899169921875, -2.65966796875, -2.5294189453125, -2.399169921875, -2.2689208984375, -2.138671875, -2.0084228515625, -1.878173828125, -1.7479248046875, -1.61767578125, -1.4874267578125, -1.357177734375, -1.2269287109375, -1.0966796875, -0.9664306640625, -0.836181640625, -0.7059326171875, -0.57568359375, -0.4454345703125, -0.315185546875, -0.1849365234375, -0.0546875, 0.0755615234375, 0.205810546875, 0.3360595703125, 0.46630859375, 0.5965576171875, 0.726806640625, 0.8570556640625, 0.9873046875, 1.1175537109375, 1.247802734375, 1.3780517578125, 1.50830078125, 1.6385498046875, 1.768798828125, 1.8990478515625, 2.029296875, 2.1595458984375, 2.289794921875, 2.4200439453125, 2.55029296875, 2.6805419921875, 2.810791015625, 2.9410400390625, 3.0712890625, 3.2015380859375, 3.331787109375, 3.4620361328125, 3.59228515625, 3.7225341796875, 3.852783203125, 3.9830322265625, 4.11328125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 4.0, 6.0, 5.0, 7.0, 15.0, 9.0, 39.0, 45.0, 55.0, 59.0, 75.0, 74.0, 69.0, 102.0, 76.0, 79.0, 76.0, 34.0, 39.0, 29.0, 26.0, 13.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19873046875, -0.19100189208984375, -0.1832733154296875, -0.17554473876953125, -0.167816162109375, -0.16008758544921875, -0.1523590087890625, -0.14463043212890625, -0.13690185546875, -0.12917327880859375, -0.1214447021484375, -0.11371612548828125, -0.105987548828125, -0.09825897216796875, -0.0905303955078125, -0.08280181884765625, -0.0750732421875, -0.06734466552734375, -0.0596160888671875, -0.05188751220703125, -0.044158935546875, -0.03643035888671875, -0.0287017822265625, -0.02097320556640625, -0.01324462890625, -0.00551605224609375, 0.0022125244140625, 0.00994110107421875, 0.017669677734375, 0.02539825439453125, 0.0331268310546875, 0.04085540771484375, 0.048583984375, 0.05631256103515625, 0.0640411376953125, 0.07176971435546875, 0.079498291015625, 0.08722686767578125, 0.0949554443359375, 0.10268402099609375, 0.11041259765625, 0.11814117431640625, 0.1258697509765625, 0.13359832763671875, 0.141326904296875, 0.14905548095703125, 0.1567840576171875, 0.16451263427734375, 0.1722412109375, 0.17996978759765625, 0.1876983642578125, 0.19542694091796875, 0.203155517578125, 0.21088409423828125, 0.2186126708984375, 0.22634124755859375, 0.23406982421875, 0.24179840087890625, 0.2495269775390625, 0.25725555419921875, 0.264984130859375, 0.27271270751953125, 0.2804412841796875, 0.28816986083984375, 0.2958984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 4.0, 4.0, 13.0, 11.0, 12.0, 10.0, 11.0, 22.0, 27.0, 30.0, 79.0, 420.0, 4834.0, 908599.0, 131558.0, 2314.0, 306.0, 97.0, 33.0, 31.0, 19.0, 18.0, 8.0, 16.0, 13.0, 10.0, 6.0, 4.0, 11.0, 5.0, 4.0, 2.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.630126953125, -15.08837890625, -14.546630859375, -14.0048828125, -13.463134765625, -12.92138671875, -12.379638671875, -11.837890625, -11.296142578125, -10.75439453125, -10.212646484375, -9.6708984375, -9.129150390625, -8.58740234375, -8.045654296875, -7.50390625, -6.962158203125, -6.42041015625, -5.878662109375, -5.3369140625, -4.795166015625, -4.25341796875, -3.711669921875, -3.169921875, -2.628173828125, -2.08642578125, -1.544677734375, -1.0029296875, -0.461181640625, 0.08056640625, 0.622314453125, 1.1640625, 1.705810546875, 2.24755859375, 2.789306640625, 3.3310546875, 3.872802734375, 4.41455078125, 4.956298828125, 5.498046875, 6.039794921875, 6.58154296875, 7.123291015625, 7.6650390625, 8.206787109375, 8.74853515625, 9.290283203125, 9.83203125, 10.373779296875, 10.91552734375, 11.457275390625, 11.9990234375, 12.540771484375, 13.08251953125, 13.624267578125, 14.166015625, 14.707763671875, 15.24951171875, 15.791259765625, 16.3330078125, 16.874755859375, 17.41650390625, 17.958251953125, 18.5]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 5.0, 9.0, 12.0, 15.0, 25.0, 21.0, 20.0, 21.0, 38.0, 28.0, 38.0, 47.0, 50.0, 48.0, 47.0, 45.0, 43.0, 53.0, 51.0, 40.0, 50.0, 34.0, 39.0, 43.0, 26.0, 21.0, 22.0, 18.0, 16.0, 15.0, 11.0, 8.0, 9.0, 7.0, 8.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2109375, -1.168792724609375, -1.12664794921875, -1.084503173828125, -1.0423583984375, -1.000213623046875, -0.95806884765625, -0.915924072265625, -0.873779296875, -0.831634521484375, -0.78948974609375, -0.747344970703125, -0.7052001953125, -0.663055419921875, -0.62091064453125, -0.578765869140625, -0.53662109375, -0.494476318359375, -0.45233154296875, -0.410186767578125, -0.3680419921875, -0.325897216796875, -0.28375244140625, -0.241607666015625, -0.199462890625, -0.157318115234375, -0.11517333984375, -0.073028564453125, -0.0308837890625, 0.011260986328125, 0.05340576171875, 0.095550537109375, 0.1376953125, 0.179840087890625, 0.22198486328125, 0.264129638671875, 0.3062744140625, 0.348419189453125, 0.39056396484375, 0.432708740234375, 0.474853515625, 0.516998291015625, 0.55914306640625, 0.601287841796875, 0.6434326171875, 0.685577392578125, 0.72772216796875, 0.769866943359375, 0.81201171875, 0.854156494140625, 0.89630126953125, 0.938446044921875, 0.9805908203125, 1.022735595703125, 1.06488037109375, 1.107025146484375, 1.149169921875, 1.191314697265625, 1.23345947265625, 1.275604248046875, 1.3177490234375, 1.359893798828125, 1.40203857421875, 1.444183349609375, 1.486328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 11.0, 14.0, 32.0, 89.0, 361.0, 17892.0, 1028904.0, 1012.0, 131.0, 35.0, 21.0, 10.0, 9.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.75, -118.3857421875, -115.021484375, -111.6572265625, -108.29296875, -104.9287109375, -101.564453125, -98.2001953125, -94.8359375, -91.4716796875, -88.107421875, -84.7431640625, -81.37890625, -78.0146484375, -74.650390625, -71.2861328125, -67.921875, -64.5576171875, -61.193359375, -57.8291015625, -54.46484375, -51.1005859375, -47.736328125, -44.3720703125, -41.0078125, -37.6435546875, -34.279296875, -30.9150390625, -27.55078125, -24.1865234375, -20.822265625, -17.4580078125, -14.09375, -10.7294921875, -7.365234375, -4.0009765625, -0.63671875, 2.7275390625, 6.091796875, 9.4560546875, 12.8203125, 16.1845703125, 19.548828125, 22.9130859375, 26.27734375, 29.6416015625, 33.005859375, 36.3701171875, 39.734375, 43.0986328125, 46.462890625, 49.8271484375, 53.19140625, 56.5556640625, 59.919921875, 63.2841796875, 66.6484375, 70.0126953125, 73.376953125, 76.7412109375, 80.10546875, 83.4697265625, 86.833984375, 90.1982421875, 93.5625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 2.0, 9.0, 13.0, 17.0, 18.0, 23.0, 20.0, 32.0, 61.0, 230.0, 344.0, 50.0, 49.0, 36.0, 21.0, 18.0, 9.0, 8.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00917816162109375, -0.008908629417419434, -0.008639097213745117, -0.0083695650100708, -0.008100032806396484, -0.007830500602722168, -0.0075609683990478516, -0.007291436195373535, -0.007021903991699219, -0.006752371788024902, -0.006482839584350586, -0.0062133073806762695, -0.005943775177001953, -0.005674242973327637, -0.00540471076965332, -0.005135178565979004, -0.0048656463623046875, -0.004596114158630371, -0.004326581954956055, -0.004057049751281738, -0.003787517547607422, -0.0035179853439331055, -0.003248453140258789, -0.0029789209365844727, -0.0027093887329101562, -0.00243985652923584, -0.0021703243255615234, -0.001900792121887207, -0.0016312599182128906, -0.0013617277145385742, -0.0010921955108642578, -0.0008226633071899414, -0.000553131103515625, -0.0002835988998413086, -1.4066696166992188e-05, 0.0002554655075073242, 0.0005249977111816406, 0.000794529914855957, 0.0010640621185302734, 0.0013335943222045898, 0.0016031265258789062, 0.0018726587295532227, 0.002142190933227539, 0.0024117231369018555, 0.002681255340576172, 0.0029507875442504883, 0.0032203197479248047, 0.003489851951599121, 0.0037593841552734375, 0.004028916358947754, 0.00429844856262207, 0.004567980766296387, 0.004837512969970703, 0.0051070451736450195, 0.005376577377319336, 0.005646109580993652, 0.005915641784667969, 0.006185173988342285, 0.0064547061920166016, 0.006724238395690918, 0.006993770599365234, 0.007263302803039551, 0.007532835006713867, 0.007802367210388184, 0.0080718994140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 12.0, 8.0, 10.0, 27.0, 32.0, 63.0, 78.0, 104.0, 207.0, 331.0, 563.0, 1026.0, 2024.0, 4526.0, 12985.0, 69958.0, 880816.0, 57083.0, 10923.0, 3746.0, 1747.0, 928.0, 536.0, 301.0, 189.0, 90.0, 74.0, 50.0, 32.0, 23.0, 16.0, 11.0, 6.0, 8.0, 7.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.26318359375, -17.6826171875, -17.10205078125, -16.521484375, -15.94091796875, -15.3603515625, -14.77978515625, -14.19921875, -13.61865234375, -13.0380859375, -12.45751953125, -11.876953125, -11.29638671875, -10.7158203125, -10.13525390625, -9.5546875, -8.97412109375, -8.3935546875, -7.81298828125, -7.232421875, -6.65185546875, -6.0712890625, -5.49072265625, -4.91015625, -4.32958984375, -3.7490234375, -3.16845703125, -2.587890625, -2.00732421875, -1.4267578125, -0.84619140625, -0.265625, 0.31494140625, 0.8955078125, 1.47607421875, 2.056640625, 2.63720703125, 3.2177734375, 3.79833984375, 4.37890625, 4.95947265625, 5.5400390625, 6.12060546875, 6.701171875, 7.28173828125, 7.8623046875, 8.44287109375, 9.0234375, 9.60400390625, 10.1845703125, 10.76513671875, 11.345703125, 11.92626953125, 12.5068359375, 13.08740234375, 13.66796875, 14.24853515625, 14.8291015625, 15.40966796875, 15.990234375, 16.57080078125, 17.1513671875, 17.73193359375, 18.3125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 11.0, 22.0, 34.0, 42.0, 80.0, 230.0, 346.0, 70.0, 44.0, 36.0, 18.0, 14.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.811279296875, -12.41162109375, -12.011962890625, -11.6123046875, -11.212646484375, -10.81298828125, -10.413330078125, -10.013671875, -9.614013671875, -9.21435546875, -8.814697265625, -8.4150390625, -8.015380859375, -7.61572265625, -7.216064453125, -6.81640625, -6.416748046875, -6.01708984375, -5.617431640625, -5.2177734375, -4.818115234375, -4.41845703125, -4.018798828125, -3.619140625, -3.219482421875, -2.81982421875, -2.420166015625, -2.0205078125, -1.620849609375, -1.22119140625, -0.821533203125, -0.421875, -0.022216796875, 0.37744140625, 0.777099609375, 1.1767578125, 1.576416015625, 1.97607421875, 2.375732421875, 2.775390625, 3.175048828125, 3.57470703125, 3.974365234375, 4.3740234375, 4.773681640625, 5.17333984375, 5.572998046875, 5.97265625, 6.372314453125, 6.77197265625, 7.171630859375, 7.5712890625, 7.970947265625, 8.37060546875, 8.770263671875, 9.169921875, 9.569580078125, 9.96923828125, 10.368896484375, 10.7685546875, 11.168212890625, 11.56787109375, 11.967529296875, 12.3671875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 17.0, 111.0, 574.0, 235.0, 42.0, 12.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.79825592041016, -79.5240478515625, -75.24983215332031, -70.97562408447266, -66.701416015625, -62.42720413208008, -58.152992248535156, -53.8787841796875, -49.60457229614258, -45.330360412597656, -41.05615234375, -36.78194046020508, -32.507728576660156, -28.2335205078125, -23.959308624267578, -19.68509864807129, -15.410888671875, -11.136678695678711, -6.8624677658081055, -2.5882568359375, 1.685953140258789, 5.960163116455078, 10.234375, 14.508584976196289, 18.782794952392578, 23.057004928588867, 27.331214904785156, 31.605426788330078, 35.879638671875, 40.153846740722656, 44.42805862426758, 48.7022705078125, 52.97648620605469, 57.25069808959961, 61.524906158447266, 65.79911804199219, 70.07332611083984, 74.3475341796875, 78.62174987792969, 82.89595794677734, 87.170166015625, 91.44437408447266, 95.71858978271484, 99.9927978515625, 104.26700592041016, 108.54121398925781, 112.8154296875, 117.08963775634766, 121.36385345458984, 125.6380615234375, 129.9122772216797, 134.18649291992188, 138.460693359375, 142.7349090576172, 147.00912475585938, 151.2833251953125, 155.5575408935547, 159.83175659179688, 164.10595703125, 168.3801727294922, 172.65438842773438, 176.9285888671875, 181.2028045654297, 185.47702026367188, 189.751220703125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 3.0, 7.0, 12.0, 13.0, 19.0, 31.0, 37.0, 46.0, 65.0, 83.0, 95.0, 104.0, 94.0, 81.0, 66.0, 72.0, 44.0, 23.0, 25.0, 18.0, 14.0, 12.0, 11.0, 9.0, 5.0, 0.0, 5.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.120607376098633, -26.324491500854492, -25.52837562561035, -24.73225975036621, -23.936141967773438, -23.140026092529297, -22.343910217285156, -21.547794342041016, -20.751678466796875, -19.955562591552734, -19.159446716308594, -18.363330841064453, -17.567214965820312, -16.77109718322754, -15.974981307983398, -15.178865432739258, -14.382749557495117, -13.586633682250977, -12.790517807006836, -11.994400978088379, -11.198285102844238, -10.402169227600098, -9.60605239868164, -8.8099365234375, -8.01382064819336, -7.217704772949219, -6.42158842086792, -5.625472068786621, -4.8293561935424805, -4.03324031829834, -3.237123966217041, -2.441007614135742, -1.6448936462402344, -0.8487775325775146, -0.05266141891479492, 0.7434546947479248, 1.5395708084106445, 2.3356869220733643, 3.131803035736084, 3.927919387817383, 4.724035263061523, 5.520151138305664, 6.316267490386963, 7.112383842468262, 7.908499717712402, 8.704615592956543, 9.500732421875, 10.29684829711914, 11.092964172363281, 11.889080047607422, 12.685195922851562, 13.48131275177002, 14.27742862701416, 15.0735445022583, 15.869661331176758, 16.6657772064209, 17.46189308166504, 18.25800895690918, 19.05412483215332, 19.85024070739746, 20.646358489990234, 21.442474365234375, 22.238590240478516, 23.034706115722656, 23.830821990966797]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 0.0, 2.0, 4.0, 14.0, 10.0, 12.0, 8.0, 6.0, 16.0, 12.0, 18.0, 29.0, 80.0, 215.0, 6780.0, 4184241.0, 2170.0, 266.0, 135.0, 61.0, 54.0, 22.0, 28.0, 28.0, 8.0, 12.0, 8.0, 11.0, 6.0, 8.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-84.25, -81.9345703125, -79.619140625, -77.3037109375, -74.98828125, -72.6728515625, -70.357421875, -68.0419921875, -65.7265625, -63.4111328125, -61.095703125, -58.7802734375, -56.46484375, -54.1494140625, -51.833984375, -49.5185546875, -47.203125, -44.8876953125, -42.572265625, -40.2568359375, -37.94140625, -35.6259765625, -33.310546875, -30.9951171875, -28.6796875, -26.3642578125, -24.048828125, -21.7333984375, -19.41796875, -17.1025390625, -14.787109375, -12.4716796875, -10.15625, -7.8408203125, -5.525390625, -3.2099609375, -0.89453125, 1.4208984375, 3.736328125, 6.0517578125, 8.3671875, 10.6826171875, 12.998046875, 15.3134765625, 17.62890625, 19.9443359375, 22.259765625, 24.5751953125, 26.890625, 29.2060546875, 31.521484375, 33.8369140625, 36.15234375, 38.4677734375, 40.783203125, 43.0986328125, 45.4140625, 47.7294921875, 50.044921875, 52.3603515625, 54.67578125, 56.9912109375, 59.306640625, 61.6220703125, 63.9375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 27.0, 47.0, 89.0, 133.0, 142.0, 190.0, 155.0, 104.0, 49.0, 22.0, 10.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278564453125, -0.2556877136230469, -0.23281097412109375, -0.20993423461914062, -0.1870574951171875, -0.16418075561523438, -0.14130401611328125, -0.11842727661132812, -0.095550537109375, -0.07267379760742188, -0.04979705810546875, -0.026920318603515625, -0.0040435791015625, 0.018833160400390625, 0.04170989990234375, 0.06458663940429688, 0.08746337890625, 0.11034011840820312, 0.13321685791015625, 0.15609359741210938, 0.1789703369140625, 0.20184707641601562, 0.22472381591796875, 0.24760055541992188, 0.270477294921875, 0.2933540344238281, 0.31623077392578125, 0.3391075134277344, 0.3619842529296875, 0.3848609924316406, 0.40773773193359375, 0.4306144714355469, 0.4534912109375, 0.4763679504394531, 0.49924468994140625, 0.5221214294433594, 0.5449981689453125, 0.5678749084472656, 0.5907516479492188, 0.6136283874511719, 0.636505126953125, 0.6593818664550781, 0.6822586059570312, 0.7051353454589844, 0.7280120849609375, 0.7508888244628906, 0.7737655639648438, 0.7966423034667969, 0.81951904296875, 0.8423957824707031, 0.8652725219726562, 0.8881492614746094, 0.9110260009765625, 0.9339027404785156, 0.9567794799804688, 0.9796562194824219, 1.002532958984375, 1.0254096984863281, 1.0482864379882812, 1.0711631774902344, 1.0940399169921875, 1.1169166564941406, 1.1397933959960938, 1.1626701354980469, 1.185546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 59.0, 5925.0, 4187947.0, 327.0, 29.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.453125, -13.297607421875, -9.14208984375, -4.986572265625, -0.8310546875, 3.324462890625, 7.47998046875, 11.635498046875, 15.791015625, 19.946533203125, 24.10205078125, 28.257568359375, 32.4130859375, 36.568603515625, 40.72412109375, 44.879638671875, 49.03515625, 53.190673828125, 57.34619140625, 61.501708984375, 65.6572265625, 69.812744140625, 73.96826171875, 78.123779296875, 82.279296875, 86.434814453125, 90.59033203125, 94.745849609375, 98.9013671875, 103.056884765625, 107.21240234375, 111.367919921875, 115.5234375, 119.678955078125, 123.83447265625, 127.989990234375, 132.1455078125, 136.301025390625, 140.45654296875, 144.612060546875, 148.767578125, 152.923095703125, 157.07861328125, 161.234130859375, 165.3896484375, 169.545166015625, 173.70068359375, 177.856201171875, 182.01171875, 186.167236328125, 190.32275390625, 194.478271484375, 198.6337890625, 202.789306640625, 206.94482421875, 211.100341796875, 215.255859375, 219.411376953125, 223.56689453125, 227.722412109375, 231.8779296875, 236.033447265625, 240.18896484375, 244.344482421875, 248.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 15.0, 18.0, 21.0, 36.0, 74.0, 111.0, 231.0, 1758.0, 1288.0, 238.0, 127.0, 52.0, 46.0, 23.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.3701171875, -1.32586669921875, -1.2816162109375, -1.23736572265625, -1.193115234375, -1.14886474609375, -1.1046142578125, -1.06036376953125, -1.01611328125, -0.97186279296875, -0.9276123046875, -0.88336181640625, -0.839111328125, -0.79486083984375, -0.7506103515625, -0.70635986328125, -0.662109375, -0.61785888671875, -0.5736083984375, -0.52935791015625, -0.485107421875, -0.44085693359375, -0.3966064453125, -0.35235595703125, -0.30810546875, -0.26385498046875, -0.2196044921875, -0.17535400390625, -0.131103515625, -0.08685302734375, -0.0426025390625, 0.00164794921875, 0.0458984375, 0.09014892578125, 0.1343994140625, 0.17864990234375, 0.222900390625, 0.26715087890625, 0.3114013671875, 0.35565185546875, 0.39990234375, 0.44415283203125, 0.4884033203125, 0.53265380859375, 0.576904296875, 0.62115478515625, 0.6654052734375, 0.70965576171875, 0.75390625, 0.79815673828125, 0.8424072265625, 0.88665771484375, 0.930908203125, 0.97515869140625, 1.0194091796875, 1.06365966796875, 1.10791015625, 1.15216064453125, 1.1964111328125, 1.24066162109375, 1.284912109375, 1.32916259765625, 1.3734130859375, 1.41766357421875, 1.4619140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 15.0, 1004.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.88494873046875, -54.413490295410156, -43.94203186035156, -33.470577239990234, -22.99911880493164, -12.527660369873047, -2.0562057495117188, 8.415252685546875, 18.88671112060547, 29.358169555664062, 39.829627990722656, 50.301082611083984, 60.77254104614258, 71.24400329589844, 81.7154541015625, 92.1869125366211, 102.65837097167969, 113.12982940673828, 123.60128784179688, 134.07273864746094, 144.54420471191406, 155.01565551757812, 165.48712158203125, 175.9585723876953, 186.43002319335938, 196.90147399902344, 207.37294006347656, 217.84439086914062, 228.31585693359375, 238.7873077392578, 249.25875854492188, 259.730224609375, 270.2016906738281, 280.67315673828125, 291.14459228515625, 301.6160583496094, 312.0875244140625, 322.5589904785156, 333.0304260253906, 343.50189208984375, 353.9733581542969, 364.44482421875, 374.916259765625, 385.3877258300781, 395.85919189453125, 406.3306579589844, 416.8020935058594, 427.2735595703125, 437.7449951171875, 448.2164611816406, 458.6878967285156, 469.15936279296875, 479.6308288574219, 490.102294921875, 500.57373046875, 511.0451965332031, 521.5166625976562, 531.9880981445312, 542.4595947265625, 552.9310302734375, 563.4024658203125, 573.8739624023438, 584.3453979492188, 594.81689453125, 605.288330078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 9.0, 16.0, 19.0, 58.0, 145.0, 230.0, 211.0, 169.0, 89.0, 39.0, 14.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.658546447753906, -12.991655349731445, -12.324764251708984, -11.657873153686523, -10.990982055664062, -10.324090957641602, -9.657200813293457, -8.990309715270996, -8.323418617248535, -7.656527519226074, -6.989636421203613, -6.3227458000183105, -5.65585470199585, -4.988963603973389, -4.322072982788086, -3.655181884765625, -2.988290786743164, -2.321399688720703, -1.6545088291168213, -0.9876179695129395, -0.3207268714904785, 0.3461642265319824, 1.0130548477172852, 1.679945945739746, 2.346837043762207, 3.013728141784668, 3.68061900138855, 4.347509860992432, 5.014400959014893, 5.6812920570373535, 6.348182678222656, 7.015073776245117, 7.681964874267578, 8.348855972290039, 9.0157470703125, 9.682638168334961, 10.349529266357422, 11.016420364379883, 11.683310508728027, 12.350201606750488, 13.01709270477295, 13.68398380279541, 14.350874900817871, 15.017765045166016, 15.684656143188477, 16.351547241210938, 17.0184383392334, 17.68532943725586, 18.35222053527832, 19.01911163330078, 19.686002731323242, 20.352893829345703, 21.019784927368164, 21.686676025390625, 22.353565216064453, 23.020458221435547, 23.687347412109375, 24.354238510131836, 25.021129608154297, 25.688020706176758, 26.35491180419922, 27.02180290222168, 27.68869400024414, 28.35558319091797, 29.022476196289062]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 6.0, 10.0, 9.0, 5.0, 11.0, 15.0, 18.0, 18.0, 24.0, 30.0, 26.0, 26.0, 45.0, 46.0, 51.0, 86.0, 1168.0, 481359.0, 563856.0, 1275.0, 79.0, 53.0, 43.0, 32.0, 33.0, 35.0, 31.0, 31.0, 17.0, 21.0, 18.0, 7.0, 13.0, 9.0, 8.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.046875, -18.451904296875, -17.85693359375, -17.261962890625, -16.6669921875, -16.072021484375, -15.47705078125, -14.882080078125, -14.287109375, -13.692138671875, -13.09716796875, -12.502197265625, -11.9072265625, -11.312255859375, -10.71728515625, -10.122314453125, -9.52734375, -8.932373046875, -8.33740234375, -7.742431640625, -7.1474609375, -6.552490234375, -5.95751953125, -5.362548828125, -4.767578125, -4.172607421875, -3.57763671875, -2.982666015625, -2.3876953125, -1.792724609375, -1.19775390625, -0.602783203125, -0.0078125, 0.587158203125, 1.18212890625, 1.777099609375, 2.3720703125, 2.967041015625, 3.56201171875, 4.156982421875, 4.751953125, 5.346923828125, 5.94189453125, 6.536865234375, 7.1318359375, 7.726806640625, 8.32177734375, 8.916748046875, 9.51171875, 10.106689453125, 10.70166015625, 11.296630859375, 11.8916015625, 12.486572265625, 13.08154296875, 13.676513671875, 14.271484375, 14.866455078125, 15.46142578125, 16.056396484375, 16.6513671875, 17.246337890625, 17.84130859375, 18.436279296875, 19.03125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 45.0, 168.0, 345.0, 298.0, 130.0, 21.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423828125, -0.351959228515625, -0.28009033203125, -0.208221435546875, -0.1363525390625, -0.064483642578125, 0.00738525390625, 0.079254150390625, 0.151123046875, 0.222991943359375, 0.29486083984375, 0.366729736328125, 0.4385986328125, 0.510467529296875, 0.58233642578125, 0.654205322265625, 0.72607421875, 0.797943115234375, 0.86981201171875, 0.941680908203125, 1.0135498046875, 1.085418701171875, 1.15728759765625, 1.229156494140625, 1.301025390625, 1.372894287109375, 1.44476318359375, 1.516632080078125, 1.5885009765625, 1.660369873046875, 1.73223876953125, 1.804107666015625, 1.8759765625, 1.947845458984375, 2.01971435546875, 2.091583251953125, 2.1634521484375, 2.235321044921875, 2.30718994140625, 2.379058837890625, 2.450927734375, 2.522796630859375, 2.59466552734375, 2.666534423828125, 2.7384033203125, 2.810272216796875, 2.88214111328125, 2.954010009765625, 3.02587890625, 3.097747802734375, 3.16961669921875, 3.241485595703125, 3.3133544921875, 3.385223388671875, 3.45709228515625, 3.528961181640625, 3.600830078125, 3.672698974609375, 3.74456787109375, 3.816436767578125, 3.8883056640625, 3.960174560546875, 4.03204345703125, 4.103912353515625, 4.17578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 0.0, 5.0, 13.0, 12.0, 17.0, 18.0, 28.0, 38.0, 54.0, 71.0, 134.0, 266.0, 899.0, 6339.0, 207151.0, 810343.0, 20566.0, 1727.0, 396.0, 168.0, 77.0, 60.0, 44.0, 29.0, 25.0, 17.0, 10.0, 13.0, 6.0, 9.0, 2.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.015625, -15.596435546875, -15.17724609375, -14.758056640625, -14.3388671875, -13.919677734375, -13.50048828125, -13.081298828125, -12.662109375, -12.242919921875, -11.82373046875, -11.404541015625, -10.9853515625, -10.566162109375, -10.14697265625, -9.727783203125, -9.30859375, -8.889404296875, -8.47021484375, -8.051025390625, -7.6318359375, -7.212646484375, -6.79345703125, -6.374267578125, -5.955078125, -5.535888671875, -5.11669921875, -4.697509765625, -4.2783203125, -3.859130859375, -3.43994140625, -3.020751953125, -2.6015625, -2.182373046875, -1.76318359375, -1.343994140625, -0.9248046875, -0.505615234375, -0.08642578125, 0.332763671875, 0.751953125, 1.171142578125, 1.59033203125, 2.009521484375, 2.4287109375, 2.847900390625, 3.26708984375, 3.686279296875, 4.10546875, 4.524658203125, 4.94384765625, 5.363037109375, 5.7822265625, 6.201416015625, 6.62060546875, 7.039794921875, 7.458984375, 7.878173828125, 8.29736328125, 8.716552734375, 9.1357421875, 9.554931640625, 9.97412109375, 10.393310546875, 10.8125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 10.0, 5.0, 12.0, 7.0, 8.0, 21.0, 29.0, 39.0, 38.0, 34.0, 27.0, 32.0, 52.0, 36.0, 43.0, 48.0, 39.0, 71.0, 55.0, 55.0, 39.0, 36.0, 31.0, 31.0, 29.0, 24.0, 27.0, 15.0, 18.0, 13.0, 17.0, 16.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.61328125, -3.517303466796875, -3.42132568359375, -3.325347900390625, -3.2293701171875, -3.133392333984375, -3.03741455078125, -2.941436767578125, -2.845458984375, -2.749481201171875, -2.65350341796875, -2.557525634765625, -2.4615478515625, -2.365570068359375, -2.26959228515625, -2.173614501953125, -2.07763671875, -1.981658935546875, -1.88568115234375, -1.789703369140625, -1.6937255859375, -1.597747802734375, -1.50177001953125, -1.405792236328125, -1.309814453125, -1.213836669921875, -1.11785888671875, -1.021881103515625, -0.9259033203125, -0.829925537109375, -0.73394775390625, -0.637969970703125, -0.5419921875, -0.446014404296875, -0.35003662109375, -0.254058837890625, -0.1580810546875, -0.062103271484375, 0.03387451171875, 0.129852294921875, 0.225830078125, 0.321807861328125, 0.41778564453125, 0.513763427734375, 0.6097412109375, 0.705718994140625, 0.80169677734375, 0.897674560546875, 0.99365234375, 1.089630126953125, 1.18560791015625, 1.281585693359375, 1.3775634765625, 1.473541259765625, 1.56951904296875, 1.665496826171875, 1.761474609375, 1.857452392578125, 1.95343017578125, 2.049407958984375, 2.1453857421875, 2.241363525390625, 2.33734130859375, 2.433319091796875, 2.529296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 10.0, 4.0, 8.0, 7.0, 16.0, 20.0, 27.0, 35.0, 59.0, 107.0, 435.0, 3263.0, 510412.0, 530175.0, 3178.0, 441.0, 137.0, 57.0, 39.0, 26.0, 20.0, 10.0, 12.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.265625, -25.574462890625, -24.88330078125, -24.192138671875, -23.5009765625, -22.809814453125, -22.11865234375, -21.427490234375, -20.736328125, -20.045166015625, -19.35400390625, -18.662841796875, -17.9716796875, -17.280517578125, -16.58935546875, -15.898193359375, -15.20703125, -14.515869140625, -13.82470703125, -13.133544921875, -12.4423828125, -11.751220703125, -11.06005859375, -10.368896484375, -9.677734375, -8.986572265625, -8.29541015625, -7.604248046875, -6.9130859375, -6.221923828125, -5.53076171875, -4.839599609375, -4.1484375, -3.457275390625, -2.76611328125, -2.074951171875, -1.3837890625, -0.692626953125, -0.00146484375, 0.689697265625, 1.380859375, 2.072021484375, 2.76318359375, 3.454345703125, 4.1455078125, 4.836669921875, 5.52783203125, 6.218994140625, 6.91015625, 7.601318359375, 8.29248046875, 8.983642578125, 9.6748046875, 10.365966796875, 11.05712890625, 11.748291015625, 12.439453125, 13.130615234375, 13.82177734375, 14.512939453125, 15.2041015625, 15.895263671875, 16.58642578125, 17.277587890625, 17.96875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 7.0, 11.0, 9.0, 14.0, 26.0, 38.0, 80.0, 173.0, 242.0, 161.0, 82.0, 36.0, 24.0, 25.0, 12.0, 8.0, 7.0, 8.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0015811920166015625, -0.0015412122011184692, -0.001501232385635376, -0.0014612525701522827, -0.0014212727546691895, -0.0013812929391860962, -0.001341313123703003, -0.0013013333082199097, -0.0012613534927368164, -0.0012213736772537231, -0.0011813938617706299, -0.0011414140462875366, -0.0011014342308044434, -0.00106145441532135, -0.0010214745998382568, -0.0009814947843551636, -0.0009415149688720703, -0.000901535153388977, -0.0008615553379058838, -0.0008215755224227905, -0.0007815957069396973, -0.000741615891456604, -0.0007016360759735107, -0.0006616562604904175, -0.0006216764450073242, -0.000581696629524231, -0.0005417168140411377, -0.0005017369985580444, -0.00046175718307495117, -0.0004217773675918579, -0.00038179755210876465, -0.0003418177366256714, -0.0003018379211425781, -0.00026185810565948486, -0.0002218782901763916, -0.00018189847469329834, -0.00014191865921020508, -0.00010193884372711182, -6.195902824401855e-05, -2.1979212760925293e-05, 1.800060272216797e-05, 5.798041820526123e-05, 9.796023368835449e-05, 0.00013794004917144775, 0.00017791986465454102, 0.00021789968013763428, 0.00025787949562072754, 0.0002978593111038208, 0.00033783912658691406, 0.0003778189420700073, 0.0004177987575531006, 0.00045777857303619385, 0.0004977583885192871, 0.0005377382040023804, 0.0005777180194854736, 0.0006176978349685669, 0.0006576776504516602, 0.0006976574659347534, 0.0007376372814178467, 0.0007776170969009399, 0.0008175969123840332, 0.0008575767278671265, 0.0008975565433502197, 0.000937536358833313, 0.0009775161743164062]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 8.0, 13.0, 12.0, 19.0, 43.0, 64.0, 198.0, 1125.0, 35239.0, 1000566.0, 10256.0, 714.0, 146.0, 54.0, 28.0, 12.0, 11.0, 7.0, 7.0, 5.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.8238525390625, -16.303955078125, -15.7840576171875, -15.26416015625, -14.7442626953125, -14.224365234375, -13.7044677734375, -13.1845703125, -12.6646728515625, -12.144775390625, -11.6248779296875, -11.10498046875, -10.5850830078125, -10.065185546875, -9.5452880859375, -9.025390625, -8.5054931640625, -7.985595703125, -7.4656982421875, -6.94580078125, -6.4259033203125, -5.906005859375, -5.3861083984375, -4.8662109375, -4.3463134765625, -3.826416015625, -3.3065185546875, -2.78662109375, -2.2667236328125, -1.746826171875, -1.2269287109375, -0.70703125, -0.1871337890625, 0.332763671875, 0.8526611328125, 1.37255859375, 1.8924560546875, 2.412353515625, 2.9322509765625, 3.4521484375, 3.9720458984375, 4.491943359375, 5.0118408203125, 5.53173828125, 6.0516357421875, 6.571533203125, 7.0914306640625, 7.611328125, 8.1312255859375, 8.651123046875, 9.1710205078125, 9.69091796875, 10.2108154296875, 10.730712890625, 11.2506103515625, 11.7705078125, 12.2904052734375, 12.810302734375, 13.3302001953125, 13.85009765625, 14.3699951171875, 14.889892578125, 15.4097900390625, 15.9296875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 3.0, 8.0, 14.0, 9.0, 21.0, 21.0, 43.0, 66.0, 95.0, 145.0, 146.0, 134.0, 98.0, 54.0, 27.0, 24.0, 21.0, 18.0, 6.0, 7.0, 9.0, 4.0, 1.0, 6.0, 2.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86895751953125, -3.7496337890625, -3.63031005859375, -3.510986328125, -3.39166259765625, -3.2723388671875, -3.15301513671875, -3.03369140625, -2.91436767578125, -2.7950439453125, -2.67572021484375, -2.556396484375, -2.43707275390625, -2.3177490234375, -2.19842529296875, -2.0791015625, -1.95977783203125, -1.8404541015625, -1.72113037109375, -1.601806640625, -1.48248291015625, -1.3631591796875, -1.24383544921875, -1.12451171875, -1.00518798828125, -0.8858642578125, -0.76654052734375, -0.647216796875, -0.52789306640625, -0.4085693359375, -0.28924560546875, -0.169921875, -0.05059814453125, 0.0687255859375, 0.18804931640625, 0.307373046875, 0.42669677734375, 0.5460205078125, 0.66534423828125, 0.78466796875, 0.90399169921875, 1.0233154296875, 1.14263916015625, 1.261962890625, 1.38128662109375, 1.5006103515625, 1.61993408203125, 1.7392578125, 1.85858154296875, 1.9779052734375, 2.09722900390625, 2.216552734375, 2.33587646484375, 2.4552001953125, 2.57452392578125, 2.69384765625, 2.81317138671875, 2.9324951171875, 3.05181884765625, 3.171142578125, 3.29046630859375, 3.4097900390625, 3.52911376953125, 3.6484375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 12.0, 984.0, 19.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.61256408691406, -80.5682601928711, -63.52396011352539, -46.47966003417969, -29.43535614013672, -12.39105224609375, 4.6532440185546875, 21.697547912597656, 38.741851806640625, 55.786155700683594, 72.83045959472656, 89.874755859375, 106.91905975341797, 123.96336364746094, 141.00765991210938, 158.05197143554688, 175.0962677001953, 192.14056396484375, 209.18487548828125, 226.2291717529297, 243.27346801757812, 260.3177795410156, 277.362060546875, 294.4063720703125, 311.45068359375, 328.4949951171875, 345.5392761230469, 362.5835876464844, 379.6278991699219, 396.67218017578125, 413.71649169921875, 430.76080322265625, 447.80511474609375, 464.84942626953125, 481.8937072753906, 498.9380187988281, 515.9822998046875, 533.026611328125, 550.0709228515625, 567.115234375, 584.1595458984375, 601.203857421875, 618.2481689453125, 635.29248046875, 652.3367309570312, 669.3810424804688, 686.4253540039062, 703.4696655273438, 720.513916015625, 737.5582275390625, 754.6025390625, 771.6468505859375, 788.6911010742188, 805.7354125976562, 822.7797241210938, 839.8240356445312, 856.8683471679688, 873.9126586914062, 890.9569702148438, 908.001220703125, 925.0455322265625, 942.08984375, 959.1341552734375, 976.178466796875, 993.2227783203125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 9.0, 17.0, 25.0, 19.0, 29.0, 33.0, 42.0, 67.0, 73.0, 62.0, 60.0, 84.0, 70.0, 74.0, 47.0, 59.0, 62.0, 40.0, 38.0, 22.0, 23.0, 12.0, 10.0, 13.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.333789825439453, -18.358734130859375, -17.38368034362793, -16.40862464904785, -15.433568954467773, -14.458514213562012, -13.48345947265625, -12.508403778076172, -11.533348083496094, -10.558293342590332, -9.583237648010254, -8.608182907104492, -7.633127212524414, -6.658072471618652, -5.683017253875732, -4.7079620361328125, -3.732907295227051, -2.757852077484131, -1.7827969789505005, -0.8077418804168701, 0.1673133373260498, 1.1423683166503906, 2.1174235343933105, 3.0924787521362305, 4.06753396987915, 5.04258918762207, 6.01764440536499, 6.99269962310791, 7.967754364013672, 8.94281005859375, 9.917864799499512, 10.892919540405273, 11.867975234985352, 12.843029975891113, 13.818085670471191, 14.793140411376953, 15.768196105957031, 16.74325180053711, 17.718305587768555, 18.693361282348633, 19.66841697692871, 20.64347267150879, 21.618526458740234, 22.593582153320312, 23.56863784790039, 24.54369354248047, 25.518747329711914, 26.493803024291992, 27.468856811523438, 28.443912506103516, 29.41896629333496, 30.39402198791504, 31.369077682495117, 32.34413146972656, 33.31918716430664, 34.29424285888672, 35.2692985534668, 36.244354248046875, 37.21940994262695, 38.19446563720703, 39.169517517089844, 40.14457321166992, 41.11962890625, 42.09468460083008, 43.069740295410156]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 15.0, 49.0, 233.0, 1018.0, 4182894.0, 9171.0, 627.0, 170.0, 61.0, 39.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.296875, -18.536376953125, -15.77587890625, -13.015380859375, -10.2548828125, -7.494384765625, -4.73388671875, -1.973388671875, 0.787109375, 3.547607421875, 6.30810546875, 9.068603515625, 11.8291015625, 14.589599609375, 17.35009765625, 20.110595703125, 22.87109375, 25.631591796875, 28.39208984375, 31.152587890625, 33.9130859375, 36.673583984375, 39.43408203125, 42.194580078125, 44.955078125, 47.715576171875, 50.47607421875, 53.236572265625, 55.9970703125, 58.757568359375, 61.51806640625, 64.278564453125, 67.0390625, 69.799560546875, 72.56005859375, 75.320556640625, 78.0810546875, 80.841552734375, 83.60205078125, 86.362548828125, 89.123046875, 91.883544921875, 94.64404296875, 97.404541015625, 100.1650390625, 102.925537109375, 105.68603515625, 108.446533203125, 111.20703125, 113.967529296875, 116.72802734375, 119.488525390625, 122.2490234375, 125.009521484375, 127.77001953125, 130.530517578125, 133.291015625, 136.051513671875, 138.81201171875, 141.572509765625, 144.3330078125, 147.093505859375, 149.85400390625, 152.614501953125, 155.375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 11.0, 25.0, 90.0, 196.0, 297.0, 242.0, 111.0, 37.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.3841285705566406, -0.30170440673828125, -0.21928024291992188, -0.1368560791015625, -0.054431915283203125, 0.02799224853515625, 0.11041641235351562, 0.192840576171875, 0.2752647399902344, 0.35768890380859375, 0.4401130676269531, 0.5225372314453125, 0.6049613952636719, 0.6873855590820312, 0.7698097229003906, 0.85223388671875, 0.9346580505371094, 1.0170822143554688, 1.0995063781738281, 1.1819305419921875, 1.2643547058105469, 1.3467788696289062, 1.4292030334472656, 1.511627197265625, 1.5940513610839844, 1.6764755249023438, 1.7588996887207031, 1.8413238525390625, 1.9237480163574219, 2.0061721801757812, 2.0885963439941406, 2.1710205078125, 2.2534446716308594, 2.3358688354492188, 2.418292999267578, 2.5007171630859375, 2.583141326904297, 2.6655654907226562, 2.7479896545410156, 2.830413818359375, 2.9128379821777344, 2.9952621459960938, 3.077686309814453, 3.1601104736328125, 3.242534637451172, 3.3249588012695312, 3.4073829650878906, 3.48980712890625, 3.5722312927246094, 3.6546554565429688, 3.737079620361328, 3.8195037841796875, 3.901927947998047, 3.9843521118164062, 4.066776275634766, 4.149200439453125, 4.231624603271484, 4.314048767089844, 4.396472930908203, 4.4788970947265625, 4.561321258544922, 4.643745422363281, 4.726169586181641, 4.80859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 13.0, 61.0, 141.0, 372.0, 4189814.0, 3187.0, 400.0, 211.0, 71.0, 18.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.25, -71.01953125, -63.7890625, -56.55859375, -49.328125, -42.09765625, -34.8671875, -27.63671875, -20.40625, -13.17578125, -5.9453125, 1.28515625, 8.515625, 15.74609375, 22.9765625, 30.20703125, 37.4375, 44.66796875, 51.8984375, 59.12890625, 66.359375, 73.58984375, 80.8203125, 88.05078125, 95.28125, 102.51171875, 109.7421875, 116.97265625, 124.203125, 131.43359375, 138.6640625, 145.89453125, 153.125, 160.35546875, 167.5859375, 174.81640625, 182.046875, 189.27734375, 196.5078125, 203.73828125, 210.96875, 218.19921875, 225.4296875, 232.66015625, 239.890625, 247.12109375, 254.3515625, 261.58203125, 268.8125, 276.04296875, 283.2734375, 290.50390625, 297.734375, 304.96484375, 312.1953125, 319.42578125, 326.65625, 333.88671875, 341.1171875, 348.34765625, 355.578125, 362.80859375, 370.0390625, 377.26953125, 384.5]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 54.0, 896.0, 3087.0, 41.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.3282470703125, -3.851806640625, -3.3753662109375, -2.89892578125, -2.4224853515625, -1.946044921875, -1.4696044921875, -0.9931640625, -0.5167236328125, -0.040283203125, 0.4361572265625, 0.91259765625, 1.3890380859375, 1.865478515625, 2.3419189453125, 2.818359375, 3.2947998046875, 3.771240234375, 4.2476806640625, 4.72412109375, 5.2005615234375, 5.677001953125, 6.1534423828125, 6.6298828125, 7.1063232421875, 7.582763671875, 8.0592041015625, 8.53564453125, 9.0120849609375, 9.488525390625, 9.9649658203125, 10.44140625, 10.9178466796875, 11.394287109375, 11.8707275390625, 12.34716796875, 12.8236083984375, 13.300048828125, 13.7764892578125, 14.2529296875, 14.7293701171875, 15.205810546875, 15.6822509765625, 16.15869140625, 16.6351318359375, 17.111572265625, 17.5880126953125, 18.064453125, 18.5408935546875, 19.017333984375, 19.4937744140625, 19.97021484375, 20.4466552734375, 20.923095703125, 21.3995361328125, 21.8759765625, 22.3524169921875, 22.828857421875, 23.3052978515625, 23.78173828125, 24.2581787109375, 24.734619140625, 25.2110595703125, 25.6875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 20.0, 886.0, 99.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.11139678955078, -116.8646240234375, -107.61785888671875, -98.37109375, -89.12432098388672, -79.87754821777344, -70.63078308105469, -61.384010314941406, -52.137245178222656, -42.89047622680664, -33.643707275390625, -24.39693832397461, -15.150169372558594, -5.903400421142578, 3.3433685302734375, 12.590141296386719, 21.83690643310547, 31.083675384521484, 40.3304443359375, 49.577213287353516, 58.82398223876953, 68.07075500488281, 77.31752014160156, 86.56429290771484, 95.8110580444336, 105.05783081054688, 114.30459594726562, 123.55136108398438, 132.79812622070312, 142.04490661621094, 151.2916717529297, 160.5384521484375, 169.78521728515625, 179.031982421875, 188.27874755859375, 197.52552795410156, 206.7722930908203, 216.01905822753906, 225.26583862304688, 234.51260375976562, 243.75936889648438, 253.00613403320312, 262.2528991699219, 271.4996643066406, 280.7464599609375, 289.99322509765625, 299.239990234375, 308.48675537109375, 317.7335205078125, 326.98028564453125, 336.22705078125, 345.47381591796875, 354.7205810546875, 363.9673767089844, 373.2141418457031, 382.4609069824219, 391.7076721191406, 400.9544372558594, 410.2012023925781, 419.4479675292969, 428.69476318359375, 437.9415283203125, 447.18829345703125, 456.43505859375, 465.68182373046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 10.0, 33.0, 56.0, 84.0, 116.0, 154.0, 168.0, 141.0, 110.0, 57.0, 33.0, 19.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.08953857421875, -86.33087158203125, -83.57220458984375, -80.81353759765625, -78.05487060546875, -75.29619598388672, -72.53752899169922, -69.77886199951172, -67.02019500732422, -64.26152801513672, -61.50286102294922, -58.74419021606445, -55.98552322387695, -53.22685623168945, -50.46818542480469, -47.70951843261719, -44.95085144042969, -42.19218444824219, -39.43351745605469, -36.67484664916992, -33.91617965698242, -31.157512664794922, -28.39884376525879, -25.640174865722656, -22.881507873535156, -20.122840881347656, -17.364171981811523, -14.605504035949707, -11.84683609008789, -9.088168144226074, -6.329500198364258, -3.570831298828125, -0.8121566772460938, 1.9465112686157227, 4.705179214477539, 7.4638471603393555, 10.222515106201172, 12.981183052062988, 15.739850997924805, 18.498519897460938, 21.257186889648438, 24.015853881835938, 26.77452278137207, 29.533191680908203, 32.2918586730957, 35.0505256652832, 37.80919647216797, 40.56786346435547, 43.32653045654297, 46.08519744873047, 48.84386444091797, 51.602535247802734, 54.361202239990234, 57.119869232177734, 59.8785400390625, 62.63720703125, 65.3958740234375, 68.154541015625, 70.9132080078125, 73.671875, 76.4305419921875, 79.18921661376953, 81.94788360595703, 84.70655059814453, 87.46521759033203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 15.0, 13.0, 45.0, 63.0, 107.0, 180.0, 539.0, 1854.0, 12163.0, 830102.0, 195637.0, 5826.0, 1201.0, 400.0, 150.0, 82.0, 52.0, 26.0, 27.0, 9.0, 13.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.375, -35.23291015625, -34.0908203125, -32.94873046875, -31.806640625, -30.66455078125, -29.5224609375, -28.38037109375, -27.23828125, -26.09619140625, -24.9541015625, -23.81201171875, -22.669921875, -21.52783203125, -20.3857421875, -19.24365234375, -18.1015625, -16.95947265625, -15.8173828125, -14.67529296875, -13.533203125, -12.39111328125, -11.2490234375, -10.10693359375, -8.96484375, -7.82275390625, -6.6806640625, -5.53857421875, -4.396484375, -3.25439453125, -2.1123046875, -0.97021484375, 0.171875, 1.31396484375, 2.4560546875, 3.59814453125, 4.740234375, 5.88232421875, 7.0244140625, 8.16650390625, 9.30859375, 10.45068359375, 11.5927734375, 12.73486328125, 13.876953125, 15.01904296875, 16.1611328125, 17.30322265625, 18.4453125, 19.58740234375, 20.7294921875, 21.87158203125, 23.013671875, 24.15576171875, 25.2978515625, 26.43994140625, 27.58203125, 28.72412109375, 29.8662109375, 31.00830078125, 32.150390625, 33.29248046875, 34.4345703125, 35.57666015625, 36.71875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 25.0, 40.0, 85.0, 111.0, 162.0, 179.0, 148.0, 114.0, 62.0, 41.0, 21.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.154296875, -3.000213623046875, -2.84613037109375, -2.692047119140625, -2.5379638671875, -2.383880615234375, -2.22979736328125, -2.075714111328125, -1.921630859375, -1.767547607421875, -1.61346435546875, -1.459381103515625, -1.3052978515625, -1.151214599609375, -0.99713134765625, -0.843048095703125, -0.68896484375, -0.534881591796875, -0.38079833984375, -0.226715087890625, -0.0726318359375, 0.081451416015625, 0.23553466796875, 0.389617919921875, 0.543701171875, 0.697784423828125, 0.85186767578125, 1.005950927734375, 1.1600341796875, 1.314117431640625, 1.46820068359375, 1.622283935546875, 1.7763671875, 1.930450439453125, 2.08453369140625, 2.238616943359375, 2.3927001953125, 2.546783447265625, 2.70086669921875, 2.854949951171875, 3.009033203125, 3.163116455078125, 3.31719970703125, 3.471282958984375, 3.6253662109375, 3.779449462890625, 3.93353271484375, 4.087615966796875, 4.24169921875, 4.395782470703125, 4.54986572265625, 4.703948974609375, 4.8580322265625, 5.012115478515625, 5.16619873046875, 5.320281982421875, 5.474365234375, 5.628448486328125, 5.78253173828125, 5.936614990234375, 6.0906982421875, 6.244781494140625, 6.39886474609375, 6.552947998046875, 6.70703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 19.0, 16.0, 26.0, 23.0, 53.0, 85.0, 150.0, 481.0, 2912.0, 105797.0, 925639.0, 11703.0, 1003.0, 279.0, 105.0, 61.0, 30.0, 24.0, 16.0, 15.0, 19.0, 11.0, 12.0, 5.0, 5.0, 4.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.328125, -27.449462890625, -26.57080078125, -25.692138671875, -24.8134765625, -23.934814453125, -23.05615234375, -22.177490234375, -21.298828125, -20.420166015625, -19.54150390625, -18.662841796875, -17.7841796875, -16.905517578125, -16.02685546875, -15.148193359375, -14.26953125, -13.390869140625, -12.51220703125, -11.633544921875, -10.7548828125, -9.876220703125, -8.99755859375, -8.118896484375, -7.240234375, -6.361572265625, -5.48291015625, -4.604248046875, -3.7255859375, -2.846923828125, -1.96826171875, -1.089599609375, -0.2109375, 0.667724609375, 1.54638671875, 2.425048828125, 3.3037109375, 4.182373046875, 5.06103515625, 5.939697265625, 6.818359375, 7.697021484375, 8.57568359375, 9.454345703125, 10.3330078125, 11.211669921875, 12.09033203125, 12.968994140625, 13.84765625, 14.726318359375, 15.60498046875, 16.483642578125, 17.3623046875, 18.240966796875, 19.11962890625, 19.998291015625, 20.876953125, 21.755615234375, 22.63427734375, 23.512939453125, 24.3916015625, 25.270263671875, 26.14892578125, 27.027587890625, 27.90625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 5.0, 5.0, 7.0, 16.0, 15.0, 15.0, 26.0, 27.0, 25.0, 37.0, 32.0, 57.0, 51.0, 52.0, 56.0, 57.0, 62.0, 45.0, 56.0, 63.0, 57.0, 48.0, 39.0, 25.0, 12.0, 18.0, 21.0, 14.0, 12.0, 10.0, 11.0, 3.0, 2.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5546875, -8.29620361328125, -8.0377197265625, -7.77923583984375, -7.520751953125, -7.26226806640625, -7.0037841796875, -6.74530029296875, -6.48681640625, -6.22833251953125, -5.9698486328125, -5.71136474609375, -5.452880859375, -5.19439697265625, -4.9359130859375, -4.67742919921875, -4.4189453125, -4.16046142578125, -3.9019775390625, -3.64349365234375, -3.385009765625, -3.12652587890625, -2.8680419921875, -2.60955810546875, -2.35107421875, -2.09259033203125, -1.8341064453125, -1.57562255859375, -1.317138671875, -1.05865478515625, -0.8001708984375, -0.54168701171875, -0.283203125, -0.02471923828125, 0.2337646484375, 0.49224853515625, 0.750732421875, 1.00921630859375, 1.2677001953125, 1.52618408203125, 1.78466796875, 2.04315185546875, 2.3016357421875, 2.56011962890625, 2.818603515625, 3.07708740234375, 3.3355712890625, 3.59405517578125, 3.8525390625, 4.11102294921875, 4.3695068359375, 4.62799072265625, 4.886474609375, 5.14495849609375, 5.4034423828125, 5.66192626953125, 5.92041015625, 6.17889404296875, 6.4373779296875, 6.69586181640625, 6.954345703125, 7.21282958984375, 7.4713134765625, 7.72979736328125, 7.98828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 10.0, 8.0, 9.0, 25.0, 37.0, 35.0, 74.0, 129.0, 210.0, 439.0, 834.0, 2295.0, 8633.0, 100084.0, 872520.0, 53165.0, 6558.0, 1861.0, 768.0, 343.0, 189.0, 116.0, 62.0, 40.0, 20.0, 20.0, 17.0, 7.0, 9.0, 3.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.245361328125, -7.99853515625, -7.751708984375, -7.5048828125, -7.258056640625, -7.01123046875, -6.764404296875, -6.517578125, -6.270751953125, -6.02392578125, -5.777099609375, -5.5302734375, -5.283447265625, -5.03662109375, -4.789794921875, -4.54296875, -4.296142578125, -4.04931640625, -3.802490234375, -3.5556640625, -3.308837890625, -3.06201171875, -2.815185546875, -2.568359375, -2.321533203125, -2.07470703125, -1.827880859375, -1.5810546875, -1.334228515625, -1.08740234375, -0.840576171875, -0.59375, -0.346923828125, -0.10009765625, 0.146728515625, 0.3935546875, 0.640380859375, 0.88720703125, 1.134033203125, 1.380859375, 1.627685546875, 1.87451171875, 2.121337890625, 2.3681640625, 2.614990234375, 2.86181640625, 3.108642578125, 3.35546875, 3.602294921875, 3.84912109375, 4.095947265625, 4.3427734375, 4.589599609375, 4.83642578125, 5.083251953125, 5.330078125, 5.576904296875, 5.82373046875, 6.070556640625, 6.3173828125, 6.564208984375, 6.81103515625, 7.057861328125, 7.3046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 7.0, 14.0, 12.0, 22.0, 19.0, 19.0, 25.0, 41.0, 45.0, 72.0, 151.0, 151.0, 111.0, 77.0, 55.0, 38.0, 32.0, 24.0, 20.0, 14.0, 12.0, 7.0, 8.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011577606201171875, -0.0011267811059951782, -0.001095801591873169, -0.0010648220777511597, -0.0010338425636291504, -0.0010028630495071411, -0.0009718835353851318, -0.0009409040212631226, -0.0009099245071411133, -0.000878944993019104, -0.0008479654788970947, -0.0008169859647750854, -0.0007860064506530762, -0.0007550269365310669, -0.0007240474224090576, -0.0006930679082870483, -0.0006620883941650391, -0.0006311088800430298, -0.0006001293659210205, -0.0005691498517990112, -0.000538170337677002, -0.0005071908235549927, -0.0004762113094329834, -0.0004452317953109741, -0.00041425228118896484, -0.00038327276706695557, -0.0003522932529449463, -0.000321313738822937, -0.00029033422470092773, -0.00025935471057891846, -0.00022837519645690918, -0.0001973956823348999, -0.00016641616821289062, -0.00013543665409088135, -0.00010445713996887207, -7.347762584686279e-05, -4.2498111724853516e-05, -1.1518597602844238e-05, 1.946091651916504e-05, 5.0440430641174316e-05, 8.14199447631836e-05, 0.00011239945888519287, 0.00014337897300720215, 0.00017435848712921143, 0.0002053380012512207, 0.00023631751537322998, 0.00026729702949523926, 0.00029827654361724854, 0.0003292560577392578, 0.0003602355718612671, 0.00039121508598327637, 0.00042219460010528564, 0.0004531741142272949, 0.0004841536283493042, 0.0005151331424713135, 0.0005461126565933228, 0.000577092170715332, 0.0006080716848373413, 0.0006390511989593506, 0.0006700307130813599, 0.0007010102272033691, 0.0007319897413253784, 0.0007629692554473877, 0.000793948769569397, 0.0008249282836914062]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 10.0, 15.0, 18.0, 39.0, 60.0, 116.0, 381.0, 1740.0, 44099.0, 990428.0, 10201.0, 940.0, 258.0, 101.0, 45.0, 31.0, 28.0, 13.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.459716796875, -15.95068359375, -15.441650390625, -14.9326171875, -14.423583984375, -13.91455078125, -13.405517578125, -12.896484375, -12.387451171875, -11.87841796875, -11.369384765625, -10.8603515625, -10.351318359375, -9.84228515625, -9.333251953125, -8.82421875, -8.315185546875, -7.80615234375, -7.297119140625, -6.7880859375, -6.279052734375, -5.77001953125, -5.260986328125, -4.751953125, -4.242919921875, -3.73388671875, -3.224853515625, -2.7158203125, -2.206787109375, -1.69775390625, -1.188720703125, -0.6796875, -0.170654296875, 0.33837890625, 0.847412109375, 1.3564453125, 1.865478515625, 2.37451171875, 2.883544921875, 3.392578125, 3.901611328125, 4.41064453125, 4.919677734375, 5.4287109375, 5.937744140625, 6.44677734375, 6.955810546875, 7.46484375, 7.973876953125, 8.48291015625, 8.991943359375, 9.5009765625, 10.010009765625, 10.51904296875, 11.028076171875, 11.537109375, 12.046142578125, 12.55517578125, 13.064208984375, 13.5732421875, 14.082275390625, 14.59130859375, 15.100341796875, 15.609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 14.0, 8.0, 14.0, 23.0, 34.0, 73.0, 89.0, 125.0, 125.0, 132.0, 110.0, 88.0, 60.0, 43.0, 20.0, 18.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.1077880859375, -4.930419921875, -4.7530517578125, -4.57568359375, -4.3983154296875, -4.220947265625, -4.0435791015625, -3.8662109375, -3.6888427734375, -3.511474609375, -3.3341064453125, -3.15673828125, -2.9793701171875, -2.802001953125, -2.6246337890625, -2.447265625, -2.2698974609375, -2.092529296875, -1.9151611328125, -1.73779296875, -1.5604248046875, -1.383056640625, -1.2056884765625, -1.0283203125, -0.8509521484375, -0.673583984375, -0.4962158203125, -0.31884765625, -0.1414794921875, 0.035888671875, 0.2132568359375, 0.390625, 0.5679931640625, 0.745361328125, 0.9227294921875, 1.10009765625, 1.2774658203125, 1.454833984375, 1.6322021484375, 1.8095703125, 1.9869384765625, 2.164306640625, 2.3416748046875, 2.51904296875, 2.6964111328125, 2.873779296875, 3.0511474609375, 3.228515625, 3.4058837890625, 3.583251953125, 3.7606201171875, 3.93798828125, 4.1153564453125, 4.292724609375, 4.4700927734375, 4.6474609375, 4.8248291015625, 5.002197265625, 5.1795654296875, 5.35693359375, 5.5343017578125, 5.711669921875, 5.8890380859375, 6.06640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 19.0, 77.0, 701.0, 185.0, 13.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.79705810546875, -266.55810546875, -259.31915283203125, -252.08021545410156, -244.8412628173828, -237.60232543945312, -230.36337280273438, -223.12442016601562, -215.88546752929688, -208.64651489257812, -201.40757751464844, -194.1686248779297, -186.92967224121094, -179.69073486328125, -172.4517822265625, -165.21282958984375, -157.973876953125, -150.73492431640625, -143.49598693847656, -136.2570343017578, -129.01808166503906, -121.77913665771484, -114.54019165039062, -107.30123901367188, -100.06230163574219, -92.82335662841797, -85.58440399169922, -78.345458984375, -71.10650634765625, -63.86756134033203, -56.62861251831055, -49.38966369628906, -42.15071105957031, -34.91176223754883, -27.672813415527344, -20.433866500854492, -13.194917678833008, -5.955970764160156, 1.2829780578613281, 8.521926879882812, 15.760875701904297, 22.99982452392578, 30.238773345947266, 37.47772216796875, 44.71666717529297, 51.95561599731445, 59.19456481933594, 66.43351745605469, 73.6724624633789, 80.91140747070312, 88.15036010742188, 95.3893051147461, 102.62825775146484, 109.86720275878906, 117.10615539550781, 124.34510040283203, 131.58404541015625, 138.822998046875, 146.0619354248047, 153.30088806152344, 160.5398406982422, 167.77877807617188, 175.01773071289062, 182.25668334960938, 189.49563598632812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 6.0, 8.0, 2.0, 7.0, 16.0, 23.0, 21.0, 28.0, 41.0, 47.0, 36.0, 55.0, 58.0, 65.0, 64.0, 78.0, 58.0, 72.0, 61.0, 46.0, 49.0, 36.0, 30.0, 20.0, 22.0, 16.0, 8.0, 7.0, 7.0, 2.0, 6.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.408939361572266, -59.443477630615234, -57.4780158996582, -55.512550354003906, -53.547088623046875, -51.581626892089844, -49.61616516113281, -47.65070343017578, -45.68524169921875, -43.71977996826172, -41.75431823730469, -39.788856506347656, -37.82339096069336, -35.85792922973633, -33.8924674987793, -31.927005767822266, -29.96154022216797, -27.996078491210938, -26.030614852905273, -24.065153121948242, -22.099689483642578, -20.134227752685547, -18.168766021728516, -16.203304290771484, -14.23784065246582, -12.272377967834473, -10.306915283203125, -8.341453552246094, -6.375990867614746, -4.410528182983398, -2.445066452026367, -0.47960376739501953, 1.4858627319335938, 3.4513251781463623, 5.416787624359131, 7.38224983215332, 9.347712516784668, 11.313175201416016, 13.278636932373047, 15.244099617004395, 17.209562301635742, 19.175024032592773, 21.140487670898438, 23.10594940185547, 25.0714111328125, 27.036874771118164, 29.002336502075195, 30.96780014038086, 32.93326187133789, 34.89872360229492, 36.86418533325195, 38.82965087890625, 40.79511260986328, 42.76057434082031, 44.726036071777344, 46.691497802734375, 48.656959533691406, 50.62242126464844, 52.58788299560547, 54.5533447265625, 56.5188102722168, 58.48427200317383, 60.44973373413086, 62.41519546508789, 64.38066101074219]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 7.0, 15.0, 47.0, 88.0, 276.0, 2120.0, 516301.0, 3670762.0, 3580.0, 597.0, 214.0, 136.0, 57.0, 37.0, 15.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.21875, -20.20751953125, -18.1962890625, -16.18505859375, -14.173828125, -12.16259765625, -10.1513671875, -8.14013671875, -6.12890625, -4.11767578125, -2.1064453125, -0.09521484375, 1.916015625, 3.92724609375, 5.9384765625, 7.94970703125, 9.9609375, 11.97216796875, 13.9833984375, 15.99462890625, 18.005859375, 20.01708984375, 22.0283203125, 24.03955078125, 26.05078125, 28.06201171875, 30.0732421875, 32.08447265625, 34.095703125, 36.10693359375, 38.1181640625, 40.12939453125, 42.140625, 44.15185546875, 46.1630859375, 48.17431640625, 50.185546875, 52.19677734375, 54.2080078125, 56.21923828125, 58.23046875, 60.24169921875, 62.2529296875, 64.26416015625, 66.275390625, 68.28662109375, 70.2978515625, 72.30908203125, 74.3203125, 76.33154296875, 78.3427734375, 80.35400390625, 82.365234375, 84.37646484375, 86.3876953125, 88.39892578125, 90.41015625, 92.42138671875, 94.4326171875, 96.44384765625, 98.455078125, 100.46630859375, 102.4775390625, 104.48876953125, 106.5]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 16.0, 36.0, 59.0, 88.0, 121.0, 172.0, 158.0, 129.0, 93.0, 63.0, 30.0, 17.0, 10.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7333984375, -1.5904083251953125, -1.447418212890625, -1.3044281005859375, -1.16143798828125, -1.0184478759765625, -0.875457763671875, -0.7324676513671875, -0.5894775390625, -0.4464874267578125, -0.303497314453125, -0.1605072021484375, -0.01751708984375, 0.1254730224609375, 0.268463134765625, 0.4114532470703125, 0.554443359375, 0.6974334716796875, 0.840423583984375, 0.9834136962890625, 1.12640380859375, 1.2693939208984375, 1.412384033203125, 1.5553741455078125, 1.6983642578125, 1.8413543701171875, 1.984344482421875, 2.1273345947265625, 2.27032470703125, 2.4133148193359375, 2.556304931640625, 2.6992950439453125, 2.84228515625, 2.9852752685546875, 3.128265380859375, 3.2712554931640625, 3.41424560546875, 3.5572357177734375, 3.700225830078125, 3.8432159423828125, 3.9862060546875, 4.1291961669921875, 4.272186279296875, 4.4151763916015625, 4.55816650390625, 4.7011566162109375, 4.844146728515625, 4.9871368408203125, 5.130126953125, 5.2731170654296875, 5.416107177734375, 5.5590972900390625, 5.70208740234375, 5.8450775146484375, 5.988067626953125, 6.1310577392578125, 6.2740478515625, 6.4170379638671875, 6.560028076171875, 6.7030181884765625, 6.84600830078125, 6.9889984130859375, 7.131988525390625, 7.2749786376953125, 7.41796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 41.0, 117.0, 1242.0, 4191247.0, 1330.0, 215.0, 58.0, 16.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.75, -62.14453125, -55.5390625, -48.93359375, -42.328125, -35.72265625, -29.1171875, -22.51171875, -15.90625, -9.30078125, -2.6953125, 3.91015625, 10.515625, 17.12109375, 23.7265625, 30.33203125, 36.9375, 43.54296875, 50.1484375, 56.75390625, 63.359375, 69.96484375, 76.5703125, 83.17578125, 89.78125, 96.38671875, 102.9921875, 109.59765625, 116.203125, 122.80859375, 129.4140625, 136.01953125, 142.625, 149.23046875, 155.8359375, 162.44140625, 169.046875, 175.65234375, 182.2578125, 188.86328125, 195.46875, 202.07421875, 208.6796875, 215.28515625, 221.890625, 228.49609375, 235.1015625, 241.70703125, 248.3125, 254.91796875, 261.5234375, 268.12890625, 274.734375, 281.33984375, 287.9453125, 294.55078125, 301.15625, 307.76171875, 314.3671875, 320.97265625, 327.578125, 334.18359375, 340.7890625, 347.39453125, 354.0]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 7.0, 14.0, 43.0, 228.0, 3479.0, 245.0, 44.0, 16.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.61944580078125, -3.1334228515625, -2.64739990234375, -2.161376953125, -1.67535400390625, -1.1893310546875, -0.70330810546875, -0.21728515625, 0.26873779296875, 0.7547607421875, 1.24078369140625, 1.726806640625, 2.21282958984375, 2.6988525390625, 3.18487548828125, 3.6708984375, 4.15692138671875, 4.6429443359375, 5.12896728515625, 5.614990234375, 6.10101318359375, 6.5870361328125, 7.07305908203125, 7.55908203125, 8.04510498046875, 8.5311279296875, 9.01715087890625, 9.503173828125, 9.98919677734375, 10.4752197265625, 10.96124267578125, 11.447265625, 11.93328857421875, 12.4193115234375, 12.90533447265625, 13.391357421875, 13.87738037109375, 14.3634033203125, 14.84942626953125, 15.33544921875, 15.82147216796875, 16.3074951171875, 16.79351806640625, 17.279541015625, 17.76556396484375, 18.2515869140625, 18.73760986328125, 19.2236328125, 19.70965576171875, 20.1956787109375, 20.68170166015625, 21.167724609375, 21.65374755859375, 22.1397705078125, 22.62579345703125, 23.11181640625, 23.59783935546875, 24.0838623046875, 24.56988525390625, 25.055908203125, 25.54193115234375, 26.0279541015625, 26.51397705078125, 27.0]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 41.0, 852.0, 91.0, 20.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-203.90155029296875, -197.8068389892578, -191.7121124267578, -185.61740112304688, -179.52267456054688, -173.42796325683594, -167.333251953125, -161.238525390625, -155.14381408691406, -149.04910278320312, -142.95437622070312, -136.8596649169922, -130.7649383544922, -124.67022705078125, -118.57550811767578, -112.48078918457031, -106.38607025146484, -100.29135131835938, -94.1966323852539, -88.10191345214844, -82.0072021484375, -75.91248321533203, -69.81776428222656, -63.72304916381836, -57.62833023071289, -51.53361129760742, -45.43889617919922, -39.34417724609375, -33.24945831298828, -27.154743194580078, -21.06002426147461, -14.965309143066406, -8.870590209960938, -2.7758727073669434, 3.318844795227051, 9.413562774658203, 15.508279800415039, 21.602996826171875, 27.697715759277344, 33.79243087768555, 39.887149810791016, 45.981868743896484, 52.07658386230469, 58.171302795410156, 64.26602172851562, 70.36073303222656, 76.45545959472656, 82.5501708984375, 88.64488983154297, 94.73960876464844, 100.8343276977539, 106.92904663085938, 113.02375793457031, 119.11847686767578, 125.21319580078125, 131.3079071044922, 137.4026336669922, 143.49734497070312, 149.59207153320312, 155.68678283691406, 161.78150939941406, 167.876220703125, 173.970947265625, 180.06565856933594, 186.16036987304688]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 17.0, 20.0, 34.0, 59.0, 83.0, 83.0, 102.0, 126.0, 101.0, 104.0, 78.0, 65.0, 50.0, 30.0, 16.0, 13.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.70928192138672, -54.79673385620117, -52.88418960571289, -50.971641540527344, -49.0590934753418, -47.14654541015625, -45.23400115966797, -43.32145309448242, -41.408905029296875, -39.49635696411133, -37.58381271362305, -35.6712646484375, -33.75871658325195, -31.84617042541504, -29.933624267578125, -28.021076202392578, -26.108530044555664, -24.19598388671875, -22.283435821533203, -20.37088966369629, -18.458341598510742, -16.545795440673828, -14.633248329162598, -12.720701217651367, -10.808154106140137, -8.895606994628906, -6.983059883117676, -5.0705132484436035, -3.157966136932373, -1.2454195022583008, 0.6671276092529297, 2.57967472076416, 4.492221832275391, 6.404768943786621, 8.317316055297852, 10.229862213134766, 12.142410278320312, 14.054956436157227, 15.967503547668457, 17.880050659179688, 19.792598724365234, 21.70514488220215, 23.617692947387695, 25.53023910522461, 27.442787170410156, 29.35533332824707, 31.267879486083984, 33.18042755126953, 35.09297180175781, 37.00551986694336, 38.91806411743164, 40.83061218261719, 42.743160247802734, 44.65570831298828, 46.56825256347656, 48.48080062866211, 50.393348693847656, 52.3058967590332, 54.218441009521484, 56.13098907470703, 58.04353713989258, 59.956085205078125, 61.868629455566406, 63.78117752075195, 65.6937255859375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 2.0, 7.0, 3.0, 9.0, 15.0, 19.0, 22.0, 24.0, 38.0, 39.0, 69.0, 99.0, 146.0, 177.0, 333.0, 529.0, 1174.0, 2931.0, 9923.0, 44340.0, 385940.0, 527991.0, 56352.0, 11981.0, 3468.0, 1316.0, 610.0, 292.0, 188.0, 140.0, 95.0, 75.0, 48.0, 36.0, 24.0, 21.0, 15.0, 13.0, 16.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7734375, -14.312744140625, -13.85205078125, -13.391357421875, -12.9306640625, -12.469970703125, -12.00927734375, -11.548583984375, -11.087890625, -10.627197265625, -10.16650390625, -9.705810546875, -9.2451171875, -8.784423828125, -8.32373046875, -7.863037109375, -7.40234375, -6.941650390625, -6.48095703125, -6.020263671875, -5.5595703125, -5.098876953125, -4.63818359375, -4.177490234375, -3.716796875, -3.256103515625, -2.79541015625, -2.334716796875, -1.8740234375, -1.413330078125, -0.95263671875, -0.491943359375, -0.03125, 0.429443359375, 0.89013671875, 1.350830078125, 1.8115234375, 2.272216796875, 2.73291015625, 3.193603515625, 3.654296875, 4.114990234375, 4.57568359375, 5.036376953125, 5.4970703125, 5.957763671875, 6.41845703125, 6.879150390625, 7.33984375, 7.800537109375, 8.26123046875, 8.721923828125, 9.1826171875, 9.643310546875, 10.10400390625, 10.564697265625, 11.025390625, 11.486083984375, 11.94677734375, 12.407470703125, 12.8681640625, 13.328857421875, 13.78955078125, 14.250244140625, 14.7109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 11.0, 15.0, 38.0, 58.0, 81.0, 87.0, 114.0, 120.0, 111.0, 88.0, 75.0, 66.0, 51.0, 28.0, 20.0, 14.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.1763916015625, -3.016845703125, -2.8572998046875, -2.69775390625, -2.5382080078125, -2.378662109375, -2.2191162109375, -2.0595703125, -1.9000244140625, -1.740478515625, -1.5809326171875, -1.42138671875, -1.2618408203125, -1.102294921875, -0.9427490234375, -0.783203125, -0.6236572265625, -0.464111328125, -0.3045654296875, -0.14501953125, 0.0145263671875, 0.174072265625, 0.3336181640625, 0.4931640625, 0.6527099609375, 0.812255859375, 0.9718017578125, 1.13134765625, 1.2908935546875, 1.450439453125, 1.6099853515625, 1.76953125, 1.9290771484375, 2.088623046875, 2.2481689453125, 2.40771484375, 2.5672607421875, 2.726806640625, 2.8863525390625, 3.0458984375, 3.2054443359375, 3.364990234375, 3.5245361328125, 3.68408203125, 3.8436279296875, 4.003173828125, 4.1627197265625, 4.322265625, 4.4818115234375, 4.641357421875, 4.8009033203125, 4.96044921875, 5.1199951171875, 5.279541015625, 5.4390869140625, 5.5986328125, 5.7581787109375, 5.917724609375, 6.0772705078125, 6.23681640625, 6.3963623046875, 6.555908203125, 6.7154541015625, 6.875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 9.0, 16.0, 12.0, 11.0, 43.0, 52.0, 69.0, 146.0, 262.0, 864.0, 3599.0, 36671.0, 913472.0, 85722.0, 5641.0, 1191.0, 385.0, 138.0, 75.0, 42.0, 33.0, 19.0, 24.0, 15.0, 10.0, 7.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.96875, -25.23974609375, -24.5107421875, -23.78173828125, -23.052734375, -22.32373046875, -21.5947265625, -20.86572265625, -20.13671875, -19.40771484375, -18.6787109375, -17.94970703125, -17.220703125, -16.49169921875, -15.7626953125, -15.03369140625, -14.3046875, -13.57568359375, -12.8466796875, -12.11767578125, -11.388671875, -10.65966796875, -9.9306640625, -9.20166015625, -8.47265625, -7.74365234375, -7.0146484375, -6.28564453125, -5.556640625, -4.82763671875, -4.0986328125, -3.36962890625, -2.640625, -1.91162109375, -1.1826171875, -0.45361328125, 0.275390625, 1.00439453125, 1.7333984375, 2.46240234375, 3.19140625, 3.92041015625, 4.6494140625, 5.37841796875, 6.107421875, 6.83642578125, 7.5654296875, 8.29443359375, 9.0234375, 9.75244140625, 10.4814453125, 11.21044921875, 11.939453125, 12.66845703125, 13.3974609375, 14.12646484375, 14.85546875, 15.58447265625, 16.3134765625, 17.04248046875, 17.771484375, 18.50048828125, 19.2294921875, 19.95849609375, 20.6875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 11.0, 3.0, 13.0, 11.0, 19.0, 27.0, 45.0, 44.0, 59.0, 52.0, 52.0, 62.0, 65.0, 61.0, 69.0, 69.0, 77.0, 41.0, 43.0, 34.0, 28.0, 24.0, 22.0, 14.0, 18.0, 8.0, 7.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.9921875, -14.5699462890625, -14.147705078125, -13.7254638671875, -13.30322265625, -12.8809814453125, -12.458740234375, -12.0364990234375, -11.6142578125, -11.1920166015625, -10.769775390625, -10.3475341796875, -9.92529296875, -9.5030517578125, -9.080810546875, -8.6585693359375, -8.236328125, -7.8140869140625, -7.391845703125, -6.9696044921875, -6.54736328125, -6.1251220703125, -5.702880859375, -5.2806396484375, -4.8583984375, -4.4361572265625, -4.013916015625, -3.5916748046875, -3.16943359375, -2.7471923828125, -2.324951171875, -1.9027099609375, -1.48046875, -1.0582275390625, -0.635986328125, -0.2137451171875, 0.20849609375, 0.6307373046875, 1.052978515625, 1.4752197265625, 1.8974609375, 2.3197021484375, 2.741943359375, 3.1641845703125, 3.58642578125, 4.0086669921875, 4.430908203125, 4.8531494140625, 5.275390625, 5.6976318359375, 6.119873046875, 6.5421142578125, 6.96435546875, 7.3865966796875, 7.808837890625, 8.2310791015625, 8.6533203125, 9.0755615234375, 9.497802734375, 9.9200439453125, 10.34228515625, 10.7645263671875, 11.186767578125, 11.6090087890625, 12.03125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 10.0, 18.0, 12.0, 18.0, 29.0, 41.0, 70.0, 93.0, 146.0, 250.0, 503.0, 1201.0, 3893.0, 21304.0, 432372.0, 555557.0, 25930.0, 4488.0, 1291.0, 578.0, 285.0, 136.0, 92.0, 61.0, 41.0, 23.0, 18.0, 26.0, 13.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.48406982421875, -4.3118896484375, -4.13970947265625, -3.967529296875, -3.79534912109375, -3.6231689453125, -3.45098876953125, -3.27880859375, -3.10662841796875, -2.9344482421875, -2.76226806640625, -2.590087890625, -2.41790771484375, -2.2457275390625, -2.07354736328125, -1.9013671875, -1.72918701171875, -1.5570068359375, -1.38482666015625, -1.212646484375, -1.04046630859375, -0.8682861328125, -0.69610595703125, -0.52392578125, -0.35174560546875, -0.1795654296875, -0.00738525390625, 0.164794921875, 0.33697509765625, 0.5091552734375, 0.68133544921875, 0.853515625, 1.02569580078125, 1.1978759765625, 1.37005615234375, 1.542236328125, 1.71441650390625, 1.8865966796875, 2.05877685546875, 2.23095703125, 2.40313720703125, 2.5753173828125, 2.74749755859375, 2.919677734375, 3.09185791015625, 3.2640380859375, 3.43621826171875, 3.6083984375, 3.78057861328125, 3.9527587890625, 4.12493896484375, 4.297119140625, 4.46929931640625, 4.6414794921875, 4.81365966796875, 4.98583984375, 5.15802001953125, 5.3302001953125, 5.50238037109375, 5.674560546875, 5.84674072265625, 6.0189208984375, 6.19110107421875, 6.36328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 10.0, 12.0, 18.0, 15.0, 22.0, 35.0, 33.0, 42.0, 58.0, 99.0, 109.0, 120.0, 78.0, 89.0, 59.0, 57.0, 32.0, 26.0, 16.0, 9.0, 12.0, 11.0, 11.0, 3.0, 8.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005092620849609375, -0.000494837760925293, -0.00048041343688964844, -0.0004659891128540039, -0.0004515647888183594, -0.00043714046478271484, -0.0004227161407470703, -0.0004082918167114258, -0.00039386749267578125, -0.0003794431686401367, -0.0003650188446044922, -0.00035059452056884766, -0.0003361701965332031, -0.0003217458724975586, -0.00030732154846191406, -0.00029289722442626953, -0.000278472900390625, -0.00026404857635498047, -0.00024962425231933594, -0.0002351999282836914, -0.00022077560424804688, -0.00020635128021240234, -0.0001919269561767578, -0.00017750263214111328, -0.00016307830810546875, -0.00014865398406982422, -0.0001342296600341797, -0.00011980533599853516, -0.00010538101196289062, -9.09566879272461e-05, -7.653236389160156e-05, -6.210803985595703e-05, -4.76837158203125e-05, -3.325939178466797e-05, -1.8835067749023438e-05, -4.410743713378906e-06, 1.0013580322265625e-05, 2.4437904357910156e-05, 3.886222839355469e-05, 5.328655242919922e-05, 6.771087646484375e-05, 8.213520050048828e-05, 9.655952453613281e-05, 0.00011098384857177734, 0.00012540817260742188, 0.0001398324966430664, 0.00015425682067871094, 0.00016868114471435547, 0.00018310546875, 0.00019752979278564453, 0.00021195411682128906, 0.0002263784408569336, 0.00024080276489257812, 0.00025522708892822266, 0.0002696514129638672, 0.0002840757369995117, 0.00029850006103515625, 0.0003129243850708008, 0.0003273487091064453, 0.00034177303314208984, 0.0003561973571777344, 0.0003706216812133789, 0.00038504600524902344, 0.00039947032928466797, 0.0004138946533203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 2.0, 8.0, 15.0, 12.0, 23.0, 18.0, 29.0, 39.0, 71.0, 126.0, 274.0, 704.0, 2657.0, 17233.0, 469817.0, 534461.0, 18901.0, 2748.0, 724.0, 316.0, 135.0, 67.0, 48.0, 26.0, 19.0, 7.0, 12.0, 11.0, 7.0, 7.0, 10.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24798583984375, -7.0467529296875, -6.84552001953125, -6.644287109375, -6.44305419921875, -6.2418212890625, -6.04058837890625, -5.83935546875, -5.63812255859375, -5.4368896484375, -5.23565673828125, -5.034423828125, -4.83319091796875, -4.6319580078125, -4.43072509765625, -4.2294921875, -4.02825927734375, -3.8270263671875, -3.62579345703125, -3.424560546875, -3.22332763671875, -3.0220947265625, -2.82086181640625, -2.61962890625, -2.41839599609375, -2.2171630859375, -2.01593017578125, -1.814697265625, -1.61346435546875, -1.4122314453125, -1.21099853515625, -1.009765625, -0.80853271484375, -0.6072998046875, -0.40606689453125, -0.204833984375, -0.00360107421875, 0.1976318359375, 0.39886474609375, 0.60009765625, 0.80133056640625, 1.0025634765625, 1.20379638671875, 1.405029296875, 1.60626220703125, 1.8074951171875, 2.00872802734375, 2.2099609375, 2.41119384765625, 2.6124267578125, 2.81365966796875, 3.014892578125, 3.21612548828125, 3.4173583984375, 3.61859130859375, 3.81982421875, 4.02105712890625, 4.2222900390625, 4.42352294921875, 4.624755859375, 4.82598876953125, 5.0272216796875, 5.22845458984375, 5.4296875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 7.0, 5.0, 3.0, 3.0, 6.0, 10.0, 8.0, 5.0, 8.0, 11.0, 11.0, 19.0, 14.0, 26.0, 36.0, 33.0, 56.0, 70.0, 76.0, 88.0, 98.0, 83.0, 72.0, 45.0, 44.0, 36.0, 22.0, 19.0, 13.0, 15.0, 4.0, 7.0, 7.0, 3.0, 6.0, 9.0, 6.0, 0.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-3.400390625, -3.3106689453125, -3.220947265625, -3.1312255859375, -3.04150390625, -2.9517822265625, -2.862060546875, -2.7723388671875, -2.6826171875, -2.5928955078125, -2.503173828125, -2.4134521484375, -2.32373046875, -2.2340087890625, -2.144287109375, -2.0545654296875, -1.96484375, -1.8751220703125, -1.785400390625, -1.6956787109375, -1.60595703125, -1.5162353515625, -1.426513671875, -1.3367919921875, -1.2470703125, -1.1573486328125, -1.067626953125, -0.9779052734375, -0.88818359375, -0.7984619140625, -0.708740234375, -0.6190185546875, -0.529296875, -0.4395751953125, -0.349853515625, -0.2601318359375, -0.17041015625, -0.0806884765625, 0.009033203125, 0.0987548828125, 0.1884765625, 0.2781982421875, 0.367919921875, 0.4576416015625, 0.54736328125, 0.6370849609375, 0.726806640625, 0.8165283203125, 0.90625, 0.9959716796875, 1.085693359375, 1.1754150390625, 1.26513671875, 1.3548583984375, 1.444580078125, 1.5343017578125, 1.6240234375, 1.7137451171875, 1.803466796875, 1.8931884765625, 1.98291015625, 2.0726318359375, 2.162353515625, 2.2520751953125, 2.341796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 13.0, 52.0, 316.0, 512.0, 95.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-231.30599975585938, -225.97024536132812, -220.63449096679688, -215.29873657226562, -209.96298217773438, -204.62722778320312, -199.29147338867188, -193.95571899414062, -188.61996459960938, -183.28421020507812, -177.94845581054688, -172.61270141601562, -167.27694702148438, -161.94119262695312, -156.60543823242188, -151.26968383789062, -145.93392944335938, -140.59817504882812, -135.26242065429688, -129.92666625976562, -124.59091186523438, -119.25515747070312, -113.91940307617188, -108.58364868164062, -103.24789428710938, -97.91213989257812, -92.57638549804688, -87.24063110351562, -81.90487670898438, -76.56912231445312, -71.23336791992188, -65.89761352539062, -60.56184387207031, -55.22608947753906, -49.89033508300781, -44.55458068847656, -39.21882629394531, -33.88307189941406, -28.547317504882812, -23.211563110351562, -17.875808715820312, -12.540054321289062, -7.2042999267578125, -1.8685455322265625, 3.4672088623046875, 8.802963256835938, 14.138717651367188, 19.474472045898438, 24.810226440429688, 30.145980834960938, 35.48173522949219, 40.81748962402344, 46.15324401855469, 51.48899841308594, 56.82475280761719, 62.16050720214844, 67.49626159667969, 72.83201599121094, 78.16777038574219, 83.50352478027344, 88.83927917480469, 94.17503356933594, 99.51078796386719, 104.84654235839844, 110.18229675292969]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 12.0, 8.0, 21.0, 24.0, 23.0, 22.0, 32.0, 40.0, 48.0, 62.0, 64.0, 59.0, 48.0, 57.0, 54.0, 49.0, 53.0, 49.0, 45.0, 56.0, 27.0, 24.0, 27.0, 17.0, 13.0, 12.0, 5.0, 5.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-65.06925201416016, -63.02565002441406, -60.98204803466797, -58.938446044921875, -56.89484405517578, -54.85124206542969, -52.80763626098633, -50.764034271240234, -48.72043228149414, -46.67683029174805, -44.63322830200195, -42.58962631225586, -40.5460205078125, -38.502418518066406, -36.45881652832031, -34.41521453857422, -32.371612548828125, -30.32801055908203, -28.284408569335938, -26.24080467224121, -24.197202682495117, -22.153600692749023, -20.109996795654297, -18.066394805908203, -16.02279281616211, -13.979190826416016, -11.935587882995605, -9.891984939575195, -7.848382949829102, -5.804780960083008, -3.7611780166625977, -1.7175750732421875, 0.326019287109375, 2.369621753692627, 4.413224220275879, 6.456826686859131, 8.500429153442383, 10.544031143188477, 12.587634086608887, 14.631237030029297, 16.67483901977539, 18.718441009521484, 20.762042999267578, 22.805646896362305, 24.8492488861084, 26.892850875854492, 28.93645477294922, 30.980056762695312, 33.023658752441406, 35.0672607421875, 37.110862731933594, 39.15446472167969, 41.19806671142578, 43.241668701171875, 45.285274505615234, 47.32887649536133, 49.37247848510742, 51.416080474853516, 53.45968246459961, 55.5032844543457, 57.54689025878906, 59.590492248535156, 61.63409423828125, 63.677696228027344, 65.72129821777344]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 10.0, 8.0, 14.0, 41.0, 67.0, 117.0, 239.0, 538.0, 1557.0, 6126.0, 67356.0, 4048589.0, 59529.0, 6538.0, 1893.0, 747.0, 395.0, 192.0, 92.0, 80.0, 32.0, 31.0, 22.0, 19.0, 12.0, 11.0, 4.0, 6.0, 1.0, 1.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -12.7618408203125, -11.937744140625, -11.1136474609375, -10.28955078125, -9.4654541015625, -8.641357421875, -7.8172607421875, -6.9931640625, -6.1690673828125, -5.344970703125, -4.5208740234375, -3.69677734375, -2.8726806640625, -2.048583984375, -1.2244873046875, -0.400390625, 0.4237060546875, 1.247802734375, 2.0718994140625, 2.89599609375, 3.7200927734375, 4.544189453125, 5.3682861328125, 6.1923828125, 7.0164794921875, 7.840576171875, 8.6646728515625, 9.48876953125, 10.3128662109375, 11.136962890625, 11.9610595703125, 12.78515625, 13.6092529296875, 14.433349609375, 15.2574462890625, 16.08154296875, 16.9056396484375, 17.729736328125, 18.5538330078125, 19.3779296875, 20.2020263671875, 21.026123046875, 21.8502197265625, 22.67431640625, 23.4984130859375, 24.322509765625, 25.1466064453125, 25.970703125, 26.7947998046875, 27.618896484375, 28.4429931640625, 29.26708984375, 30.0911865234375, 30.915283203125, 31.7393798828125, 32.5634765625, 33.3875732421875, 34.211669921875, 35.0357666015625, 35.85986328125, 36.6839599609375, 37.508056640625, 38.3321533203125, 39.15625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 12.0, 17.0, 30.0, 49.0, 63.0, 74.0, 98.0, 106.0, 108.0, 82.0, 98.0, 84.0, 56.0, 49.0, 20.0, 20.0, 9.0, 10.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.51568603515625, -2.3634033203125, -2.21112060546875, -2.058837890625, -1.90655517578125, -1.7542724609375, -1.60198974609375, -1.44970703125, -1.29742431640625, -1.1451416015625, -0.99285888671875, -0.840576171875, -0.68829345703125, -0.5360107421875, -0.38372802734375, -0.2314453125, -0.07916259765625, 0.0731201171875, 0.22540283203125, 0.377685546875, 0.52996826171875, 0.6822509765625, 0.83453369140625, 0.98681640625, 1.13909912109375, 1.2913818359375, 1.44366455078125, 1.595947265625, 1.74822998046875, 1.9005126953125, 2.05279541015625, 2.205078125, 2.35736083984375, 2.5096435546875, 2.66192626953125, 2.814208984375, 2.96649169921875, 3.1187744140625, 3.27105712890625, 3.42333984375, 3.57562255859375, 3.7279052734375, 3.88018798828125, 4.032470703125, 4.18475341796875, 4.3370361328125, 4.48931884765625, 4.6416015625, 4.79388427734375, 4.9461669921875, 5.09844970703125, 5.250732421875, 5.40301513671875, 5.5552978515625, 5.70758056640625, 5.85986328125, 6.01214599609375, 6.1644287109375, 6.31671142578125, 6.468994140625, 6.62127685546875, 6.7735595703125, 6.92584228515625, 7.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 20.0, 42.0, 66.0, 109.0, 214.0, 1632.0, 4191722.0, 308.0, 83.0, 52.0, 17.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-383.5, -375.86328125, -368.2265625, -360.58984375, -352.953125, -345.31640625, -337.6796875, -330.04296875, -322.40625, -314.76953125, -307.1328125, -299.49609375, -291.859375, -284.22265625, -276.5859375, -268.94921875, -261.3125, -253.67578125, -246.0390625, -238.40234375, -230.765625, -223.12890625, -215.4921875, -207.85546875, -200.21875, -192.58203125, -184.9453125, -177.30859375, -169.671875, -162.03515625, -154.3984375, -146.76171875, -139.125, -131.48828125, -123.8515625, -116.21484375, -108.578125, -100.94140625, -93.3046875, -85.66796875, -78.03125, -70.39453125, -62.7578125, -55.12109375, -47.484375, -39.84765625, -32.2109375, -24.57421875, -16.9375, -9.30078125, -1.6640625, 5.97265625, 13.609375, 21.24609375, 28.8828125, 36.51953125, 44.15625, 51.79296875, 59.4296875, 67.06640625, 74.703125, 82.33984375, 89.9765625, 97.61328125, 105.25]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 24.0, 3706.0, 347.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0, -57.8388671875, -56.677734375, -55.5166015625, -54.35546875, -53.1943359375, -52.033203125, -50.8720703125, -49.7109375, -48.5498046875, -47.388671875, -46.2275390625, -45.06640625, -43.9052734375, -42.744140625, -41.5830078125, -40.421875, -39.2607421875, -38.099609375, -36.9384765625, -35.77734375, -34.6162109375, -33.455078125, -32.2939453125, -31.1328125, -29.9716796875, -28.810546875, -27.6494140625, -26.48828125, -25.3271484375, -24.166015625, -23.0048828125, -21.84375, -20.6826171875, -19.521484375, -18.3603515625, -17.19921875, -16.0380859375, -14.876953125, -13.7158203125, -12.5546875, -11.3935546875, -10.232421875, -9.0712890625, -7.91015625, -6.7490234375, -5.587890625, -4.4267578125, -3.265625, -2.1044921875, -0.943359375, 0.2177734375, 1.37890625, 2.5400390625, 3.701171875, 4.8623046875, 6.0234375, 7.1845703125, 8.345703125, 9.5068359375, 10.66796875, 11.8291015625, 12.990234375, 14.1513671875, 15.3125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 972.0, 36.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-346.61688232421875, -333.13543701171875, -319.65399169921875, -306.17254638671875, -292.69110107421875, -279.20965576171875, -265.72821044921875, -252.24676513671875, -238.76531982421875, -225.28387451171875, -211.80242919921875, -198.32098388671875, -184.83953857421875, -171.35809326171875, -157.87664794921875, -144.39520263671875, -130.91375732421875, -117.43231201171875, -103.95086669921875, -90.46942138671875, -76.98797607421875, -63.50653076171875, -50.02508544921875, -36.54364013671875, -23.06219482421875, -9.58074951171875, 3.90069580078125, 17.38214111328125, 30.86358642578125, 44.34503173828125, 57.82647705078125, 71.30792236328125, 84.78936767578125, 98.27081298828125, 111.75225830078125, 125.23370361328125, 138.71514892578125, 152.19659423828125, 165.67803955078125, 179.15948486328125, 192.64093017578125, 206.12237548828125, 219.60382080078125, 233.08526611328125, 246.56671142578125, 260.04815673828125, 273.52960205078125, 287.01104736328125, 300.49249267578125, 313.97393798828125, 327.45538330078125, 340.93682861328125, 354.41827392578125, 367.89971923828125, 381.38116455078125, 394.86260986328125, 408.34405517578125, 421.82550048828125, 435.30694580078125, 448.78839111328125, 462.26983642578125, 475.75128173828125, 489.23272705078125, 502.71417236328125, 516.1956176757812]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 40.0, 81.0, 132.0, 179.0, 181.0, 163.0, 112.0, 63.0, 25.0, 15.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.53354263305664, -60.15679931640625, -57.780052185058594, -55.4033088684082, -53.02656555175781, -50.649818420410156, -48.273075103759766, -45.896331787109375, -43.51958465576172, -41.14284133911133, -38.76609420776367, -36.38935089111328, -34.012603759765625, -31.635860443115234, -29.259117126464844, -26.88237190246582, -24.505626678466797, -22.128881454467773, -19.75213623046875, -17.37539291381836, -14.998647689819336, -12.621902465820312, -10.245158195495605, -7.868413925170898, -5.491668701171875, -3.1149239540100098, -0.7381792068481445, 1.6385655403137207, 4.015310287475586, 6.392055511474609, 8.768799781799316, 11.145544052124023, 13.522293090820312, 15.899038314819336, 18.27578353881836, 20.65252685546875, 23.029272079467773, 25.406017303466797, 27.782760620117188, 30.15950584411621, 32.536251068115234, 34.912994384765625, 37.28974151611328, 39.66648483276367, 42.04322814941406, 44.41997528076172, 46.79671859741211, 49.1734619140625, 51.550209045410156, 53.92695236206055, 56.3036994934082, 58.680442810058594, 61.05718994140625, 63.43393325805664, 65.81067657470703, 68.18742370605469, 70.56416320800781, 72.94091033935547, 75.3176498413086, 77.69439697265625, 80.0711441040039, 82.44789123535156, 84.82463073730469, 87.20137786865234, 89.578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 12.0, 9.0, 14.0, 18.0, 21.0, 30.0, 51.0, 59.0, 98.0, 165.0, 265.0, 476.0, 979.0, 2233.0, 6742.0, 24100.0, 106864.0, 551959.0, 281935.0, 52179.0, 13087.0, 4016.0, 1496.0, 736.0, 372.0, 206.0, 126.0, 74.0, 80.0, 45.0, 34.0, 17.0, 19.0, 9.0, 9.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.8365478515625, -7.532470703125, -7.2283935546875, -6.92431640625, -6.6202392578125, -6.316162109375, -6.0120849609375, -5.7080078125, -5.4039306640625, -5.099853515625, -4.7957763671875, -4.49169921875, -4.1876220703125, -3.883544921875, -3.5794677734375, -3.275390625, -2.9713134765625, -2.667236328125, -2.3631591796875, -2.05908203125, -1.7550048828125, -1.450927734375, -1.1468505859375, -0.8427734375, -0.5386962890625, -0.234619140625, 0.0694580078125, 0.37353515625, 0.6776123046875, 0.981689453125, 1.2857666015625, 1.58984375, 1.8939208984375, 2.197998046875, 2.5020751953125, 2.80615234375, 3.1102294921875, 3.414306640625, 3.7183837890625, 4.0224609375, 4.3265380859375, 4.630615234375, 4.9346923828125, 5.23876953125, 5.5428466796875, 5.846923828125, 6.1510009765625, 6.455078125, 6.7591552734375, 7.063232421875, 7.3673095703125, 7.67138671875, 7.9754638671875, 8.279541015625, 8.5836181640625, 8.8876953125, 9.1917724609375, 9.495849609375, 9.7999267578125, 10.10400390625, 10.4080810546875, 10.712158203125, 11.0162353515625, 11.3203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 12.0, 24.0, 19.0, 34.0, 45.0, 54.0, 67.0, 82.0, 73.0, 81.0, 77.0, 86.0, 58.0, 48.0, 62.0, 46.0, 30.0, 28.0, 23.0, 7.0, 16.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.423828125, -2.318939208984375, -2.21405029296875, -2.109161376953125, -2.0042724609375, -1.899383544921875, -1.79449462890625, -1.689605712890625, -1.584716796875, -1.479827880859375, -1.37493896484375, -1.270050048828125, -1.1651611328125, -1.060272216796875, -0.95538330078125, -0.850494384765625, -0.74560546875, -0.640716552734375, -0.53582763671875, -0.430938720703125, -0.3260498046875, -0.221160888671875, -0.11627197265625, -0.011383056640625, 0.093505859375, 0.198394775390625, 0.30328369140625, 0.408172607421875, 0.5130615234375, 0.617950439453125, 0.72283935546875, 0.827728271484375, 0.9326171875, 1.037506103515625, 1.14239501953125, 1.247283935546875, 1.3521728515625, 1.457061767578125, 1.56195068359375, 1.666839599609375, 1.771728515625, 1.876617431640625, 1.98150634765625, 2.086395263671875, 2.1912841796875, 2.296173095703125, 2.40106201171875, 2.505950927734375, 2.61083984375, 2.715728759765625, 2.82061767578125, 2.925506591796875, 3.0303955078125, 3.135284423828125, 3.24017333984375, 3.345062255859375, 3.449951171875, 3.554840087890625, 3.65972900390625, 3.764617919921875, 3.8695068359375, 3.974395751953125, 4.07928466796875, 4.184173583984375, 4.2890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 12.0, 14.0, 25.0, 47.0, 57.0, 110.0, 173.0, 354.0, 795.0, 2547.0, 14953.0, 442865.0, 564847.0, 17396.0, 2678.0, 856.0, 346.0, 157.0, 89.0, 70.0, 38.0, 31.0, 21.0, 13.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.754150390625, -15.14892578125, -14.543701171875, -13.9384765625, -13.333251953125, -12.72802734375, -12.122802734375, -11.517578125, -10.912353515625, -10.30712890625, -9.701904296875, -9.0966796875, -8.491455078125, -7.88623046875, -7.281005859375, -6.67578125, -6.070556640625, -5.46533203125, -4.860107421875, -4.2548828125, -3.649658203125, -3.04443359375, -2.439208984375, -1.833984375, -1.228759765625, -0.62353515625, -0.018310546875, 0.5869140625, 1.192138671875, 1.79736328125, 2.402587890625, 3.0078125, 3.613037109375, 4.21826171875, 4.823486328125, 5.4287109375, 6.033935546875, 6.63916015625, 7.244384765625, 7.849609375, 8.454833984375, 9.06005859375, 9.665283203125, 10.2705078125, 10.875732421875, 11.48095703125, 12.086181640625, 12.69140625, 13.296630859375, 13.90185546875, 14.507080078125, 15.1123046875, 15.717529296875, 16.32275390625, 16.927978515625, 17.533203125, 18.138427734375, 18.74365234375, 19.348876953125, 19.9541015625, 20.559326171875, 21.16455078125, 21.769775390625, 22.375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 12.0, 16.0, 19.0, 34.0, 45.0, 34.0, 43.0, 47.0, 71.0, 66.0, 89.0, 69.0, 76.0, 83.0, 50.0, 36.0, 36.0, 31.0, 29.0, 18.0, 15.0, 17.0, 12.0, 8.0, 9.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.5953369140625, -10.175048828125, -9.7547607421875, -9.33447265625, -8.9141845703125, -8.493896484375, -8.0736083984375, -7.6533203125, -7.2330322265625, -6.812744140625, -6.3924560546875, -5.97216796875, -5.5518798828125, -5.131591796875, -4.7113037109375, -4.291015625, -3.8707275390625, -3.450439453125, -3.0301513671875, -2.60986328125, -2.1895751953125, -1.769287109375, -1.3489990234375, -0.9287109375, -0.5084228515625, -0.088134765625, 0.3321533203125, 0.75244140625, 1.1727294921875, 1.593017578125, 2.0133056640625, 2.43359375, 2.8538818359375, 3.274169921875, 3.6944580078125, 4.11474609375, 4.5350341796875, 4.955322265625, 5.3756103515625, 5.7958984375, 6.2161865234375, 6.636474609375, 7.0567626953125, 7.47705078125, 7.8973388671875, 8.317626953125, 8.7379150390625, 9.158203125, 9.5784912109375, 9.998779296875, 10.4190673828125, 10.83935546875, 11.2596435546875, 11.679931640625, 12.1002197265625, 12.5205078125, 12.9407958984375, 13.361083984375, 13.7813720703125, 14.20166015625, 14.6219482421875, 15.042236328125, 15.4625244140625, 15.8828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 19.0, 31.0, 82.0, 129.0, 273.0, 660.0, 1838.0, 7456.0, 102325.0, 898077.0, 31140.0, 4354.0, 1254.0, 453.0, 213.0, 102.0, 49.0, 29.0, 21.0, 13.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.097412109375, -7.87451171875, -7.651611328125, -7.4287109375, -7.205810546875, -6.98291015625, -6.760009765625, -6.537109375, -6.314208984375, -6.09130859375, -5.868408203125, -5.6455078125, -5.422607421875, -5.19970703125, -4.976806640625, -4.75390625, -4.531005859375, -4.30810546875, -4.085205078125, -3.8623046875, -3.639404296875, -3.41650390625, -3.193603515625, -2.970703125, -2.747802734375, -2.52490234375, -2.302001953125, -2.0791015625, -1.856201171875, -1.63330078125, -1.410400390625, -1.1875, -0.964599609375, -0.74169921875, -0.518798828125, -0.2958984375, -0.072998046875, 0.14990234375, 0.372802734375, 0.595703125, 0.818603515625, 1.04150390625, 1.264404296875, 1.4873046875, 1.710205078125, 1.93310546875, 2.156005859375, 2.37890625, 2.601806640625, 2.82470703125, 3.047607421875, 3.2705078125, 3.493408203125, 3.71630859375, 3.939208984375, 4.162109375, 4.385009765625, 4.60791015625, 4.830810546875, 5.0537109375, 5.276611328125, 5.49951171875, 5.722412109375, 5.9453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 10.0, 9.0, 5.0, 16.0, 17.0, 18.0, 21.0, 37.0, 55.0, 53.0, 63.0, 73.0, 81.0, 91.0, 79.0, 61.0, 67.0, 48.0, 40.0, 32.0, 27.0, 22.0, 16.0, 14.0, 13.0, 6.0, 11.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018393993377685547, -0.00017614476382732391, -0.00016834959387779236, -0.0001605544239282608, -0.00015275925397872925, -0.0001449640840291977, -0.00013716891407966614, -0.00012937374413013458, -0.00012157857418060303, -0.00011378340423107147, -0.00010598823428153992, -9.819306433200836e-05, -9.03978943824768e-05, -8.260272443294525e-05, -7.48075544834137e-05, -6.701238453388214e-05, -5.9217214584350586e-05, -5.142204463481903e-05, -4.3626874685287476e-05, -3.583170473575592e-05, -2.8036534786224365e-05, -2.024136483669281e-05, -1.2446194887161255e-05, -4.6510249376297e-06, 3.1441450119018555e-06, 1.093931496143341e-05, 1.8734484910964966e-05, 2.652965486049652e-05, 3.4324824810028076e-05, 4.211999475955963e-05, 4.9915164709091187e-05, 5.771033465862274e-05, 6.55055046081543e-05, 7.330067455768585e-05, 8.109584450721741e-05, 8.889101445674896e-05, 9.668618440628052e-05, 0.00010448135435581207, 0.00011227652430534363, 0.00012007169425487518, 0.00012786686420440674, 0.0001356620341539383, 0.00014345720410346985, 0.0001512523740530014, 0.00015904754400253296, 0.00016684271395206451, 0.00017463788390159607, 0.00018243305385112762, 0.00019022822380065918, 0.00019802339375019073, 0.0002058185636997223, 0.00021361373364925385, 0.0002214089035987854, 0.00022920407354831696, 0.0002369992434978485, 0.00024479441344738007, 0.0002525895833969116, 0.0002603847533464432, 0.00026817992329597473, 0.0002759750932455063, 0.00028377026319503784, 0.0002915654331445694, 0.00029936060309410095, 0.0003071557730436325, 0.00031495094299316406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 12.0, 17.0, 27.0, 26.0, 41.0, 78.0, 184.0, 409.0, 1156.0, 5008.0, 65718.0, 924766.0, 45246.0, 4143.0, 1008.0, 331.0, 161.0, 63.0, 40.0, 26.0, 23.0, 14.0, 7.0, 4.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.05078125, -6.85186767578125, -6.6529541015625, -6.45404052734375, -6.255126953125, -6.05621337890625, -5.8572998046875, -5.65838623046875, -5.45947265625, -5.26055908203125, -5.0616455078125, -4.86273193359375, -4.663818359375, -4.46490478515625, -4.2659912109375, -4.06707763671875, -3.8681640625, -3.66925048828125, -3.4703369140625, -3.27142333984375, -3.072509765625, -2.87359619140625, -2.6746826171875, -2.47576904296875, -2.27685546875, -2.07794189453125, -1.8790283203125, -1.68011474609375, -1.481201171875, -1.28228759765625, -1.0833740234375, -0.88446044921875, -0.685546875, -0.48663330078125, -0.2877197265625, -0.08880615234375, 0.110107421875, 0.30902099609375, 0.5079345703125, 0.70684814453125, 0.90576171875, 1.10467529296875, 1.3035888671875, 1.50250244140625, 1.701416015625, 1.90032958984375, 2.0992431640625, 2.29815673828125, 2.4970703125, 2.69598388671875, 2.8948974609375, 3.09381103515625, 3.292724609375, 3.49163818359375, 3.6905517578125, 3.88946533203125, 4.08837890625, 4.28729248046875, 4.4862060546875, 4.68511962890625, 4.884033203125, 5.08294677734375, 5.2818603515625, 5.48077392578125, 5.6796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 1.0, 10.0, 8.0, 13.0, 8.0, 24.0, 31.0, 42.0, 69.0, 105.0, 140.0, 147.0, 146.0, 71.0, 65.0, 36.0, 15.0, 13.0, 9.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.77734375, -4.645355224609375, -4.51336669921875, -4.381378173828125, -4.2493896484375, -4.117401123046875, -3.98541259765625, -3.853424072265625, -3.721435546875, -3.589447021484375, -3.45745849609375, -3.325469970703125, -3.1934814453125, -3.061492919921875, -2.92950439453125, -2.797515869140625, -2.66552734375, -2.533538818359375, -2.40155029296875, -2.269561767578125, -2.1375732421875, -2.005584716796875, -1.87359619140625, -1.741607666015625, -1.609619140625, -1.477630615234375, -1.34564208984375, -1.213653564453125, -1.0816650390625, -0.949676513671875, -0.81768798828125, -0.685699462890625, -0.5537109375, -0.421722412109375, -0.28973388671875, -0.157745361328125, -0.0257568359375, 0.106231689453125, 0.23822021484375, 0.370208740234375, 0.502197265625, 0.634185791015625, 0.76617431640625, 0.898162841796875, 1.0301513671875, 1.162139892578125, 1.29412841796875, 1.426116943359375, 1.55810546875, 1.690093994140625, 1.82208251953125, 1.954071044921875, 2.0860595703125, 2.218048095703125, 2.35003662109375, 2.482025146484375, 2.614013671875, 2.746002197265625, 2.87799072265625, 3.009979248046875, 3.1419677734375, 3.273956298828125, 3.40594482421875, 3.537933349609375, 3.669921875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 13.0, 53.0, 162.0, 506.0, 196.0, 57.0, 12.0, 10.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.84048461914062, -80.01313781738281, -75.185791015625, -70.35844421386719, -65.53109741210938, -60.70375061035156, -55.876407623291016, -51.0490608215332, -46.22171401977539, -41.39436721801758, -36.567020416259766, -31.739675521850586, -26.912328720092773, -22.08498191833496, -17.25763702392578, -12.430290222167969, -7.602943420410156, -2.775597095489502, 2.0517492294311523, 6.879095077514648, 11.706441879272461, 16.533788681030273, 21.361133575439453, 26.188480377197266, 31.015827178955078, 35.84317398071289, 40.6705207824707, 45.49786376953125, 50.32521057128906, 55.152557373046875, 59.97990417480469, 64.8072509765625, 69.63459777832031, 74.46194458007812, 79.28929138183594, 84.11663818359375, 88.94398498535156, 93.77133178710938, 98.59867858886719, 103.426025390625, 108.25337219238281, 113.08071899414062, 117.90806579589844, 122.73541259765625, 127.56275939941406, 132.39010620117188, 137.2174530029297, 142.0447998046875, 146.87213134765625, 151.69947814941406, 156.52682495117188, 161.3541717529297, 166.1815185546875, 171.0088653564453, 175.83621215820312, 180.66355895996094, 185.49090576171875, 190.31825256347656, 195.14559936523438, 199.9729461669922, 204.80029296875, 209.6276397705078, 214.45498657226562, 219.28233337402344, 224.10968017578125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 10.0, 8.0, 11.0, 15.0, 17.0, 9.0, 14.0, 24.0, 32.0, 38.0, 36.0, 43.0, 38.0, 63.0, 55.0, 60.0, 53.0, 55.0, 51.0, 39.0, 49.0, 40.0, 40.0, 31.0, 24.0, 20.0, 21.0, 17.0, 16.0, 16.0, 6.0, 5.0, 13.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.48450469970703, -58.53110122680664, -56.57769775390625, -54.624290466308594, -52.6708869934082, -50.71748352050781, -48.76408004760742, -46.81067657470703, -44.85727310180664, -42.90386962890625, -40.95046615600586, -38.99706268310547, -37.04365539550781, -35.09025192260742, -33.13684844970703, -31.18344497680664, -29.230039596557617, -27.276636123657227, -25.323230743408203, -23.369827270507812, -21.416423797607422, -19.46302032470703, -17.509614944458008, -15.556211471557617, -13.60280704498291, -11.649402618408203, -9.695999145507812, -7.7425947189331055, -5.789190769195557, -3.835786819458008, -1.8823823928833008, 0.07102108001708984, 2.024425506591797, 3.9778294563293457, 5.9312334060668945, 7.884637832641602, 9.838041305541992, 11.7914457321167, 13.744850158691406, 15.698253631591797, 17.651657104492188, 19.605060577392578, 21.5584659576416, 23.511869430541992, 25.465272903442383, 27.418678283691406, 29.372081756591797, 31.325485229492188, 33.278892517089844, 35.232295989990234, 37.185699462890625, 39.13910675048828, 41.09251022338867, 43.04591369628906, 44.99931716918945, 46.952720642089844, 48.906124114990234, 50.859527587890625, 52.812931060791016, 54.766334533691406, 56.71974182128906, 58.67314529418945, 60.626548767089844, 62.579952239990234, 64.53335571289062]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 13.0, 12.0, 18.0, 28.0, 64.0, 94.0, 149.0, 302.0, 657.0, 1469.0, 3921.0, 15270.0, 135312.0, 3897882.0, 117188.0, 14699.0, 3922.0, 1573.0, 728.0, 392.0, 222.0, 133.0, 71.0, 43.0, 29.0, 27.0, 19.0, 11.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -13.9669189453125, -13.316650390625, -12.6663818359375, -12.01611328125, -11.3658447265625, -10.715576171875, -10.0653076171875, -9.4150390625, -8.7647705078125, -8.114501953125, -7.4642333984375, -6.81396484375, -6.1636962890625, -5.513427734375, -4.8631591796875, -4.212890625, -3.5626220703125, -2.912353515625, -2.2620849609375, -1.61181640625, -0.9615478515625, -0.311279296875, 0.3389892578125, 0.9892578125, 1.6395263671875, 2.289794921875, 2.9400634765625, 3.59033203125, 4.2406005859375, 4.890869140625, 5.5411376953125, 6.19140625, 6.8416748046875, 7.491943359375, 8.1422119140625, 8.79248046875, 9.4427490234375, 10.093017578125, 10.7432861328125, 11.3935546875, 12.0438232421875, 12.694091796875, 13.3443603515625, 13.99462890625, 14.6448974609375, 15.295166015625, 15.9454345703125, 16.595703125, 17.2459716796875, 17.896240234375, 18.5465087890625, 19.19677734375, 19.8470458984375, 20.497314453125, 21.1475830078125, 21.7978515625, 22.4481201171875, 23.098388671875, 23.7486572265625, 24.39892578125, 25.0491943359375, 25.699462890625, 26.3497314453125, 27.0]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 10.0, 13.0, 32.0, 32.0, 43.0, 50.0, 48.0, 54.0, 60.0, 87.0, 72.0, 69.0, 82.0, 45.0, 63.0, 50.0, 52.0, 28.0, 29.0, 15.0, 13.0, 9.0, 14.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.017730712890625, -1.91632080078125, -1.814910888671875, -1.7135009765625, -1.612091064453125, -1.51068115234375, -1.409271240234375, -1.307861328125, -1.206451416015625, -1.10504150390625, -1.003631591796875, -0.9022216796875, -0.800811767578125, -0.69940185546875, -0.597991943359375, -0.49658203125, -0.395172119140625, -0.29376220703125, -0.192352294921875, -0.0909423828125, 0.010467529296875, 0.11187744140625, 0.213287353515625, 0.314697265625, 0.416107177734375, 0.51751708984375, 0.618927001953125, 0.7203369140625, 0.821746826171875, 0.92315673828125, 1.024566650390625, 1.1259765625, 1.227386474609375, 1.32879638671875, 1.430206298828125, 1.5316162109375, 1.633026123046875, 1.73443603515625, 1.835845947265625, 1.937255859375, 2.038665771484375, 2.14007568359375, 2.241485595703125, 2.3428955078125, 2.444305419921875, 2.54571533203125, 2.647125244140625, 2.74853515625, 2.849945068359375, 2.95135498046875, 3.052764892578125, 3.1541748046875, 3.255584716796875, 3.35699462890625, 3.458404541015625, 3.559814453125, 3.661224365234375, 3.76263427734375, 3.864044189453125, 3.9654541015625, 4.066864013671875, 4.16827392578125, 4.269683837890625, 4.37109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 2.0, 8.0, 4.0, 11.0, 9.0, 21.0, 16.0, 57.0, 65.0, 114.0, 246.0, 569.0, 1161.0, 3367.0, 14450.0, 617382.0, 3531219.0, 19437.0, 3764.0, 1290.0, 508.0, 252.0, 110.0, 73.0, 49.0, 30.0, 22.0, 11.0, 9.0, 3.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.484375, -24.832275390625, -24.18017578125, -23.528076171875, -22.8759765625, -22.223876953125, -21.57177734375, -20.919677734375, -20.267578125, -19.615478515625, -18.96337890625, -18.311279296875, -17.6591796875, -17.007080078125, -16.35498046875, -15.702880859375, -15.05078125, -14.398681640625, -13.74658203125, -13.094482421875, -12.4423828125, -11.790283203125, -11.13818359375, -10.486083984375, -9.833984375, -9.181884765625, -8.52978515625, -7.877685546875, -7.2255859375, -6.573486328125, -5.92138671875, -5.269287109375, -4.6171875, -3.965087890625, -3.31298828125, -2.660888671875, -2.0087890625, -1.356689453125, -0.70458984375, -0.052490234375, 0.599609375, 1.251708984375, 1.90380859375, 2.555908203125, 3.2080078125, 3.860107421875, 4.51220703125, 5.164306640625, 5.81640625, 6.468505859375, 7.12060546875, 7.772705078125, 8.4248046875, 9.076904296875, 9.72900390625, 10.381103515625, 11.033203125, 11.685302734375, 12.33740234375, 12.989501953125, 13.6416015625, 14.293701171875, 14.94580078125, 15.597900390625, 16.25]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 19.0, 31.0, 75.0, 217.0, 1259.0, 1955.0, 255.0, 100.0, 52.0, 22.0, 20.0, 9.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.015625, -8.734619140625, -8.45361328125, -8.172607421875, -7.8916015625, -7.610595703125, -7.32958984375, -7.048583984375, -6.767578125, -6.486572265625, -6.20556640625, -5.924560546875, -5.6435546875, -5.362548828125, -5.08154296875, -4.800537109375, -4.51953125, -4.238525390625, -3.95751953125, -3.676513671875, -3.3955078125, -3.114501953125, -2.83349609375, -2.552490234375, -2.271484375, -1.990478515625, -1.70947265625, -1.428466796875, -1.1474609375, -0.866455078125, -0.58544921875, -0.304443359375, -0.0234375, 0.257568359375, 0.53857421875, 0.819580078125, 1.1005859375, 1.381591796875, 1.66259765625, 1.943603515625, 2.224609375, 2.505615234375, 2.78662109375, 3.067626953125, 3.3486328125, 3.629638671875, 3.91064453125, 4.191650390625, 4.47265625, 4.753662109375, 5.03466796875, 5.315673828125, 5.5966796875, 5.877685546875, 6.15869140625, 6.439697265625, 6.720703125, 7.001708984375, 7.28271484375, 7.563720703125, 7.8447265625, 8.125732421875, 8.40673828125, 8.687744140625, 8.96875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 14.0, 52.0, 460.0, 440.0, 36.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.74054718017578, -115.43753051757812, -112.13451385498047, -108.83149719238281, -105.52848815917969, -102.2254638671875, -98.92245483398438, -95.61943817138672, -92.31642150878906, -89.0134048461914, -85.71038818359375, -82.4073715209961, -79.10435485839844, -75.80134582519531, -72.49832916259766, -69.1953125, -65.89229583740234, -62.58927917480469, -59.28626251220703, -55.98324966430664, -52.680233001708984, -49.37721633911133, -46.07420349121094, -42.77118682861328, -39.468170166015625, -36.16515350341797, -32.86213684082031, -29.559123992919922, -26.256107330322266, -22.95309066772461, -19.650075912475586, -16.347061157226562, -13.044036865234375, -9.741021156311035, -6.438005447387695, -3.1349897384643555, 0.16802597045898438, 3.4710426330566406, 6.774057388305664, 10.077072143554688, 13.380088806152344, 16.68310546875, 19.986120223999023, 23.289134979248047, 26.592151641845703, 29.89516830444336, 33.19818115234375, 36.501197814941406, 39.80421447753906, 43.10723114013672, 46.410247802734375, 49.713260650634766, 53.01627731323242, 56.31929397583008, 59.62230682373047, 62.925323486328125, 66.22834014892578, 69.53135681152344, 72.8343734741211, 76.13739013671875, 79.44039916992188, 82.74342346191406, 86.04643249511719, 89.34944915771484, 92.6524658203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 8.0, 13.0, 16.0, 29.0, 35.0, 45.0, 57.0, 46.0, 70.0, 63.0, 84.0, 69.0, 71.0, 71.0, 62.0, 56.0, 30.0, 52.0, 26.0, 22.0, 16.0, 19.0, 15.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.586833953857422, -24.681041717529297, -23.775249481201172, -22.869457244873047, -21.963665008544922, -21.057872772216797, -20.152080535888672, -19.246288299560547, -18.340496063232422, -17.434703826904297, -16.528911590576172, -15.623119354248047, -14.717327117919922, -13.811534881591797, -12.905741691589355, -11.99994945526123, -11.094156265258789, -10.188364028930664, -9.282571792602539, -8.376779556274414, -7.470986843109131, -6.565194606781006, -5.659401893615723, -4.753609657287598, -3.8478174209594727, -2.9420251846313477, -2.0362327098846436, -1.1304402351379395, -0.22464799880981445, 0.6811442375183105, 1.5869369506835938, 2.4927291870117188, 3.3985214233398438, 4.304313659667969, 5.210105895996094, 6.115898609161377, 7.021690845489502, 7.927483081817627, 8.83327579498291, 9.739068031311035, 10.64486026763916, 11.550652503967285, 12.45644474029541, 13.362237930297852, 14.268030166625977, 15.173822402954102, 16.079614639282227, 16.98540687561035, 17.891199111938477, 18.7969913482666, 19.702783584594727, 20.60857582092285, 21.514368057250977, 22.4201602935791, 23.32595443725586, 24.231746673583984, 25.13753890991211, 26.043331146240234, 26.94912338256836, 27.854915618896484, 28.76070785522461, 29.666500091552734, 30.57229232788086, 31.478084564208984, 32.38387680053711]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 12.0, 5.0, 4.0, 7.0, 15.0, 34.0, 29.0, 49.0, 76.0, 100.0, 152.0, 230.0, 417.0, 745.0, 1484.0, 3546.0, 9700.0, 30915.0, 117471.0, 508676.0, 282653.0, 62920.0, 18145.0, 6213.0, 2362.0, 1101.0, 574.0, 287.0, 210.0, 113.0, 82.0, 73.0, 34.0, 35.0, 20.0, 24.0, 11.0, 11.0, 7.0, 2.0, 9.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.203125, -8.9306640625, -8.658203125, -8.3857421875, -8.11328125, -7.8408203125, -7.568359375, -7.2958984375, -7.0234375, -6.7509765625, -6.478515625, -6.2060546875, -5.93359375, -5.6611328125, -5.388671875, -5.1162109375, -4.84375, -4.5712890625, -4.298828125, -4.0263671875, -3.75390625, -3.4814453125, -3.208984375, -2.9365234375, -2.6640625, -2.3916015625, -2.119140625, -1.8466796875, -1.57421875, -1.3017578125, -1.029296875, -0.7568359375, -0.484375, -0.2119140625, 0.060546875, 0.3330078125, 0.60546875, 0.8779296875, 1.150390625, 1.4228515625, 1.6953125, 1.9677734375, 2.240234375, 2.5126953125, 2.78515625, 3.0576171875, 3.330078125, 3.6025390625, 3.875, 4.1474609375, 4.419921875, 4.6923828125, 4.96484375, 5.2373046875, 5.509765625, 5.7822265625, 6.0546875, 6.3271484375, 6.599609375, 6.8720703125, 7.14453125, 7.4169921875, 7.689453125, 7.9619140625, 8.234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 17.0, 20.0, 34.0, 32.0, 37.0, 54.0, 59.0, 73.0, 66.0, 74.0, 69.0, 71.0, 67.0, 58.0, 51.0, 54.0, 38.0, 29.0, 21.0, 13.0, 11.0, 7.0, 7.0, 4.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.47265625, -2.3785400390625, -2.284423828125, -2.1903076171875, -2.09619140625, -2.0020751953125, -1.907958984375, -1.8138427734375, -1.7197265625, -1.6256103515625, -1.531494140625, -1.4373779296875, -1.34326171875, -1.2491455078125, -1.155029296875, -1.0609130859375, -0.966796875, -0.8726806640625, -0.778564453125, -0.6844482421875, -0.59033203125, -0.4962158203125, -0.402099609375, -0.3079833984375, -0.2138671875, -0.1197509765625, -0.025634765625, 0.0684814453125, 0.16259765625, 0.2567138671875, 0.350830078125, 0.4449462890625, 0.5390625, 0.6331787109375, 0.727294921875, 0.8214111328125, 0.91552734375, 1.0096435546875, 1.103759765625, 1.1978759765625, 1.2919921875, 1.3861083984375, 1.480224609375, 1.5743408203125, 1.66845703125, 1.7625732421875, 1.856689453125, 1.9508056640625, 2.044921875, 2.1390380859375, 2.233154296875, 2.3272705078125, 2.42138671875, 2.5155029296875, 2.609619140625, 2.7037353515625, 2.7978515625, 2.8919677734375, 2.986083984375, 3.0802001953125, 3.17431640625, 3.2684326171875, 3.362548828125, 3.4566650390625, 3.55078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 10.0, 8.0, 10.0, 13.0, 12.0, 14.0, 34.0, 40.0, 46.0, 64.0, 101.0, 158.0, 245.0, 372.0, 661.0, 1185.0, 2466.0, 5843.0, 16892.0, 56187.0, 247151.0, 529241.0, 133951.0, 34609.0, 11159.0, 4077.0, 1717.0, 865.0, 473.0, 292.0, 206.0, 126.0, 83.0, 65.0, 48.0, 28.0, 32.0, 18.0, 16.0, 12.0, 7.0, 2.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.79296875, -6.58270263671875, -6.3724365234375, -6.16217041015625, -5.951904296875, -5.74163818359375, -5.5313720703125, -5.32110595703125, -5.11083984375, -4.90057373046875, -4.6903076171875, -4.48004150390625, -4.269775390625, -4.05950927734375, -3.8492431640625, -3.63897705078125, -3.4287109375, -3.21844482421875, -3.0081787109375, -2.79791259765625, -2.587646484375, -2.37738037109375, -2.1671142578125, -1.95684814453125, -1.74658203125, -1.53631591796875, -1.3260498046875, -1.11578369140625, -0.905517578125, -0.69525146484375, -0.4849853515625, -0.27471923828125, -0.064453125, 0.14581298828125, 0.3560791015625, 0.56634521484375, 0.776611328125, 0.98687744140625, 1.1971435546875, 1.40740966796875, 1.61767578125, 1.82794189453125, 2.0382080078125, 2.24847412109375, 2.458740234375, 2.66900634765625, 2.8792724609375, 3.08953857421875, 3.2998046875, 3.51007080078125, 3.7203369140625, 3.93060302734375, 4.140869140625, 4.35113525390625, 4.5614013671875, 4.77166748046875, 4.98193359375, 5.19219970703125, 5.4024658203125, 5.61273193359375, 5.822998046875, 6.03326416015625, 6.2435302734375, 6.45379638671875, 6.6640625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 11.0, 15.0, 18.0, 27.0, 28.0, 27.0, 23.0, 38.0, 30.0, 39.0, 57.0, 40.0, 46.0, 39.0, 58.0, 49.0, 48.0, 50.0, 43.0, 44.0, 39.0, 35.0, 24.0, 27.0, 26.0, 12.0, 22.0, 17.0, 10.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.578125, -7.294921875, -7.01171875, -6.728515625, -6.4453125, -6.162109375, -5.87890625, -5.595703125, -5.3125, -5.029296875, -4.74609375, -4.462890625, -4.1796875, -3.896484375, -3.61328125, -3.330078125, -3.046875, -2.763671875, -2.48046875, -2.197265625, -1.9140625, -1.630859375, -1.34765625, -1.064453125, -0.78125, -0.498046875, -0.21484375, 0.068359375, 0.3515625, 0.634765625, 0.91796875, 1.201171875, 1.484375, 1.767578125, 2.05078125, 2.333984375, 2.6171875, 2.900390625, 3.18359375, 3.466796875, 3.75, 4.033203125, 4.31640625, 4.599609375, 4.8828125, 5.166015625, 5.44921875, 5.732421875, 6.015625, 6.298828125, 6.58203125, 6.865234375, 7.1484375, 7.431640625, 7.71484375, 7.998046875, 8.28125, 8.564453125, 8.84765625, 9.130859375, 9.4140625, 9.697265625, 9.98046875, 10.263671875, 10.546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 3.0, 10.0, 13.0, 18.0, 20.0, 42.0, 51.0, 79.0, 111.0, 184.0, 345.0, 706.0, 1881.0, 5820.0, 26611.0, 777091.0, 214837.0, 14339.0, 3801.0, 1302.0, 557.0, 245.0, 158.0, 101.0, 78.0, 43.0, 25.0, 18.0, 16.0, 19.0, 9.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.97515869140625, -7.7393798828125, -7.50360107421875, -7.267822265625, -7.03204345703125, -6.7962646484375, -6.56048583984375, -6.32470703125, -6.08892822265625, -5.8531494140625, -5.61737060546875, -5.381591796875, -5.14581298828125, -4.9100341796875, -4.67425537109375, -4.4384765625, -4.20269775390625, -3.9669189453125, -3.73114013671875, -3.495361328125, -3.25958251953125, -3.0238037109375, -2.78802490234375, -2.55224609375, -2.31646728515625, -2.0806884765625, -1.84490966796875, -1.609130859375, -1.37335205078125, -1.1375732421875, -0.90179443359375, -0.666015625, -0.43023681640625, -0.1944580078125, 0.04132080078125, 0.277099609375, 0.51287841796875, 0.7486572265625, 0.98443603515625, 1.22021484375, 1.45599365234375, 1.6917724609375, 1.92755126953125, 2.163330078125, 2.39910888671875, 2.6348876953125, 2.87066650390625, 3.1064453125, 3.34222412109375, 3.5780029296875, 3.81378173828125, 4.049560546875, 4.28533935546875, 4.5211181640625, 4.75689697265625, 4.99267578125, 5.22845458984375, 5.4642333984375, 5.70001220703125, 5.935791015625, 6.17156982421875, 6.4073486328125, 6.64312744140625, 6.87890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 6.0, 19.0, 11.0, 25.0, 29.0, 28.0, 54.0, 61.0, 91.0, 88.0, 111.0, 103.0, 74.0, 70.0, 53.0, 31.0, 27.0, 33.0, 10.0, 12.0, 12.0, 12.0, 6.0, 5.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003066062927246094, -0.00029795989394187927, -0.00028931349515914917, -0.00028066709637641907, -0.00027202069759368896, -0.00026337429881095886, -0.00025472790002822876, -0.00024608150124549866, -0.00023743510246276855, -0.00022878870368003845, -0.00022014230489730835, -0.00021149590611457825, -0.00020284950733184814, -0.00019420310854911804, -0.00018555670976638794, -0.00017691031098365784, -0.00016826391220092773, -0.00015961751341819763, -0.00015097111463546753, -0.00014232471585273743, -0.00013367831707000732, -0.00012503191828727722, -0.00011638551950454712, -0.00010773912072181702, -9.909272193908691e-05, -9.044632315635681e-05, -8.179992437362671e-05, -7.31535255908966e-05, -6.45071268081665e-05, -5.58607280254364e-05, -4.72143292427063e-05, -3.8567930459976196e-05, -2.9921531677246094e-05, -2.127513289451599e-05, -1.2628734111785889e-05, -3.982335329055786e-06, 4.664063453674316e-06, 1.3310462236404419e-05, 2.195686101913452e-05, 3.0603259801864624e-05, 3.9249658584594727e-05, 4.789605736732483e-05, 5.654245615005493e-05, 6.518885493278503e-05, 7.383525371551514e-05, 8.248165249824524e-05, 9.112805128097534e-05, 9.977445006370544e-05, 0.00010842084884643555, 0.00011706724762916565, 0.00012571364641189575, 0.00013436004519462585, 0.00014300644397735596, 0.00015165284276008606, 0.00016029924154281616, 0.00016894564032554626, 0.00017759203910827637, 0.00018623843789100647, 0.00019488483667373657, 0.00020353123545646667, 0.00021217763423919678, 0.00022082403302192688, 0.00022947043180465698, 0.00023811683058738708, 0.0002467632293701172]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 5.0, 10.0, 16.0, 12.0, 30.0, 34.0, 53.0, 80.0, 164.0, 362.0, 729.0, 1817.0, 5729.0, 29677.0, 844193.0, 149150.0, 11284.0, 3012.0, 1082.0, 482.0, 234.0, 149.0, 91.0, 44.0, 25.0, 25.0, 16.0, 9.0, 10.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3719482421875, -6.142333984375, -5.9127197265625, -5.68310546875, -5.4534912109375, -5.223876953125, -4.9942626953125, -4.7646484375, -4.5350341796875, -4.305419921875, -4.0758056640625, -3.84619140625, -3.6165771484375, -3.386962890625, -3.1573486328125, -2.927734375, -2.6981201171875, -2.468505859375, -2.2388916015625, -2.00927734375, -1.7796630859375, -1.550048828125, -1.3204345703125, -1.0908203125, -0.8612060546875, -0.631591796875, -0.4019775390625, -0.17236328125, 0.0572509765625, 0.286865234375, 0.5164794921875, 0.74609375, 0.9757080078125, 1.205322265625, 1.4349365234375, 1.66455078125, 1.8941650390625, 2.123779296875, 2.3533935546875, 2.5830078125, 2.8126220703125, 3.042236328125, 3.2718505859375, 3.50146484375, 3.7310791015625, 3.960693359375, 4.1903076171875, 4.419921875, 4.6495361328125, 4.879150390625, 5.1087646484375, 5.33837890625, 5.5679931640625, 5.797607421875, 6.0272216796875, 6.2568359375, 6.4864501953125, 6.716064453125, 6.9456787109375, 7.17529296875, 7.4049072265625, 7.634521484375, 7.8641357421875, 8.09375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 4.0, 7.0, 16.0, 16.0, 38.0, 85.0, 199.0, 266.0, 199.0, 85.0, 30.0, 13.0, 7.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2723388671875, -9.982177734375, -9.6920166015625, -9.40185546875, -9.1116943359375, -8.821533203125, -8.5313720703125, -8.2412109375, -7.9510498046875, -7.660888671875, -7.3707275390625, -7.08056640625, -6.7904052734375, -6.500244140625, -6.2100830078125, -5.919921875, -5.6297607421875, -5.339599609375, -5.0494384765625, -4.75927734375, -4.4691162109375, -4.178955078125, -3.8887939453125, -3.5986328125, -3.3084716796875, -3.018310546875, -2.7281494140625, -2.43798828125, -2.1478271484375, -1.857666015625, -1.5675048828125, -1.27734375, -0.9871826171875, -0.697021484375, -0.4068603515625, -0.11669921875, 0.1734619140625, 0.463623046875, 0.7537841796875, 1.0439453125, 1.3341064453125, 1.624267578125, 1.9144287109375, 2.20458984375, 2.4947509765625, 2.784912109375, 3.0750732421875, 3.365234375, 3.6553955078125, 3.945556640625, 4.2357177734375, 4.52587890625, 4.8160400390625, 5.106201171875, 5.3963623046875, 5.6865234375, 5.9766845703125, 6.266845703125, 6.5570068359375, 6.84716796875, 7.1373291015625, 7.427490234375, 7.7176513671875, 8.0078125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 6.0, 6.0, 9.0, 8.0, 18.0, 26.0, 58.0, 87.0, 165.0, 175.0, 152.0, 116.0, 65.0, 43.0, 19.0, 16.0, 17.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-67.87911987304688, -66.31166076660156, -64.74420166015625, -63.1767463684082, -61.60928726196289, -60.04182815551758, -58.47437286376953, -56.90691375732422, -55.339454650878906, -53.771995544433594, -52.20453643798828, -50.637081146240234, -49.06962203979492, -47.50216293334961, -45.93470764160156, -44.36724853515625, -42.79978942871094, -41.232330322265625, -39.66487121582031, -38.097415924072266, -36.52995681762695, -34.96249771118164, -33.395042419433594, -31.82758331298828, -30.26012420654297, -28.692665100097656, -27.125207901000977, -25.557750701904297, -23.990291595458984, -22.422832489013672, -20.855375289916992, -19.287918090820312, -17.720455169677734, -16.152996063232422, -14.585538864135742, -13.018080711364746, -11.45062255859375, -9.883164405822754, -8.315706253051758, -6.748248100280762, -5.180789947509766, -3.6133317947387695, -2.0458736419677734, -0.47841548919677734, 1.0890426635742188, 2.656500816345215, 4.223958969116211, 5.791417121887207, 7.358875274658203, 8.9263334274292, 10.493791580200195, 12.061249732971191, 13.628707885742188, 15.196166038513184, 16.76362419128418, 18.33108139038086, 19.898540496826172, 21.465999603271484, 23.033456802368164, 24.600914001464844, 26.168373107910156, 27.73583221435547, 29.30328941345215, 30.870746612548828, 32.43820571899414]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 7.0, 9.0, 10.0, 6.0, 15.0, 29.0, 26.0, 24.0, 23.0, 26.0, 29.0, 32.0, 43.0, 41.0, 50.0, 45.0, 56.0, 46.0, 48.0, 38.0, 41.0, 37.0, 56.0, 50.0, 27.0, 18.0, 34.0, 24.0, 18.0, 23.0, 22.0, 6.0, 11.0, 9.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.83695983886719, -42.1286506652832, -40.42033767700195, -38.71202850341797, -37.00371551513672, -35.295406341552734, -33.58709716796875, -31.878786087036133, -30.170475006103516, -28.4621639251709, -26.75385284423828, -25.045543670654297, -23.33723258972168, -21.628921508789062, -19.920612335205078, -18.21230125427246, -16.503990173339844, -14.795679092407227, -13.087368965148926, -11.379058837890625, -9.670747756958008, -7.962436676025391, -6.25412654876709, -4.545816421508789, -2.837505340576172, -1.129194736480713, 0.5791158676147461, 2.287426471710205, 3.995737075805664, 5.704048156738281, 7.412358283996582, 9.120668411254883, 10.8289794921875, 12.537290573120117, 14.245600700378418, 15.953910827636719, 17.662221908569336, 19.370532989501953, 21.078842163085938, 22.787153244018555, 24.495464324951172, 26.20377540588379, 27.912086486816406, 29.62039566040039, 31.328706741333008, 33.037017822265625, 34.74532699584961, 36.453636169433594, 38.161949157714844, 39.87025833129883, 41.57857131958008, 43.28688049316406, 44.99519348144531, 46.7035026550293, 48.41181182861328, 50.12012481689453, 51.828433990478516, 53.5367431640625, 55.24505615234375, 56.953365325927734, 58.66167449951172, 60.36998748779297, 62.07829666137695, 63.78660583496094, 65.49491882324219]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 16.0, 19.0, 30.0, 62.0, 83.0, 150.0, 216.0, 433.0, 958.0, 2395.0, 6931.0, 28631.0, 302057.0, 3751549.0, 79041.0, 14144.0, 4316.0, 1581.0, 715.0, 397.0, 195.0, 126.0, 87.0, 39.0, 28.0, 16.0, 19.0, 13.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.687744140625, -9.36767578125, -9.047607421875, -8.7275390625, -8.407470703125, -8.08740234375, -7.767333984375, -7.447265625, -7.127197265625, -6.80712890625, -6.487060546875, -6.1669921875, -5.846923828125, -5.52685546875, -5.206787109375, -4.88671875, -4.566650390625, -4.24658203125, -3.926513671875, -3.6064453125, -3.286376953125, -2.96630859375, -2.646240234375, -2.326171875, -2.006103515625, -1.68603515625, -1.365966796875, -1.0458984375, -0.725830078125, -0.40576171875, -0.085693359375, 0.234375, 0.554443359375, 0.87451171875, 1.194580078125, 1.5146484375, 1.834716796875, 2.15478515625, 2.474853515625, 2.794921875, 3.114990234375, 3.43505859375, 3.755126953125, 4.0751953125, 4.395263671875, 4.71533203125, 5.035400390625, 5.35546875, 5.675537109375, 5.99560546875, 6.315673828125, 6.6357421875, 6.955810546875, 7.27587890625, 7.595947265625, 7.916015625, 8.236083984375, 8.55615234375, 8.876220703125, 9.1962890625, 9.516357421875, 9.83642578125, 10.156494140625, 10.4765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 8.0, 10.0, 14.0, 17.0, 25.0, 26.0, 29.0, 41.0, 48.0, 56.0, 59.0, 68.0, 50.0, 77.0, 63.0, 65.0, 56.0, 58.0, 54.0, 43.0, 34.0, 32.0, 24.0, 13.0, 8.0, 8.0, 7.0, 1.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.566070556640625, -2.47003173828125, -2.373992919921875, -2.2779541015625, -2.181915283203125, -2.08587646484375, -1.989837646484375, -1.893798828125, -1.797760009765625, -1.70172119140625, -1.605682373046875, -1.5096435546875, -1.413604736328125, -1.31756591796875, -1.221527099609375, -1.12548828125, -1.029449462890625, -0.93341064453125, -0.837371826171875, -0.7413330078125, -0.645294189453125, -0.54925537109375, -0.453216552734375, -0.357177734375, -0.261138916015625, -0.16510009765625, -0.069061279296875, 0.0269775390625, 0.123016357421875, 0.21905517578125, 0.315093994140625, 0.4111328125, 0.507171630859375, 0.60321044921875, 0.699249267578125, 0.7952880859375, 0.891326904296875, 0.98736572265625, 1.083404541015625, 1.179443359375, 1.275482177734375, 1.37152099609375, 1.467559814453125, 1.5635986328125, 1.659637451171875, 1.75567626953125, 1.851715087890625, 1.94775390625, 2.043792724609375, 2.13983154296875, 2.235870361328125, 2.3319091796875, 2.427947998046875, 2.52398681640625, 2.620025634765625, 2.716064453125, 2.812103271484375, 2.90814208984375, 3.004180908203125, 3.1002197265625, 3.196258544921875, 3.29229736328125, 3.388336181640625, 3.484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 12.0, 8.0, 9.0, 11.0, 18.0, 13.0, 30.0, 53.0, 84.0, 113.0, 243.0, 654.0, 2258.0, 13831.0, 452345.0, 3696645.0, 23111.0, 3358.0, 789.0, 307.0, 144.0, 79.0, 46.0, 29.0, 31.0, 16.0, 13.0, 10.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.046875, -12.61376953125, -12.1806640625, -11.74755859375, -11.314453125, -10.88134765625, -10.4482421875, -10.01513671875, -9.58203125, -9.14892578125, -8.7158203125, -8.28271484375, -7.849609375, -7.41650390625, -6.9833984375, -6.55029296875, -6.1171875, -5.68408203125, -5.2509765625, -4.81787109375, -4.384765625, -3.95166015625, -3.5185546875, -3.08544921875, -2.65234375, -2.21923828125, -1.7861328125, -1.35302734375, -0.919921875, -0.48681640625, -0.0537109375, 0.37939453125, 0.8125, 1.24560546875, 1.6787109375, 2.11181640625, 2.544921875, 2.97802734375, 3.4111328125, 3.84423828125, 4.27734375, 4.71044921875, 5.1435546875, 5.57666015625, 6.009765625, 6.44287109375, 6.8759765625, 7.30908203125, 7.7421875, 8.17529296875, 8.6083984375, 9.04150390625, 9.474609375, 9.90771484375, 10.3408203125, 10.77392578125, 11.20703125, 11.64013671875, 12.0732421875, 12.50634765625, 12.939453125, 13.37255859375, 13.8056640625, 14.23876953125, 14.671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 4.0, 5.0, 8.0, 13.0, 12.0, 22.0, 34.0, 56.0, 86.0, 188.0, 668.0, 2244.0, 399.0, 151.0, 71.0, 33.0, 20.0, 15.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.65234375, -4.5279541015625, -4.403564453125, -4.2791748046875, -4.15478515625, -4.0303955078125, -3.906005859375, -3.7816162109375, -3.6572265625, -3.5328369140625, -3.408447265625, -3.2840576171875, -3.15966796875, -3.0352783203125, -2.910888671875, -2.7864990234375, -2.662109375, -2.5377197265625, -2.413330078125, -2.2889404296875, -2.16455078125, -2.0401611328125, -1.915771484375, -1.7913818359375, -1.6669921875, -1.5426025390625, -1.418212890625, -1.2938232421875, -1.16943359375, -1.0450439453125, -0.920654296875, -0.7962646484375, -0.671875, -0.5474853515625, -0.423095703125, -0.2987060546875, -0.17431640625, -0.0499267578125, 0.074462890625, 0.1988525390625, 0.3232421875, 0.4476318359375, 0.572021484375, 0.6964111328125, 0.82080078125, 0.9451904296875, 1.069580078125, 1.1939697265625, 1.318359375, 1.4427490234375, 1.567138671875, 1.6915283203125, 1.81591796875, 1.9403076171875, 2.064697265625, 2.1890869140625, 2.3134765625, 2.4378662109375, 2.562255859375, 2.6866455078125, 2.81103515625, 2.9354248046875, 3.059814453125, 3.1842041015625, 3.30859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 21.0, 55.0, 257.0, 487.0, 140.0, 24.0, 11.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.97433090209961, -59.66493606567383, -58.35554122924805, -57.04615020751953, -55.73675537109375, -54.42736053466797, -53.11796569824219, -51.808570861816406, -50.499176025390625, -49.189781188964844, -47.88038635253906, -46.57099533081055, -45.261600494384766, -43.952205657958984, -42.6428108215332, -41.33341598510742, -40.024024963378906, -38.714630126953125, -37.405235290527344, -36.09584426879883, -34.78644943237305, -33.477054595947266, -32.167659759521484, -30.858264923095703, -29.548871994018555, -28.239477157592773, -26.930084228515625, -25.620689392089844, -24.311294555664062, -23.001901626586914, -21.692506790161133, -20.383113861083984, -19.07371711730957, -17.76432228088379, -16.45492935180664, -15.14553451538086, -13.836140632629395, -12.52674674987793, -11.217351913452148, -9.907958030700684, -8.598564147949219, -7.289170265197754, -5.979775905609131, -4.670381546020508, -3.360987663269043, -2.051593780517578, -0.7421994209289551, 0.567194938659668, 1.8765888214111328, 3.1859829425811768, 4.495377063751221, 5.804771423339844, 7.114165306091309, 8.423559188842773, 9.732954025268555, 11.04234790802002, 12.351741790771484, 13.66113567352295, 14.970529556274414, 16.279924392700195, 17.589317321777344, 18.898712158203125, 20.208106994628906, 21.517501831054688, 22.826894760131836]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 4.0, 5.0, 14.0, 16.0, 12.0, 27.0, 21.0, 28.0, 26.0, 45.0, 55.0, 45.0, 59.0, 60.0, 64.0, 63.0, 62.0, 60.0, 56.0, 53.0, 45.0, 35.0, 33.0, 33.0, 17.0, 17.0, 15.0, 7.0, 9.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.20586395263672, -16.75762367248535, -16.30938148498535, -15.861141204833984, -15.4128999710083, -14.964658737182617, -14.51641845703125, -14.068177223205566, -13.619935989379883, -13.1716947555542, -12.723453521728516, -12.275213241577148, -11.826972007751465, -11.378730773925781, -10.930490493774414, -10.48224925994873, -10.034008026123047, -9.585766792297363, -9.13752555847168, -8.689285278320312, -8.241044044494629, -7.792802810668945, -7.34456205368042, -6.8963212966918945, -6.448080062866211, -5.999838829040527, -5.551598072052002, -5.103357315063477, -4.655116081237793, -4.206874847412109, -3.758634090423584, -3.3103930950164795, -2.8621530532836914, -2.413912057876587, -1.9656710624694824, -1.517430067062378, -1.0691890716552734, -0.620948076248169, -0.17270708084106445, 0.27553391456604004, 0.7237749099731445, 1.172015905380249, 1.6202569007873535, 2.068497896194458, 2.5167388916015625, 2.964979887008667, 3.4132208824157715, 3.861461877822876, 4.3097028732299805, 4.757944107055664, 5.2061848640441895, 5.654425621032715, 6.102666854858398, 6.550908088684082, 6.999148845672607, 7.447389602661133, 7.895630836486816, 8.3438720703125, 8.792112350463867, 9.24035358428955, 9.688594818115234, 10.136836051940918, 10.585077285766602, 11.033317565917969, 11.481558799743652]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 17.0, 12.0, 11.0, 19.0, 34.0, 58.0, 84.0, 98.0, 170.0, 245.0, 427.0, 653.0, 1190.0, 2344.0, 4917.0, 10493.0, 24782.0, 63687.0, 178258.0, 392857.0, 230632.0, 81474.0, 31155.0, 12875.0, 5700.0, 2780.0, 1434.0, 820.0, 454.0, 290.0, 174.0, 114.0, 74.0, 57.0, 44.0, 27.0, 22.0, 13.0, 17.0, 8.0, 11.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.33929443359375, -5.1590576171875, -4.97882080078125, -4.798583984375, -4.61834716796875, -4.4381103515625, -4.25787353515625, -4.07763671875, -3.89739990234375, -3.7171630859375, -3.53692626953125, -3.356689453125, -3.17645263671875, -2.9962158203125, -2.81597900390625, -2.6357421875, -2.45550537109375, -2.2752685546875, -2.09503173828125, -1.914794921875, -1.73455810546875, -1.5543212890625, -1.37408447265625, -1.19384765625, -1.01361083984375, -0.8333740234375, -0.65313720703125, -0.472900390625, -0.29266357421875, -0.1124267578125, 0.06781005859375, 0.248046875, 0.42828369140625, 0.6085205078125, 0.78875732421875, 0.968994140625, 1.14923095703125, 1.3294677734375, 1.50970458984375, 1.68994140625, 1.87017822265625, 2.0504150390625, 2.23065185546875, 2.410888671875, 2.59112548828125, 2.7713623046875, 2.95159912109375, 3.1318359375, 3.31207275390625, 3.4923095703125, 3.67254638671875, 3.852783203125, 4.03302001953125, 4.2132568359375, 4.39349365234375, 4.57373046875, 4.75396728515625, 4.9342041015625, 5.11444091796875, 5.294677734375, 5.47491455078125, 5.6551513671875, 5.83538818359375, 6.015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 7.0, 16.0, 22.0, 21.0, 34.0, 28.0, 34.0, 52.0, 48.0, 58.0, 63.0, 66.0, 63.0, 73.0, 60.0, 56.0, 56.0, 50.0, 49.0, 38.0, 31.0, 17.0, 15.0, 13.0, 8.0, 4.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.35546875, -2.26385498046875, -2.1722412109375, -2.08062744140625, -1.989013671875, -1.89739990234375, -1.8057861328125, -1.71417236328125, -1.62255859375, -1.53094482421875, -1.4393310546875, -1.34771728515625, -1.256103515625, -1.16448974609375, -1.0728759765625, -0.98126220703125, -0.8896484375, -0.79803466796875, -0.7064208984375, -0.61480712890625, -0.523193359375, -0.43157958984375, -0.3399658203125, -0.24835205078125, -0.15673828125, -0.06512451171875, 0.0264892578125, 0.11810302734375, 0.209716796875, 0.30133056640625, 0.3929443359375, 0.48455810546875, 0.576171875, 0.66778564453125, 0.7593994140625, 0.85101318359375, 0.942626953125, 1.03424072265625, 1.1258544921875, 1.21746826171875, 1.30908203125, 1.40069580078125, 1.4923095703125, 1.58392333984375, 1.675537109375, 1.76715087890625, 1.8587646484375, 1.95037841796875, 2.0419921875, 2.13360595703125, 2.2252197265625, 2.31683349609375, 2.408447265625, 2.50006103515625, 2.5916748046875, 2.68328857421875, 2.77490234375, 2.86651611328125, 2.9581298828125, 3.04974365234375, 3.141357421875, 3.23297119140625, 3.3245849609375, 3.41619873046875, 3.5078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 8.0, 10.0, 18.0, 18.0, 30.0, 33.0, 54.0, 64.0, 94.0, 138.0, 159.0, 209.0, 313.0, 509.0, 885.0, 1892.0, 5020.0, 16732.0, 75730.0, 473247.0, 389646.0, 61335.0, 14146.0, 4270.0, 1656.0, 724.0, 430.0, 291.0, 203.0, 153.0, 122.0, 81.0, 74.0, 48.0, 50.0, 33.0, 16.0, 30.0, 23.0, 20.0, 16.0, 8.0, 3.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.96875, -7.711181640625, -7.45361328125, -7.196044921875, -6.9384765625, -6.680908203125, -6.42333984375, -6.165771484375, -5.908203125, -5.650634765625, -5.39306640625, -5.135498046875, -4.8779296875, -4.620361328125, -4.36279296875, -4.105224609375, -3.84765625, -3.590087890625, -3.33251953125, -3.074951171875, -2.8173828125, -2.559814453125, -2.30224609375, -2.044677734375, -1.787109375, -1.529541015625, -1.27197265625, -1.014404296875, -0.7568359375, -0.499267578125, -0.24169921875, 0.015869140625, 0.2734375, 0.531005859375, 0.78857421875, 1.046142578125, 1.3037109375, 1.561279296875, 1.81884765625, 2.076416015625, 2.333984375, 2.591552734375, 2.84912109375, 3.106689453125, 3.3642578125, 3.621826171875, 3.87939453125, 4.136962890625, 4.39453125, 4.652099609375, 4.90966796875, 5.167236328125, 5.4248046875, 5.682373046875, 5.93994140625, 6.197509765625, 6.455078125, 6.712646484375, 6.97021484375, 7.227783203125, 7.4853515625, 7.742919921875, 8.00048828125, 8.258056640625, 8.515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 3.0, 14.0, 5.0, 8.0, 15.0, 16.0, 23.0, 16.0, 25.0, 20.0, 36.0, 27.0, 33.0, 27.0, 54.0, 39.0, 37.0, 54.0, 45.0, 41.0, 43.0, 37.0, 38.0, 33.0, 22.0, 39.0, 27.0, 37.0, 20.0, 21.0, 30.0, 19.0, 16.0, 14.0, 12.0, 11.0, 2.0, 9.0, 4.0, 5.0, 7.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.578125, -8.30810546875, -8.0380859375, -7.76806640625, -7.498046875, -7.22802734375, -6.9580078125, -6.68798828125, -6.41796875, -6.14794921875, -5.8779296875, -5.60791015625, -5.337890625, -5.06787109375, -4.7978515625, -4.52783203125, -4.2578125, -3.98779296875, -3.7177734375, -3.44775390625, -3.177734375, -2.90771484375, -2.6376953125, -2.36767578125, -2.09765625, -1.82763671875, -1.5576171875, -1.28759765625, -1.017578125, -0.74755859375, -0.4775390625, -0.20751953125, 0.0625, 0.33251953125, 0.6025390625, 0.87255859375, 1.142578125, 1.41259765625, 1.6826171875, 1.95263671875, 2.22265625, 2.49267578125, 2.7626953125, 3.03271484375, 3.302734375, 3.57275390625, 3.8427734375, 4.11279296875, 4.3828125, 4.65283203125, 4.9228515625, 5.19287109375, 5.462890625, 5.73291015625, 6.0029296875, 6.27294921875, 6.54296875, 6.81298828125, 7.0830078125, 7.35302734375, 7.623046875, 7.89306640625, 8.1630859375, 8.43310546875, 8.703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 1.0, 8.0, 18.0, 32.0, 34.0, 58.0, 118.0, 189.0, 361.0, 740.0, 1608.0, 4233.0, 14920.0, 77024.0, 624347.0, 276411.0, 35033.0, 8492.0, 2649.0, 1121.0, 511.0, 246.0, 155.0, 85.0, 51.0, 34.0, 26.0, 16.0, 11.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.21124267578125, -4.0787353515625, -3.94622802734375, -3.813720703125, -3.68121337890625, -3.5487060546875, -3.41619873046875, -3.28369140625, -3.15118408203125, -3.0186767578125, -2.88616943359375, -2.753662109375, -2.62115478515625, -2.4886474609375, -2.35614013671875, -2.2236328125, -2.09112548828125, -1.9586181640625, -1.82611083984375, -1.693603515625, -1.56109619140625, -1.4285888671875, -1.29608154296875, -1.16357421875, -1.03106689453125, -0.8985595703125, -0.76605224609375, -0.633544921875, -0.50103759765625, -0.3685302734375, -0.23602294921875, -0.103515625, 0.02899169921875, 0.1614990234375, 0.29400634765625, 0.426513671875, 0.55902099609375, 0.6915283203125, 0.82403564453125, 0.95654296875, 1.08905029296875, 1.2215576171875, 1.35406494140625, 1.486572265625, 1.61907958984375, 1.7515869140625, 1.88409423828125, 2.0166015625, 2.14910888671875, 2.2816162109375, 2.41412353515625, 2.546630859375, 2.67913818359375, 2.8116455078125, 2.94415283203125, 3.07666015625, 3.20916748046875, 3.3416748046875, 3.47418212890625, 3.606689453125, 3.73919677734375, 3.8717041015625, 4.00421142578125, 4.13671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 10.0, 5.0, 9.0, 12.0, 18.0, 23.0, 46.0, 60.0, 122.0, 145.0, 169.0, 127.0, 84.0, 45.0, 28.0, 25.0, 14.0, 10.0, 9.0, 8.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005931854248046875, -0.0005758777260780334, -0.0005585700273513794, -0.0005412623286247253, -0.0005239546298980713, -0.0005066469311714172, -0.0004893392324447632, -0.00047203153371810913, -0.0004547238349914551, -0.000437416136264801, -0.00042010843753814697, -0.0004028007388114929, -0.00038549304008483887, -0.0003681853413581848, -0.00035087764263153076, -0.0003335699439048767, -0.00031626224517822266, -0.0002989545464515686, -0.00028164684772491455, -0.0002643391489982605, -0.00024703145027160645, -0.0002297237515449524, -0.00021241605281829834, -0.0001951083540916443, -0.00017780065536499023, -0.00016049295663833618, -0.00014318525791168213, -0.00012587755918502808, -0.00010856986045837402, -9.126216173171997e-05, -7.395446300506592e-05, -5.6646764278411865e-05, -3.933906555175781e-05, -2.203136682510376e-05, -4.723668098449707e-06, 1.2584030628204346e-05, 2.98917293548584e-05, 4.719942808151245e-05, 6.45071268081665e-05, 8.181482553482056e-05, 9.912252426147461e-05, 0.00011643022298812866, 0.00013373792171478271, 0.00015104562044143677, 0.00016835331916809082, 0.00018566101789474487, 0.00020296871662139893, 0.00022027641534805298, 0.00023758411407470703, 0.0002548918128013611, 0.00027219951152801514, 0.0002895072102546692, 0.00030681490898132324, 0.0003241226077079773, 0.00034143030643463135, 0.0003587380051612854, 0.00037604570388793945, 0.0003933534026145935, 0.00041066110134124756, 0.0004279688000679016, 0.00044527649879455566, 0.0004625841975212097, 0.00047989189624786377, 0.0004971995949745178, 0.0005145072937011719]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 20.0, 13.0, 21.0, 31.0, 52.0, 66.0, 130.0, 211.0, 349.0, 650.0, 1501.0, 4188.0, 14989.0, 83361.0, 653601.0, 245631.0, 31825.0, 7406.0, 2389.0, 958.0, 485.0, 252.0, 152.0, 81.0, 54.0, 39.0, 28.0, 18.0, 8.0, 4.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.59765625, -3.47247314453125, -3.3472900390625, -3.22210693359375, -3.096923828125, -2.97174072265625, -2.8465576171875, -2.72137451171875, -2.59619140625, -2.47100830078125, -2.3458251953125, -2.22064208984375, -2.095458984375, -1.97027587890625, -1.8450927734375, -1.71990966796875, -1.5947265625, -1.46954345703125, -1.3443603515625, -1.21917724609375, -1.093994140625, -0.96881103515625, -0.8436279296875, -0.71844482421875, -0.59326171875, -0.46807861328125, -0.3428955078125, -0.21771240234375, -0.092529296875, 0.03265380859375, 0.1578369140625, 0.28302001953125, 0.408203125, 0.53338623046875, 0.6585693359375, 0.78375244140625, 0.908935546875, 1.03411865234375, 1.1593017578125, 1.28448486328125, 1.40966796875, 1.53485107421875, 1.6600341796875, 1.78521728515625, 1.910400390625, 2.03558349609375, 2.1607666015625, 2.28594970703125, 2.4111328125, 2.53631591796875, 2.6614990234375, 2.78668212890625, 2.911865234375, 3.03704833984375, 3.1622314453125, 3.28741455078125, 3.41259765625, 3.53778076171875, 3.6629638671875, 3.78814697265625, 3.913330078125, 4.03851318359375, 4.1636962890625, 4.28887939453125, 4.4140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 9.0, 8.0, 15.0, 15.0, 18.0, 17.0, 18.0, 21.0, 48.0, 54.0, 62.0, 79.0, 106.0, 93.0, 100.0, 76.0, 74.0, 51.0, 36.0, 22.0, 10.0, 20.0, 15.0, 6.0, 9.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9609375, -2.852203369140625, -2.74346923828125, -2.634735107421875, -2.5260009765625, -2.417266845703125, -2.30853271484375, -2.199798583984375, -2.091064453125, -1.982330322265625, -1.87359619140625, -1.764862060546875, -1.6561279296875, -1.547393798828125, -1.43865966796875, -1.329925537109375, -1.22119140625, -1.112457275390625, -1.00372314453125, -0.894989013671875, -0.7862548828125, -0.677520751953125, -0.56878662109375, -0.460052490234375, -0.351318359375, -0.242584228515625, -0.13385009765625, -0.025115966796875, 0.0836181640625, 0.192352294921875, 0.30108642578125, 0.409820556640625, 0.5185546875, 0.627288818359375, 0.73602294921875, 0.844757080078125, 0.9534912109375, 1.062225341796875, 1.17095947265625, 1.279693603515625, 1.388427734375, 1.497161865234375, 1.60589599609375, 1.714630126953125, 1.8233642578125, 1.932098388671875, 2.04083251953125, 2.149566650390625, 2.25830078125, 2.367034912109375, 2.47576904296875, 2.584503173828125, 2.6932373046875, 2.801971435546875, 2.91070556640625, 3.019439697265625, 3.128173828125, 3.236907958984375, 3.34564208984375, 3.454376220703125, 3.5631103515625, 3.671844482421875, 3.78057861328125, 3.889312744140625, 3.998046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 15.0, 27.0, 173.0, 495.0, 215.0, 54.0, 17.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.52156066894531, -94.69498443603516, -89.86840057373047, -85.04182434082031, -80.21524047851562, -75.38866424560547, -70.56208801269531, -65.73550415039062, -60.9089241027832, -56.08234405517578, -51.25576400756836, -46.42918395996094, -41.60260772705078, -36.776023864746094, -31.949447631835938, -27.122867584228516, -22.296287536621094, -17.469707489013672, -12.643128395080566, -7.816549301147461, -2.989969253540039, 1.8366107940673828, 6.663188934326172, 11.489768981933594, 16.316349029541016, 21.142929077148438, 25.96950912475586, 30.79608726501465, 35.62266540527344, 40.449249267578125, 45.27582550048828, 50.1024055480957, 54.928985595703125, 59.75556564331055, 64.58214569091797, 69.40872192382812, 74.23530578613281, 79.06188201904297, 83.88845825195312, 88.71504211425781, 93.5416259765625, 98.36820220947266, 103.19478607177734, 108.0213623046875, 112.84794616699219, 117.67452239990234, 122.5010986328125, 127.32768249511719, 132.15426635742188, 136.98085021972656, 141.8074188232422, 146.63400268554688, 151.46058654785156, 156.28717041015625, 161.11373901367188, 165.94032287597656, 170.7668914794922, 175.59347534179688, 180.4200439453125, 185.2466278076172, 190.07321166992188, 194.89979553222656, 199.7263641357422, 204.55294799804688, 209.37953186035156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 10.0, 4.0, 2.0, 9.0, 10.0, 21.0, 9.0, 12.0, 14.0, 24.0, 15.0, 25.0, 27.0, 33.0, 36.0, 35.0, 32.0, 34.0, 37.0, 42.0, 30.0, 47.0, 43.0, 46.0, 40.0, 37.0, 35.0, 34.0, 28.0, 29.0, 24.0, 17.0, 22.0, 17.0, 21.0, 20.0, 13.0, 10.0, 7.0, 9.0, 11.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-48.0368766784668, -46.487491607666016, -44.9381103515625, -43.38872528076172, -41.83934020996094, -40.289955139160156, -38.74057388305664, -37.19118881225586, -35.641807556152344, -34.09242248535156, -32.54304122924805, -30.993656158447266, -29.444271087646484, -27.894887924194336, -26.345504760742188, -24.796119689941406, -23.246734619140625, -21.697351455688477, -20.147966384887695, -18.598583221435547, -17.049198150634766, -15.499814987182617, -13.950431823730469, -12.401047706604004, -10.851663589477539, -9.302279472351074, -7.752895832061768, -6.203512191772461, -4.654128074645996, -3.1047439575195312, -1.5553607940673828, -0.005976676940917969, 1.5434036254882812, 3.092787504196167, 4.642171382904053, 6.191555023193359, 7.740939140319824, 9.290323257446289, 10.839706420898438, 12.389090538024902, 13.938474655151367, 15.487858772277832, 17.037242889404297, 18.586626052856445, 20.136009216308594, 21.685394287109375, 23.234777450561523, 24.784160614013672, 26.333545684814453, 27.8829288482666, 29.432313919067383, 30.98169708251953, 32.53108215332031, 34.080467224121094, 35.62984848022461, 37.17923355102539, 38.728614807128906, 40.27799987792969, 41.8273811340332, 43.376766204833984, 44.926151275634766, 46.47553253173828, 48.02491760253906, 49.574302673339844, 51.123687744140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 12.0, 12.0, 18.0, 18.0, 33.0, 50.0, 82.0, 116.0, 168.0, 226.0, 337.0, 553.0, 959.0, 1745.0, 3138.0, 5809.0, 12250.0, 31274.0, 118920.0, 3006045.0, 883331.0, 82168.0, 24875.0, 10412.0, 5093.0, 2711.0, 1532.0, 893.0, 504.0, 342.0, 196.0, 156.0, 95.0, 63.0, 38.0, 30.0, 22.0, 21.0, 14.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484375, -6.281005859375, -6.07763671875, -5.874267578125, -5.6708984375, -5.467529296875, -5.26416015625, -5.060791015625, -4.857421875, -4.654052734375, -4.45068359375, -4.247314453125, -4.0439453125, -3.840576171875, -3.63720703125, -3.433837890625, -3.23046875, -3.027099609375, -2.82373046875, -2.620361328125, -2.4169921875, -2.213623046875, -2.01025390625, -1.806884765625, -1.603515625, -1.400146484375, -1.19677734375, -0.993408203125, -0.7900390625, -0.586669921875, -0.38330078125, -0.179931640625, 0.0234375, 0.226806640625, 0.43017578125, 0.633544921875, 0.8369140625, 1.040283203125, 1.24365234375, 1.447021484375, 1.650390625, 1.853759765625, 2.05712890625, 2.260498046875, 2.4638671875, 2.667236328125, 2.87060546875, 3.073974609375, 3.27734375, 3.480712890625, 3.68408203125, 3.887451171875, 4.0908203125, 4.294189453125, 4.49755859375, 4.700927734375, 4.904296875, 5.107666015625, 5.31103515625, 5.514404296875, 5.7177734375, 5.921142578125, 6.12451171875, 6.327880859375, 6.53125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 2.0, 5.0, 8.0, 9.0, 16.0, 15.0, 21.0, 20.0, 26.0, 29.0, 23.0, 37.0, 54.0, 47.0, 47.0, 50.0, 50.0, 62.0, 53.0, 49.0, 46.0, 55.0, 49.0, 35.0, 37.0, 33.0, 17.0, 20.0, 13.0, 18.0, 15.0, 12.0, 5.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75, -2.660247802734375, -2.57049560546875, -2.480743408203125, -2.3909912109375, -2.301239013671875, -2.21148681640625, -2.121734619140625, -2.031982421875, -1.942230224609375, -1.85247802734375, -1.762725830078125, -1.6729736328125, -1.583221435546875, -1.49346923828125, -1.403717041015625, -1.31396484375, -1.224212646484375, -1.13446044921875, -1.044708251953125, -0.9549560546875, -0.865203857421875, -0.77545166015625, -0.685699462890625, -0.595947265625, -0.506195068359375, -0.41644287109375, -0.326690673828125, -0.2369384765625, -0.147186279296875, -0.05743408203125, 0.032318115234375, 0.1220703125, 0.211822509765625, 0.30157470703125, 0.391326904296875, 0.4810791015625, 0.570831298828125, 0.66058349609375, 0.750335693359375, 0.840087890625, 0.929840087890625, 1.01959228515625, 1.109344482421875, 1.1990966796875, 1.288848876953125, 1.37860107421875, 1.468353271484375, 1.55810546875, 1.647857666015625, 1.73760986328125, 1.827362060546875, 1.9171142578125, 2.006866455078125, 2.09661865234375, 2.186370849609375, 2.276123046875, 2.365875244140625, 2.45562744140625, 2.545379638671875, 2.6351318359375, 2.724884033203125, 2.81463623046875, 2.904388427734375, 2.994140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 5.0, 7.0, 13.0, 18.0, 32.0, 75.0, 163.0, 444.0, 1045.0, 3177.0, 15378.0, 251124.0, 3857419.0, 55716.0, 6790.0, 1790.0, 627.0, 245.0, 101.0, 53.0, 27.0, 6.0, 9.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.2265625, -11.8477783203125, -11.468994140625, -11.0902099609375, -10.71142578125, -10.3326416015625, -9.953857421875, -9.5750732421875, -9.1962890625, -8.8175048828125, -8.438720703125, -8.0599365234375, -7.68115234375, -7.3023681640625, -6.923583984375, -6.5447998046875, -6.166015625, -5.7872314453125, -5.408447265625, -5.0296630859375, -4.65087890625, -4.2720947265625, -3.893310546875, -3.5145263671875, -3.1357421875, -2.7569580078125, -2.378173828125, -1.9993896484375, -1.62060546875, -1.2418212890625, -0.863037109375, -0.4842529296875, -0.10546875, 0.2733154296875, 0.652099609375, 1.0308837890625, 1.40966796875, 1.7884521484375, 2.167236328125, 2.5460205078125, 2.9248046875, 3.3035888671875, 3.682373046875, 4.0611572265625, 4.43994140625, 4.8187255859375, 5.197509765625, 5.5762939453125, 5.955078125, 6.3338623046875, 6.712646484375, 7.0914306640625, 7.47021484375, 7.8489990234375, 8.227783203125, 8.6065673828125, 8.9853515625, 9.3641357421875, 9.742919921875, 10.1217041015625, 10.50048828125, 10.8792724609375, 11.258056640625, 11.6368408203125, 12.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 19.0, 30.0, 53.0, 55.0, 115.0, 348.0, 1637.0, 1181.0, 292.0, 123.0, 63.0, 46.0, 29.0, 19.0, 7.0, 8.0, 8.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.23944091796875, -5.0804443359375, -4.92144775390625, -4.762451171875, -4.60345458984375, -4.4444580078125, -4.28546142578125, -4.12646484375, -3.96746826171875, -3.8084716796875, -3.64947509765625, -3.490478515625, -3.33148193359375, -3.1724853515625, -3.01348876953125, -2.8544921875, -2.69549560546875, -2.5364990234375, -2.37750244140625, -2.218505859375, -2.05950927734375, -1.9005126953125, -1.74151611328125, -1.58251953125, -1.42352294921875, -1.2645263671875, -1.10552978515625, -0.946533203125, -0.78753662109375, -0.6285400390625, -0.46954345703125, -0.310546875, -0.15155029296875, 0.0074462890625, 0.16644287109375, 0.325439453125, 0.48443603515625, 0.6434326171875, 0.80242919921875, 0.96142578125, 1.12042236328125, 1.2794189453125, 1.43841552734375, 1.597412109375, 1.75640869140625, 1.9154052734375, 2.07440185546875, 2.2333984375, 2.39239501953125, 2.5513916015625, 2.71038818359375, 2.869384765625, 3.02838134765625, 3.1873779296875, 3.34637451171875, 3.50537109375, 3.66436767578125, 3.8233642578125, 3.98236083984375, 4.141357421875, 4.30035400390625, 4.4593505859375, 4.61834716796875, 4.77734375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 34.0, 76.0, 199.0, 302.0, 204.0, 118.0, 23.0, 19.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.6229248046875, -46.64616775512695, -45.66941452026367, -44.692657470703125, -43.71590042114258, -42.73914337158203, -41.76239013671875, -40.7856330871582, -39.808876037597656, -38.83211898803711, -37.85536575317383, -36.87860870361328, -35.901851654052734, -34.92509460449219, -33.948341369628906, -32.97158432006836, -31.994831085205078, -31.018075942993164, -30.041318893432617, -29.064563751220703, -28.087806701660156, -27.111051559448242, -26.134296417236328, -25.15753936767578, -24.180784225463867, -23.204029083251953, -22.227272033691406, -21.250516891479492, -20.273761749267578, -19.29700469970703, -18.320249557495117, -17.343494415283203, -16.366735458374023, -15.389979362487793, -14.413223266601562, -13.436468124389648, -12.459712028503418, -11.482955932617188, -10.506200790405273, -9.529444694519043, -8.552688598632812, -7.575932502746582, -6.59917688369751, -5.6224212646484375, -4.645665168762207, -3.6689090728759766, -2.6921534538269043, -1.715397834777832, -0.7386417388916016, 0.2381141185760498, 1.2148699760437012, 2.1916258335113525, 3.168381690979004, 4.145137786865234, 5.121893405914307, 6.098649024963379, 7.075405120849609, 8.05216121673584, 9.02891731262207, 10.005672454833984, 10.982428550720215, 11.959184646606445, 12.93593978881836, 13.91269588470459, 14.88945198059082]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 6.0, 9.0, 8.0, 13.0, 15.0, 22.0, 23.0, 28.0, 31.0, 32.0, 42.0, 50.0, 37.0, 61.0, 66.0, 48.0, 57.0, 45.0, 55.0, 58.0, 39.0, 62.0, 43.0, 28.0, 23.0, 28.0, 11.0, 14.0, 15.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.598751068115234, -17.104717254638672, -16.61068344116211, -16.11665153503418, -15.622617721557617, -15.128583908081055, -14.634551048278809, -14.140518188476562, -13.646484375, -13.152450561523438, -12.658417701721191, -12.164384841918945, -11.670351028442383, -11.17631721496582, -10.682284355163574, -10.188251495361328, -9.694217681884766, -9.200183868408203, -8.706151008605957, -8.212118148803711, -7.718084335327148, -7.224050998687744, -6.73001766204834, -6.2359843254089355, -5.741950988769531, -5.247917652130127, -4.753884315490723, -4.259850978851318, -3.765817642211914, -3.2717843055725098, -2.7777509689331055, -2.283717632293701, -1.7896842956542969, -1.2956509590148926, -0.8016176223754883, -0.307584285736084, 0.1864490509033203, 0.6804823875427246, 1.174515724182129, 1.6685490608215332, 2.1625823974609375, 2.656615734100342, 3.150649070739746, 3.6446824073791504, 4.138715744018555, 4.632749080657959, 5.126782417297363, 5.620815753936768, 6.114849090576172, 6.608882427215576, 7.1029157638549805, 7.596949100494385, 8.090982437133789, 8.585016250610352, 9.079049110412598, 9.573081970214844, 10.067115783691406, 10.561149597167969, 11.055182456970215, 11.549215316772461, 12.043249130249023, 12.537282943725586, 13.031315803527832, 13.525348663330078, 14.01938247680664]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 8.0, 11.0, 22.0, 15.0, 24.0, 41.0, 71.0, 86.0, 123.0, 182.0, 279.0, 443.0, 654.0, 1079.0, 2002.0, 3608.0, 6452.0, 13137.0, 28890.0, 71913.0, 208802.0, 443690.0, 160999.0, 57253.0, 24436.0, 11150.0, 5675.0, 3001.0, 1766.0, 978.0, 614.0, 377.0, 263.0, 143.0, 122.0, 63.0, 70.0, 36.0, 26.0, 12.0, 12.0, 8.0, 6.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.62890625, -5.44366455078125, -5.2584228515625, -5.07318115234375, -4.887939453125, -4.70269775390625, -4.5174560546875, -4.33221435546875, -4.14697265625, -3.96173095703125, -3.7764892578125, -3.59124755859375, -3.406005859375, -3.22076416015625, -3.0355224609375, -2.85028076171875, -2.6650390625, -2.47979736328125, -2.2945556640625, -2.10931396484375, -1.924072265625, -1.73883056640625, -1.5535888671875, -1.36834716796875, -1.18310546875, -0.99786376953125, -0.8126220703125, -0.62738037109375, -0.442138671875, -0.25689697265625, -0.0716552734375, 0.11358642578125, 0.298828125, 0.48406982421875, 0.6693115234375, 0.85455322265625, 1.039794921875, 1.22503662109375, 1.4102783203125, 1.59552001953125, 1.78076171875, 1.96600341796875, 2.1512451171875, 2.33648681640625, 2.521728515625, 2.70697021484375, 2.8922119140625, 3.07745361328125, 3.2626953125, 3.44793701171875, 3.6331787109375, 3.81842041015625, 4.003662109375, 4.18890380859375, 4.3741455078125, 4.55938720703125, 4.74462890625, 4.92987060546875, 5.1151123046875, 5.30035400390625, 5.485595703125, 5.67083740234375, 5.8560791015625, 6.04132080078125, 6.2265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 23.0, 18.0, 18.0, 15.0, 28.0, 22.0, 39.0, 43.0, 42.0, 49.0, 45.0, 57.0, 40.0, 67.0, 51.0, 48.0, 41.0, 44.0, 51.0, 43.0, 32.0, 29.0, 23.0, 16.0, 16.0, 9.0, 11.0, 12.0, 9.0, 10.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.5115966796875, -2.425537109375, -2.3394775390625, -2.25341796875, -2.1673583984375, -2.081298828125, -1.9952392578125, -1.9091796875, -1.8231201171875, -1.737060546875, -1.6510009765625, -1.56494140625, -1.4788818359375, -1.392822265625, -1.3067626953125, -1.220703125, -1.1346435546875, -1.048583984375, -0.9625244140625, -0.87646484375, -0.7904052734375, -0.704345703125, -0.6182861328125, -0.5322265625, -0.4461669921875, -0.360107421875, -0.2740478515625, -0.18798828125, -0.1019287109375, -0.015869140625, 0.0701904296875, 0.15625, 0.2423095703125, 0.328369140625, 0.4144287109375, 0.50048828125, 0.5865478515625, 0.672607421875, 0.7586669921875, 0.8447265625, 0.9307861328125, 1.016845703125, 1.1029052734375, 1.18896484375, 1.2750244140625, 1.361083984375, 1.4471435546875, 1.533203125, 1.6192626953125, 1.705322265625, 1.7913818359375, 1.87744140625, 1.9635009765625, 2.049560546875, 2.1356201171875, 2.2216796875, 2.3077392578125, 2.393798828125, 2.4798583984375, 2.56591796875, 2.6519775390625, 2.738037109375, 2.8240966796875, 2.91015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 7.0, 9.0, 12.0, 19.0, 28.0, 38.0, 31.0, 54.0, 85.0, 108.0, 178.0, 242.0, 373.0, 639.0, 1502.0, 4514.0, 21177.0, 157673.0, 735986.0, 104045.0, 15315.0, 3649.0, 1201.0, 620.0, 321.0, 199.0, 147.0, 124.0, 73.0, 41.0, 44.0, 27.0, 15.0, 17.0, 8.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.90625, -10.547607421875, -10.18896484375, -9.830322265625, -9.4716796875, -9.113037109375, -8.75439453125, -8.395751953125, -8.037109375, -7.678466796875, -7.31982421875, -6.961181640625, -6.6025390625, -6.243896484375, -5.88525390625, -5.526611328125, -5.16796875, -4.809326171875, -4.45068359375, -4.092041015625, -3.7333984375, -3.374755859375, -3.01611328125, -2.657470703125, -2.298828125, -1.940185546875, -1.58154296875, -1.222900390625, -0.8642578125, -0.505615234375, -0.14697265625, 0.211669921875, 0.5703125, 0.928955078125, 1.28759765625, 1.646240234375, 2.0048828125, 2.363525390625, 2.72216796875, 3.080810546875, 3.439453125, 3.798095703125, 4.15673828125, 4.515380859375, 4.8740234375, 5.232666015625, 5.59130859375, 5.949951171875, 6.30859375, 6.667236328125, 7.02587890625, 7.384521484375, 7.7431640625, 8.101806640625, 8.46044921875, 8.819091796875, 9.177734375, 9.536376953125, 9.89501953125, 10.253662109375, 10.6123046875, 10.970947265625, 11.32958984375, 11.688232421875, 12.046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 5.0, 7.0, 10.0, 9.0, 17.0, 29.0, 31.0, 27.0, 46.0, 44.0, 48.0, 47.0, 52.0, 77.0, 51.0, 66.0, 57.0, 58.0, 47.0, 39.0, 46.0, 39.0, 26.0, 31.0, 26.0, 16.0, 11.0, 10.0, 7.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.3828125, -13.9493408203125, -13.515869140625, -13.0823974609375, -12.64892578125, -12.2154541015625, -11.781982421875, -11.3485107421875, -10.9150390625, -10.4815673828125, -10.048095703125, -9.6146240234375, -9.18115234375, -8.7476806640625, -8.314208984375, -7.8807373046875, -7.447265625, -7.0137939453125, -6.580322265625, -6.1468505859375, -5.71337890625, -5.2799072265625, -4.846435546875, -4.4129638671875, -3.9794921875, -3.5460205078125, -3.112548828125, -2.6790771484375, -2.24560546875, -1.8121337890625, -1.378662109375, -0.9451904296875, -0.51171875, -0.0782470703125, 0.355224609375, 0.7886962890625, 1.22216796875, 1.6556396484375, 2.089111328125, 2.5225830078125, 2.9560546875, 3.3895263671875, 3.822998046875, 4.2564697265625, 4.68994140625, 5.1234130859375, 5.556884765625, 5.9903564453125, 6.423828125, 6.8572998046875, 7.290771484375, 7.7242431640625, 8.15771484375, 8.5911865234375, 9.024658203125, 9.4581298828125, 9.8916015625, 10.3250732421875, 10.758544921875, 11.1920166015625, 11.62548828125, 12.0589599609375, 12.492431640625, 12.9259033203125, 13.359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 11.0, 29.0, 64.0, 182.0, 602.0, 7499.0, 1024339.0, 14772.0, 715.0, 213.0, 71.0, 29.0, 10.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.578125, -19.9462890625, -19.314453125, -18.6826171875, -18.05078125, -17.4189453125, -16.787109375, -16.1552734375, -15.5234375, -14.8916015625, -14.259765625, -13.6279296875, -12.99609375, -12.3642578125, -11.732421875, -11.1005859375, -10.46875, -9.8369140625, -9.205078125, -8.5732421875, -7.94140625, -7.3095703125, -6.677734375, -6.0458984375, -5.4140625, -4.7822265625, -4.150390625, -3.5185546875, -2.88671875, -2.2548828125, -1.623046875, -0.9912109375, -0.359375, 0.2724609375, 0.904296875, 1.5361328125, 2.16796875, 2.7998046875, 3.431640625, 4.0634765625, 4.6953125, 5.3271484375, 5.958984375, 6.5908203125, 7.22265625, 7.8544921875, 8.486328125, 9.1181640625, 9.75, 10.3818359375, 11.013671875, 11.6455078125, 12.27734375, 12.9091796875, 13.541015625, 14.1728515625, 14.8046875, 15.4365234375, 16.068359375, 16.7001953125, 17.33203125, 17.9638671875, 18.595703125, 19.2275390625, 19.859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 3.0, 2.0, 5.0, 9.0, 7.0, 9.0, 12.0, 17.0, 32.0, 48.0, 68.0, 137.0, 231.0, 152.0, 73.0, 45.0, 35.0, 24.0, 20.0, 13.0, 19.0, 8.0, 3.0, 3.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00046253204345703125, -0.0004498586058616638, -0.0004371851682662964, -0.00042451173067092896, -0.0004118382930755615, -0.0003991648554801941, -0.00038649141788482666, -0.00037381798028945923, -0.0003611445426940918, -0.00034847110509872437, -0.00033579766750335693, -0.0003231242299079895, -0.00031045079231262207, -0.00029777735471725464, -0.0002851039171218872, -0.0002724304795265198, -0.00025975704193115234, -0.0002470836043357849, -0.00023441016674041748, -0.00022173672914505005, -0.00020906329154968262, -0.00019638985395431519, -0.00018371641635894775, -0.00017104297876358032, -0.0001583695411682129, -0.00014569610357284546, -0.00013302266597747803, -0.0001203492283821106, -0.00010767579078674316, -9.500235319137573e-05, -8.23289155960083e-05, -6.965547800064087e-05, -5.698204040527344e-05, -4.4308602809906006e-05, -3.1635165214538574e-05, -1.8961727619171143e-05, -6.288290023803711e-06, 6.385147571563721e-06, 1.9058585166931152e-05, 3.1732022762298584e-05, 4.4405460357666016e-05, 5.707889795303345e-05, 6.975233554840088e-05, 8.242577314376831e-05, 9.509921073913574e-05, 0.00010777264833450317, 0.0001204460859298706, 0.00013311952352523804, 0.00014579296112060547, 0.0001584663987159729, 0.00017113983631134033, 0.00018381327390670776, 0.0001964867115020752, 0.00020916014909744263, 0.00022183358669281006, 0.0002345070242881775, 0.0002471804618835449, 0.00025985389947891235, 0.0002725273370742798, 0.0002852007746696472, 0.00029787421226501465, 0.0003105476498603821, 0.0003232210874557495, 0.00033589452505111694, 0.0003485679626464844]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 12.0, 24.0, 62.0, 134.0, 283.0, 858.0, 33331.0, 1009637.0, 3349.0, 483.0, 195.0, 87.0, 47.0, 21.0, 14.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.0, -20.38720703125, -19.7744140625, -19.16162109375, -18.548828125, -17.93603515625, -17.3232421875, -16.71044921875, -16.09765625, -15.48486328125, -14.8720703125, -14.25927734375, -13.646484375, -13.03369140625, -12.4208984375, -11.80810546875, -11.1953125, -10.58251953125, -9.9697265625, -9.35693359375, -8.744140625, -8.13134765625, -7.5185546875, -6.90576171875, -6.29296875, -5.68017578125, -5.0673828125, -4.45458984375, -3.841796875, -3.22900390625, -2.6162109375, -2.00341796875, -1.390625, -0.77783203125, -0.1650390625, 0.44775390625, 1.060546875, 1.67333984375, 2.2861328125, 2.89892578125, 3.51171875, 4.12451171875, 4.7373046875, 5.35009765625, 5.962890625, 6.57568359375, 7.1884765625, 7.80126953125, 8.4140625, 9.02685546875, 9.6396484375, 10.25244140625, 10.865234375, 11.47802734375, 12.0908203125, 12.70361328125, 13.31640625, 13.92919921875, 14.5419921875, 15.15478515625, 15.767578125, 16.38037109375, 16.9931640625, 17.60595703125, 18.21875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 21.0, 66.0, 264.0, 461.0, 130.0, 41.0, 15.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.111328125, -18.51953125, -17.927734375, -17.3359375, -16.744140625, -16.15234375, -15.560546875, -14.96875, -14.376953125, -13.78515625, -13.193359375, -12.6015625, -12.009765625, -11.41796875, -10.826171875, -10.234375, -9.642578125, -9.05078125, -8.458984375, -7.8671875, -7.275390625, -6.68359375, -6.091796875, -5.5, -4.908203125, -4.31640625, -3.724609375, -3.1328125, -2.541015625, -1.94921875, -1.357421875, -0.765625, -0.173828125, 0.41796875, 1.009765625, 1.6015625, 2.193359375, 2.78515625, 3.376953125, 3.96875, 4.560546875, 5.15234375, 5.744140625, 6.3359375, 6.927734375, 7.51953125, 8.111328125, 8.703125, 9.294921875, 9.88671875, 10.478515625, 11.0703125, 11.662109375, 12.25390625, 12.845703125, 13.4375, 14.029296875, 14.62109375, 15.212890625, 15.8046875, 16.396484375, 16.98828125, 17.580078125, 18.171875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 13.0, 30.0, 72.0, 342.0, 382.0, 114.0, 38.0, 9.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.01408004760742, -45.555320739746094, -41.0965576171875, -36.63779830932617, -32.179039001464844, -27.72027587890625, -23.261516571044922, -18.80275535583496, -14.343994140625, -9.885232925415039, -5.4264726638793945, -0.96771240234375, 3.491048812866211, 7.949810028076172, 12.4085693359375, 16.86733055114746, 21.326091766357422, 25.784852981567383, 30.243614196777344, 34.70237350463867, 39.1611328125, 43.619895935058594, 48.07865524291992, 52.53741455078125, 56.996177673339844, 61.45493698120117, 65.9136962890625, 70.3724594116211, 74.83122253417969, 79.28997802734375, 83.74874114990234, 88.20750427246094, 92.66627502441406, 97.12503814697266, 101.58379364013672, 106.04255676269531, 110.5013198852539, 114.9600830078125, 119.41883850097656, 123.87760162353516, 128.33636474609375, 132.7951202392578, 137.25389099121094, 141.712646484375, 146.17140197753906, 150.6301727294922, 155.08892822265625, 159.5476837158203, 164.00643920898438, 168.46519470214844, 172.92396545410156, 177.38272094726562, 181.8414764404297, 186.3002471923828, 190.75900268554688, 195.21775817871094, 199.67652893066406, 204.13528442382812, 208.59405517578125, 213.0528106689453, 217.51156616210938, 221.9703369140625, 226.42909240722656, 230.88784790039062, 235.34661865234375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 6.0, 8.0, 9.0, 13.0, 7.0, 19.0, 26.0, 26.0, 23.0, 26.0, 29.0, 38.0, 39.0, 21.0, 38.0, 48.0, 38.0, 36.0, 48.0, 51.0, 43.0, 34.0, 33.0, 41.0, 47.0, 27.0, 30.0, 23.0, 21.0, 17.0, 21.0, 15.0, 12.0, 10.0, 10.0, 9.0, 11.0, 4.0, 8.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-51.105201721191406, -49.53765106201172, -47.970096588134766, -46.40254592895508, -44.83499526977539, -43.26744079589844, -41.69989013671875, -40.13233947753906, -38.564788818359375, -36.99723815917969, -35.429683685302734, -33.86213302612305, -32.29458236694336, -30.72702980041504, -29.15947723388672, -27.59192657470703, -26.024372100830078, -24.456819534301758, -22.88926887512207, -21.32171630859375, -19.754165649414062, -18.186613082885742, -16.619060516357422, -15.051508903503418, -13.483957290649414, -11.91640567779541, -10.348854064941406, -8.781301498413086, -7.213749885559082, -5.646198272705078, -4.078645706176758, -2.511094093322754, -0.9435386657714844, 0.6240131855010986, 2.1915650367736816, 3.7591171264648438, 5.326668739318848, 6.894220352172852, 8.461772918701172, 10.029324531555176, 11.59687614440918, 13.164427757263184, 14.731979370117188, 16.299531936645508, 17.867084503173828, 19.434635162353516, 21.002187728881836, 22.569740295410156, 24.137290954589844, 25.704843521118164, 27.27239418029785, 28.839946746826172, 30.40749740600586, 31.97504997253418, 33.5426025390625, 35.11015319824219, 36.677703857421875, 38.24525451660156, 39.812808990478516, 41.3803596496582, 42.94791030883789, 44.515464782714844, 46.08301544189453, 47.65056610107422, 49.21812057495117]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 11.0, 12.0, 27.0, 30.0, 47.0, 51.0, 116.0, 172.0, 263.0, 465.0, 756.0, 1441.0, 2751.0, 5728.0, 14526.0, 49763.0, 524693.0, 3463197.0, 92414.0, 21616.0, 8170.0, 3682.0, 1919.0, 993.0, 548.0, 331.0, 186.0, 112.0, 80.0, 48.0, 40.0, 21.0, 18.0, 9.0, 8.0, 11.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.87255859375, -7.6279296875, -7.38330078125, -7.138671875, -6.89404296875, -6.6494140625, -6.40478515625, -6.16015625, -5.91552734375, -5.6708984375, -5.42626953125, -5.181640625, -4.93701171875, -4.6923828125, -4.44775390625, -4.203125, -3.95849609375, -3.7138671875, -3.46923828125, -3.224609375, -2.97998046875, -2.7353515625, -2.49072265625, -2.24609375, -2.00146484375, -1.7568359375, -1.51220703125, -1.267578125, -1.02294921875, -0.7783203125, -0.53369140625, -0.2890625, -0.04443359375, 0.2001953125, 0.44482421875, 0.689453125, 0.93408203125, 1.1787109375, 1.42333984375, 1.66796875, 1.91259765625, 2.1572265625, 2.40185546875, 2.646484375, 2.89111328125, 3.1357421875, 3.38037109375, 3.625, 3.86962890625, 4.1142578125, 4.35888671875, 4.603515625, 4.84814453125, 5.0927734375, 5.33740234375, 5.58203125, 5.82666015625, 6.0712890625, 6.31591796875, 6.560546875, 6.80517578125, 7.0498046875, 7.29443359375, 7.5390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 7.0, 5.0, 4.0, 11.0, 10.0, 11.0, 17.0, 24.0, 19.0, 29.0, 21.0, 22.0, 44.0, 43.0, 45.0, 54.0, 49.0, 43.0, 47.0, 59.0, 48.0, 43.0, 41.0, 35.0, 37.0, 27.0, 24.0, 38.0, 23.0, 14.0, 24.0, 9.0, 14.0, 16.0, 7.0, 9.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.65234375, -2.56903076171875, -2.4857177734375, -2.40240478515625, -2.319091796875, -2.23577880859375, -2.1524658203125, -2.06915283203125, -1.98583984375, -1.90252685546875, -1.8192138671875, -1.73590087890625, -1.652587890625, -1.56927490234375, -1.4859619140625, -1.40264892578125, -1.3193359375, -1.23602294921875, -1.1527099609375, -1.06939697265625, -0.986083984375, -0.90277099609375, -0.8194580078125, -0.73614501953125, -0.65283203125, -0.56951904296875, -0.4862060546875, -0.40289306640625, -0.319580078125, -0.23626708984375, -0.1529541015625, -0.06964111328125, 0.013671875, 0.09698486328125, 0.1802978515625, 0.26361083984375, 0.346923828125, 0.43023681640625, 0.5135498046875, 0.59686279296875, 0.68017578125, 0.76348876953125, 0.8468017578125, 0.93011474609375, 1.013427734375, 1.09674072265625, 1.1800537109375, 1.26336669921875, 1.3466796875, 1.42999267578125, 1.5133056640625, 1.59661865234375, 1.679931640625, 1.76324462890625, 1.8465576171875, 1.92987060546875, 2.01318359375, 2.09649658203125, 2.1798095703125, 2.26312255859375, 2.346435546875, 2.42974853515625, 2.5130615234375, 2.59637451171875, 2.6796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 3.0, 7.0, 17.0, 22.0, 31.0, 41.0, 61.0, 109.0, 252.0, 485.0, 1377.0, 4557.0, 20848.0, 330619.0, 3777520.0, 46607.0, 8265.0, 2097.0, 721.0, 306.0, 151.0, 64.0, 34.0, 30.0, 19.0, 16.0, 9.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.359375, -11.0172119140625, -10.675048828125, -10.3328857421875, -9.99072265625, -9.6485595703125, -9.306396484375, -8.9642333984375, -8.6220703125, -8.2799072265625, -7.937744140625, -7.5955810546875, -7.25341796875, -6.9112548828125, -6.569091796875, -6.2269287109375, -5.884765625, -5.5426025390625, -5.200439453125, -4.8582763671875, -4.51611328125, -4.1739501953125, -3.831787109375, -3.4896240234375, -3.1474609375, -2.8052978515625, -2.463134765625, -2.1209716796875, -1.77880859375, -1.4366455078125, -1.094482421875, -0.7523193359375, -0.41015625, -0.0679931640625, 0.274169921875, 0.6163330078125, 0.95849609375, 1.3006591796875, 1.642822265625, 1.9849853515625, 2.3271484375, 2.6693115234375, 3.011474609375, 3.3536376953125, 3.69580078125, 4.0379638671875, 4.380126953125, 4.7222900390625, 5.064453125, 5.4066162109375, 5.748779296875, 6.0909423828125, 6.43310546875, 6.7752685546875, 7.117431640625, 7.4595947265625, 7.8017578125, 8.1439208984375, 8.486083984375, 8.8282470703125, 9.17041015625, 9.5125732421875, 9.854736328125, 10.1968994140625, 10.5390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 9.0, 8.0, 12.0, 29.0, 49.0, 135.0, 506.0, 2667.0, 376.0, 100.0, 64.0, 34.0, 26.0, 13.0, 9.0, 6.0, 7.0, 1.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.21484375, -7.044677734375, -6.87451171875, -6.704345703125, -6.5341796875, -6.364013671875, -6.19384765625, -6.023681640625, -5.853515625, -5.683349609375, -5.51318359375, -5.343017578125, -5.1728515625, -5.002685546875, -4.83251953125, -4.662353515625, -4.4921875, -4.322021484375, -4.15185546875, -3.981689453125, -3.8115234375, -3.641357421875, -3.47119140625, -3.301025390625, -3.130859375, -2.960693359375, -2.79052734375, -2.620361328125, -2.4501953125, -2.280029296875, -2.10986328125, -1.939697265625, -1.76953125, -1.599365234375, -1.42919921875, -1.259033203125, -1.0888671875, -0.918701171875, -0.74853515625, -0.578369140625, -0.408203125, -0.238037109375, -0.06787109375, 0.102294921875, 0.2724609375, 0.442626953125, 0.61279296875, 0.782958984375, 0.953125, 1.123291015625, 1.29345703125, 1.463623046875, 1.6337890625, 1.803955078125, 1.97412109375, 2.144287109375, 2.314453125, 2.484619140625, 2.65478515625, 2.824951171875, 2.9951171875, 3.165283203125, 3.33544921875, 3.505615234375, 3.67578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 21.0, 63.0, 136.0, 282.0, 244.0, 150.0, 50.0, 11.0, 14.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-38.245201110839844, -37.407958984375, -36.57072067260742, -35.733482360839844, -34.896240234375, -34.058998107910156, -33.22175979614258, -32.384521484375, -31.547279357910156, -30.710039138793945, -29.872798919677734, -29.035558700561523, -28.198318481445312, -27.3610782623291, -26.52383804321289, -25.68659782409668, -24.84935760498047, -24.012117385864258, -23.174877166748047, -22.337636947631836, -21.500396728515625, -20.663156509399414, -19.825916290283203, -18.988676071166992, -18.15143585205078, -17.31419563293457, -16.47695541381836, -15.639715194702148, -14.802474975585938, -13.965234756469727, -13.127994537353516, -12.290754318237305, -11.453516006469727, -10.616275787353516, -9.779035568237305, -8.941795349121094, -8.104555130004883, -7.267314910888672, -6.430074691772461, -5.59283447265625, -4.755594253540039, -3.918354034423828, -3.081113815307617, -2.2438735961914062, -1.4066333770751953, -0.5693931579589844, 0.26784706115722656, 1.1050872802734375, 1.9423274993896484, 2.7795677185058594, 3.6168079376220703, 4.454048156738281, 5.291288375854492, 6.128528594970703, 6.965768814086914, 7.803009033203125, 8.640249252319336, 9.477489471435547, 10.314729690551758, 11.151969909667969, 11.98921012878418, 12.82645034790039, 13.663690567016602, 14.500930786132812, 15.338171005249023]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 6.0, 10.0, 24.0, 26.0, 28.0, 38.0, 33.0, 34.0, 27.0, 34.0, 52.0, 55.0, 81.0, 65.0, 59.0, 49.0, 56.0, 44.0, 43.0, 41.0, 29.0, 34.0, 24.0, 23.0, 20.0, 16.0, 9.0, 10.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.380352020263672, -14.929425239562988, -14.478498458862305, -14.027570724487305, -13.576643943786621, -13.125717163085938, -12.674789428710938, -12.223862648010254, -11.77293586730957, -11.322009086608887, -10.871082305908203, -10.420154571533203, -9.96922779083252, -9.518301010131836, -9.067373275756836, -8.616446495056152, -8.165519714355469, -7.714592933654785, -7.263665676116943, -6.812738418579102, -6.361811637878418, -5.910884857177734, -5.459957599639893, -5.009030342102051, -4.558103561401367, -4.107176780700684, -3.656249523162842, -3.205322504043579, -2.7543954849243164, -2.3034684658050537, -1.852541446685791, -1.4016144275665283, -0.950688362121582, -0.49976134300231934, -0.04883432388305664, 0.40209269523620605, 0.8530197143554688, 1.3039467334747314, 1.7548737525939941, 2.205800771713257, 2.6567277908325195, 3.1076548099517822, 3.558581829071045, 4.009509086608887, 4.46043586730957, 4.911362648010254, 5.362289905548096, 5.8132171630859375, 6.264143943786621, 6.715070724487305, 7.1659979820251465, 7.616925239562988, 8.067852020263672, 8.518778800964355, 8.969705581665039, 9.420633316040039, 9.871560096740723, 10.322486877441406, 10.773414611816406, 11.22434139251709, 11.675268173217773, 12.126194953918457, 12.57712173461914, 13.02804946899414, 13.478976249694824]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 8.0, 11.0, 15.0, 23.0, 23.0, 28.0, 54.0, 95.0, 175.0, 276.0, 660.0, 1342.0, 3411.0, 9373.0, 31379.0, 125420.0, 550964.0, 245901.0, 55040.0, 15419.0, 5061.0, 2034.0, 854.0, 394.0, 233.0, 106.0, 59.0, 51.0, 31.0, 26.0, 20.0, 18.0, 7.0, 7.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.96875, -8.71038818359375, -8.4520263671875, -8.19366455078125, -7.935302734375, -7.67694091796875, -7.4185791015625, -7.16021728515625, -6.90185546875, -6.64349365234375, -6.3851318359375, -6.12677001953125, -5.868408203125, -5.61004638671875, -5.3516845703125, -5.09332275390625, -4.8349609375, -4.57659912109375, -4.3182373046875, -4.05987548828125, -3.801513671875, -3.54315185546875, -3.2847900390625, -3.02642822265625, -2.76806640625, -2.50970458984375, -2.2513427734375, -1.99298095703125, -1.734619140625, -1.47625732421875, -1.2178955078125, -0.95953369140625, -0.701171875, -0.44281005859375, -0.1844482421875, 0.07391357421875, 0.332275390625, 0.59063720703125, 0.8489990234375, 1.10736083984375, 1.36572265625, 1.62408447265625, 1.8824462890625, 2.14080810546875, 2.399169921875, 2.65753173828125, 2.9158935546875, 3.17425537109375, 3.4326171875, 3.69097900390625, 3.9493408203125, 4.20770263671875, 4.466064453125, 4.72442626953125, 4.9827880859375, 5.24114990234375, 5.49951171875, 5.75787353515625, 6.0162353515625, 6.27459716796875, 6.532958984375, 6.79132080078125, 7.0496826171875, 7.30804443359375, 7.56640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 2.0, 7.0, 4.0, 13.0, 16.0, 14.0, 12.0, 19.0, 22.0, 22.0, 32.0, 40.0, 36.0, 39.0, 39.0, 55.0, 62.0, 41.0, 55.0, 36.0, 50.0, 43.0, 47.0, 38.0, 33.0, 28.0, 27.0, 31.0, 19.0, 23.0, 9.0, 17.0, 8.0, 12.0, 9.0, 14.0, 9.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.59765625, -2.515167236328125, -2.43267822265625, -2.350189208984375, -2.2677001953125, -2.185211181640625, -2.10272216796875, -2.020233154296875, -1.937744140625, -1.855255126953125, -1.77276611328125, -1.690277099609375, -1.6077880859375, -1.525299072265625, -1.44281005859375, -1.360321044921875, -1.27783203125, -1.195343017578125, -1.11285400390625, -1.030364990234375, -0.9478759765625, -0.865386962890625, -0.78289794921875, -0.700408935546875, -0.617919921875, -0.535430908203125, -0.45294189453125, -0.370452880859375, -0.2879638671875, -0.205474853515625, -0.12298583984375, -0.040496826171875, 0.0419921875, 0.124481201171875, 0.20697021484375, 0.289459228515625, 0.3719482421875, 0.454437255859375, 0.53692626953125, 0.619415283203125, 0.701904296875, 0.784393310546875, 0.86688232421875, 0.949371337890625, 1.0318603515625, 1.114349365234375, 1.19683837890625, 1.279327392578125, 1.36181640625, 1.444305419921875, 1.52679443359375, 1.609283447265625, 1.6917724609375, 1.774261474609375, 1.85675048828125, 1.939239501953125, 2.021728515625, 2.104217529296875, 2.18670654296875, 2.269195556640625, 2.3516845703125, 2.434173583984375, 2.51666259765625, 2.599151611328125, 2.681640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 17.0, 12.0, 19.0, 27.0, 38.0, 62.0, 90.0, 131.0, 208.0, 326.0, 565.0, 1553.0, 4992.0, 20829.0, 137066.0, 708287.0, 144187.0, 21921.0, 4994.0, 1675.0, 642.0, 326.0, 180.0, 113.0, 70.0, 41.0, 47.0, 35.0, 26.0, 17.0, 11.0, 5.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2666015625, -8.962890625, -8.6591796875, -8.35546875, -8.0517578125, -7.748046875, -7.4443359375, -7.140625, -6.8369140625, -6.533203125, -6.2294921875, -5.92578125, -5.6220703125, -5.318359375, -5.0146484375, -4.7109375, -4.4072265625, -4.103515625, -3.7998046875, -3.49609375, -3.1923828125, -2.888671875, -2.5849609375, -2.28125, -1.9775390625, -1.673828125, -1.3701171875, -1.06640625, -0.7626953125, -0.458984375, -0.1552734375, 0.1484375, 0.4521484375, 0.755859375, 1.0595703125, 1.36328125, 1.6669921875, 1.970703125, 2.2744140625, 2.578125, 2.8818359375, 3.185546875, 3.4892578125, 3.79296875, 4.0966796875, 4.400390625, 4.7041015625, 5.0078125, 5.3115234375, 5.615234375, 5.9189453125, 6.22265625, 6.5263671875, 6.830078125, 7.1337890625, 7.4375, 7.7412109375, 8.044921875, 8.3486328125, 8.65234375, 8.9560546875, 9.259765625, 9.5634765625, 9.8671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 6.0, 11.0, 5.0, 13.0, 15.0, 22.0, 23.0, 24.0, 37.0, 31.0, 41.0, 50.0, 48.0, 45.0, 48.0, 50.0, 57.0, 52.0, 41.0, 53.0, 47.0, 42.0, 34.0, 35.0, 32.0, 31.0, 23.0, 17.0, 16.0, 7.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1796875, -11.8167724609375, -11.453857421875, -11.0909423828125, -10.72802734375, -10.3651123046875, -10.002197265625, -9.6392822265625, -9.2763671875, -8.9134521484375, -8.550537109375, -8.1876220703125, -7.82470703125, -7.4617919921875, -7.098876953125, -6.7359619140625, -6.373046875, -6.0101318359375, -5.647216796875, -5.2843017578125, -4.92138671875, -4.5584716796875, -4.195556640625, -3.8326416015625, -3.4697265625, -3.1068115234375, -2.743896484375, -2.3809814453125, -2.01806640625, -1.6551513671875, -1.292236328125, -0.9293212890625, -0.56640625, -0.2034912109375, 0.159423828125, 0.5223388671875, 0.88525390625, 1.2481689453125, 1.611083984375, 1.9739990234375, 2.3369140625, 2.6998291015625, 3.062744140625, 3.4256591796875, 3.78857421875, 4.1514892578125, 4.514404296875, 4.8773193359375, 5.240234375, 5.6031494140625, 5.966064453125, 6.3289794921875, 6.69189453125, 7.0548095703125, 7.417724609375, 7.7806396484375, 8.1435546875, 8.5064697265625, 8.869384765625, 9.2322998046875, 9.59521484375, 9.9581298828125, 10.321044921875, 10.6839599609375, 11.046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 17.0, 28.0, 76.0, 261.0, 779.0, 4027.0, 66876.0, 927319.0, 44712.0, 3377.0, 675.0, 225.0, 83.0, 31.0, 18.0, 13.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.3280029296875, -6.144287109375, -5.9605712890625, -5.77685546875, -5.5931396484375, -5.409423828125, -5.2257080078125, -5.0419921875, -4.8582763671875, -4.674560546875, -4.4908447265625, -4.30712890625, -4.1234130859375, -3.939697265625, -3.7559814453125, -3.572265625, -3.3885498046875, -3.204833984375, -3.0211181640625, -2.83740234375, -2.6536865234375, -2.469970703125, -2.2862548828125, -2.1025390625, -1.9188232421875, -1.735107421875, -1.5513916015625, -1.36767578125, -1.1839599609375, -1.000244140625, -0.8165283203125, -0.6328125, -0.4490966796875, -0.265380859375, -0.0816650390625, 0.10205078125, 0.2857666015625, 0.469482421875, 0.6531982421875, 0.8369140625, 1.0206298828125, 1.204345703125, 1.3880615234375, 1.57177734375, 1.7554931640625, 1.939208984375, 2.1229248046875, 2.306640625, 2.4903564453125, 2.674072265625, 2.8577880859375, 3.04150390625, 3.2252197265625, 3.408935546875, 3.5926513671875, 3.7763671875, 3.9600830078125, 4.143798828125, 4.3275146484375, 4.51123046875, 4.6949462890625, 4.878662109375, 5.0623779296875, 5.24609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 8.0, 6.0, 10.0, 11.0, 25.0, 22.0, 28.0, 72.0, 133.0, 240.0, 197.0, 87.0, 31.0, 32.0, 23.0, 15.0, 9.0, 4.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003993511199951172, -0.0003854222595691681, -0.000371493399143219, -0.0003575645387172699, -0.0003436356782913208, -0.0003297068178653717, -0.0003157779574394226, -0.0003018490970134735, -0.0002879202365875244, -0.0002739913761615753, -0.0002600625157356262, -0.0002461336553096771, -0.00023220479488372803, -0.00021827593445777893, -0.00020434707403182983, -0.00019041821360588074, -0.00017648935317993164, -0.00016256049275398254, -0.00014863163232803345, -0.00013470277190208435, -0.00012077391147613525, -0.00010684505105018616, -9.291619062423706e-05, -7.898733019828796e-05, -6.505846977233887e-05, -5.112960934638977e-05, -3.7200748920440674e-05, -2.3271888494491577e-05, -9.34302806854248e-06, 4.585832357406616e-06, 1.8514692783355713e-05, 3.244355320930481e-05, 4.6372413635253906e-05, 6.0301274061203e-05, 7.42301344871521e-05, 8.81589949131012e-05, 0.00010208785533905029, 0.00011601671576499939, 0.00012994557619094849, 0.00014387443661689758, 0.00015780329704284668, 0.00017173215746879578, 0.00018566101789474487, 0.00019958987832069397, 0.00021351873874664307, 0.00022744759917259216, 0.00024137645959854126, 0.00025530532002449036, 0.00026923418045043945, 0.00028316304087638855, 0.00029709190130233765, 0.00031102076172828674, 0.00032494962215423584, 0.00033887848258018494, 0.00035280734300613403, 0.00036673620343208313, 0.0003806650638580322, 0.0003945939242839813, 0.0004085227847099304, 0.0004224516451358795, 0.0004363805055618286, 0.0004503093659877777, 0.0004642382264137268, 0.0004781670868396759, 0.000492095947265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 16.0, 25.0, 36.0, 49.0, 72.0, 135.0, 221.0, 406.0, 833.0, 2378.0, 11311.0, 102324.0, 818245.0, 97340.0, 11007.0, 2323.0, 845.0, 398.0, 206.0, 130.0, 83.0, 45.0, 32.0, 21.0, 12.0, 11.0, 7.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.943359375, -3.835296630859375, -3.72723388671875, -3.619171142578125, -3.5111083984375, -3.403045654296875, -3.29498291015625, -3.186920166015625, -3.078857421875, -2.970794677734375, -2.86273193359375, -2.754669189453125, -2.6466064453125, -2.538543701171875, -2.43048095703125, -2.322418212890625, -2.21435546875, -2.106292724609375, -1.99822998046875, -1.890167236328125, -1.7821044921875, -1.674041748046875, -1.56597900390625, -1.457916259765625, -1.349853515625, -1.241790771484375, -1.13372802734375, -1.025665283203125, -0.9176025390625, -0.809539794921875, -0.70147705078125, -0.593414306640625, -0.4853515625, -0.377288818359375, -0.26922607421875, -0.161163330078125, -0.0531005859375, 0.054962158203125, 0.16302490234375, 0.271087646484375, 0.379150390625, 0.487213134765625, 0.59527587890625, 0.703338623046875, 0.8114013671875, 0.919464111328125, 1.02752685546875, 1.135589599609375, 1.24365234375, 1.351715087890625, 1.45977783203125, 1.567840576171875, 1.6759033203125, 1.783966064453125, 1.89202880859375, 2.000091552734375, 2.108154296875, 2.216217041015625, 2.32427978515625, 2.432342529296875, 2.5404052734375, 2.648468017578125, 2.75653076171875, 2.864593505859375, 2.97265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 9.0, 17.0, 16.0, 31.0, 32.0, 59.0, 86.0, 90.0, 147.0, 143.0, 107.0, 80.0, 66.0, 33.0, 27.0, 20.0, 14.0, 6.0, 7.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.76953125, -5.6493988037109375, -5.529266357421875, -5.4091339111328125, -5.28900146484375, -5.1688690185546875, -5.048736572265625, -4.9286041259765625, -4.8084716796875, -4.6883392333984375, -4.568206787109375, -4.4480743408203125, -4.32794189453125, -4.2078094482421875, -4.087677001953125, -3.9675445556640625, -3.847412109375, -3.7272796630859375, -3.607147216796875, -3.4870147705078125, -3.36688232421875, -3.2467498779296875, -3.126617431640625, -3.0064849853515625, -2.8863525390625, -2.7662200927734375, -2.646087646484375, -2.5259552001953125, -2.40582275390625, -2.2856903076171875, -2.165557861328125, -2.0454254150390625, -1.92529296875, -1.8051605224609375, -1.685028076171875, -1.5648956298828125, -1.44476318359375, -1.3246307373046875, -1.204498291015625, -1.0843658447265625, -0.9642333984375, -0.8441009521484375, -0.723968505859375, -0.6038360595703125, -0.48370361328125, -0.3635711669921875, -0.243438720703125, -0.1233062744140625, -0.003173828125, 0.1169586181640625, 0.237091064453125, 0.3572235107421875, 0.47735595703125, 0.5974884033203125, 0.717620849609375, 0.8377532958984375, 0.9578857421875, 1.0780181884765625, 1.198150634765625, 1.3182830810546875, 1.43841552734375, 1.5585479736328125, 1.678680419921875, 1.7988128662109375, 1.9189453125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 18.0, 47.0, 148.0, 318.0, 303.0, 101.0, 41.0, 9.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-162.3708038330078, -159.29904174804688, -156.227294921875, -153.15553283691406, -150.08377075195312, -147.01202392578125, -143.9402618408203, -140.86851501464844, -137.7967529296875, -134.72499084472656, -131.6532440185547, -128.58148193359375, -125.50972747802734, -122.43797302246094, -119.3662109375, -116.2944564819336, -113.22270202636719, -110.15094757080078, -107.07919311523438, -104.00743103027344, -100.93567657470703, -97.86392211914062, -94.79216003417969, -91.72040557861328, -88.64865112304688, -85.57689666748047, -82.50514221191406, -79.43338012695312, -76.36162567138672, -73.28987121582031, -70.21810913085938, -67.14635467529297, -64.07460021972656, -61.002845764160156, -57.931087493896484, -54.85932922363281, -51.787574768066406, -48.7158203125, -45.64406204223633, -42.572303771972656, -39.500545501708984, -36.42878723144531, -33.357032775878906, -30.285276412963867, -27.213520050048828, -24.14176368713379, -21.07000732421875, -17.99825096130371, -14.926494598388672, -11.854738235473633, -8.782981872558594, -5.711225509643555, -2.6394691467285156, 0.43228721618652344, 3.5040435791015625, 6.575799942016602, 9.64755630493164, 12.71931266784668, 15.791069030761719, 18.862825393676758, 21.934581756591797, 25.006338119506836, 28.078094482421875, 31.149850845336914, 34.22160720825195]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 7.0, 7.0, 12.0, 9.0, 13.0, 16.0, 19.0, 23.0, 15.0, 23.0, 38.0, 32.0, 26.0, 36.0, 39.0, 38.0, 44.0, 41.0, 42.0, 36.0, 34.0, 38.0, 39.0, 50.0, 30.0, 43.0, 28.0, 36.0, 26.0, 25.0, 19.0, 14.0, 14.0, 10.0, 13.0, 10.0, 8.0, 11.0, 7.0, 8.0, 4.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.97000503540039, -43.55244445800781, -42.1348876953125, -40.71732711791992, -39.299766540527344, -37.88220977783203, -36.46464920043945, -35.047088623046875, -33.62953186035156, -32.211971282958984, -30.794414520263672, -29.376853942871094, -27.95929527282715, -26.541736602783203, -25.124176025390625, -23.70661735534668, -22.289058685302734, -20.87150001525879, -19.453941345214844, -18.036380767822266, -16.61882209777832, -15.201263427734375, -13.783703804016113, -12.366144180297852, -10.948585510253906, -9.531026840209961, -8.1134672164917, -6.695908069610596, -5.278348922729492, -3.8607897758483887, -2.443230628967285, -1.0256710052490234, 0.39188385009765625, 1.8094429969787598, 3.2270021438598633, 4.644561290740967, 6.06212043762207, 7.479679584503174, 8.897238731384277, 10.314798355102539, 11.732357025146484, 13.14991569519043, 14.567475318908691, 15.985034942626953, 17.4025936126709, 18.820152282714844, 20.237712860107422, 21.655271530151367, 23.072830200195312, 24.490388870239258, 25.907947540283203, 27.32550811767578, 28.743066787719727, 30.160625457763672, 31.57818603515625, 32.99574279785156, 34.41330337524414, 35.83086395263672, 37.24842071533203, 38.66598129272461, 40.08354187011719, 41.5010986328125, 42.91865921020508, 44.336219787597656, 45.75377655029297]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 9.0, 4.0, 8.0, 18.0, 13.0, 19.0, 32.0, 42.0, 76.0, 110.0, 175.0, 258.0, 357.0, 563.0, 934.0, 1635.0, 2657.0, 4899.0, 9572.0, 21286.0, 71206.0, 3469229.0, 526666.0, 48958.0, 17200.0, 7939.0, 4150.0, 2423.0, 1388.0, 870.0, 513.0, 377.0, 241.0, 148.0, 110.0, 63.0, 41.0, 29.0, 19.0, 11.0, 9.0, 7.0, 3.0, 3.0, 1.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.109130859375, -8.80419921875, -8.499267578125, -8.1943359375, -7.889404296875, -7.58447265625, -7.279541015625, -6.974609375, -6.669677734375, -6.36474609375, -6.059814453125, -5.7548828125, -5.449951171875, -5.14501953125, -4.840087890625, -4.53515625, -4.230224609375, -3.92529296875, -3.620361328125, -3.3154296875, -3.010498046875, -2.70556640625, -2.400634765625, -2.095703125, -1.790771484375, -1.48583984375, -1.180908203125, -0.8759765625, -0.571044921875, -0.26611328125, 0.038818359375, 0.34375, 0.648681640625, 0.95361328125, 1.258544921875, 1.5634765625, 1.868408203125, 2.17333984375, 2.478271484375, 2.783203125, 3.088134765625, 3.39306640625, 3.697998046875, 4.0029296875, 4.307861328125, 4.61279296875, 4.917724609375, 5.22265625, 5.527587890625, 5.83251953125, 6.137451171875, 6.4423828125, 6.747314453125, 7.05224609375, 7.357177734375, 7.662109375, 7.967041015625, 8.27197265625, 8.576904296875, 8.8818359375, 9.186767578125, 9.49169921875, 9.796630859375, 10.1015625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 9.0, 6.0, 7.0, 13.0, 13.0, 9.0, 15.0, 19.0, 29.0, 21.0, 30.0, 38.0, 29.0, 41.0, 29.0, 51.0, 41.0, 49.0, 51.0, 59.0, 51.0, 42.0, 44.0, 36.0, 35.0, 40.0, 24.0, 26.0, 18.0, 14.0, 23.0, 14.0, 16.0, 14.0, 10.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.021484375, -2.937103271484375, -2.85272216796875, -2.768341064453125, -2.6839599609375, -2.599578857421875, -2.51519775390625, -2.430816650390625, -2.346435546875, -2.262054443359375, -2.17767333984375, -2.093292236328125, -2.0089111328125, -1.924530029296875, -1.84014892578125, -1.755767822265625, -1.67138671875, -1.587005615234375, -1.50262451171875, -1.418243408203125, -1.3338623046875, -1.249481201171875, -1.16510009765625, -1.080718994140625, -0.996337890625, -0.911956787109375, -0.82757568359375, -0.743194580078125, -0.6588134765625, -0.574432373046875, -0.49005126953125, -0.405670166015625, -0.3212890625, -0.236907958984375, -0.15252685546875, -0.068145751953125, 0.0162353515625, 0.100616455078125, 0.18499755859375, 0.269378662109375, 0.353759765625, 0.438140869140625, 0.52252197265625, 0.606903076171875, 0.6912841796875, 0.775665283203125, 0.86004638671875, 0.944427490234375, 1.02880859375, 1.113189697265625, 1.19757080078125, 1.281951904296875, 1.3663330078125, 1.450714111328125, 1.53509521484375, 1.619476318359375, 1.703857421875, 1.788238525390625, 1.87261962890625, 1.957000732421875, 2.0413818359375, 2.125762939453125, 2.21014404296875, 2.294525146484375, 2.37890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 8.0, 7.0, 20.0, 30.0, 59.0, 102.0, 212.0, 495.0, 1125.0, 3323.0, 12373.0, 100512.0, 3976593.0, 83313.0, 11237.0, 3065.0, 1033.0, 387.0, 167.0, 89.0, 59.0, 24.0, 22.0, 10.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.828125, -17.398193359375, -16.96826171875, -16.538330078125, -16.1083984375, -15.678466796875, -15.24853515625, -14.818603515625, -14.388671875, -13.958740234375, -13.52880859375, -13.098876953125, -12.6689453125, -12.239013671875, -11.80908203125, -11.379150390625, -10.94921875, -10.519287109375, -10.08935546875, -9.659423828125, -9.2294921875, -8.799560546875, -8.36962890625, -7.939697265625, -7.509765625, -7.079833984375, -6.64990234375, -6.219970703125, -5.7900390625, -5.360107421875, -4.93017578125, -4.500244140625, -4.0703125, -3.640380859375, -3.21044921875, -2.780517578125, -2.3505859375, -1.920654296875, -1.49072265625, -1.060791015625, -0.630859375, -0.200927734375, 0.22900390625, 0.658935546875, 1.0888671875, 1.518798828125, 1.94873046875, 2.378662109375, 2.80859375, 3.238525390625, 3.66845703125, 4.098388671875, 4.5283203125, 4.958251953125, 5.38818359375, 5.818115234375, 6.248046875, 6.677978515625, 7.10791015625, 7.537841796875, 7.9677734375, 8.397705078125, 8.82763671875, 9.257568359375, 9.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 13.0, 21.0, 31.0, 40.0, 74.0, 173.0, 843.0, 2369.0, 217.0, 88.0, 62.0, 20.0, 20.0, 15.0, 11.0, 9.0, 10.0, 6.0, 10.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0], "bins": [-6.45703125, -6.310821533203125, -6.16461181640625, -6.018402099609375, -5.8721923828125, -5.725982666015625, -5.57977294921875, -5.433563232421875, -5.287353515625, -5.141143798828125, -4.99493408203125, -4.848724365234375, -4.7025146484375, -4.556304931640625, -4.41009521484375, -4.263885498046875, -4.11767578125, -3.971466064453125, -3.82525634765625, -3.679046630859375, -3.5328369140625, -3.386627197265625, -3.24041748046875, -3.094207763671875, -2.947998046875, -2.801788330078125, -2.65557861328125, -2.509368896484375, -2.3631591796875, -2.216949462890625, -2.07073974609375, -1.924530029296875, -1.7783203125, -1.632110595703125, -1.48590087890625, -1.339691162109375, -1.1934814453125, -1.047271728515625, -0.90106201171875, -0.754852294921875, -0.608642578125, -0.462432861328125, -0.31622314453125, -0.170013427734375, -0.0238037109375, 0.122406005859375, 0.26861572265625, 0.414825439453125, 0.56103515625, 0.707244873046875, 0.85345458984375, 0.999664306640625, 1.1458740234375, 1.292083740234375, 1.43829345703125, 1.584503173828125, 1.730712890625, 1.876922607421875, 2.02313232421875, 2.169342041015625, 2.3155517578125, 2.461761474609375, 2.60797119140625, 2.754180908203125, 2.900390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 14.0, 31.0, 97.0, 263.0, 365.0, 154.0, 42.0, 10.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-55.36806106567383, -54.311378479003906, -53.254695892333984, -52.19801330566406, -51.141334533691406, -50.084651947021484, -49.02796936035156, -47.97128677368164, -46.91460418701172, -45.8579216003418, -44.801239013671875, -43.74455642700195, -42.68787384033203, -41.631195068359375, -40.57451248168945, -39.51782989501953, -38.46114730834961, -37.40446472167969, -36.347782135009766, -35.291099548339844, -34.23442077636719, -33.177738189697266, -32.121055603027344, -31.064373016357422, -30.0076904296875, -28.951007843017578, -27.894325256347656, -26.837644577026367, -25.780961990356445, -24.724279403686523, -23.667598724365234, -22.610916137695312, -21.55423355102539, -20.49755096435547, -19.440868377685547, -18.384187698364258, -17.327505111694336, -16.270822525024414, -15.214140892028809, -14.157459259033203, -13.100776672363281, -12.04409408569336, -10.987412452697754, -9.930730819702148, -8.874048233032227, -7.817366123199463, -6.760684013366699, -5.7040019035339355, -4.647319793701172, -3.590637683868408, -2.5339555740356445, -1.4772734642028809, -0.4205913543701172, 0.6360907554626465, 1.6927728652954102, 2.749454975128174, 3.8061370849609375, 4.862819194793701, 5.919501304626465, 6.9761834144592285, 8.032865524291992, 9.089548110961914, 10.14622974395752, 11.202911376953125, 12.259593963623047]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 3.0, 10.0, 6.0, 15.0, 11.0, 9.0, 25.0, 24.0, 22.0, 40.0, 39.0, 40.0, 47.0, 28.0, 58.0, 48.0, 54.0, 59.0, 52.0, 45.0, 47.0, 48.0, 32.0, 40.0, 32.0, 36.0, 28.0, 21.0, 18.0, 19.0, 11.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.551115036010742, -14.161030769348145, -13.770947456359863, -13.380863189697266, -12.990779876708984, -12.600695610046387, -12.210612297058105, -11.820528030395508, -11.430444717407227, -11.040360450744629, -10.650277137756348, -10.26019287109375, -9.870109558105469, -9.480025291442871, -9.08994197845459, -8.699857711791992, -8.309774398803711, -7.9196906089782715, -7.529606819152832, -7.139523029327393, -6.749439239501953, -6.359355449676514, -5.969271659851074, -5.579187393188477, -5.189103126525879, -4.7990193367004395, -4.408935546875, -4.0188517570495605, -3.628767967224121, -3.2386841773986816, -2.848600149154663, -2.4585163593292236, -2.0684328079223633, -1.6783490180969238, -1.2882652282714844, -0.8981813192367554, -0.5080975294113159, -0.11801373958587646, 0.27207016944885254, 0.662153959274292, 1.0522377490997314, 1.442321538925171, 1.8324053287506104, 2.222489356994629, 2.6125731468200684, 3.002656936645508, 3.3927407264709473, 3.7828245162963867, 4.172908306121826, 4.562992095947266, 4.953075885772705, 5.3431596755981445, 5.733243465423584, 6.123327255249023, 6.513411521911621, 6.903494834899902, 7.2935791015625, 7.6836628913879395, 8.073746681213379, 8.463830947875977, 8.853914260864258, 9.243998527526855, 9.634081840515137, 10.024166107177734, 10.414249420166016]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 7.0, 18.0, 15.0, 35.0, 32.0, 49.0, 86.0, 114.0, 158.0, 251.0, 413.0, 572.0, 942.0, 1474.0, 2598.0, 4556.0, 8723.0, 16896.0, 35006.0, 83003.0, 213295.0, 378097.0, 172621.0, 67811.0, 29722.0, 14442.0, 7413.0, 4053.0, 2336.0, 1391.0, 861.0, 555.0, 329.0, 210.0, 148.0, 89.0, 50.0, 54.0, 33.0, 31.0, 16.0, 9.0, 14.0, 1.0, 6.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.38671875, -5.20343017578125, -5.0201416015625, -4.83685302734375, -4.653564453125, -4.47027587890625, -4.2869873046875, -4.10369873046875, -3.92041015625, -3.73712158203125, -3.5538330078125, -3.37054443359375, -3.187255859375, -3.00396728515625, -2.8206787109375, -2.63739013671875, -2.4541015625, -2.27081298828125, -2.0875244140625, -1.90423583984375, -1.720947265625, -1.53765869140625, -1.3543701171875, -1.17108154296875, -0.98779296875, -0.80450439453125, -0.6212158203125, -0.43792724609375, -0.254638671875, -0.07135009765625, 0.1119384765625, 0.29522705078125, 0.478515625, 0.66180419921875, 0.8450927734375, 1.02838134765625, 1.211669921875, 1.39495849609375, 1.5782470703125, 1.76153564453125, 1.94482421875, 2.12811279296875, 2.3114013671875, 2.49468994140625, 2.677978515625, 2.86126708984375, 3.0445556640625, 3.22784423828125, 3.4111328125, 3.59442138671875, 3.7777099609375, 3.96099853515625, 4.144287109375, 4.32757568359375, 4.5108642578125, 4.69415283203125, 4.87744140625, 5.06072998046875, 5.2440185546875, 5.42730712890625, 5.610595703125, 5.79388427734375, 5.9771728515625, 6.16046142578125, 6.34375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 5.0, 8.0, 16.0, 10.0, 20.0, 24.0, 17.0, 23.0, 29.0, 24.0, 26.0, 41.0, 35.0, 40.0, 48.0, 50.0, 45.0, 52.0, 43.0, 42.0, 49.0, 23.0, 58.0, 28.0, 42.0, 32.0, 24.0, 15.0, 14.0, 12.0, 21.0, 17.0, 16.0, 16.0, 5.0, 5.0, 10.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.77734375, -2.69464111328125, -2.6119384765625, -2.52923583984375, -2.446533203125, -2.36383056640625, -2.2811279296875, -2.19842529296875, -2.11572265625, -2.03302001953125, -1.9503173828125, -1.86761474609375, -1.784912109375, -1.70220947265625, -1.6195068359375, -1.53680419921875, -1.4541015625, -1.37139892578125, -1.2886962890625, -1.20599365234375, -1.123291015625, -1.04058837890625, -0.9578857421875, -0.87518310546875, -0.79248046875, -0.70977783203125, -0.6270751953125, -0.54437255859375, -0.461669921875, -0.37896728515625, -0.2962646484375, -0.21356201171875, -0.130859375, -0.04815673828125, 0.0345458984375, 0.11724853515625, 0.199951171875, 0.28265380859375, 0.3653564453125, 0.44805908203125, 0.53076171875, 0.61346435546875, 0.6961669921875, 0.77886962890625, 0.861572265625, 0.94427490234375, 1.0269775390625, 1.10968017578125, 1.1923828125, 1.27508544921875, 1.3577880859375, 1.44049072265625, 1.523193359375, 1.60589599609375, 1.6885986328125, 1.77130126953125, 1.85400390625, 1.93670654296875, 2.0194091796875, 2.10211181640625, 2.184814453125, 2.26751708984375, 2.3502197265625, 2.43292236328125, 2.515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 3.0, 11.0, 3.0, 13.0, 17.0, 26.0, 29.0, 46.0, 63.0, 98.0, 132.0, 219.0, 328.0, 686.0, 1394.0, 4937.0, 35607.0, 663369.0, 316307.0, 19378.0, 3384.0, 1123.0, 544.0, 279.0, 166.0, 110.0, 66.0, 49.0, 44.0, 24.0, 29.0, 14.0, 10.0, 5.0, 8.0, 10.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.8359375, -15.3057861328125, -14.775634765625, -14.2454833984375, -13.71533203125, -13.1851806640625, -12.655029296875, -12.1248779296875, -11.5947265625, -11.0645751953125, -10.534423828125, -10.0042724609375, -9.47412109375, -8.9439697265625, -8.413818359375, -7.8836669921875, -7.353515625, -6.8233642578125, -6.293212890625, -5.7630615234375, -5.23291015625, -4.7027587890625, -4.172607421875, -3.6424560546875, -3.1123046875, -2.5821533203125, -2.052001953125, -1.5218505859375, -0.99169921875, -0.4615478515625, 0.068603515625, 0.5987548828125, 1.12890625, 1.6590576171875, 2.189208984375, 2.7193603515625, 3.24951171875, 3.7796630859375, 4.309814453125, 4.8399658203125, 5.3701171875, 5.9002685546875, 6.430419921875, 6.9605712890625, 7.49072265625, 8.0208740234375, 8.551025390625, 9.0811767578125, 9.611328125, 10.1414794921875, 10.671630859375, 11.2017822265625, 11.73193359375, 12.2620849609375, 12.792236328125, 13.3223876953125, 13.8525390625, 14.3826904296875, 14.912841796875, 15.4429931640625, 15.97314453125, 16.5032958984375, 17.033447265625, 17.5635986328125, 18.09375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 23.0, 19.0, 22.0, 36.0, 36.0, 39.0, 54.0, 51.0, 62.0, 74.0, 69.0, 46.0, 63.0, 65.0, 51.0, 54.0, 47.0, 34.0, 25.0, 24.0, 18.0, 13.0, 10.0, 9.0, 9.0, 3.0, 2.0, 10.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.359375, -16.82177734375, -16.2841796875, -15.74658203125, -15.208984375, -14.67138671875, -14.1337890625, -13.59619140625, -13.05859375, -12.52099609375, -11.9833984375, -11.44580078125, -10.908203125, -10.37060546875, -9.8330078125, -9.29541015625, -8.7578125, -8.22021484375, -7.6826171875, -7.14501953125, -6.607421875, -6.06982421875, -5.5322265625, -4.99462890625, -4.45703125, -3.91943359375, -3.3818359375, -2.84423828125, -2.306640625, -1.76904296875, -1.2314453125, -0.69384765625, -0.15625, 0.38134765625, 0.9189453125, 1.45654296875, 1.994140625, 2.53173828125, 3.0693359375, 3.60693359375, 4.14453125, 4.68212890625, 5.2197265625, 5.75732421875, 6.294921875, 6.83251953125, 7.3701171875, 7.90771484375, 8.4453125, 8.98291015625, 9.5205078125, 10.05810546875, 10.595703125, 11.13330078125, 11.6708984375, 12.20849609375, 12.74609375, 13.28369140625, 13.8212890625, 14.35888671875, 14.896484375, 15.43408203125, 15.9716796875, 16.50927734375, 17.046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 8.0, 12.0, 16.0, 11.0, 21.0, 27.0, 36.0, 55.0, 78.0, 109.0, 154.0, 222.0, 327.0, 479.0, 773.0, 1245.0, 2421.0, 5155.0, 15474.0, 95494.0, 802301.0, 97223.0, 15644.0, 5186.0, 2467.0, 1278.0, 781.0, 459.0, 345.0, 211.0, 154.0, 97.0, 82.0, 52.0, 44.0, 26.0, 17.0, 14.0, 18.0, 16.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6484375, -6.45574951171875, -6.2630615234375, -6.07037353515625, -5.877685546875, -5.68499755859375, -5.4923095703125, -5.29962158203125, -5.10693359375, -4.91424560546875, -4.7215576171875, -4.52886962890625, -4.336181640625, -4.14349365234375, -3.9508056640625, -3.75811767578125, -3.5654296875, -3.37274169921875, -3.1800537109375, -2.98736572265625, -2.794677734375, -2.60198974609375, -2.4093017578125, -2.21661376953125, -2.02392578125, -1.83123779296875, -1.6385498046875, -1.44586181640625, -1.253173828125, -1.06048583984375, -0.8677978515625, -0.67510986328125, -0.482421875, -0.28973388671875, -0.0970458984375, 0.09564208984375, 0.288330078125, 0.48101806640625, 0.6737060546875, 0.86639404296875, 1.05908203125, 1.25177001953125, 1.4444580078125, 1.63714599609375, 1.829833984375, 2.02252197265625, 2.2152099609375, 2.40789794921875, 2.6005859375, 2.79327392578125, 2.9859619140625, 3.17864990234375, 3.371337890625, 3.56402587890625, 3.7567138671875, 3.94940185546875, 4.14208984375, 4.33477783203125, 4.5274658203125, 4.72015380859375, 4.912841796875, 5.10552978515625, 5.2982177734375, 5.49090576171875, 5.68359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 17.0, 34.0, 68.0, 121.0, 310.0, 213.0, 106.0, 62.0, 25.0, 13.0, 10.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006785392761230469, -0.0006488487124443054, -0.000619158148765564, -0.0005894675850868225, -0.0005597770214080811, -0.0005300864577293396, -0.0005003958940505981, -0.0004707053303718567, -0.00044101476669311523, -0.0004113242030143738, -0.0003816336393356323, -0.00035194307565689087, -0.0003222525119781494, -0.00029256194829940796, -0.0002628713846206665, -0.00023318082094192505, -0.0002034902572631836, -0.00017379969358444214, -0.00014410912990570068, -0.00011441856622695923, -8.472800254821777e-05, -5.503743886947632e-05, -2.5346875190734863e-05, 4.343688488006592e-06, 3.403425216674805e-05, 6.37248158454895e-05, 9.341537952423096e-05, 0.0001231059432029724, 0.00015279650688171387, 0.00018248707056045532, 0.00021217763423919678, 0.00024186819791793823, 0.0002715587615966797, 0.00030124932527542114, 0.0003309398889541626, 0.00036063045263290405, 0.0003903210163116455, 0.00042001157999038696, 0.0004497021436691284, 0.0004793927073478699, 0.0005090832710266113, 0.0005387738347053528, 0.0005684643983840942, 0.0005981549620628357, 0.0006278455257415771, 0.0006575360894203186, 0.0006872266530990601, 0.0007169172167778015, 0.000746607780456543, 0.0007762983441352844, 0.0008059889078140259, 0.0008356794714927673, 0.0008653700351715088, 0.0008950605988502502, 0.0009247511625289917, 0.0009544417262077332, 0.0009841322898864746, 0.001013822853565216, 0.0010435134172439575, 0.001073203980922699, 0.0011028945446014404, 0.0011325851082801819, 0.0011622756719589233, 0.0011919662356376648, 0.0012216567993164062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 9.0, 16.0, 26.0, 59.0, 103.0, 222.0, 637.0, 2879.0, 74553.0, 960243.0, 7950.0, 1200.0, 380.0, 126.0, 48.0, 31.0, 22.0, 15.0, 8.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.014404296875, -15.40380859375, -14.793212890625, -14.1826171875, -13.572021484375, -12.96142578125, -12.350830078125, -11.740234375, -11.129638671875, -10.51904296875, -9.908447265625, -9.2978515625, -8.687255859375, -8.07666015625, -7.466064453125, -6.85546875, -6.244873046875, -5.63427734375, -5.023681640625, -4.4130859375, -3.802490234375, -3.19189453125, -2.581298828125, -1.970703125, -1.360107421875, -0.74951171875, -0.138916015625, 0.4716796875, 1.082275390625, 1.69287109375, 2.303466796875, 2.9140625, 3.524658203125, 4.13525390625, 4.745849609375, 5.3564453125, 5.967041015625, 6.57763671875, 7.188232421875, 7.798828125, 8.409423828125, 9.02001953125, 9.630615234375, 10.2412109375, 10.851806640625, 11.46240234375, 12.072998046875, 12.68359375, 13.294189453125, 13.90478515625, 14.515380859375, 15.1259765625, 15.736572265625, 16.34716796875, 16.957763671875, 17.568359375, 18.178955078125, 18.78955078125, 19.400146484375, 20.0107421875, 20.621337890625, 21.23193359375, 21.842529296875, 22.453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 9.0, 10.0, 6.0, 16.0, 30.0, 50.0, 104.0, 218.0, 273.0, 121.0, 54.0, 38.0, 20.0, 7.0, 9.0, 4.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.984375, -12.5399169921875, -12.095458984375, -11.6510009765625, -11.20654296875, -10.7620849609375, -10.317626953125, -9.8731689453125, -9.4287109375, -8.9842529296875, -8.539794921875, -8.0953369140625, -7.65087890625, -7.2064208984375, -6.761962890625, -6.3175048828125, -5.873046875, -5.4285888671875, -4.984130859375, -4.5396728515625, -4.09521484375, -3.6507568359375, -3.206298828125, -2.7618408203125, -2.3173828125, -1.8729248046875, -1.428466796875, -0.9840087890625, -0.53955078125, -0.0950927734375, 0.349365234375, 0.7938232421875, 1.23828125, 1.6827392578125, 2.127197265625, 2.5716552734375, 3.01611328125, 3.4605712890625, 3.905029296875, 4.3494873046875, 4.7939453125, 5.2384033203125, 5.682861328125, 6.1273193359375, 6.57177734375, 7.0162353515625, 7.460693359375, 7.9051513671875, 8.349609375, 8.7940673828125, 9.238525390625, 9.6829833984375, 10.12744140625, 10.5718994140625, 11.016357421875, 11.4608154296875, 11.9052734375, 12.3497314453125, 12.794189453125, 13.2386474609375, 13.68310546875, 14.1275634765625, 14.572021484375, 15.0164794921875, 15.4609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 13.0, 39.0, 81.0, 201.0, 280.0, 211.0, 73.0, 46.0, 22.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-224.6123809814453, -220.06549072265625, -215.5186004638672, -210.97171020507812, -206.42481994628906, -201.8779296875, -197.33103942871094, -192.78414916992188, -188.2372589111328, -183.69036865234375, -179.1434783935547, -174.59658813476562, -170.04969787597656, -165.5028076171875, -160.95591735839844, -156.40902709960938, -151.8621368408203, -147.31524658203125, -142.7683563232422, -138.22146606445312, -133.67457580566406, -129.127685546875, -124.58079528808594, -120.03390502929688, -115.48701477050781, -110.94012451171875, -106.39323425292969, -101.84634399414062, -97.29945373535156, -92.7525634765625, -88.20567321777344, -83.65878295898438, -79.11188507080078, -74.56499481201172, -70.01810455322266, -65.4712142944336, -60.92432403564453, -56.37743377685547, -51.830543518066406, -47.283653259277344, -42.73676300048828, -38.18987274169922, -33.642982482910156, -29.096092224121094, -24.54920196533203, -20.00231170654297, -15.455421447753906, -10.908531188964844, -6.361640930175781, -1.8147506713867188, 2.7321395874023438, 7.279029846191406, 11.825920104980469, 16.37281036376953, 20.919700622558594, 25.466590881347656, 30.01348114013672, 34.56037139892578, 39.107261657714844, 43.654151916503906, 48.20104217529297, 52.74793243408203, 57.294822692871094, 61.841712951660156, 66.38860321044922]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 11.0, 7.0, 14.0, 19.0, 25.0, 23.0, 27.0, 26.0, 36.0, 31.0, 52.0, 52.0, 38.0, 43.0, 48.0, 57.0, 62.0, 41.0, 49.0, 46.0, 29.0, 30.0, 28.0, 27.0, 30.0, 27.0, 24.0, 12.0, 11.0, 16.0, 15.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-89.87799835205078, -86.97004699707031, -84.06209564208984, -81.15414428710938, -78.24618530273438, -75.3382339477539, -72.43028259277344, -69.52233123779297, -66.6143798828125, -63.70642852783203, -60.7984733581543, -57.89052200317383, -54.982566833496094, -52.074615478515625, -49.166664123535156, -46.25871276855469, -43.35075378417969, -40.44280242919922, -37.534847259521484, -34.626895904541016, -31.718942642211914, -28.810989379882812, -25.903038024902344, -22.995084762573242, -20.08713150024414, -17.17917823791504, -14.271225929260254, -11.363273620605469, -8.455320358276367, -5.547367095947266, -2.639415740966797, 0.2685375213623047, 3.1764984130859375, 6.084451198577881, 8.992403984069824, 11.90035629272461, 14.808309555053711, 17.716262817382812, 20.62421417236328, 23.532167434692383, 26.440120697021484, 29.348073959350586, 32.25602722167969, 35.163978576660156, 38.071929931640625, 40.97988510131836, 43.88783645629883, 46.79579162597656, 49.70374298095703, 52.6116943359375, 55.519649505615234, 58.4276008605957, 61.33555603027344, 64.2435073852539, 67.15145874023438, 70.05941009521484, 72.96736145019531, 75.87531280517578, 78.78326416015625, 81.69122314453125, 84.59917449951172, 87.50712585449219, 90.41507720947266, 93.32302856445312, 96.23098754882812]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 12.0, 21.0, 15.0, 30.0, 41.0, 74.0, 127.0, 197.0, 421.0, 879.0, 2121.0, 5339.0, 16560.0, 80337.0, 3843477.0, 205344.0, 26553.0, 7613.0, 2767.0, 1115.0, 540.0, 262.0, 168.0, 76.0, 56.0, 32.0, 24.0, 22.0, 15.0, 6.0, 8.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2734375, -14.791259765625, -14.30908203125, -13.826904296875, -13.3447265625, -12.862548828125, -12.38037109375, -11.898193359375, -11.416015625, -10.933837890625, -10.45166015625, -9.969482421875, -9.4873046875, -9.005126953125, -8.52294921875, -8.040771484375, -7.55859375, -7.076416015625, -6.59423828125, -6.112060546875, -5.6298828125, -5.147705078125, -4.66552734375, -4.183349609375, -3.701171875, -3.218994140625, -2.73681640625, -2.254638671875, -1.7724609375, -1.290283203125, -0.80810546875, -0.325927734375, 0.15625, 0.638427734375, 1.12060546875, 1.602783203125, 2.0849609375, 2.567138671875, 3.04931640625, 3.531494140625, 4.013671875, 4.495849609375, 4.97802734375, 5.460205078125, 5.9423828125, 6.424560546875, 6.90673828125, 7.388916015625, 7.87109375, 8.353271484375, 8.83544921875, 9.317626953125, 9.7998046875, 10.281982421875, 10.76416015625, 11.246337890625, 11.728515625, 12.210693359375, 12.69287109375, 13.175048828125, 13.6572265625, 14.139404296875, 14.62158203125, 15.103759765625, 15.5859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 3.0, 8.0, 11.0, 6.0, 15.0, 20.0, 20.0, 23.0, 32.0, 24.0, 35.0, 40.0, 44.0, 49.0, 36.0, 60.0, 54.0, 46.0, 43.0, 61.0, 61.0, 43.0, 39.0, 39.0, 36.0, 31.0, 24.0, 25.0, 14.0, 13.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33984375, -3.2119140625, -3.083984375, -2.9560546875, -2.828125, -2.7001953125, -2.572265625, -2.4443359375, -2.31640625, -2.1884765625, -2.060546875, -1.9326171875, -1.8046875, -1.6767578125, -1.548828125, -1.4208984375, -1.29296875, -1.1650390625, -1.037109375, -0.9091796875, -0.78125, -0.6533203125, -0.525390625, -0.3974609375, -0.26953125, -0.1416015625, -0.013671875, 0.1142578125, 0.2421875, 0.3701171875, 0.498046875, 0.6259765625, 0.75390625, 0.8818359375, 1.009765625, 1.1376953125, 1.265625, 1.3935546875, 1.521484375, 1.6494140625, 1.77734375, 1.9052734375, 2.033203125, 2.1611328125, 2.2890625, 2.4169921875, 2.544921875, 2.6728515625, 2.80078125, 2.9287109375, 3.056640625, 3.1845703125, 3.3125, 3.4404296875, 3.568359375, 3.6962890625, 3.82421875, 3.9521484375, 4.080078125, 4.2080078125, 4.3359375, 4.4638671875, 4.591796875, 4.7197265625, 4.84765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 21.0, 40.0, 45.0, 100.0, 200.0, 400.0, 926.0, 2838.0, 12160.0, 156313.0, 3969666.0, 42349.0, 6257.0, 1677.0, 640.0, 312.0, 136.0, 80.0, 48.0, 24.0, 18.0, 13.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.09326171875, -16.3896484375, -15.68603515625, -14.982421875, -14.27880859375, -13.5751953125, -12.87158203125, -12.16796875, -11.46435546875, -10.7607421875, -10.05712890625, -9.353515625, -8.64990234375, -7.9462890625, -7.24267578125, -6.5390625, -5.83544921875, -5.1318359375, -4.42822265625, -3.724609375, -3.02099609375, -2.3173828125, -1.61376953125, -0.91015625, -0.20654296875, 0.4970703125, 1.20068359375, 1.904296875, 2.60791015625, 3.3115234375, 4.01513671875, 4.71875, 5.42236328125, 6.1259765625, 6.82958984375, 7.533203125, 8.23681640625, 8.9404296875, 9.64404296875, 10.34765625, 11.05126953125, 11.7548828125, 12.45849609375, 13.162109375, 13.86572265625, 14.5693359375, 15.27294921875, 15.9765625, 16.68017578125, 17.3837890625, 18.08740234375, 18.791015625, 19.49462890625, 20.1982421875, 20.90185546875, 21.60546875, 22.30908203125, 23.0126953125, 23.71630859375, 24.419921875, 25.12353515625, 25.8271484375, 26.53076171875, 27.234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 4.0, 8.0, 8.0, 12.0, 20.0, 32.0, 50.0, 102.0, 282.0, 2881.0, 408.0, 99.0, 54.0, 38.0, 23.0, 14.0, 12.0, 4.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.3546142578125, -11.006103515625, -10.6575927734375, -10.30908203125, -9.9605712890625, -9.612060546875, -9.2635498046875, -8.9150390625, -8.5665283203125, -8.218017578125, -7.8695068359375, -7.52099609375, -7.1724853515625, -6.823974609375, -6.4754638671875, -6.126953125, -5.7784423828125, -5.429931640625, -5.0814208984375, -4.73291015625, -4.3843994140625, -4.035888671875, -3.6873779296875, -3.3388671875, -2.9903564453125, -2.641845703125, -2.2933349609375, -1.94482421875, -1.5963134765625, -1.247802734375, -0.8992919921875, -0.55078125, -0.2022705078125, 0.146240234375, 0.4947509765625, 0.84326171875, 1.1917724609375, 1.540283203125, 1.8887939453125, 2.2373046875, 2.5858154296875, 2.934326171875, 3.2828369140625, 3.63134765625, 3.9798583984375, 4.328369140625, 4.6768798828125, 5.025390625, 5.3739013671875, 5.722412109375, 6.0709228515625, 6.41943359375, 6.7679443359375, 7.116455078125, 7.4649658203125, 7.8134765625, 8.1619873046875, 8.510498046875, 8.8590087890625, 9.20751953125, 9.5560302734375, 9.904541015625, 10.2530517578125, 10.6015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 8.0, 27.0, 39.0, 128.0, 309.0, 287.0, 113.0, 45.0, 19.0, 10.0, 9.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.68382263183594, -64.70262908935547, -62.721431732177734, -60.740234375, -58.759037017822266, -56.77783966064453, -54.79664611816406, -52.81544876098633, -50.834251403808594, -48.85305404663086, -46.87186050415039, -44.890663146972656, -42.90946578979492, -40.92826843261719, -38.94707489013672, -36.965877532958984, -34.984683990478516, -33.00348663330078, -31.02229118347168, -29.041095733642578, -27.059898376464844, -25.078702926635742, -23.09750747680664, -21.116310119628906, -19.135114669799805, -17.153919219970703, -15.172721862792969, -13.191526412963867, -11.21033000946045, -9.229133605957031, -7.24793815612793, -5.266741752624512, -3.2855491638183594, -1.3043529987335205, 0.6768431663513184, 2.658039093017578, 4.639235496520996, 6.620431900024414, 8.601627349853516, 10.582823753356934, 12.564020156860352, 14.54521656036377, 16.526412963867188, 18.50760841369629, 20.48880386352539, 22.470001220703125, 24.451196670532227, 26.432392120361328, 28.413589477539062, 30.394784927368164, 32.375980377197266, 34.357177734375, 36.338375091552734, 38.31957244873047, 40.30076599121094, 42.28196334838867, 44.263160705566406, 46.24435806274414, 48.22555160522461, 50.206748962402344, 52.18794631958008, 54.16914367675781, 56.15033721923828, 58.131534576416016, 60.112728118896484]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 11.0, 20.0, 24.0, 27.0, 30.0, 26.0, 39.0, 39.0, 51.0, 46.0, 62.0, 72.0, 51.0, 55.0, 54.0, 64.0, 48.0, 42.0, 39.0, 35.0, 36.0, 40.0, 22.0, 8.0, 13.0, 12.0, 13.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.63614273071289, -25.617835998535156, -24.599529266357422, -23.581222534179688, -22.562915802001953, -21.54460906982422, -20.526302337646484, -19.50799560546875, -18.489688873291016, -17.47138214111328, -16.453075408935547, -15.434768676757812, -14.416461944580078, -13.398155212402344, -12.37984848022461, -11.361541748046875, -10.34323501586914, -9.324928283691406, -8.306621551513672, -7.2883148193359375, -6.270008087158203, -5.251701354980469, -4.233394622802734, -3.215087890625, -2.1967811584472656, -1.1784744262695312, -0.16016769409179688, 0.8581390380859375, 1.8764457702636719, 2.8947525024414062, 3.9130592346191406, 4.931365966796875, 5.949676513671875, 6.967983245849609, 7.986289978027344, 9.004596710205078, 10.022903442382812, 11.041210174560547, 12.059516906738281, 13.077823638916016, 14.09613037109375, 15.114437103271484, 16.13274383544922, 17.151050567626953, 18.169357299804688, 19.187664031982422, 20.205970764160156, 21.22427749633789, 22.242584228515625, 23.26089096069336, 24.279197692871094, 25.297504425048828, 26.315811157226562, 27.334117889404297, 28.35242462158203, 29.370731353759766, 30.3890380859375, 31.407344818115234, 32.42565155029297, 33.4439582824707, 34.46226501464844, 35.48057174682617, 36.498878479003906, 37.51718521118164, 38.535491943359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 9.0, 11.0, 15.0, 21.0, 36.0, 43.0, 64.0, 113.0, 167.0, 288.0, 472.0, 819.0, 1461.0, 2700.0, 5369.0, 10657.0, 23202.0, 55178.0, 146787.0, 349735.0, 274231.0, 102258.0, 40056.0, 17494.0, 8120.0, 4130.0, 2182.0, 1220.0, 640.0, 398.0, 242.0, 152.0, 95.0, 59.0, 42.0, 18.0, 24.0, 12.0, 10.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046875, -6.8023681640625, -6.557861328125, -6.3133544921875, -6.06884765625, -5.8243408203125, -5.579833984375, -5.3353271484375, -5.0908203125, -4.8463134765625, -4.601806640625, -4.3572998046875, -4.11279296875, -3.8682861328125, -3.623779296875, -3.3792724609375, -3.134765625, -2.8902587890625, -2.645751953125, -2.4012451171875, -2.15673828125, -1.9122314453125, -1.667724609375, -1.4232177734375, -1.1787109375, -0.9342041015625, -0.689697265625, -0.4451904296875, -0.20068359375, 0.0438232421875, 0.288330078125, 0.5328369140625, 0.77734375, 1.0218505859375, 1.266357421875, 1.5108642578125, 1.75537109375, 1.9998779296875, 2.244384765625, 2.4888916015625, 2.7333984375, 2.9779052734375, 3.222412109375, 3.4669189453125, 3.71142578125, 3.9559326171875, 4.200439453125, 4.4449462890625, 4.689453125, 4.9339599609375, 5.178466796875, 5.4229736328125, 5.66748046875, 5.9119873046875, 6.156494140625, 6.4010009765625, 6.6455078125, 6.8900146484375, 7.134521484375, 7.3790283203125, 7.62353515625, 7.8680419921875, 8.112548828125, 8.3570556640625, 8.6015625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 7.0, 5.0, 6.0, 7.0, 10.0, 19.0, 21.0, 16.0, 19.0, 23.0, 25.0, 41.0, 40.0, 44.0, 39.0, 47.0, 54.0, 43.0, 48.0, 50.0, 51.0, 48.0, 50.0, 45.0, 28.0, 45.0, 31.0, 21.0, 18.0, 13.0, 23.0, 15.0, 10.0, 8.0, 7.0, 7.0, 3.0, 5.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.1422119140625, -3.018798828125, -2.8953857421875, -2.77197265625, -2.6485595703125, -2.525146484375, -2.4017333984375, -2.2783203125, -2.1549072265625, -2.031494140625, -1.9080810546875, -1.78466796875, -1.6612548828125, -1.537841796875, -1.4144287109375, -1.291015625, -1.1676025390625, -1.044189453125, -0.9207763671875, -0.79736328125, -0.6739501953125, -0.550537109375, -0.4271240234375, -0.3037109375, -0.1802978515625, -0.056884765625, 0.0665283203125, 0.18994140625, 0.3133544921875, 0.436767578125, 0.5601806640625, 0.68359375, 0.8070068359375, 0.930419921875, 1.0538330078125, 1.17724609375, 1.3006591796875, 1.424072265625, 1.5474853515625, 1.6708984375, 1.7943115234375, 1.917724609375, 2.0411376953125, 2.16455078125, 2.2879638671875, 2.411376953125, 2.5347900390625, 2.658203125, 2.7816162109375, 2.905029296875, 3.0284423828125, 3.15185546875, 3.2752685546875, 3.398681640625, 3.5220947265625, 3.6455078125, 3.7689208984375, 3.892333984375, 4.0157470703125, 4.13916015625, 4.2625732421875, 4.385986328125, 4.5093994140625, 4.6328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 11.0, 18.0, 21.0, 23.0, 36.0, 45.0, 76.0, 108.0, 162.0, 243.0, 356.0, 635.0, 1313.0, 4431.0, 21516.0, 181453.0, 719941.0, 98648.0, 13779.0, 3193.0, 1097.0, 483.0, 287.0, 195.0, 126.0, 92.0, 73.0, 39.0, 43.0, 17.0, 14.0, 20.0, 13.0, 13.0, 5.0, 3.0, 2.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.21337890625, -15.5986328125, -14.98388671875, -14.369140625, -13.75439453125, -13.1396484375, -12.52490234375, -11.91015625, -11.29541015625, -10.6806640625, -10.06591796875, -9.451171875, -8.83642578125, -8.2216796875, -7.60693359375, -6.9921875, -6.37744140625, -5.7626953125, -5.14794921875, -4.533203125, -3.91845703125, -3.3037109375, -2.68896484375, -2.07421875, -1.45947265625, -0.8447265625, -0.22998046875, 0.384765625, 0.99951171875, 1.6142578125, 2.22900390625, 2.84375, 3.45849609375, 4.0732421875, 4.68798828125, 5.302734375, 5.91748046875, 6.5322265625, 7.14697265625, 7.76171875, 8.37646484375, 8.9912109375, 9.60595703125, 10.220703125, 10.83544921875, 11.4501953125, 12.06494140625, 12.6796875, 13.29443359375, 13.9091796875, 14.52392578125, 15.138671875, 15.75341796875, 16.3681640625, 16.98291015625, 17.59765625, 18.21240234375, 18.8271484375, 19.44189453125, 20.056640625, 20.67138671875, 21.2861328125, 21.90087890625, 22.515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 12.0, 11.0, 11.0, 4.0, 16.0, 17.0, 27.0, 33.0, 32.0, 49.0, 35.0, 48.0, 36.0, 42.0, 39.0, 49.0, 56.0, 40.0, 48.0, 49.0, 39.0, 37.0, 36.0, 26.0, 35.0, 18.0, 19.0, 27.0, 19.0, 13.0, 16.0, 12.0, 12.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.703125, -20.998779296875, -20.29443359375, -19.590087890625, -18.8857421875, -18.181396484375, -17.47705078125, -16.772705078125, -16.068359375, -15.364013671875, -14.65966796875, -13.955322265625, -13.2509765625, -12.546630859375, -11.84228515625, -11.137939453125, -10.43359375, -9.729248046875, -9.02490234375, -8.320556640625, -7.6162109375, -6.911865234375, -6.20751953125, -5.503173828125, -4.798828125, -4.094482421875, -3.39013671875, -2.685791015625, -1.9814453125, -1.277099609375, -0.57275390625, 0.131591796875, 0.8359375, 1.540283203125, 2.24462890625, 2.948974609375, 3.6533203125, 4.357666015625, 5.06201171875, 5.766357421875, 6.470703125, 7.175048828125, 7.87939453125, 8.583740234375, 9.2880859375, 9.992431640625, 10.69677734375, 11.401123046875, 12.10546875, 12.809814453125, 13.51416015625, 14.218505859375, 14.9228515625, 15.627197265625, 16.33154296875, 17.035888671875, 17.740234375, 18.444580078125, 19.14892578125, 19.853271484375, 20.5576171875, 21.261962890625, 21.96630859375, 22.670654296875, 23.375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 18.0, 10.0, 17.0, 24.0, 36.0, 53.0, 78.0, 148.0, 251.0, 515.0, 1141.0, 3327.0, 14451.0, 169018.0, 787019.0, 60153.0, 8121.0, 2255.0, 893.0, 430.0, 218.0, 130.0, 85.0, 58.0, 21.0, 14.0, 18.0, 7.0, 11.0, 3.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.1953125, -10.8953857421875, -10.595458984375, -10.2955322265625, -9.99560546875, -9.6956787109375, -9.395751953125, -9.0958251953125, -8.7958984375, -8.4959716796875, -8.196044921875, -7.8961181640625, -7.59619140625, -7.2962646484375, -6.996337890625, -6.6964111328125, -6.396484375, -6.0965576171875, -5.796630859375, -5.4967041015625, -5.19677734375, -4.8968505859375, -4.596923828125, -4.2969970703125, -3.9970703125, -3.6971435546875, -3.397216796875, -3.0972900390625, -2.79736328125, -2.4974365234375, -2.197509765625, -1.8975830078125, -1.59765625, -1.2977294921875, -0.997802734375, -0.6978759765625, -0.39794921875, -0.0980224609375, 0.201904296875, 0.5018310546875, 0.8017578125, 1.1016845703125, 1.401611328125, 1.7015380859375, 2.00146484375, 2.3013916015625, 2.601318359375, 2.9012451171875, 3.201171875, 3.5010986328125, 3.801025390625, 4.1009521484375, 4.40087890625, 4.7008056640625, 5.000732421875, 5.3006591796875, 5.6005859375, 5.9005126953125, 6.200439453125, 6.5003662109375, 6.80029296875, 7.1002197265625, 7.400146484375, 7.7000732421875, 8.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 8.0, 16.0, 8.0, 26.0, 24.0, 53.0, 51.0, 78.0, 105.0, 116.0, 118.0, 124.0, 76.0, 58.0, 51.0, 21.0, 23.0, 16.0, 9.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000606536865234375, -0.0005881339311599731, -0.0005697309970855713, -0.0005513280630111694, -0.0005329251289367676, -0.0005145221948623657, -0.0004961192607879639, -0.000477716326713562, -0.00045931339263916016, -0.0004409104585647583, -0.00042250752449035645, -0.0004041045904159546, -0.00038570165634155273, -0.0003672987222671509, -0.000348895788192749, -0.00033049285411834717, -0.0003120899200439453, -0.00029368698596954346, -0.0002752840518951416, -0.00025688111782073975, -0.0002384781837463379, -0.00022007524967193604, -0.00020167231559753418, -0.00018326938152313232, -0.00016486644744873047, -0.0001464635133743286, -0.00012806057929992676, -0.0001096576452255249, -9.125471115112305e-05, -7.285177707672119e-05, -5.4448843002319336e-05, -3.604590892791748e-05, -1.7642974853515625e-05, 7.599592208862305e-07, 1.9162893295288086e-05, 3.756582736968994e-05, 5.59687614440918e-05, 7.437169551849365e-05, 9.277462959289551e-05, 0.00011117756366729736, 0.00012958049774169922, 0.00014798343181610107, 0.00016638636589050293, 0.00018478929996490479, 0.00020319223403930664, 0.0002215951681137085, 0.00023999810218811035, 0.0002584010362625122, 0.00027680397033691406, 0.0002952069044113159, 0.0003136098384857178, 0.00033201277256011963, 0.0003504157066345215, 0.00036881864070892334, 0.0003872215747833252, 0.00040562450885772705, 0.0004240274429321289, 0.00044243037700653076, 0.0004608333110809326, 0.00047923624515533447, 0.0004976391792297363, 0.0005160421133041382, 0.00053444504737854, 0.0005528479814529419, 0.0005712509155273438]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 15.0, 13.0, 27.0, 45.0, 85.0, 133.0, 257.0, 597.0, 1684.0, 8046.0, 108104.0, 863805.0, 57547.0, 5727.0, 1353.0, 523.0, 221.0, 113.0, 62.0, 55.0, 30.0, 22.0, 14.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.4605712890625, -12.108642578125, -11.7567138671875, -11.40478515625, -11.0528564453125, -10.700927734375, -10.3489990234375, -9.9970703125, -9.6451416015625, -9.293212890625, -8.9412841796875, -8.58935546875, -8.2374267578125, -7.885498046875, -7.5335693359375, -7.181640625, -6.8297119140625, -6.477783203125, -6.1258544921875, -5.77392578125, -5.4219970703125, -5.070068359375, -4.7181396484375, -4.3662109375, -4.0142822265625, -3.662353515625, -3.3104248046875, -2.95849609375, -2.6065673828125, -2.254638671875, -1.9027099609375, -1.55078125, -1.1988525390625, -0.846923828125, -0.4949951171875, -0.14306640625, 0.2088623046875, 0.560791015625, 0.9127197265625, 1.2646484375, 1.6165771484375, 1.968505859375, 2.3204345703125, 2.67236328125, 3.0242919921875, 3.376220703125, 3.7281494140625, 4.080078125, 4.4320068359375, 4.783935546875, 5.1358642578125, 5.48779296875, 5.8397216796875, 6.191650390625, 6.5435791015625, 6.8955078125, 7.2474365234375, 7.599365234375, 7.9512939453125, 8.30322265625, 8.6551513671875, 9.007080078125, 9.3590087890625, 9.7109375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 9.0, 7.0, 12.0, 18.0, 32.0, 52.0, 71.0, 139.0, 154.0, 167.0, 105.0, 74.0, 57.0, 38.0, 25.0, 13.0, 8.0, 6.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.3709716796875, -16.913818359375, -16.4566650390625, -15.99951171875, -15.5423583984375, -15.085205078125, -14.6280517578125, -14.1708984375, -13.7137451171875, -13.256591796875, -12.7994384765625, -12.34228515625, -11.8851318359375, -11.427978515625, -10.9708251953125, -10.513671875, -10.0565185546875, -9.599365234375, -9.1422119140625, -8.68505859375, -8.2279052734375, -7.770751953125, -7.3135986328125, -6.8564453125, -6.3992919921875, -5.942138671875, -5.4849853515625, -5.02783203125, -4.5706787109375, -4.113525390625, -3.6563720703125, -3.19921875, -2.7420654296875, -2.284912109375, -1.8277587890625, -1.37060546875, -0.9134521484375, -0.456298828125, 0.0008544921875, 0.4580078125, 0.9151611328125, 1.372314453125, 1.8294677734375, 2.28662109375, 2.7437744140625, 3.200927734375, 3.6580810546875, 4.115234375, 4.5723876953125, 5.029541015625, 5.4866943359375, 5.94384765625, 6.4010009765625, 6.858154296875, 7.3153076171875, 7.7724609375, 8.2296142578125, 8.686767578125, 9.1439208984375, 9.60107421875, 10.0582275390625, 10.515380859375, 10.9725341796875, 11.4296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 120.0, 651.0, 189.0, 29.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-782.9471435546875, -767.1223754882812, -751.297607421875, -735.4728393554688, -719.6480712890625, -703.8233032226562, -687.99853515625, -672.1737060546875, -656.3489379882812, -640.524169921875, -624.6994018554688, -608.8746337890625, -593.0498657226562, -577.22509765625, -561.4002685546875, -545.5755615234375, -529.7507934570312, -513.926025390625, -498.10125732421875, -482.2764892578125, -466.4516906738281, -450.6269226074219, -434.8021545410156, -418.9773864746094, -403.152587890625, -387.32781982421875, -371.5030517578125, -355.67828369140625, -339.8534851074219, -324.0287170410156, -308.2039489746094, -292.3791809082031, -276.554443359375, -260.72967529296875, -244.90489196777344, -229.0801239013672, -213.25535583496094, -197.43057250976562, -181.60580444335938, -165.78103637695312, -149.95623779296875, -134.1314697265625, -118.30669403076172, -102.48191833496094, -86.65715026855469, -70.8323745727539, -55.007598876953125, -39.182830810546875, -23.358062744140625, -7.533289909362793, 8.291482925415039, 24.116256713867188, 39.9410285949707, 55.76580047607422, 71.590576171875, 87.41534423828125, 103.24011993408203, 119.06489562988281, 134.88966369628906, 150.71444702148438, 166.53921508789062, 182.36398315429688, 198.18875122070312, 214.01351928710938, 229.8383026123047]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 13.0, 8.0, 5.0, 10.0, 17.0, 13.0, 15.0, 22.0, 32.0, 28.0, 35.0, 32.0, 40.0, 52.0, 51.0, 41.0, 41.0, 47.0, 70.0, 41.0, 41.0, 41.0, 34.0, 39.0, 32.0, 26.0, 29.0, 26.0, 16.0, 11.0, 11.0, 18.0, 11.0, 11.0, 5.0, 8.0, 2.0, 7.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-122.55804443359375, -118.80497741699219, -115.05191040039062, -111.29884338378906, -107.5457763671875, -103.79270935058594, -100.03964233398438, -96.28657531738281, -92.53350830078125, -88.78044128417969, -85.02737426757812, -81.27430725097656, -77.521240234375, -73.76817321777344, -70.01510620117188, -66.26203918457031, -62.50897979736328, -58.75591278076172, -55.002845764160156, -51.249778747558594, -47.49671173095703, -43.74364471435547, -39.99058151245117, -36.23751449584961, -32.48444747924805, -28.731380462646484, -24.978313446044922, -21.225248336791992, -17.47218132019043, -13.719114303588867, -9.966049194335938, -6.212982177734375, -2.4599151611328125, 1.2931513786315918, 5.046217918395996, 8.799283981323242, 12.552350997924805, 16.305418014526367, 20.058483123779297, 23.81155014038086, 27.564617156982422, 31.317684173583984, 35.07075119018555, 38.823814392089844, 42.576881408691406, 46.32994842529297, 50.08301544189453, 53.836082458496094, 57.589149475097656, 61.34221649169922, 65.09528350830078, 68.84835052490234, 72.6014175415039, 76.35448455810547, 80.1075439453125, 83.86061096191406, 87.61367797851562, 91.36674499511719, 95.11981201171875, 98.87287902832031, 102.62594604492188, 106.37901306152344, 110.132080078125, 113.88514709472656, 117.63821411132812]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 10.0, 14.0, 18.0, 45.0, 70.0, 161.0, 264.0, 528.0, 1166.0, 3634.0, 30722.0, 4127958.0, 24026.0, 3431.0, 1122.0, 488.0, 259.0, 143.0, 83.0, 45.0, 25.0, 21.0, 12.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.0, -26.279296875, -25.55859375, -24.837890625, -24.1171875, -23.396484375, -22.67578125, -21.955078125, -21.234375, -20.513671875, -19.79296875, -19.072265625, -18.3515625, -17.630859375, -16.91015625, -16.189453125, -15.46875, -14.748046875, -14.02734375, -13.306640625, -12.5859375, -11.865234375, -11.14453125, -10.423828125, -9.703125, -8.982421875, -8.26171875, -7.541015625, -6.8203125, -6.099609375, -5.37890625, -4.658203125, -3.9375, -3.216796875, -2.49609375, -1.775390625, -1.0546875, -0.333984375, 0.38671875, 1.107421875, 1.828125, 2.548828125, 3.26953125, 3.990234375, 4.7109375, 5.431640625, 6.15234375, 6.873046875, 7.59375, 8.314453125, 9.03515625, 9.755859375, 10.4765625, 11.197265625, 11.91796875, 12.638671875, 13.359375, 14.080078125, 14.80078125, 15.521484375, 16.2421875, 16.962890625, 17.68359375, 18.404296875, 19.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 9.0, 8.0, 16.0, 22.0, 27.0, 27.0, 46.0, 36.0, 54.0, 55.0, 51.0, 57.0, 71.0, 74.0, 70.0, 76.0, 35.0, 45.0, 40.0, 37.0, 30.0, 18.0, 18.0, 18.0, 13.0, 11.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.703125, -6.4869384765625, -6.270751953125, -6.0545654296875, -5.83837890625, -5.6221923828125, -5.406005859375, -5.1898193359375, -4.9736328125, -4.7574462890625, -4.541259765625, -4.3250732421875, -4.10888671875, -3.8927001953125, -3.676513671875, -3.4603271484375, -3.244140625, -3.0279541015625, -2.811767578125, -2.5955810546875, -2.37939453125, -2.1632080078125, -1.947021484375, -1.7308349609375, -1.5146484375, -1.2984619140625, -1.082275390625, -0.8660888671875, -0.64990234375, -0.4337158203125, -0.217529296875, -0.0013427734375, 0.21484375, 0.4310302734375, 0.647216796875, 0.8634033203125, 1.07958984375, 1.2957763671875, 1.511962890625, 1.7281494140625, 1.9443359375, 2.1605224609375, 2.376708984375, 2.5928955078125, 2.80908203125, 3.0252685546875, 3.241455078125, 3.4576416015625, 3.673828125, 3.8900146484375, 4.106201171875, 4.3223876953125, 4.53857421875, 4.7547607421875, 4.970947265625, 5.1871337890625, 5.4033203125, 5.6195068359375, 5.835693359375, 6.0518798828125, 6.26806640625, 6.4842529296875, 6.700439453125, 6.9166259765625, 7.1328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 1.0, 2.0, 4.0, 6.0, 4.0, 12.0, 16.0, 16.0, 23.0, 39.0, 47.0, 46.0, 92.0, 155.0, 204.0, 291.0, 468.0, 856.0, 1517.0, 3097.0, 8186.0, 39167.0, 3973079.0, 141854.0, 15548.0, 4704.0, 1974.0, 1070.0, 595.0, 387.0, 227.0, 154.0, 120.0, 77.0, 61.0, 42.0, 37.0, 33.0, 17.0, 10.0, 12.0, 9.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0], "bins": [-12.6875, -12.3323974609375, -11.977294921875, -11.6221923828125, -11.26708984375, -10.9119873046875, -10.556884765625, -10.2017822265625, -9.8466796875, -9.4915771484375, -9.136474609375, -8.7813720703125, -8.42626953125, -8.0711669921875, -7.716064453125, -7.3609619140625, -7.005859375, -6.6507568359375, -6.295654296875, -5.9405517578125, -5.58544921875, -5.2303466796875, -4.875244140625, -4.5201416015625, -4.1650390625, -3.8099365234375, -3.454833984375, -3.0997314453125, -2.74462890625, -2.3895263671875, -2.034423828125, -1.6793212890625, -1.32421875, -0.9691162109375, -0.614013671875, -0.2589111328125, 0.09619140625, 0.4512939453125, 0.806396484375, 1.1614990234375, 1.5166015625, 1.8717041015625, 2.226806640625, 2.5819091796875, 2.93701171875, 3.2921142578125, 3.647216796875, 4.0023193359375, 4.357421875, 4.7125244140625, 5.067626953125, 5.4227294921875, 5.77783203125, 6.1329345703125, 6.488037109375, 6.8431396484375, 7.1982421875, 7.5533447265625, 7.908447265625, 8.2635498046875, 8.61865234375, 8.9737548828125, 9.328857421875, 9.6839599609375, 10.0390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 19.0, 71.0, 3317.0, 513.0, 64.0, 28.0, 18.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.9234619140625, -2.776611328125, -2.6297607421875, -2.48291015625, -2.3360595703125, -2.189208984375, -2.0423583984375, -1.8955078125, -1.7486572265625, -1.601806640625, -1.4549560546875, -1.30810546875, -1.1612548828125, -1.014404296875, -0.8675537109375, -0.720703125, -0.5738525390625, -0.427001953125, -0.2801513671875, -0.13330078125, 0.0135498046875, 0.160400390625, 0.3072509765625, 0.4541015625, 0.6009521484375, 0.747802734375, 0.8946533203125, 1.04150390625, 1.1883544921875, 1.335205078125, 1.4820556640625, 1.62890625, 1.7757568359375, 1.922607421875, 2.0694580078125, 2.21630859375, 2.3631591796875, 2.510009765625, 2.6568603515625, 2.8037109375, 2.9505615234375, 3.097412109375, 3.2442626953125, 3.39111328125, 3.5379638671875, 3.684814453125, 3.8316650390625, 3.978515625, 4.1253662109375, 4.272216796875, 4.4190673828125, 4.56591796875, 4.7127685546875, 4.859619140625, 5.0064697265625, 5.1533203125, 5.3001708984375, 5.447021484375, 5.5938720703125, 5.74072265625, 5.8875732421875, 6.034423828125, 6.1812744140625, 6.328125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 22.0, 49.0, 152.0, 223.0, 196.0, 166.0, 101.0, 43.0, 17.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5971360206604, -5.188908576965332, -4.7806806564331055, -4.372452735900879, -3.9642252922058105, -3.555997610092163, -3.1477699279785156, -2.739542245864868, -2.3313145637512207, -1.9230868816375732, -1.5148591995239258, -1.1066315174102783, -0.6984038352966309, -0.2901761531829834, 0.11805152893066406, 0.5262792110443115, 0.934506893157959, 1.3427345752716064, 1.750962257385254, 2.1591899394989014, 2.567417621612549, 2.9756453037261963, 3.3838729858398438, 3.792100667953491, 4.200328350067139, 4.608555793762207, 5.016783714294434, 5.42501163482666, 5.8332390785217285, 6.241466522216797, 6.649694442749023, 7.05792236328125, 7.466150283813477, 7.874378204345703, 8.28260612487793, 8.69083309173584, 9.099061012268066, 9.507288932800293, 9.915515899658203, 10.32374382019043, 10.731971740722656, 11.140199661254883, 11.54842758178711, 11.95665454864502, 12.364882469177246, 12.773110389709473, 13.181337356567383, 13.58956527709961, 13.997793197631836, 14.406021118164062, 14.814249038696289, 15.2224760055542, 15.630703926086426, 16.038930892944336, 16.447158813476562, 16.85538673400879, 17.263614654541016, 17.671842575073242, 18.08007049560547, 18.488298416137695, 18.896526336669922, 19.304752349853516, 19.712980270385742, 20.12120819091797, 20.529436111450195]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 6.0, 7.0, 6.0, 14.0, 10.0, 19.0, 20.0, 24.0, 19.0, 28.0, 24.0, 35.0, 26.0, 33.0, 31.0, 57.0, 61.0, 54.0, 35.0, 51.0, 37.0, 41.0, 35.0, 47.0, 33.0, 32.0, 36.0, 24.0, 26.0, 26.0, 16.0, 19.0, 12.0, 11.0, 10.0, 9.0, 5.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.280094146728516, -6.0917253494262695, -5.903356075286865, -5.714987277984619, -5.526618003845215, -5.338249206542969, -5.1498799324035645, -4.961511135101318, -4.773141860961914, -4.584773063659668, -4.396403789520264, -4.208034992218018, -4.019665718078613, -3.831296682357788, -3.642927646636963, -3.454558849334717, -3.2661898136138916, -3.0778207778930664, -2.889451742172241, -2.701082706451416, -2.512713670730591, -2.3243446350097656, -2.1359758377075195, -1.9476066827774048, -1.7592376470565796, -1.5708686113357544, -1.3824995756149292, -1.1941306591033936, -1.0057616233825684, -0.8173925280570984, -0.629023551940918, -0.4406545162200928, -0.2522854804992676, -0.06391645967960358, 0.12445256114006042, 0.31282156705856323, 0.5011906027793884, 0.6895596385002136, 0.877928614616394, 1.0662976503372192, 1.2546666860580444, 1.4430357217788696, 1.6314047574996948, 1.8197736740112305, 2.0081427097320557, 2.196511745452881, 2.384880781173706, 2.5732498168945312, 2.7616188526153564, 2.9499878883361816, 3.138356924057007, 3.326725959777832, 3.5150949954986572, 3.7034640312194824, 3.8918328285217285, 4.080202102661133, 4.268570899963379, 4.456939697265625, 4.645308971405029, 4.833677768707275, 5.02204704284668, 5.210415840148926, 5.39878511428833, 5.587153911590576, 5.7755231857299805]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 12.0, 9.0, 15.0, 19.0, 26.0, 48.0, 63.0, 112.0, 203.0, 397.0, 960.0, 2716.0, 8900.0, 36104.0, 205277.0, 614076.0, 141821.0, 27000.0, 6929.0, 2200.0, 816.0, 386.0, 182.0, 98.0, 66.0, 34.0, 19.0, 21.0, 18.0, 6.0, 9.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.536865234375, -14.04248046875, -13.548095703125, -13.0537109375, -12.559326171875, -12.06494140625, -11.570556640625, -11.076171875, -10.581787109375, -10.08740234375, -9.593017578125, -9.0986328125, -8.604248046875, -8.10986328125, -7.615478515625, -7.12109375, -6.626708984375, -6.13232421875, -5.637939453125, -5.1435546875, -4.649169921875, -4.15478515625, -3.660400390625, -3.166015625, -2.671630859375, -2.17724609375, -1.682861328125, -1.1884765625, -0.694091796875, -0.19970703125, 0.294677734375, 0.7890625, 1.283447265625, 1.77783203125, 2.272216796875, 2.7666015625, 3.260986328125, 3.75537109375, 4.249755859375, 4.744140625, 5.238525390625, 5.73291015625, 6.227294921875, 6.7216796875, 7.216064453125, 7.71044921875, 8.204833984375, 8.69921875, 9.193603515625, 9.68798828125, 10.182373046875, 10.6767578125, 11.171142578125, 11.66552734375, 12.159912109375, 12.654296875, 13.148681640625, 13.64306640625, 14.137451171875, 14.6318359375, 15.126220703125, 15.62060546875, 16.114990234375, 16.609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 12.0, 16.0, 28.0, 27.0, 33.0, 41.0, 51.0, 62.0, 52.0, 59.0, 67.0, 76.0, 67.0, 73.0, 52.0, 44.0, 37.0, 40.0, 34.0, 27.0, 25.0, 9.0, 9.0, 10.0, 8.0, 2.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.651611328125, -6.42431640625, -6.197021484375, -5.9697265625, -5.742431640625, -5.51513671875, -5.287841796875, -5.060546875, -4.833251953125, -4.60595703125, -4.378662109375, -4.1513671875, -3.924072265625, -3.69677734375, -3.469482421875, -3.2421875, -3.014892578125, -2.78759765625, -2.560302734375, -2.3330078125, -2.105712890625, -1.87841796875, -1.651123046875, -1.423828125, -1.196533203125, -0.96923828125, -0.741943359375, -0.5146484375, -0.287353515625, -0.06005859375, 0.167236328125, 0.39453125, 0.621826171875, 0.84912109375, 1.076416015625, 1.3037109375, 1.531005859375, 1.75830078125, 1.985595703125, 2.212890625, 2.440185546875, 2.66748046875, 2.894775390625, 3.1220703125, 3.349365234375, 3.57666015625, 3.803955078125, 4.03125, 4.258544921875, 4.48583984375, 4.713134765625, 4.9404296875, 5.167724609375, 5.39501953125, 5.622314453125, 5.849609375, 6.076904296875, 6.30419921875, 6.531494140625, 6.7587890625, 6.986083984375, 7.21337890625, 7.440673828125, 7.66796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 3.0, 7.0, 9.0, 11.0, 14.0, 27.0, 36.0, 48.0, 48.0, 74.0, 82.0, 119.0, 170.0, 243.0, 381.0, 786.0, 1776.0, 6111.0, 33108.0, 379192.0, 567902.0, 46281.0, 7701.0, 2090.0, 920.0, 455.0, 252.0, 196.0, 109.0, 90.0, 78.0, 47.0, 38.0, 31.0, 29.0, 24.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-25.421875, -24.71728515625, -24.0126953125, -23.30810546875, -22.603515625, -21.89892578125, -21.1943359375, -20.48974609375, -19.78515625, -19.08056640625, -18.3759765625, -17.67138671875, -16.966796875, -16.26220703125, -15.5576171875, -14.85302734375, -14.1484375, -13.44384765625, -12.7392578125, -12.03466796875, -11.330078125, -10.62548828125, -9.9208984375, -9.21630859375, -8.51171875, -7.80712890625, -7.1025390625, -6.39794921875, -5.693359375, -4.98876953125, -4.2841796875, -3.57958984375, -2.875, -2.17041015625, -1.4658203125, -0.76123046875, -0.056640625, 0.64794921875, 1.3525390625, 2.05712890625, 2.76171875, 3.46630859375, 4.1708984375, 4.87548828125, 5.580078125, 6.28466796875, 6.9892578125, 7.69384765625, 8.3984375, 9.10302734375, 9.8076171875, 10.51220703125, 11.216796875, 11.92138671875, 12.6259765625, 13.33056640625, 14.03515625, 14.73974609375, 15.4443359375, 16.14892578125, 16.853515625, 17.55810546875, 18.2626953125, 18.96728515625, 19.671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 11.0, 10.0, 7.0, 16.0, 25.0, 14.0, 20.0, 18.0, 32.0, 28.0, 34.0, 42.0, 42.0, 40.0, 49.0, 43.0, 48.0, 47.0, 43.0, 41.0, 44.0, 45.0, 34.0, 23.0, 34.0, 31.0, 30.0, 20.0, 23.0, 14.0, 17.0, 12.0, 11.0, 6.0, 9.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-31.53125, -30.63232421875, -29.7333984375, -28.83447265625, -27.935546875, -27.03662109375, -26.1376953125, -25.23876953125, -24.33984375, -23.44091796875, -22.5419921875, -21.64306640625, -20.744140625, -19.84521484375, -18.9462890625, -18.04736328125, -17.1484375, -16.24951171875, -15.3505859375, -14.45166015625, -13.552734375, -12.65380859375, -11.7548828125, -10.85595703125, -9.95703125, -9.05810546875, -8.1591796875, -7.26025390625, -6.361328125, -5.46240234375, -4.5634765625, -3.66455078125, -2.765625, -1.86669921875, -0.9677734375, -0.06884765625, 0.830078125, 1.72900390625, 2.6279296875, 3.52685546875, 4.42578125, 5.32470703125, 6.2236328125, 7.12255859375, 8.021484375, 8.92041015625, 9.8193359375, 10.71826171875, 11.6171875, 12.51611328125, 13.4150390625, 14.31396484375, 15.212890625, 16.11181640625, 17.0107421875, 17.90966796875, 18.80859375, 19.70751953125, 20.6064453125, 21.50537109375, 22.404296875, 23.30322265625, 24.2021484375, 25.10107421875, 26.0]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 11.0, 14.0, 25.0, 32.0, 46.0, 65.0, 104.0, 157.0, 323.0, 549.0, 1302.0, 3788.0, 21022.0, 428616.0, 560160.0, 25260.0, 4305.0, 1339.0, 585.0, 291.0, 180.0, 119.0, 63.0, 49.0, 40.0, 20.0, 12.0, 13.0, 14.0, 10.0, 8.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.09375, -9.7972412109375, -9.500732421875, -9.2042236328125, -8.90771484375, -8.6112060546875, -8.314697265625, -8.0181884765625, -7.7216796875, -7.4251708984375, -7.128662109375, -6.8321533203125, -6.53564453125, -6.2391357421875, -5.942626953125, -5.6461181640625, -5.349609375, -5.0531005859375, -4.756591796875, -4.4600830078125, -4.16357421875, -3.8670654296875, -3.570556640625, -3.2740478515625, -2.9775390625, -2.6810302734375, -2.384521484375, -2.0880126953125, -1.79150390625, -1.4949951171875, -1.198486328125, -0.9019775390625, -0.60546875, -0.3089599609375, -0.012451171875, 0.2840576171875, 0.58056640625, 0.8770751953125, 1.173583984375, 1.4700927734375, 1.7666015625, 2.0631103515625, 2.359619140625, 2.6561279296875, 2.95263671875, 3.2491455078125, 3.545654296875, 3.8421630859375, 4.138671875, 4.4351806640625, 4.731689453125, 5.0281982421875, 5.32470703125, 5.6212158203125, 5.917724609375, 6.2142333984375, 6.5107421875, 6.8072509765625, 7.103759765625, 7.4002685546875, 7.69677734375, 7.9932861328125, 8.289794921875, 8.5863037109375, 8.8828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 9.0, 7.0, 4.0, 9.0, 12.0, 25.0, 20.0, 27.0, 43.0, 48.0, 53.0, 75.0, 79.0, 84.0, 76.0, 88.0, 61.0, 65.0, 54.0, 39.0, 42.0, 25.0, 13.0, 12.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043487548828125, -0.00042092055082321167, -0.00040696561336517334, -0.000393010675907135, -0.0003790557384490967, -0.00036510080099105835, -0.00035114586353302, -0.0003371909260749817, -0.00032323598861694336, -0.00030928105115890503, -0.0002953261137008667, -0.00028137117624282837, -0.00026741623878479004, -0.0002534613013267517, -0.00023950636386871338, -0.00022555142641067505, -0.00021159648895263672, -0.0001976415514945984, -0.00018368661403656006, -0.00016973167657852173, -0.0001557767391204834, -0.00014182180166244507, -0.00012786686420440674, -0.00011391192674636841, -9.995698928833008e-05, -8.600205183029175e-05, -7.204711437225342e-05, -5.809217691421509e-05, -4.413723945617676e-05, -3.0182301998138428e-05, -1.6227364540100098e-05, -2.2724270820617676e-06, 1.1682510375976562e-05, 2.5637447834014893e-05, 3.959238529205322e-05, 5.354732275009155e-05, 6.750226020812988e-05, 8.145719766616821e-05, 9.541213512420654e-05, 0.00010936707258224487, 0.0001233220100402832, 0.00013727694749832153, 0.00015123188495635986, 0.0001651868224143982, 0.00017914175987243652, 0.00019309669733047485, 0.00020705163478851318, 0.00022100657224655151, 0.00023496150970458984, 0.0002489164471626282, 0.0002628713846206665, 0.00027682632207870483, 0.00029078125953674316, 0.0003047361969947815, 0.0003186911344528198, 0.00033264607191085815, 0.0003466010093688965, 0.0003605559468269348, 0.00037451088428497314, 0.0003884658217430115, 0.0004024207592010498, 0.00041637569665908813, 0.00043033063411712646, 0.0004442855715751648, 0.0004582405090332031]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 2.0, 7.0, 7.0, 11.0, 30.0, 40.0, 85.0, 188.0, 647.0, 2479.0, 32093.0, 986733.0, 23284.0, 2060.0, 526.0, 153.0, 87.0, 39.0, 20.0, 20.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.859375, -19.29931640625, -18.7392578125, -18.17919921875, -17.619140625, -17.05908203125, -16.4990234375, -15.93896484375, -15.37890625, -14.81884765625, -14.2587890625, -13.69873046875, -13.138671875, -12.57861328125, -12.0185546875, -11.45849609375, -10.8984375, -10.33837890625, -9.7783203125, -9.21826171875, -8.658203125, -8.09814453125, -7.5380859375, -6.97802734375, -6.41796875, -5.85791015625, -5.2978515625, -4.73779296875, -4.177734375, -3.61767578125, -3.0576171875, -2.49755859375, -1.9375, -1.37744140625, -0.8173828125, -0.25732421875, 0.302734375, 0.86279296875, 1.4228515625, 1.98291015625, 2.54296875, 3.10302734375, 3.6630859375, 4.22314453125, 4.783203125, 5.34326171875, 5.9033203125, 6.46337890625, 7.0234375, 7.58349609375, 8.1435546875, 8.70361328125, 9.263671875, 9.82373046875, 10.3837890625, 10.94384765625, 11.50390625, 12.06396484375, 12.6240234375, 13.18408203125, 13.744140625, 14.30419921875, 14.8642578125, 15.42431640625, 15.984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 15.0, 23.0, 33.0, 72.0, 136.0, 199.0, 208.0, 137.0, 65.0, 43.0, 22.0, 9.0, 9.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.310546875, -18.76171875, -18.212890625, -17.6640625, -17.115234375, -16.56640625, -16.017578125, -15.46875, -14.919921875, -14.37109375, -13.822265625, -13.2734375, -12.724609375, -12.17578125, -11.626953125, -11.078125, -10.529296875, -9.98046875, -9.431640625, -8.8828125, -8.333984375, -7.78515625, -7.236328125, -6.6875, -6.138671875, -5.58984375, -5.041015625, -4.4921875, -3.943359375, -3.39453125, -2.845703125, -2.296875, -1.748046875, -1.19921875, -0.650390625, -0.1015625, 0.447265625, 0.99609375, 1.544921875, 2.09375, 2.642578125, 3.19140625, 3.740234375, 4.2890625, 4.837890625, 5.38671875, 5.935546875, 6.484375, 7.033203125, 7.58203125, 8.130859375, 8.6796875, 9.228515625, 9.77734375, 10.326171875, 10.875, 11.423828125, 11.97265625, 12.521484375, 13.0703125, 13.619140625, 14.16796875, 14.716796875, 15.265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 17.0, 55.0, 128.0, 249.0, 247.0, 168.0, 54.0, 30.0, 20.0, 11.0, 11.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0], "bins": [-318.14764404296875, -311.9079284667969, -305.6681823730469, -299.428466796875, -293.1887512207031, -286.9490051269531, -280.70928955078125, -274.46954345703125, -268.2298278808594, -261.9901123046875, -255.75038146972656, -249.51065063476562, -243.2709197998047, -237.03118896484375, -230.79147338867188, -224.55174255371094, -218.31201171875, -212.07228088378906, -205.8325653076172, -199.59283447265625, -193.3531036376953, -187.11337280273438, -180.8736572265625, -174.63392639160156, -168.3942108154297, -162.15447998046875, -155.91476440429688, -149.67503356933594, -143.435302734375, -137.19557189941406, -130.9558563232422, -124.71612548828125, -118.47639465332031, -112.2366714477539, -105.99694061279297, -99.75721740722656, -93.51748657226562, -87.27776336669922, -81.03804016113281, -74.79830932617188, -68.55857849121094, -62.318851470947266, -56.079124450683594, -49.83940124511719, -43.59967041015625, -37.359947204589844, -31.120220184326172, -24.8804931640625, -18.640769958496094, -12.401042938232422, -6.161316871643066, 0.07840919494628906, 6.318136215209961, 12.557863235473633, 18.797588348388672, 25.037315368652344, 31.277042388916016, 37.51676940917969, 43.75649642944336, 49.99622344970703, 56.23594665527344, 62.475677490234375, 68.71540069580078, 74.95512390136719, 81.19485473632812]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 10.0, 6.0, 12.0, 14.0, 16.0, 13.0, 16.0, 27.0, 27.0, 26.0, 34.0, 44.0, 47.0, 44.0, 63.0, 50.0, 63.0, 49.0, 49.0, 56.0, 43.0, 40.0, 37.0, 34.0, 26.0, 26.0, 17.0, 11.0, 22.0, 17.0, 11.0, 10.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-144.09609985351562, -139.6763153076172, -135.2565460205078, -130.83676147460938, -126.41698455810547, -121.99720764160156, -117.57742309570312, -113.15764617919922, -108.73786926269531, -104.3180923461914, -99.8983154296875, -95.47853088378906, -91.05875396728516, -86.63897705078125, -82.21919250488281, -77.7994155883789, -73.379638671875, -68.9598617553711, -64.54008483886719, -60.12030029296875, -55.700523376464844, -51.28074645996094, -46.860965728759766, -42.441184997558594, -38.02140808105469, -33.60163116455078, -29.18185043334961, -24.76207160949707, -20.34229278564453, -15.922513961791992, -11.502735137939453, -7.082956314086914, -2.663177490234375, 1.756601333618164, 6.176380157470703, 10.596158981323242, 15.015937805175781, 19.43571662902832, 23.85549545288086, 28.2752742767334, 32.69505310058594, 37.114830017089844, 41.534610748291016, 45.95439147949219, 50.374168395996094, 54.7939453125, 59.21372604370117, 63.633506774902344, 68.05328369140625, 72.47306060791016, 76.89283752441406, 81.3126220703125, 85.7323989868164, 90.15217590332031, 94.57196044921875, 98.99173736572266, 103.41151428222656, 107.83129119873047, 112.25106811523438, 116.67085266113281, 121.09062957763672, 125.51040649414062, 129.93019104003906, 134.34996032714844, 138.76974487304688]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 7.0, 26.0, 47.0, 42.0, 92.0, 165.0, 383.0, 902.0, 2494.0, 12937.0, 4074896.0, 93749.0, 5785.0, 1534.0, 583.0, 278.0, 142.0, 81.0, 44.0, 23.0, 20.0, 7.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.640625, -15.0341796875, -14.427734375, -13.8212890625, -13.21484375, -12.6083984375, -12.001953125, -11.3955078125, -10.7890625, -10.1826171875, -9.576171875, -8.9697265625, -8.36328125, -7.7568359375, -7.150390625, -6.5439453125, -5.9375, -5.3310546875, -4.724609375, -4.1181640625, -3.51171875, -2.9052734375, -2.298828125, -1.6923828125, -1.0859375, -0.4794921875, 0.126953125, 0.7333984375, 1.33984375, 1.9462890625, 2.552734375, 3.1591796875, 3.765625, 4.3720703125, 4.978515625, 5.5849609375, 6.19140625, 6.7978515625, 7.404296875, 8.0107421875, 8.6171875, 9.2236328125, 9.830078125, 10.4365234375, 11.04296875, 11.6494140625, 12.255859375, 12.8623046875, 13.46875, 14.0751953125, 14.681640625, 15.2880859375, 15.89453125, 16.5009765625, 17.107421875, 17.7138671875, 18.3203125, 18.9267578125, 19.533203125, 20.1396484375, 20.74609375, 21.3525390625, 21.958984375, 22.5654296875, 23.171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 8.0, 8.0, 6.0, 10.0, 9.0, 14.0, 17.0, 30.0, 19.0, 49.0, 30.0, 47.0, 49.0, 64.0, 51.0, 62.0, 58.0, 64.0, 56.0, 54.0, 42.0, 43.0, 27.0, 36.0, 21.0, 24.0, 21.0, 20.0, 10.0, 13.0, 10.0, 6.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4609375, -7.24981689453125, -7.0386962890625, -6.82757568359375, -6.616455078125, -6.40533447265625, -6.1942138671875, -5.98309326171875, -5.77197265625, -5.56085205078125, -5.3497314453125, -5.13861083984375, -4.927490234375, -4.71636962890625, -4.5052490234375, -4.29412841796875, -4.0830078125, -3.87188720703125, -3.6607666015625, -3.44964599609375, -3.238525390625, -3.02740478515625, -2.8162841796875, -2.60516357421875, -2.39404296875, -2.18292236328125, -1.9718017578125, -1.76068115234375, -1.549560546875, -1.33843994140625, -1.1273193359375, -0.91619873046875, -0.705078125, -0.49395751953125, -0.2828369140625, -0.07171630859375, 0.139404296875, 0.35052490234375, 0.5616455078125, 0.77276611328125, 0.98388671875, 1.19500732421875, 1.4061279296875, 1.61724853515625, 1.828369140625, 2.03948974609375, 2.2506103515625, 2.46173095703125, 2.6728515625, 2.88397216796875, 3.0950927734375, 3.30621337890625, 3.517333984375, 3.72845458984375, 3.9395751953125, 4.15069580078125, 4.36181640625, 4.57293701171875, 4.7840576171875, 4.99517822265625, 5.206298828125, 5.41741943359375, 5.6285400390625, 5.83966064453125, 6.05078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 7.0, 5.0, 25.0, 28.0, 36.0, 56.0, 82.0, 86.0, 126.0, 163.0, 197.0, 329.0, 470.0, 670.0, 1064.0, 1902.0, 3506.0, 8796.0, 32317.0, 3475117.0, 624617.0, 28088.0, 8031.0, 3490.0, 1792.0, 990.0, 661.0, 447.0, 306.0, 214.0, 161.0, 140.0, 96.0, 73.0, 53.0, 31.0, 30.0, 16.0, 12.0, 11.0, 14.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4765625, -9.197509765625, -8.91845703125, -8.639404296875, -8.3603515625, -8.081298828125, -7.80224609375, -7.523193359375, -7.244140625, -6.965087890625, -6.68603515625, -6.406982421875, -6.1279296875, -5.848876953125, -5.56982421875, -5.290771484375, -5.01171875, -4.732666015625, -4.45361328125, -4.174560546875, -3.8955078125, -3.616455078125, -3.33740234375, -3.058349609375, -2.779296875, -2.500244140625, -2.22119140625, -1.942138671875, -1.6630859375, -1.384033203125, -1.10498046875, -0.825927734375, -0.546875, -0.267822265625, 0.01123046875, 0.290283203125, 0.5693359375, 0.848388671875, 1.12744140625, 1.406494140625, 1.685546875, 1.964599609375, 2.24365234375, 2.522705078125, 2.8017578125, 3.080810546875, 3.35986328125, 3.638916015625, 3.91796875, 4.197021484375, 4.47607421875, 4.755126953125, 5.0341796875, 5.313232421875, 5.59228515625, 5.871337890625, 6.150390625, 6.429443359375, 6.70849609375, 6.987548828125, 7.2666015625, 7.545654296875, 7.82470703125, 8.103759765625, 8.3828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 13.0, 19.0, 30.0, 98.0, 3272.0, 484.0, 82.0, 27.0, 14.0, 12.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.873046875, -3.743377685546875, -3.61370849609375, -3.484039306640625, -3.3543701171875, -3.224700927734375, -3.09503173828125, -2.965362548828125, -2.835693359375, -2.706024169921875, -2.57635498046875, -2.446685791015625, -2.3170166015625, -2.187347412109375, -2.05767822265625, -1.928009033203125, -1.79833984375, -1.668670654296875, -1.53900146484375, -1.409332275390625, -1.2796630859375, -1.149993896484375, -1.02032470703125, -0.890655517578125, -0.760986328125, -0.631317138671875, -0.50164794921875, -0.371978759765625, -0.2423095703125, -0.112640380859375, 0.01702880859375, 0.146697998046875, 0.2763671875, 0.406036376953125, 0.53570556640625, 0.665374755859375, 0.7950439453125, 0.924713134765625, 1.05438232421875, 1.184051513671875, 1.313720703125, 1.443389892578125, 1.57305908203125, 1.702728271484375, 1.8323974609375, 1.962066650390625, 2.09173583984375, 2.221405029296875, 2.35107421875, 2.480743408203125, 2.61041259765625, 2.740081787109375, 2.8697509765625, 2.999420166015625, 3.12908935546875, 3.258758544921875, 3.388427734375, 3.518096923828125, 3.64776611328125, 3.777435302734375, 3.9071044921875, 4.036773681640625, 4.16644287109375, 4.296112060546875, 4.42578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 47.0, 126.0, 208.0, 257.0, 182.0, 79.0, 46.0, 21.0, 10.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.009910583496094, -20.459884643554688, -19.90985679626465, -19.359830856323242, -18.809804916381836, -18.25977897644043, -17.70975112915039, -17.159725189208984, -16.609699249267578, -16.059673309326172, -15.50964641571045, -14.959619522094727, -14.40959358215332, -13.859566688537598, -13.309539794921875, -12.759513854980469, -12.209486961364746, -11.659460067749023, -11.109434127807617, -10.559407234191895, -10.009381294250488, -9.459354400634766, -8.90932846069336, -8.359301567077637, -7.809275150299072, -7.259248733520508, -6.709222316741943, -6.159195899963379, -5.609169006347656, -5.05914306640625, -4.509116172790527, -3.959089756011963, -3.4090633392333984, -2.859036922454834, -2.3090105056762695, -1.758983850479126, -1.2089574337005615, -0.6589310169219971, -0.10890436172485352, 0.44112205505371094, 0.9911484718322754, 1.5411748886108398, 2.0912013053894043, 2.641227960586548, 3.1912543773651123, 3.7412807941436768, 4.29130744934082, 4.841333866119385, 5.391360282897949, 5.941386699676514, 6.491413116455078, 7.041440010070801, 7.591465950012207, 8.14149284362793, 8.691518783569336, 9.241545677185059, 9.791572570800781, 10.341599464416504, 10.89162540435791, 11.441652297973633, 11.991678237915039, 12.541705131530762, 13.091732025146484, 13.64175796508789, 14.191783905029297]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 5.0, 7.0, 5.0, 12.0, 16.0, 11.0, 18.0, 15.0, 20.0, 28.0, 26.0, 42.0, 28.0, 37.0, 34.0, 51.0, 36.0, 51.0, 52.0, 41.0, 46.0, 47.0, 35.0, 48.0, 19.0, 32.0, 30.0, 45.0, 19.0, 29.0, 21.0, 15.0, 18.0, 13.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.840854644775391, -5.650702953338623, -5.460550785064697, -5.27039909362793, -5.080246925354004, -4.890095233917236, -4.6999430656433105, -4.509791374206543, -4.319639205932617, -4.12948751449585, -3.939335346221924, -3.749183416366577, -3.5590314865112305, -3.368879556655884, -3.178727626800537, -2.9885759353637695, -2.798424005508423, -2.608272075653076, -2.4181201457977295, -2.227968215942383, -2.037816286087036, -1.8476643562316895, -1.6575125455856323, -1.4673606157302856, -1.277208685874939, -1.0870567560195923, -0.8969048261642456, -0.7067529559135437, -0.516601026058197, -0.32644909620285034, -0.13629722595214844, 0.05385470390319824, 0.24400663375854492, 0.4341585636138916, 0.6243104934692383, 0.8144623637199402, 1.0046143531799316, 1.1947662830352783, 1.3849180936813354, 1.5750700235366821, 1.7652219533920288, 1.9553738832473755, 2.1455256938934326, 2.3356776237487793, 2.525829553604126, 2.7159814834594727, 2.9061334133148193, 3.096285343170166, 3.2864372730255127, 3.4765892028808594, 3.666741132736206, 3.8568930625915527, 4.04704475402832, 4.237196922302246, 4.427348613739014, 4.6175007820129395, 4.807652473449707, 4.997804164886475, 5.1879563331604, 5.378108024597168, 5.568260192871094, 5.758411884307861, 5.948564052581787, 6.138715744018555, 6.3288679122924805]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 25.0, 26.0, 35.0, 70.0, 103.0, 221.0, 438.0, 951.0, 2233.0, 5713.0, 16830.0, 60720.0, 286664.0, 500336.0, 127391.0, 30883.0, 9743.0, 3492.0, 1410.0, 646.0, 265.0, 153.0, 63.0, 50.0, 37.0, 15.0, 7.0, 8.0, 8.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.1470947265625, -10.778564453125, -10.4100341796875, -10.04150390625, -9.6729736328125, -9.304443359375, -8.9359130859375, -8.5673828125, -8.1988525390625, -7.830322265625, -7.4617919921875, -7.09326171875, -6.7247314453125, -6.356201171875, -5.9876708984375, -5.619140625, -5.2506103515625, -4.882080078125, -4.5135498046875, -4.14501953125, -3.7764892578125, -3.407958984375, -3.0394287109375, -2.6708984375, -2.3023681640625, -1.933837890625, -1.5653076171875, -1.19677734375, -0.8282470703125, -0.459716796875, -0.0911865234375, 0.27734375, 0.6458740234375, 1.014404296875, 1.3829345703125, 1.75146484375, 2.1199951171875, 2.488525390625, 2.8570556640625, 3.2255859375, 3.5941162109375, 3.962646484375, 4.3311767578125, 4.69970703125, 5.0682373046875, 5.436767578125, 5.8052978515625, 6.173828125, 6.5423583984375, 6.910888671875, 7.2794189453125, 7.64794921875, 8.0164794921875, 8.385009765625, 8.7535400390625, 9.1220703125, 9.4906005859375, 9.859130859375, 10.2276611328125, 10.59619140625, 10.9647216796875, 11.333251953125, 11.7017822265625, 12.0703125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 1.0, 5.0, 8.0, 3.0, 8.0, 7.0, 7.0, 18.0, 23.0, 16.0, 13.0, 21.0, 38.0, 36.0, 42.0, 48.0, 46.0, 45.0, 51.0, 62.0, 52.0, 55.0, 52.0, 38.0, 41.0, 32.0, 39.0, 27.0, 21.0, 17.0, 24.0, 25.0, 13.0, 11.0, 14.0, 8.0, 9.0, 3.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.56640625, -6.3839111328125, -6.201416015625, -6.0189208984375, -5.83642578125, -5.6539306640625, -5.471435546875, -5.2889404296875, -5.1064453125, -4.9239501953125, -4.741455078125, -4.5589599609375, -4.37646484375, -4.1939697265625, -4.011474609375, -3.8289794921875, -3.646484375, -3.4639892578125, -3.281494140625, -3.0989990234375, -2.91650390625, -2.7340087890625, -2.551513671875, -2.3690185546875, -2.1865234375, -2.0040283203125, -1.821533203125, -1.6390380859375, -1.45654296875, -1.2740478515625, -1.091552734375, -0.9090576171875, -0.7265625, -0.5440673828125, -0.361572265625, -0.1790771484375, 0.00341796875, 0.1859130859375, 0.368408203125, 0.5509033203125, 0.7333984375, 0.9158935546875, 1.098388671875, 1.2808837890625, 1.46337890625, 1.6458740234375, 1.828369140625, 2.0108642578125, 2.193359375, 2.3758544921875, 2.558349609375, 2.7408447265625, 2.92333984375, 3.1058349609375, 3.288330078125, 3.4708251953125, 3.6533203125, 3.8358154296875, 4.018310546875, 4.2008056640625, 4.38330078125, 4.5657958984375, 4.748291015625, 4.9307861328125, 5.11328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 13.0, 14.0, 18.0, 28.0, 21.0, 36.0, 62.0, 84.0, 154.0, 227.0, 361.0, 686.0, 1457.0, 4310.0, 18897.0, 172614.0, 736031.0, 94922.0, 12784.0, 3145.0, 1186.0, 577.0, 340.0, 197.0, 114.0, 75.0, 55.0, 28.0, 33.0, 17.0, 8.0, 10.0, 10.0, 8.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.234375, -18.640380859375, -18.04638671875, -17.452392578125, -16.8583984375, -16.264404296875, -15.67041015625, -15.076416015625, -14.482421875, -13.888427734375, -13.29443359375, -12.700439453125, -12.1064453125, -11.512451171875, -10.91845703125, -10.324462890625, -9.73046875, -9.136474609375, -8.54248046875, -7.948486328125, -7.3544921875, -6.760498046875, -6.16650390625, -5.572509765625, -4.978515625, -4.384521484375, -3.79052734375, -3.196533203125, -2.6025390625, -2.008544921875, -1.41455078125, -0.820556640625, -0.2265625, 0.367431640625, 0.96142578125, 1.555419921875, 2.1494140625, 2.743408203125, 3.33740234375, 3.931396484375, 4.525390625, 5.119384765625, 5.71337890625, 6.307373046875, 6.9013671875, 7.495361328125, 8.08935546875, 8.683349609375, 9.27734375, 9.871337890625, 10.46533203125, 11.059326171875, 11.6533203125, 12.247314453125, 12.84130859375, 13.435302734375, 14.029296875, 14.623291015625, 15.21728515625, 15.811279296875, 16.4052734375, 16.999267578125, 17.59326171875, 18.187255859375, 18.78125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 6.0, 4.0, 13.0, 12.0, 11.0, 14.0, 14.0, 18.0, 37.0, 31.0, 33.0, 52.0, 56.0, 44.0, 57.0, 49.0, 65.0, 48.0, 30.0, 43.0, 39.0, 49.0, 44.0, 40.0, 29.0, 33.0, 32.0, 20.0, 12.0, 15.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0], "bins": [-35.15625, -34.2109375, -33.265625, -32.3203125, -31.375, -30.4296875, -29.484375, -28.5390625, -27.59375, -26.6484375, -25.703125, -24.7578125, -23.8125, -22.8671875, -21.921875, -20.9765625, -20.03125, -19.0859375, -18.140625, -17.1953125, -16.25, -15.3046875, -14.359375, -13.4140625, -12.46875, -11.5234375, -10.578125, -9.6328125, -8.6875, -7.7421875, -6.796875, -5.8515625, -4.90625, -3.9609375, -3.015625, -2.0703125, -1.125, -0.1796875, 0.765625, 1.7109375, 2.65625, 3.6015625, 4.546875, 5.4921875, 6.4375, 7.3828125, 8.328125, 9.2734375, 10.21875, 11.1640625, 12.109375, 13.0546875, 14.0, 14.9453125, 15.890625, 16.8359375, 17.78125, 18.7265625, 19.671875, 20.6171875, 21.5625, 22.5078125, 23.453125, 24.3984375, 25.34375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 2.0, 10.0, 9.0, 6.0, 16.0, 24.0, 28.0, 42.0, 66.0, 100.0, 155.0, 275.0, 533.0, 1172.0, 3493.0, 16857.0, 208475.0, 752817.0, 53253.0, 7417.0, 2012.0, 806.0, 399.0, 195.0, 125.0, 65.0, 44.0, 42.0, 17.0, 25.0, 12.0, 8.0, 12.0, 13.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.326416015625, -8.05126953125, -7.776123046875, -7.5009765625, -7.225830078125, -6.95068359375, -6.675537109375, -6.400390625, -6.125244140625, -5.85009765625, -5.574951171875, -5.2998046875, -5.024658203125, -4.74951171875, -4.474365234375, -4.19921875, -3.924072265625, -3.64892578125, -3.373779296875, -3.0986328125, -2.823486328125, -2.54833984375, -2.273193359375, -1.998046875, -1.722900390625, -1.44775390625, -1.172607421875, -0.8974609375, -0.622314453125, -0.34716796875, -0.072021484375, 0.203125, 0.478271484375, 0.75341796875, 1.028564453125, 1.3037109375, 1.578857421875, 1.85400390625, 2.129150390625, 2.404296875, 2.679443359375, 2.95458984375, 3.229736328125, 3.5048828125, 3.780029296875, 4.05517578125, 4.330322265625, 4.60546875, 4.880615234375, 5.15576171875, 5.430908203125, 5.7060546875, 5.981201171875, 6.25634765625, 6.531494140625, 6.806640625, 7.081787109375, 7.35693359375, 7.632080078125, 7.9072265625, 8.182373046875, 8.45751953125, 8.732666015625, 9.0078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 13.0, 14.0, 21.0, 33.0, 56.0, 78.0, 115.0, 162.0, 147.0, 99.0, 104.0, 49.0, 31.0, 18.0, 22.0, 9.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010309219360351562, -0.0010031312704086304, -0.0009753406047821045, -0.0009475499391555786, -0.0009197592735290527, -0.0008919686079025269, -0.000864177942276001, -0.0008363872766494751, -0.0008085966110229492, -0.0007808059453964233, -0.0007530152797698975, -0.0007252246141433716, -0.0006974339485168457, -0.0006696432828903198, -0.0006418526172637939, -0.0006140619516372681, -0.0005862712860107422, -0.0005584806203842163, -0.0005306899547576904, -0.0005028992891311646, -0.00047510862350463867, -0.0004473179578781128, -0.0004195272922515869, -0.00039173662662506104, -0.00036394596099853516, -0.0003361552953720093, -0.0003083646297454834, -0.0002805739641189575, -0.00025278329849243164, -0.00022499263286590576, -0.00019720196723937988, -0.000169411301612854, -0.00014162063598632812, -0.00011382997035980225, -8.603930473327637e-05, -5.824863910675049e-05, -3.045797348022461e-05, -2.6673078536987305e-06, 2.512335777282715e-05, 5.291402339935303e-05, 8.07046890258789e-05, 0.00010849535465240479, 0.00013628602027893066, 0.00016407668590545654, 0.00019186735153198242, 0.0002196580171585083, 0.0002474486827850342, 0.00027523934841156006, 0.00030303001403808594, 0.0003308206796646118, 0.0003586113452911377, 0.0003864020109176636, 0.00041419267654418945, 0.00044198334217071533, 0.0004697740077972412, 0.0004975646734237671, 0.000525355339050293, 0.0005531460046768188, 0.0005809366703033447, 0.0006087273359298706, 0.0006365180015563965, 0.0006643086671829224, 0.0006920993328094482, 0.0007198899984359741, 0.0007476806640625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 5.0, 7.0, 14.0, 14.0, 27.0, 35.0, 72.0, 144.0, 207.0, 455.0, 922.0, 2386.0, 9779.0, 87448.0, 834901.0, 97420.0, 10103.0, 2613.0, 1016.0, 453.0, 210.0, 115.0, 78.0, 34.0, 29.0, 17.0, 11.0, 8.0, 12.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.671875, -10.379638671875, -10.08740234375, -9.795166015625, -9.5029296875, -9.210693359375, -8.91845703125, -8.626220703125, -8.333984375, -8.041748046875, -7.74951171875, -7.457275390625, -7.1650390625, -6.872802734375, -6.58056640625, -6.288330078125, -5.99609375, -5.703857421875, -5.41162109375, -5.119384765625, -4.8271484375, -4.534912109375, -4.24267578125, -3.950439453125, -3.658203125, -3.365966796875, -3.07373046875, -2.781494140625, -2.4892578125, -2.197021484375, -1.90478515625, -1.612548828125, -1.3203125, -1.028076171875, -0.73583984375, -0.443603515625, -0.1513671875, 0.140869140625, 0.43310546875, 0.725341796875, 1.017578125, 1.309814453125, 1.60205078125, 1.894287109375, 2.1865234375, 2.478759765625, 2.77099609375, 3.063232421875, 3.35546875, 3.647705078125, 3.93994140625, 4.232177734375, 4.5244140625, 4.816650390625, 5.10888671875, 5.401123046875, 5.693359375, 5.985595703125, 6.27783203125, 6.570068359375, 6.8623046875, 7.154541015625, 7.44677734375, 7.739013671875, 8.03125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 15.0, 16.0, 29.0, 25.0, 39.0, 59.0, 71.0, 98.0, 133.0, 106.0, 116.0, 85.0, 63.0, 34.0, 32.0, 22.0, 19.0, 8.0, 3.0, 7.0, 7.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.466064453125, -8.12744140625, -7.788818359375, -7.4501953125, -7.111572265625, -6.77294921875, -6.434326171875, -6.095703125, -5.757080078125, -5.41845703125, -5.079833984375, -4.7412109375, -4.402587890625, -4.06396484375, -3.725341796875, -3.38671875, -3.048095703125, -2.70947265625, -2.370849609375, -2.0322265625, -1.693603515625, -1.35498046875, -1.016357421875, -0.677734375, -0.339111328125, -0.00048828125, 0.338134765625, 0.6767578125, 1.015380859375, 1.35400390625, 1.692626953125, 2.03125, 2.369873046875, 2.70849609375, 3.047119140625, 3.3857421875, 3.724365234375, 4.06298828125, 4.401611328125, 4.740234375, 5.078857421875, 5.41748046875, 5.756103515625, 6.0947265625, 6.433349609375, 6.77197265625, 7.110595703125, 7.44921875, 7.787841796875, 8.12646484375, 8.465087890625, 8.8037109375, 9.142333984375, 9.48095703125, 9.819580078125, 10.158203125, 10.496826171875, 10.83544921875, 11.174072265625, 11.5126953125, 11.851318359375, 12.18994140625, 12.528564453125, 12.8671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 9.0, 28.0, 34.0, 107.0, 195.0, 278.0, 180.0, 101.0, 36.0, 21.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75042724609375, -127.83199310302734, -121.9135513305664, -115.9951171875, -110.0766830444336, -104.15824890136719, -98.23980712890625, -92.32137298583984, -86.40293884277344, -80.48450469970703, -74.5660629272461, -68.64762878417969, -62.72919464111328, -56.81075668334961, -50.89231872558594, -44.97388458251953, -39.055442810058594, -33.13700485229492, -27.218570709228516, -21.300132751464844, -15.381696701049805, -9.463260650634766, -3.5448226928710938, 2.3736114501953125, 8.292049407958984, 14.210485458374023, 20.128921508789062, 26.047359466552734, 31.965795516967773, 37.88423156738281, 43.802669525146484, 49.72110366821289, 55.63954162597656, 61.557979583740234, 67.4764175415039, 73.39485168457031, 79.31328582763672, 85.23171997070312, 91.15016174316406, 97.06859588623047, 102.98703002929688, 108.90546417236328, 114.82390594482422, 120.74234008789062, 126.66077423095703, 132.57920837402344, 138.49765014648438, 144.41607666015625, 150.33453369140625, 156.2529754638672, 162.17140197753906, 168.08984375, 174.00828552246094, 179.9267120361328, 185.84515380859375, 191.76358032226562, 197.68202209472656, 203.6004638671875, 209.51889038085938, 215.4373321533203, 221.35577392578125, 227.27420043945312, 233.19264221191406, 239.111083984375, 245.02951049804688]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 3.0, 3.0, 6.0, 3.0, 10.0, 7.0, 12.0, 11.0, 7.0, 16.0, 16.0, 11.0, 25.0, 37.0, 26.0, 32.0, 46.0, 42.0, 35.0, 57.0, 47.0, 56.0, 53.0, 54.0, 52.0, 48.0, 35.0, 25.0, 36.0, 29.0, 24.0, 22.0, 16.0, 21.0, 21.0, 11.0, 12.0, 16.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-142.06503295898438, -137.973876953125, -133.88270568847656, -129.7915496826172, -125.70039367675781, -121.6092300415039, -117.51806640625, -113.42691040039062, -109.33574676513672, -105.24458312988281, -101.15342712402344, -97.06226348876953, -92.97109985351562, -88.87994384765625, -84.78878021240234, -80.69761657714844, -76.60646057128906, -72.51529693603516, -68.42414093017578, -64.33297729492188, -60.241817474365234, -56.150657653808594, -52.05949401855469, -47.96833419799805, -43.877174377441406, -39.786014556884766, -35.694854736328125, -31.60369110107422, -27.512531280517578, -23.421371459960938, -19.330209732055664, -15.23904800415039, -11.14788818359375, -7.056727409362793, -2.965566635131836, 1.125594139099121, 5.216754913330078, 9.307914733886719, 13.399076461791992, 17.490238189697266, 21.581398010253906, 25.672557830810547, 29.76371955871582, 33.854881286621094, 37.946041107177734, 42.037200927734375, 46.12836456298828, 50.21952438354492, 54.31068420410156, 58.4018440246582, 62.493003845214844, 66.58416748046875, 70.67532348632812, 74.76648712158203, 78.85765075683594, 82.94880676269531, 87.03997039794922, 91.13113403320312, 95.2222900390625, 99.3134536743164, 103.40461730957031, 107.49577331542969, 111.5869369506836, 115.6781005859375, 119.76925659179688]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 11.0, 8.0, 13.0, 25.0, 35.0, 65.0, 83.0, 145.0, 265.0, 536.0, 1140.0, 2936.0, 11625.0, 613204.0, 3547312.0, 11855.0, 2807.0, 1011.0, 521.0, 276.0, 148.0, 91.0, 60.0, 39.0, 22.0, 13.0, 6.0, 6.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8297119140625, -13.276611328125, -12.7235107421875, -12.17041015625, -11.6173095703125, -11.064208984375, -10.5111083984375, -9.9580078125, -9.4049072265625, -8.851806640625, -8.2987060546875, -7.74560546875, -7.1925048828125, -6.639404296875, -6.0863037109375, -5.533203125, -4.9801025390625, -4.427001953125, -3.8739013671875, -3.32080078125, -2.7677001953125, -2.214599609375, -1.6614990234375, -1.1083984375, -0.5552978515625, -0.002197265625, 0.5509033203125, 1.10400390625, 1.6571044921875, 2.210205078125, 2.7633056640625, 3.31640625, 3.8695068359375, 4.422607421875, 4.9757080078125, 5.52880859375, 6.0819091796875, 6.635009765625, 7.1881103515625, 7.7412109375, 8.2943115234375, 8.847412109375, 9.4005126953125, 9.95361328125, 10.5067138671875, 11.059814453125, 11.6129150390625, 12.166015625, 12.7191162109375, 13.272216796875, 13.8253173828125, 14.37841796875, 14.9315185546875, 15.484619140625, 16.0377197265625, 16.5908203125, 17.1439208984375, 17.697021484375, 18.2501220703125, 18.80322265625, 19.3563232421875, 19.909423828125, 20.4625244140625, 21.015625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 10.0, 0.0, 9.0, 11.0, 14.0, 23.0, 18.0, 26.0, 30.0, 46.0, 41.0, 52.0, 61.0, 58.0, 69.0, 83.0, 78.0, 68.0, 53.0, 50.0, 45.0, 41.0, 32.0, 22.0, 17.0, 20.0, 11.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.046875, -9.80224609375, -9.5576171875, -9.31298828125, -9.068359375, -8.82373046875, -8.5791015625, -8.33447265625, -8.08984375, -7.84521484375, -7.6005859375, -7.35595703125, -7.111328125, -6.86669921875, -6.6220703125, -6.37744140625, -6.1328125, -5.88818359375, -5.6435546875, -5.39892578125, -5.154296875, -4.90966796875, -4.6650390625, -4.42041015625, -4.17578125, -3.93115234375, -3.6865234375, -3.44189453125, -3.197265625, -2.95263671875, -2.7080078125, -2.46337890625, -2.21875, -1.97412109375, -1.7294921875, -1.48486328125, -1.240234375, -0.99560546875, -0.7509765625, -0.50634765625, -0.26171875, -0.01708984375, 0.2275390625, 0.47216796875, 0.716796875, 0.96142578125, 1.2060546875, 1.45068359375, 1.6953125, 1.93994140625, 2.1845703125, 2.42919921875, 2.673828125, 2.91845703125, 3.1630859375, 3.40771484375, 3.65234375, 3.89697265625, 4.1416015625, 4.38623046875, 4.630859375, 4.87548828125, 5.1201171875, 5.36474609375, 5.609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 12.0, 14.0, 9.0, 22.0, 20.0, 42.0, 33.0, 49.0, 56.0, 104.0, 116.0, 148.0, 216.0, 449.0, 970.0, 2654.0, 9344.0, 90782.0, 4055336.0, 25226.0, 5206.0, 1703.0, 686.0, 366.0, 200.0, 124.0, 98.0, 67.0, 50.0, 36.0, 31.0, 27.0, 19.0, 22.0, 7.0, 6.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.8125, -13.3709716796875, -12.929443359375, -12.4879150390625, -12.04638671875, -11.6048583984375, -11.163330078125, -10.7218017578125, -10.2802734375, -9.8387451171875, -9.397216796875, -8.9556884765625, -8.51416015625, -8.0726318359375, -7.631103515625, -7.1895751953125, -6.748046875, -6.3065185546875, -5.864990234375, -5.4234619140625, -4.98193359375, -4.5404052734375, -4.098876953125, -3.6573486328125, -3.2158203125, -2.7742919921875, -2.332763671875, -1.8912353515625, -1.44970703125, -1.0081787109375, -0.566650390625, -0.1251220703125, 0.31640625, 0.7579345703125, 1.199462890625, 1.6409912109375, 2.08251953125, 2.5240478515625, 2.965576171875, 3.4071044921875, 3.8486328125, 4.2901611328125, 4.731689453125, 5.1732177734375, 5.61474609375, 6.0562744140625, 6.497802734375, 6.9393310546875, 7.380859375, 7.8223876953125, 8.263916015625, 8.7054443359375, 9.14697265625, 9.5885009765625, 10.030029296875, 10.4715576171875, 10.9130859375, 11.3546142578125, 11.796142578125, 12.2376708984375, 12.67919921875, 13.1207275390625, 13.562255859375, 14.0037841796875, 14.4453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 19.0, 54.0, 561.0, 3310.0, 72.0, 18.0, 10.0, 4.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.55078125, -7.39691162109375, -7.2430419921875, -7.08917236328125, -6.935302734375, -6.78143310546875, -6.6275634765625, -6.47369384765625, -6.31982421875, -6.16595458984375, -6.0120849609375, -5.85821533203125, -5.704345703125, -5.55047607421875, -5.3966064453125, -5.24273681640625, -5.0888671875, -4.93499755859375, -4.7811279296875, -4.62725830078125, -4.473388671875, -4.31951904296875, -4.1656494140625, -4.01177978515625, -3.85791015625, -3.70404052734375, -3.5501708984375, -3.39630126953125, -3.242431640625, -3.08856201171875, -2.9346923828125, -2.78082275390625, -2.626953125, -2.47308349609375, -2.3192138671875, -2.16534423828125, -2.011474609375, -1.85760498046875, -1.7037353515625, -1.54986572265625, -1.39599609375, -1.24212646484375, -1.0882568359375, -0.93438720703125, -0.780517578125, -0.62664794921875, -0.4727783203125, -0.31890869140625, -0.1650390625, -0.01116943359375, 0.1427001953125, 0.29656982421875, 0.450439453125, 0.60430908203125, 0.7581787109375, 0.91204833984375, 1.06591796875, 1.21978759765625, 1.3736572265625, 1.52752685546875, 1.681396484375, 1.83526611328125, 1.9891357421875, 2.14300537109375, 2.296875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 28.0, 24.0, 38.0, 93.0, 123.0, 142.0, 136.0, 141.0, 92.0, 71.0, 40.0, 19.0, 10.0, 3.0, 3.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.887872695922852, -10.605107307434082, -10.322342872619629, -10.03957748413086, -9.75681209564209, -9.47404670715332, -9.191282272338867, -8.908516883850098, -8.625751495361328, -8.342986106872559, -8.060221672058105, -7.777456283569336, -7.494690895080566, -7.211925983428955, -6.929161071777344, -6.646395683288574, -6.363631248474121, -6.08086633682251, -5.79810094833374, -5.515336036682129, -5.232570648193359, -4.949805736541748, -4.667040824890137, -4.384275436401367, -4.101510524749756, -3.8187453746795654, -3.535980224609375, -3.2532153129577637, -2.9704501628875732, -2.687685012817383, -2.4049201011657715, -2.122154951095581, -1.8393888473510742, -1.5566236972808838, -1.273858666419983, -0.9910935759544373, -0.7083284854888916, -0.42556333541870117, -0.1427983045578003, 0.13996672630310059, 0.422731876373291, 0.7054969668388367, 0.9882620573043823, 1.2710270881652832, 1.5537922382354736, 1.836557388305664, 2.1193222999572754, 2.402087450027466, 2.6848526000976562, 2.9676177501678467, 3.250382900238037, 3.5331478118896484, 3.815912961959839, 4.098678112030029, 4.381443023681641, 4.66420841217041, 4.9469733238220215, 5.229738235473633, 5.512503623962402, 5.795268535614014, 6.078033447265625, 6.3607988357543945, 6.643563747406006, 6.926328659057617, 7.209094047546387]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 4.0, 7.0, 0.0, 7.0, 8.0, 13.0, 19.0, 16.0, 28.0, 18.0, 21.0, 34.0, 34.0, 32.0, 38.0, 28.0, 39.0, 38.0, 49.0, 44.0, 43.0, 48.0, 41.0, 42.0, 29.0, 38.0, 23.0, 29.0, 27.0, 22.0, 25.0, 25.0, 15.0, 9.0, 19.0, 16.0, 9.0, 12.0, 8.0, 9.0, 10.0, 3.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0], "bins": [-4.951026916503906, -4.811740875244141, -4.672454357147217, -4.533167839050293, -4.393881797790527, -4.254595756530762, -4.115309238433838, -3.976022958755493, -3.8367366790771484, -3.6974503993988037, -3.558164119720459, -3.4188778400421143, -3.2795915603637695, -3.140305280685425, -3.00101900100708, -2.8617327213287354, -2.7224464416503906, -2.583160161972046, -2.443873882293701, -2.3045876026153564, -2.1653013229370117, -2.026015043258667, -1.8867287635803223, -1.7474424839019775, -1.6081562042236328, -1.468869924545288, -1.3295836448669434, -1.1902973651885986, -1.051011085510254, -0.9117248058319092, -0.7724385261535645, -0.6331522464752197, -0.493865966796875, -0.3545796871185303, -0.21529340744018555, -0.07600712776184082, 0.0632791519165039, 0.20256543159484863, 0.34185171127319336, 0.4811379909515381, 0.6204242706298828, 0.7597105503082275, 0.8989968299865723, 1.038283109664917, 1.1775693893432617, 1.3168556690216064, 1.4561419486999512, 1.595428228378296, 1.7347145080566406, 1.8740007877349854, 2.01328706741333, 2.152573347091675, 2.2918596267700195, 2.4311459064483643, 2.570432186126709, 2.7097184658050537, 2.8490047454833984, 2.988291025161743, 3.127577304840088, 3.2668635845184326, 3.4061498641967773, 3.545436143875122, 3.684722423553467, 3.8240087032318115, 3.9632949829101562]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 9.0, 5.0, 10.0, 24.0, 29.0, 45.0, 59.0, 79.0, 126.0, 255.0, 480.0, 944.0, 1921.0, 4354.0, 10660.0, 30391.0, 101166.0, 352054.0, 379874.0, 112079.0, 33331.0, 11658.0, 4757.0, 2088.0, 944.0, 481.0, 275.0, 177.0, 90.0, 64.0, 39.0, 25.0, 18.0, 19.0, 5.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5625, -7.2828369140625, -7.003173828125, -6.7235107421875, -6.44384765625, -6.1641845703125, -5.884521484375, -5.6048583984375, -5.3251953125, -5.0455322265625, -4.765869140625, -4.4862060546875, -4.20654296875, -3.9268798828125, -3.647216796875, -3.3675537109375, -3.087890625, -2.8082275390625, -2.528564453125, -2.2489013671875, -1.96923828125, -1.6895751953125, -1.409912109375, -1.1302490234375, -0.8505859375, -0.5709228515625, -0.291259765625, -0.0115966796875, 0.26806640625, 0.5477294921875, 0.827392578125, 1.1070556640625, 1.38671875, 1.6663818359375, 1.946044921875, 2.2257080078125, 2.50537109375, 2.7850341796875, 3.064697265625, 3.3443603515625, 3.6240234375, 3.9036865234375, 4.183349609375, 4.4630126953125, 4.74267578125, 5.0223388671875, 5.302001953125, 5.5816650390625, 5.861328125, 6.1409912109375, 6.420654296875, 6.7003173828125, 6.97998046875, 7.2596435546875, 7.539306640625, 7.8189697265625, 8.0986328125, 8.3782958984375, 8.657958984375, 8.9376220703125, 9.21728515625, 9.4969482421875, 9.776611328125, 10.0562744140625, 10.3359375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 13.0, 11.0, 22.0, 19.0, 15.0, 21.0, 42.0, 51.0, 42.0, 63.0, 69.0, 64.0, 73.0, 82.0, 67.0, 55.0, 62.0, 36.0, 52.0, 38.0, 23.0, 25.0, 19.0, 7.0, 11.0, 3.0, 1.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-10.7890625, -10.54144287109375, -10.2938232421875, -10.04620361328125, -9.798583984375, -9.55096435546875, -9.3033447265625, -9.05572509765625, -8.80810546875, -8.56048583984375, -8.3128662109375, -8.06524658203125, -7.817626953125, -7.57000732421875, -7.3223876953125, -7.07476806640625, -6.8271484375, -6.57952880859375, -6.3319091796875, -6.08428955078125, -5.836669921875, -5.58905029296875, -5.3414306640625, -5.09381103515625, -4.84619140625, -4.59857177734375, -4.3509521484375, -4.10333251953125, -3.855712890625, -3.60809326171875, -3.3604736328125, -3.11285400390625, -2.865234375, -2.61761474609375, -2.3699951171875, -2.12237548828125, -1.874755859375, -1.62713623046875, -1.3795166015625, -1.13189697265625, -0.88427734375, -0.63665771484375, -0.3890380859375, -0.14141845703125, 0.106201171875, 0.35382080078125, 0.6014404296875, 0.84906005859375, 1.0966796875, 1.34429931640625, 1.5919189453125, 1.83953857421875, 2.087158203125, 2.33477783203125, 2.5823974609375, 2.83001708984375, 3.07763671875, 3.32525634765625, 3.5728759765625, 3.82049560546875, 4.068115234375, 4.31573486328125, 4.5633544921875, 4.81097412109375, 5.05859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 7.0, 5.0, 8.0, 7.0, 12.0, 12.0, 15.0, 16.0, 39.0, 48.0, 78.0, 91.0, 133.0, 218.0, 383.0, 773.0, 1844.0, 6111.0, 26075.0, 175660.0, 687800.0, 120769.0, 20190.0, 4998.0, 1567.0, 695.0, 370.0, 195.0, 123.0, 84.0, 53.0, 46.0, 30.0, 22.0, 23.0, 17.0, 15.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.859375, -13.38818359375, -12.9169921875, -12.44580078125, -11.974609375, -11.50341796875, -11.0322265625, -10.56103515625, -10.08984375, -9.61865234375, -9.1474609375, -8.67626953125, -8.205078125, -7.73388671875, -7.2626953125, -6.79150390625, -6.3203125, -5.84912109375, -5.3779296875, -4.90673828125, -4.435546875, -3.96435546875, -3.4931640625, -3.02197265625, -2.55078125, -2.07958984375, -1.6083984375, -1.13720703125, -0.666015625, -0.19482421875, 0.2763671875, 0.74755859375, 1.21875, 1.68994140625, 2.1611328125, 2.63232421875, 3.103515625, 3.57470703125, 4.0458984375, 4.51708984375, 4.98828125, 5.45947265625, 5.9306640625, 6.40185546875, 6.873046875, 7.34423828125, 7.8154296875, 8.28662109375, 8.7578125, 9.22900390625, 9.7001953125, 10.17138671875, 10.642578125, 11.11376953125, 11.5849609375, 12.05615234375, 12.52734375, 12.99853515625, 13.4697265625, 13.94091796875, 14.412109375, 14.88330078125, 15.3544921875, 15.82568359375, 16.296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 10.0, 6.0, 5.0, 7.0, 8.0, 13.0, 22.0, 12.0, 22.0, 19.0, 27.0, 26.0, 27.0, 33.0, 37.0, 42.0, 40.0, 35.0, 45.0, 39.0, 52.0, 50.0, 42.0, 34.0, 52.0, 43.0, 40.0, 35.0, 28.0, 23.0, 19.0, 22.0, 15.0, 11.0, 10.0, 14.0, 6.0, 9.0, 8.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.0, -23.1494140625, -22.298828125, -21.4482421875, -20.59765625, -19.7470703125, -18.896484375, -18.0458984375, -17.1953125, -16.3447265625, -15.494140625, -14.6435546875, -13.79296875, -12.9423828125, -12.091796875, -11.2412109375, -10.390625, -9.5400390625, -8.689453125, -7.8388671875, -6.98828125, -6.1376953125, -5.287109375, -4.4365234375, -3.5859375, -2.7353515625, -1.884765625, -1.0341796875, -0.18359375, 0.6669921875, 1.517578125, 2.3681640625, 3.21875, 4.0693359375, 4.919921875, 5.7705078125, 6.62109375, 7.4716796875, 8.322265625, 9.1728515625, 10.0234375, 10.8740234375, 11.724609375, 12.5751953125, 13.42578125, 14.2763671875, 15.126953125, 15.9775390625, 16.828125, 17.6787109375, 18.529296875, 19.3798828125, 20.23046875, 21.0810546875, 21.931640625, 22.7822265625, 23.6328125, 24.4833984375, 25.333984375, 26.1845703125, 27.03515625, 27.8857421875, 28.736328125, 29.5869140625, 30.4375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 11.0, 8.0, 9.0, 20.0, 24.0, 30.0, 54.0, 70.0, 150.0, 200.0, 371.0, 747.0, 1885.0, 7469.0, 92777.0, 896268.0, 40559.0, 4989.0, 1421.0, 623.0, 312.0, 178.0, 117.0, 73.0, 47.0, 46.0, 19.0, 16.0, 17.0, 8.0, 9.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.6875, -12.3387451171875, -11.989990234375, -11.6412353515625, -11.29248046875, -10.9437255859375, -10.594970703125, -10.2462158203125, -9.8974609375, -9.5487060546875, -9.199951171875, -8.8511962890625, -8.50244140625, -8.1536865234375, -7.804931640625, -7.4561767578125, -7.107421875, -6.7586669921875, -6.409912109375, -6.0611572265625, -5.71240234375, -5.3636474609375, -5.014892578125, -4.6661376953125, -4.3173828125, -3.9686279296875, -3.619873046875, -3.2711181640625, -2.92236328125, -2.5736083984375, -2.224853515625, -1.8760986328125, -1.52734375, -1.1785888671875, -0.829833984375, -0.4810791015625, -0.13232421875, 0.2164306640625, 0.565185546875, 0.9139404296875, 1.2626953125, 1.6114501953125, 1.960205078125, 2.3089599609375, 2.65771484375, 3.0064697265625, 3.355224609375, 3.7039794921875, 4.052734375, 4.4014892578125, 4.750244140625, 5.0989990234375, 5.44775390625, 5.7965087890625, 6.145263671875, 6.4940185546875, 6.8427734375, 7.1915283203125, 7.540283203125, 7.8890380859375, 8.23779296875, 8.5865478515625, 8.935302734375, 9.2840576171875, 9.6328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 14.0, 23.0, 30.0, 54.0, 110.0, 185.0, 199.0, 141.0, 93.0, 52.0, 41.0, 20.0, 8.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011425018310546875, -0.0011081695556640625, -0.0010738372802734375, -0.0010395050048828125, -0.0010051727294921875, -0.0009708404541015625, -0.0009365081787109375, -0.0009021759033203125, -0.0008678436279296875, -0.0008335113525390625, -0.0007991790771484375, -0.0007648468017578125, -0.0007305145263671875, -0.0006961822509765625, -0.0006618499755859375, -0.0006275177001953125, -0.0005931854248046875, -0.0005588531494140625, -0.0005245208740234375, -0.0004901885986328125, -0.0004558563232421875, -0.0004215240478515625, -0.0003871917724609375, -0.0003528594970703125, -0.0003185272216796875, -0.0002841949462890625, -0.0002498626708984375, -0.0002155303955078125, -0.0001811981201171875, -0.0001468658447265625, -0.0001125335693359375, -7.82012939453125e-05, -4.38690185546875e-05, -9.5367431640625e-06, 2.47955322265625e-05, 5.91278076171875e-05, 9.34600830078125e-05, 0.0001277923583984375, 0.0001621246337890625, 0.0001964569091796875, 0.0002307891845703125, 0.0002651214599609375, 0.0002994537353515625, 0.0003337860107421875, 0.0003681182861328125, 0.0004024505615234375, 0.0004367828369140625, 0.0004711151123046875, 0.0005054473876953125, 0.0005397796630859375, 0.0005741119384765625, 0.0006084442138671875, 0.0006427764892578125, 0.0006771087646484375, 0.0007114410400390625, 0.0007457733154296875, 0.0007801055908203125, 0.0008144378662109375, 0.0008487701416015625, 0.0008831024169921875, 0.0009174346923828125, 0.0009517669677734375, 0.0009860992431640625, 0.0010204315185546875, 0.0010547637939453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 8.0, 6.0, 12.0, 14.0, 32.0, 54.0, 88.0, 178.0, 463.0, 1121.0, 4793.0, 49440.0, 923211.0, 61463.0, 5505.0, 1274.0, 443.0, 174.0, 111.0, 69.0, 30.0, 12.0, 19.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.453125, -17.06121826171875, -16.6693115234375, -16.27740478515625, -15.885498046875, -15.49359130859375, -15.1016845703125, -14.70977783203125, -14.31787109375, -13.92596435546875, -13.5340576171875, -13.14215087890625, -12.750244140625, -12.35833740234375, -11.9664306640625, -11.57452392578125, -11.1826171875, -10.79071044921875, -10.3988037109375, -10.00689697265625, -9.614990234375, -9.22308349609375, -8.8311767578125, -8.43927001953125, -8.04736328125, -7.65545654296875, -7.2635498046875, -6.87164306640625, -6.479736328125, -6.08782958984375, -5.6959228515625, -5.30401611328125, -4.912109375, -4.52020263671875, -4.1282958984375, -3.73638916015625, -3.344482421875, -2.95257568359375, -2.5606689453125, -2.16876220703125, -1.77685546875, -1.38494873046875, -0.9930419921875, -0.60113525390625, -0.209228515625, 0.18267822265625, 0.5745849609375, 0.96649169921875, 1.3583984375, 1.75030517578125, 2.1422119140625, 2.53411865234375, 2.926025390625, 3.31793212890625, 3.7098388671875, 4.10174560546875, 4.49365234375, 4.88555908203125, 5.2774658203125, 5.66937255859375, 6.061279296875, 6.45318603515625, 6.8450927734375, 7.23699951171875, 7.62890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 10.0, 24.0, 32.0, 81.0, 144.0, 191.0, 177.0, 131.0, 75.0, 43.0, 19.0, 14.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.921875, -21.4122314453125, -20.902587890625, -20.3929443359375, -19.88330078125, -19.3736572265625, -18.864013671875, -18.3543701171875, -17.8447265625, -17.3350830078125, -16.825439453125, -16.3157958984375, -15.80615234375, -15.2965087890625, -14.786865234375, -14.2772216796875, -13.767578125, -13.2579345703125, -12.748291015625, -12.2386474609375, -11.72900390625, -11.2193603515625, -10.709716796875, -10.2000732421875, -9.6904296875, -9.1807861328125, -8.671142578125, -8.1614990234375, -7.65185546875, -7.1422119140625, -6.632568359375, -6.1229248046875, -5.61328125, -5.1036376953125, -4.593994140625, -4.0843505859375, -3.57470703125, -3.0650634765625, -2.555419921875, -2.0457763671875, -1.5361328125, -1.0264892578125, -0.516845703125, -0.0072021484375, 0.50244140625, 1.0120849609375, 1.521728515625, 2.0313720703125, 2.541015625, 3.0506591796875, 3.560302734375, 4.0699462890625, 4.57958984375, 5.0892333984375, 5.598876953125, 6.1085205078125, 6.6181640625, 7.1278076171875, 7.637451171875, 8.1470947265625, 8.65673828125, 9.1663818359375, 9.676025390625, 10.1856689453125, 10.6953125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 20.0, 56.0, 156.0, 279.0, 253.0, 141.0, 41.0, 27.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.8299560546875, -160.41094970703125, -153.991943359375, -147.57293701171875, -141.1539306640625, -134.73492431640625, -128.31590270996094, -121.89689636230469, -115.47789001464844, -109.05888366699219, -102.63987731933594, -96.22086334228516, -89.8018569946289, -83.38285064697266, -76.96383666992188, -70.54483032226562, -64.12582397460938, -57.706817626953125, -51.28780746459961, -44.868797302246094, -38.449790954589844, -32.030784606933594, -25.611774444580078, -19.192764282226562, -12.773757934570312, -6.35474967956543, 0.06425857543945312, 6.483266830444336, 12.902275085449219, 19.32128143310547, 25.740291595458984, 32.1593017578125, 38.57830810546875, 44.997314453125, 51.416324615478516, 57.83533477783203, 64.25434112548828, 70.67334747314453, 77.09236145019531, 83.51136779785156, 89.93037414550781, 96.34938049316406, 102.76838684082031, 109.1874008178711, 115.60640716552734, 122.0254135131836, 128.44442749023438, 134.86343383789062, 141.28244018554688, 147.70144653320312, 154.12045288085938, 160.53945922851562, 166.95846557617188, 173.37747192382812, 179.79649353027344, 186.2154998779297, 192.63450622558594, 199.0535125732422, 205.47251892089844, 211.8915252685547, 218.310546875, 224.72955322265625, 231.1485595703125, 237.56756591796875, 243.986572265625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 5.0, 12.0, 9.0, 11.0, 17.0, 18.0, 32.0, 32.0, 28.0, 37.0, 42.0, 40.0, 34.0, 51.0, 50.0, 54.0, 52.0, 58.0, 37.0, 60.0, 39.0, 42.0, 47.0, 22.0, 22.0, 27.0, 22.0, 11.0, 13.0, 11.0, 9.0, 8.0, 13.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-112.0233154296875, -107.8429183959961, -103.66252136230469, -99.48213195800781, -95.3017349243164, -91.121337890625, -86.9409408569336, -82.76054382324219, -78.58015441894531, -74.3997573852539, -70.2193603515625, -66.03897094726562, -61.85857391357422, -57.67817687988281, -53.497779846191406, -49.3173828125, -45.136985778808594, -40.95658874511719, -36.77619552612305, -32.59579849243164, -28.415403366088867, -24.235008239746094, -20.054611206054688, -15.874216079711914, -11.69382095336914, -7.513425350189209, -3.3330297470092773, 0.8473663330078125, 5.027761459350586, 9.20815658569336, 13.388553619384766, 17.56894874572754, 21.749343872070312, 25.929738998413086, 30.11013412475586, 34.290531158447266, 38.470924377441406, 42.65132141113281, 46.83171844482422, 51.012115478515625, 55.192508697509766, 59.37290573120117, 63.55329895019531, 67.73369598388672, 71.91409301757812, 76.094482421875, 80.27488708496094, 84.45527648925781, 88.63567352294922, 92.81607055664062, 96.99646759033203, 101.17686462402344, 105.35725402832031, 109.53765106201172, 113.71804809570312, 117.89844512939453, 122.07884216308594, 126.25923919677734, 130.43963623046875, 134.62002563476562, 138.80043029785156, 142.98081970214844, 147.16122436523438, 151.34161376953125, 155.52200317382812]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 17.0, 13.0, 41.0, 54.0, 124.0, 211.0, 418.0, 909.0, 2298.0, 6350.0, 27523.0, 3882704.0, 249810.0, 16212.0, 4478.0, 1665.0, 698.0, 318.0, 176.0, 99.0, 56.0, 27.0, 21.0, 14.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.29345703125, -8.8681640625, -8.44287109375, -8.017578125, -7.59228515625, -7.1669921875, -6.74169921875, -6.31640625, -5.89111328125, -5.4658203125, -5.04052734375, -4.615234375, -4.18994140625, -3.7646484375, -3.33935546875, -2.9140625, -2.48876953125, -2.0634765625, -1.63818359375, -1.212890625, -0.78759765625, -0.3623046875, 0.06298828125, 0.48828125, 0.91357421875, 1.3388671875, 1.76416015625, 2.189453125, 2.61474609375, 3.0400390625, 3.46533203125, 3.890625, 4.31591796875, 4.7412109375, 5.16650390625, 5.591796875, 6.01708984375, 6.4423828125, 6.86767578125, 7.29296875, 7.71826171875, 8.1435546875, 8.56884765625, 8.994140625, 9.41943359375, 9.8447265625, 10.27001953125, 10.6953125, 11.12060546875, 11.5458984375, 11.97119140625, 12.396484375, 12.82177734375, 13.2470703125, 13.67236328125, 14.09765625, 14.52294921875, 14.9482421875, 15.37353515625, 15.798828125, 16.22412109375, 16.6494140625, 17.07470703125, 17.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 1.0, 5.0, 5.0, 8.0, 19.0, 23.0, 24.0, 22.0, 27.0, 52.0, 56.0, 69.0, 67.0, 78.0, 74.0, 85.0, 74.0, 55.0, 56.0, 45.0, 32.0, 37.0, 24.0, 17.0, 8.0, 7.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.28753662109375, -7.0399169921875, -6.79229736328125, -6.544677734375, -6.29705810546875, -6.0494384765625, -5.80181884765625, -5.55419921875, -5.30657958984375, -5.0589599609375, -4.81134033203125, -4.563720703125, -4.31610107421875, -4.0684814453125, -3.82086181640625, -3.5732421875, -3.32562255859375, -3.0780029296875, -2.83038330078125, -2.582763671875, -2.33514404296875, -2.0875244140625, -1.83990478515625, -1.59228515625, -1.34466552734375, -1.0970458984375, -0.84942626953125, -0.601806640625, -0.35418701171875, -0.1065673828125, 0.14105224609375, 0.388671875, 0.63629150390625, 0.8839111328125, 1.13153076171875, 1.379150390625, 1.62677001953125, 1.8743896484375, 2.12200927734375, 2.36962890625, 2.61724853515625, 2.8648681640625, 3.11248779296875, 3.360107421875, 3.60772705078125, 3.8553466796875, 4.10296630859375, 4.3505859375, 4.59820556640625, 4.8458251953125, 5.09344482421875, 5.341064453125, 5.58868408203125, 5.8363037109375, 6.08392333984375, 6.33154296875, 6.57916259765625, 6.8267822265625, 7.07440185546875, 7.322021484375, 7.56964111328125, 7.8172607421875, 8.06488037109375, 8.3125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 7.0, 10.0, 7.0, 12.0, 21.0, 35.0, 30.0, 64.0, 95.0, 112.0, 145.0, 265.0, 378.0, 722.0, 1347.0, 3268.0, 9919.0, 57552.0, 3984939.0, 113706.0, 13674.0, 4167.0, 1659.0, 842.0, 431.0, 267.0, 158.0, 113.0, 84.0, 71.0, 54.0, 37.0, 25.0, 17.0, 11.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.7532958984375, -12.405029296875, -12.0567626953125, -11.70849609375, -11.3602294921875, -11.011962890625, -10.6636962890625, -10.3154296875, -9.9671630859375, -9.618896484375, -9.2706298828125, -8.92236328125, -8.5740966796875, -8.225830078125, -7.8775634765625, -7.529296875, -7.1810302734375, -6.832763671875, -6.4844970703125, -6.13623046875, -5.7879638671875, -5.439697265625, -5.0914306640625, -4.7431640625, -4.3948974609375, -4.046630859375, -3.6983642578125, -3.35009765625, -3.0018310546875, -2.653564453125, -2.3052978515625, -1.95703125, -1.6087646484375, -1.260498046875, -0.9122314453125, -0.56396484375, -0.2156982421875, 0.132568359375, 0.4808349609375, 0.8291015625, 1.1773681640625, 1.525634765625, 1.8739013671875, 2.22216796875, 2.5704345703125, 2.918701171875, 3.2669677734375, 3.615234375, 3.9635009765625, 4.311767578125, 4.6600341796875, 5.00830078125, 5.3565673828125, 5.704833984375, 6.0531005859375, 6.4013671875, 6.7496337890625, 7.097900390625, 7.4461669921875, 7.79443359375, 8.1427001953125, 8.490966796875, 8.8392333984375, 9.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 9.0, 11.0, 36.0, 111.0, 710.0, 2930.0, 141.0, 43.0, 21.0, 16.0, 7.0, 8.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.16168212890625, -4.9561767578125, -4.75067138671875, -4.545166015625, -4.33966064453125, -4.1341552734375, -3.92864990234375, -3.72314453125, -3.51763916015625, -3.3121337890625, -3.10662841796875, -2.901123046875, -2.69561767578125, -2.4901123046875, -2.28460693359375, -2.0791015625, -1.87359619140625, -1.6680908203125, -1.46258544921875, -1.257080078125, -1.05157470703125, -0.8460693359375, -0.64056396484375, -0.43505859375, -0.22955322265625, -0.0240478515625, 0.18145751953125, 0.386962890625, 0.59246826171875, 0.7979736328125, 1.00347900390625, 1.208984375, 1.41448974609375, 1.6199951171875, 1.82550048828125, 2.031005859375, 2.23651123046875, 2.4420166015625, 2.64752197265625, 2.85302734375, 3.05853271484375, 3.2640380859375, 3.46954345703125, 3.675048828125, 3.88055419921875, 4.0860595703125, 4.29156494140625, 4.4970703125, 4.70257568359375, 4.9080810546875, 5.11358642578125, 5.319091796875, 5.52459716796875, 5.7301025390625, 5.93560791015625, 6.14111328125, 6.34661865234375, 6.5521240234375, 6.75762939453125, 6.963134765625, 7.16864013671875, 7.3741455078125, 7.57965087890625, 7.78515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 11.0, 16.0, 32.0, 102.0, 270.0, 309.0, 173.0, 58.0, 21.0, 7.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.649616241455078, -27.34982681274414, -26.050037384033203, -24.750247955322266, -23.450458526611328, -22.15066909790039, -20.850879669189453, -19.551090240478516, -18.251300811767578, -16.95151138305664, -15.651721954345703, -14.351932525634766, -13.052143096923828, -11.75235366821289, -10.452564239501953, -9.152774810791016, -7.852985382080078, -6.553195953369141, -5.253406524658203, -3.9536170959472656, -2.653827667236328, -1.3540382385253906, -0.054248809814453125, 1.2455406188964844, 2.545330047607422, 3.8451194763183594, 5.144908905029297, 6.444698333740234, 7.744487762451172, 9.04427719116211, 10.344066619873047, 11.643856048583984, 12.943641662597656, 14.243431091308594, 15.543220520019531, 16.84300994873047, 18.142799377441406, 19.442588806152344, 20.74237823486328, 22.04216766357422, 23.341957092285156, 24.641746520996094, 25.94153594970703, 27.24132537841797, 28.541114807128906, 29.840904235839844, 31.14069366455078, 32.44048309326172, 33.740272521972656, 35.040061950683594, 36.33985137939453, 37.63964080810547, 38.939430236816406, 40.239219665527344, 41.53900909423828, 42.83879852294922, 44.138587951660156, 45.438377380371094, 46.73816680908203, 48.03795623779297, 49.337745666503906, 50.637535095214844, 51.93732452392578, 53.23711395263672, 54.536903381347656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 4.0, 10.0, 6.0, 7.0, 9.0, 10.0, 12.0, 16.0, 17.0, 19.0, 18.0, 26.0, 36.0, 37.0, 51.0, 47.0, 50.0, 46.0, 41.0, 59.0, 52.0, 58.0, 42.0, 41.0, 28.0, 39.0, 30.0, 26.0, 27.0, 18.0, 25.0, 28.0, 16.0, 14.0, 10.0, 11.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.955860137939453, -11.585131645202637, -11.21440315246582, -10.84367561340332, -10.472947120666504, -10.102218627929688, -9.731490135192871, -9.360761642456055, -8.990034103393555, -8.619305610656738, -8.248577117919922, -7.877849102020264, -7.5071210861206055, -7.136392593383789, -6.765664100646973, -6.394935607910156, -6.02420711517334, -5.653478622436523, -5.282750606536865, -4.912022113800049, -4.541294097900391, -4.170565605163574, -3.799837112426758, -3.4291088581085205, -3.058380603790283, -2.687652349472046, -2.3169240951538086, -1.9461956024169922, -1.5754673480987549, -1.2047390937805176, -0.8340106010437012, -0.46328234672546387, -0.09255313873291016, 0.2781751751899719, 0.648903489112854, 1.0196318626403809, 1.3903601169586182, 1.7610883712768555, 2.131816864013672, 2.502545118331909, 2.8732733726501465, 3.244001626968384, 3.614729881286621, 3.9854583740234375, 4.356186866760254, 4.726914882659912, 5.0976433753967285, 5.468371391296387, 5.839099884033203, 6.2098283767700195, 6.580556392669678, 6.951284885406494, 7.322012901306152, 7.692741394042969, 8.063469886779785, 8.434198379516602, 8.804925918579102, 9.175654411315918, 9.546382904052734, 9.917110443115234, 10.28783893585205, 10.658567428588867, 11.029295921325684, 11.4000244140625, 11.770752906799316]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 14.0, 10.0, 15.0, 18.0, 32.0, 48.0, 69.0, 107.0, 178.0, 319.0, 542.0, 959.0, 1780.0, 3952.0, 9216.0, 26334.0, 95861.0, 405307.0, 376694.0, 86452.0, 24173.0, 8751.0, 3760.0, 1736.0, 961.0, 519.0, 255.0, 169.0, 114.0, 76.0, 29.0, 29.0, 22.0, 14.0, 10.0, 6.0, 6.0, 4.0, 7.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.5108642578125, -8.217041015625, -7.9232177734375, -7.62939453125, -7.3355712890625, -7.041748046875, -6.7479248046875, -6.4541015625, -6.1602783203125, -5.866455078125, -5.5726318359375, -5.27880859375, -4.9849853515625, -4.691162109375, -4.3973388671875, -4.103515625, -3.8096923828125, -3.515869140625, -3.2220458984375, -2.92822265625, -2.6343994140625, -2.340576171875, -2.0467529296875, -1.7529296875, -1.4591064453125, -1.165283203125, -0.8714599609375, -0.57763671875, -0.2838134765625, 0.010009765625, 0.3038330078125, 0.59765625, 0.8914794921875, 1.185302734375, 1.4791259765625, 1.77294921875, 2.0667724609375, 2.360595703125, 2.6544189453125, 2.9482421875, 3.2420654296875, 3.535888671875, 3.8297119140625, 4.12353515625, 4.4173583984375, 4.711181640625, 5.0050048828125, 5.298828125, 5.5926513671875, 5.886474609375, 6.1802978515625, 6.47412109375, 6.7679443359375, 7.061767578125, 7.3555908203125, 7.6494140625, 7.9432373046875, 8.237060546875, 8.5308837890625, 8.82470703125, 9.1185302734375, 9.412353515625, 9.7061767578125, 10.0]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 4.0, 8.0, 18.0, 14.0, 24.0, 26.0, 29.0, 46.0, 46.0, 51.0, 69.0, 75.0, 68.0, 94.0, 74.0, 57.0, 50.0, 53.0, 47.0, 36.0, 33.0, 17.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.75750732421875, -7.5150146484375, -7.27252197265625, -7.030029296875, -6.78753662109375, -6.5450439453125, -6.30255126953125, -6.06005859375, -5.81756591796875, -5.5750732421875, -5.33258056640625, -5.090087890625, -4.84759521484375, -4.6051025390625, -4.36260986328125, -4.1201171875, -3.87762451171875, -3.6351318359375, -3.39263916015625, -3.150146484375, -2.90765380859375, -2.6651611328125, -2.42266845703125, -2.18017578125, -1.93768310546875, -1.6951904296875, -1.45269775390625, -1.210205078125, -0.96771240234375, -0.7252197265625, -0.48272705078125, -0.240234375, 0.00225830078125, 0.2447509765625, 0.48724365234375, 0.729736328125, 0.97222900390625, 1.2147216796875, 1.45721435546875, 1.69970703125, 1.94219970703125, 2.1846923828125, 2.42718505859375, 2.669677734375, 2.91217041015625, 3.1546630859375, 3.39715576171875, 3.6396484375, 3.88214111328125, 4.1246337890625, 4.36712646484375, 4.609619140625, 4.85211181640625, 5.0946044921875, 5.33709716796875, 5.57958984375, 5.82208251953125, 6.0645751953125, 6.30706787109375, 6.549560546875, 6.79205322265625, 7.0345458984375, 7.27703857421875, 7.51953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 5.0, 7.0, 10.0, 15.0, 32.0, 37.0, 74.0, 104.0, 256.0, 503.0, 1400.0, 6350.0, 78991.0, 891359.0, 61949.0, 5223.0, 1266.0, 460.0, 216.0, 95.0, 75.0, 46.0, 31.0, 15.0, 11.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.125, -16.3271484375, -15.529296875, -14.7314453125, -13.93359375, -13.1357421875, -12.337890625, -11.5400390625, -10.7421875, -9.9443359375, -9.146484375, -8.3486328125, -7.55078125, -6.7529296875, -5.955078125, -5.1572265625, -4.359375, -3.5615234375, -2.763671875, -1.9658203125, -1.16796875, -0.3701171875, 0.427734375, 1.2255859375, 2.0234375, 2.8212890625, 3.619140625, 4.4169921875, 5.21484375, 6.0126953125, 6.810546875, 7.6083984375, 8.40625, 9.2041015625, 10.001953125, 10.7998046875, 11.59765625, 12.3955078125, 13.193359375, 13.9912109375, 14.7890625, 15.5869140625, 16.384765625, 17.1826171875, 17.98046875, 18.7783203125, 19.576171875, 20.3740234375, 21.171875, 21.9697265625, 22.767578125, 23.5654296875, 24.36328125, 25.1611328125, 25.958984375, 26.7568359375, 27.5546875, 28.3525390625, 29.150390625, 29.9482421875, 30.74609375, 31.5439453125, 32.341796875, 33.1396484375, 33.9375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 6.0, 6.0, 9.0, 6.0, 9.0, 16.0, 11.0, 22.0, 26.0, 25.0, 23.0, 48.0, 44.0, 43.0, 41.0, 64.0, 63.0, 56.0, 66.0, 69.0, 65.0, 48.0, 47.0, 34.0, 38.0, 24.0, 18.0, 9.0, 13.0, 18.0, 11.0, 11.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.75, -26.871826171875, -25.99365234375, -25.115478515625, -24.2373046875, -23.359130859375, -22.48095703125, -21.602783203125, -20.724609375, -19.846435546875, -18.96826171875, -18.090087890625, -17.2119140625, -16.333740234375, -15.45556640625, -14.577392578125, -13.69921875, -12.821044921875, -11.94287109375, -11.064697265625, -10.1865234375, -9.308349609375, -8.43017578125, -7.552001953125, -6.673828125, -5.795654296875, -4.91748046875, -4.039306640625, -3.1611328125, -2.282958984375, -1.40478515625, -0.526611328125, 0.3515625, 1.229736328125, 2.10791015625, 2.986083984375, 3.8642578125, 4.742431640625, 5.62060546875, 6.498779296875, 7.376953125, 8.255126953125, 9.13330078125, 10.011474609375, 10.8896484375, 11.767822265625, 12.64599609375, 13.524169921875, 14.40234375, 15.280517578125, 16.15869140625, 17.036865234375, 17.9150390625, 18.793212890625, 19.67138671875, 20.549560546875, 21.427734375, 22.305908203125, 23.18408203125, 24.062255859375, 24.9404296875, 25.818603515625, 26.69677734375, 27.574951171875, 28.453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 7.0, 13.0, 12.0, 12.0, 27.0, 34.0, 48.0, 89.0, 148.0, 219.0, 490.0, 1081.0, 3899.0, 28250.0, 719224.0, 276958.0, 13791.0, 2467.0, 842.0, 389.0, 202.0, 128.0, 68.0, 54.0, 32.0, 25.0, 10.0, 7.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.4765625, -6.28521728515625, -6.0938720703125, -5.90252685546875, -5.711181640625, -5.51983642578125, -5.3284912109375, -5.13714599609375, -4.94580078125, -4.75445556640625, -4.5631103515625, -4.37176513671875, -4.180419921875, -3.98907470703125, -3.7977294921875, -3.60638427734375, -3.4150390625, -3.22369384765625, -3.0323486328125, -2.84100341796875, -2.649658203125, -2.45831298828125, -2.2669677734375, -2.07562255859375, -1.88427734375, -1.69293212890625, -1.5015869140625, -1.31024169921875, -1.118896484375, -0.92755126953125, -0.7362060546875, -0.54486083984375, -0.353515625, -0.16217041015625, 0.0291748046875, 0.22052001953125, 0.411865234375, 0.60321044921875, 0.7945556640625, 0.98590087890625, 1.17724609375, 1.36859130859375, 1.5599365234375, 1.75128173828125, 1.942626953125, 2.13397216796875, 2.3253173828125, 2.51666259765625, 2.7080078125, 2.89935302734375, 3.0906982421875, 3.28204345703125, 3.473388671875, 3.66473388671875, 3.8560791015625, 4.04742431640625, 4.23876953125, 4.43011474609375, 4.6214599609375, 4.81280517578125, 5.004150390625, 5.19549560546875, 5.3868408203125, 5.57818603515625, 5.76953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 9.0, 4.0, 8.0, 12.0, 14.0, 30.0, 25.0, 45.0, 51.0, 59.0, 79.0, 92.0, 117.0, 103.0, 80.0, 64.0, 52.0, 40.0, 23.0, 30.0, 19.0, 13.0, 7.0, 5.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004506111145019531, -0.00043521076440811157, -0.00041981041431427, -0.00040441006422042847, -0.0003890097141265869, -0.00037360936403274536, -0.0003582090139389038, -0.00034280866384506226, -0.0003274083137512207, -0.00031200796365737915, -0.0002966076135635376, -0.00028120726346969604, -0.0002658069133758545, -0.00025040656328201294, -0.0002350062131881714, -0.00021960586309432983, -0.00020420551300048828, -0.00018880516290664673, -0.00017340481281280518, -0.00015800446271896362, -0.00014260411262512207, -0.00012720376253128052, -0.00011180341243743896, -9.640306234359741e-05, -8.100271224975586e-05, -6.56023621559143e-05, -5.0202012062072754e-05, -3.48016619682312e-05, -1.940131187438965e-05, -4.000961780548096e-06, 1.1399388313293457e-05, 2.679973840713501e-05, 4.220008850097656e-05, 5.7600438594818115e-05, 7.300078868865967e-05, 8.840113878250122e-05, 0.00010380148887634277, 0.00011920183897018433, 0.00013460218906402588, 0.00015000253915786743, 0.00016540288925170898, 0.00018080323934555054, 0.0001962035894393921, 0.00021160393953323364, 0.0002270042896270752, 0.00024240463972091675, 0.0002578049898147583, 0.00027320533990859985, 0.0002886056900024414, 0.00030400604009628296, 0.0003194063901901245, 0.00033480674028396606, 0.0003502070903778076, 0.00036560744047164917, 0.0003810077905654907, 0.0003964081406593323, 0.00041180849075317383, 0.0004272088408470154, 0.00044260919094085693, 0.0004580095410346985, 0.00047340989112854004, 0.0004888102412223816, 0.0005042105913162231, 0.0005196109414100647, 0.0005350112915039062]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 9.0, 8.0, 8.0, 14.0, 20.0, 27.0, 43.0, 67.0, 107.0, 280.0, 503.0, 1246.0, 4750.0, 39145.0, 846269.0, 143286.0, 9237.0, 2023.0, 800.0, 317.0, 141.0, 85.0, 56.0, 39.0, 23.0, 18.0, 11.0, 9.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.15972900390625, -5.9522705078125, -5.74481201171875, -5.537353515625, -5.32989501953125, -5.1224365234375, -4.91497802734375, -4.70751953125, -4.50006103515625, -4.2926025390625, -4.08514404296875, -3.877685546875, -3.67022705078125, -3.4627685546875, -3.25531005859375, -3.0478515625, -2.84039306640625, -2.6329345703125, -2.42547607421875, -2.218017578125, -2.01055908203125, -1.8031005859375, -1.59564208984375, -1.38818359375, -1.18072509765625, -0.9732666015625, -0.76580810546875, -0.558349609375, -0.35089111328125, -0.1434326171875, 0.06402587890625, 0.271484375, 0.47894287109375, 0.6864013671875, 0.89385986328125, 1.101318359375, 1.30877685546875, 1.5162353515625, 1.72369384765625, 1.93115234375, 2.13861083984375, 2.3460693359375, 2.55352783203125, 2.760986328125, 2.96844482421875, 3.1759033203125, 3.38336181640625, 3.5908203125, 3.79827880859375, 4.0057373046875, 4.21319580078125, 4.420654296875, 4.62811279296875, 4.8355712890625, 5.04302978515625, 5.25048828125, 5.45794677734375, 5.6654052734375, 5.87286376953125, 6.080322265625, 6.28778076171875, 6.4952392578125, 6.70269775390625, 6.91015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 5.0, 14.0, 30.0, 38.0, 76.0, 123.0, 151.0, 153.0, 119.0, 108.0, 63.0, 42.0, 24.0, 17.0, 8.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.07635498046875, -5.8441162109375, -5.61187744140625, -5.379638671875, -5.14739990234375, -4.9151611328125, -4.68292236328125, -4.45068359375, -4.21844482421875, -3.9862060546875, -3.75396728515625, -3.521728515625, -3.28948974609375, -3.0572509765625, -2.82501220703125, -2.5927734375, -2.36053466796875, -2.1282958984375, -1.89605712890625, -1.663818359375, -1.43157958984375, -1.1993408203125, -0.96710205078125, -0.73486328125, -0.50262451171875, -0.2703857421875, -0.03814697265625, 0.194091796875, 0.42633056640625, 0.6585693359375, 0.89080810546875, 1.123046875, 1.35528564453125, 1.5875244140625, 1.81976318359375, 2.052001953125, 2.28424072265625, 2.5164794921875, 2.74871826171875, 2.98095703125, 3.21319580078125, 3.4454345703125, 3.67767333984375, 3.909912109375, 4.14215087890625, 4.3743896484375, 4.60662841796875, 4.8388671875, 5.07110595703125, 5.3033447265625, 5.53558349609375, 5.767822265625, 6.00006103515625, 6.2322998046875, 6.46453857421875, 6.69677734375, 6.92901611328125, 7.1612548828125, 7.39349365234375, 7.625732421875, 7.85797119140625, 8.0902099609375, 8.32244873046875, 8.5546875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 14.0, 14.0, 27.0, 57.0, 131.0, 194.0, 228.0, 150.0, 96.0, 38.0, 23.0, 12.0, 9.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.00369262695312, -84.20802307128906, -80.412353515625, -76.6166763305664, -72.82100677490234, -69.02533721923828, -65.22966003417969, -61.433990478515625, -57.63832092285156, -53.8426513671875, -50.04697799682617, -46.251304626464844, -42.45563507080078, -38.65996551513672, -34.86429214477539, -31.068620681762695, -27.27294921875, -23.477277755737305, -19.68160629272461, -15.885934829711914, -12.090263366699219, -8.294591903686523, -4.498920440673828, -0.7032489776611328, 3.0924224853515625, 6.888093948364258, 10.683765411376953, 14.479436874389648, 18.275108337402344, 22.07077980041504, 25.866451263427734, 29.66212272644043, 33.457794189453125, 37.25346374511719, 41.049137115478516, 44.844810485839844, 48.640480041503906, 52.43614959716797, 56.2318229675293, 60.027496337890625, 63.82316589355469, 67.61883544921875, 71.41450500488281, 75.2101821899414, 79.00585174560547, 82.80152130126953, 86.59719848632812, 90.39286804199219, 94.18853759765625, 97.98420715332031, 101.77987670898438, 105.57555389404297, 109.37122344970703, 113.1668930053711, 116.96257019042969, 120.75823974609375, 124.55390930175781, 128.34957885742188, 132.14524841308594, 135.94091796875, 139.73660278320312, 143.5322723388672, 147.32794189453125, 151.1236114501953, 154.91928100585938]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 7.0, 11.0, 14.0, 13.0, 25.0, 17.0, 28.0, 30.0, 25.0, 43.0, 31.0, 40.0, 42.0, 50.0, 52.0, 53.0, 63.0, 56.0, 41.0, 47.0, 37.0, 37.0, 37.0, 31.0, 29.0, 24.0, 18.0, 20.0, 8.0, 4.0, 12.0, 9.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-115.11519622802734, -111.97420501708984, -108.83322143554688, -105.69223022460938, -102.55123901367188, -99.41024780273438, -96.2692642211914, -93.1282730102539, -89.98728942871094, -86.84629821777344, -83.70531463623047, -80.56432342529297, -77.42333221435547, -74.2823486328125, -71.141357421875, -68.0003662109375, -64.859375, -61.718387603759766, -58.577396392822266, -55.43640899658203, -52.29541778564453, -49.1544303894043, -46.01344299316406, -42.87245178222656, -39.73146438598633, -36.590476989746094, -33.449485778808594, -30.30849838256836, -27.167509078979492, -24.026519775390625, -20.88553237915039, -17.744543075561523, -14.603546142578125, -11.462556838989258, -8.321568489074707, -5.180580139160156, -2.039590835571289, 1.1013984680175781, 4.2423858642578125, 7.38337516784668, 10.524364471435547, 13.665353775024414, 16.80634307861328, 19.947330474853516, 23.088319778442383, 26.22930908203125, 29.370296478271484, 32.51128387451172, 35.65227508544922, 38.79326248168945, 41.93425369262695, 45.07524108886719, 48.21623229980469, 51.35721969604492, 54.498207092285156, 57.639198303222656, 60.78018569946289, 63.921173095703125, 67.06216430664062, 70.20315551757812, 73.3441390991211, 76.4851303100586, 79.62611389160156, 82.76710510253906, 85.90809631347656]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 16.0, 13.0, 27.0, 31.0, 83.0, 99.0, 216.0, 374.0, 752.0, 1666.0, 4162.0, 13392.0, 99061.0, 3881554.0, 169052.0, 16353.0, 4461.0, 1637.0, 674.0, 308.0, 165.0, 75.0, 40.0, 26.0, 16.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.125, -11.7525634765625, -11.380126953125, -11.0076904296875, -10.63525390625, -10.2628173828125, -9.890380859375, -9.5179443359375, -9.1455078125, -8.7730712890625, -8.400634765625, -8.0281982421875, -7.65576171875, -7.2833251953125, -6.910888671875, -6.5384521484375, -6.166015625, -5.7935791015625, -5.421142578125, -5.0487060546875, -4.67626953125, -4.3038330078125, -3.931396484375, -3.5589599609375, -3.1865234375, -2.8140869140625, -2.441650390625, -2.0692138671875, -1.69677734375, -1.3243408203125, -0.951904296875, -0.5794677734375, -0.20703125, 0.1654052734375, 0.537841796875, 0.9102783203125, 1.28271484375, 1.6551513671875, 2.027587890625, 2.4000244140625, 2.7724609375, 3.1448974609375, 3.517333984375, 3.8897705078125, 4.26220703125, 4.6346435546875, 5.007080078125, 5.3795166015625, 5.751953125, 6.1243896484375, 6.496826171875, 6.8692626953125, 7.24169921875, 7.6141357421875, 7.986572265625, 8.3590087890625, 8.7314453125, 9.1038818359375, 9.476318359375, 9.8487548828125, 10.22119140625, 10.5936279296875, 10.966064453125, 11.3385009765625, 11.7109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 9.0, 8.0, 5.0, 9.0, 13.0, 10.0, 9.0, 8.0, 9.0, 19.0, 24.0, 16.0, 32.0, 26.0, 22.0, 34.0, 28.0, 43.0, 45.0, 49.0, 48.0, 50.0, 45.0, 45.0, 44.0, 41.0, 36.0, 36.0, 25.0, 27.0, 28.0, 27.0, 15.0, 20.0, 20.0, 15.0, 6.0, 6.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0], "bins": [-4.5859375, -4.45880126953125, -4.3316650390625, -4.20452880859375, -4.077392578125, -3.95025634765625, -3.8231201171875, -3.69598388671875, -3.56884765625, -3.44171142578125, -3.3145751953125, -3.18743896484375, -3.060302734375, -2.93316650390625, -2.8060302734375, -2.67889404296875, -2.5517578125, -2.42462158203125, -2.2974853515625, -2.17034912109375, -2.043212890625, -1.91607666015625, -1.7889404296875, -1.66180419921875, -1.53466796875, -1.40753173828125, -1.2803955078125, -1.15325927734375, -1.026123046875, -0.89898681640625, -0.7718505859375, -0.64471435546875, -0.517578125, -0.39044189453125, -0.2633056640625, -0.13616943359375, -0.009033203125, 0.11810302734375, 0.2452392578125, 0.37237548828125, 0.49951171875, 0.62664794921875, 0.7537841796875, 0.88092041015625, 1.008056640625, 1.13519287109375, 1.2623291015625, 1.38946533203125, 1.5166015625, 1.64373779296875, 1.7708740234375, 1.89801025390625, 2.025146484375, 2.15228271484375, 2.2794189453125, 2.40655517578125, 2.53369140625, 2.66082763671875, 2.7879638671875, 2.91510009765625, 3.042236328125, 3.16937255859375, 3.2965087890625, 3.42364501953125, 3.55078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 7.0, 5.0, 8.0, 14.0, 13.0, 21.0, 37.0, 58.0, 111.0, 189.0, 560.0, 1413.0, 5636.0, 30579.0, 922674.0, 3179245.0, 42923.0, 7537.0, 1924.0, 640.0, 287.0, 146.0, 75.0, 40.0, 29.0, 28.0, 17.0, 6.0, 13.0, 7.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.3671875, -11.9560546875, -11.544921875, -11.1337890625, -10.72265625, -10.3115234375, -9.900390625, -9.4892578125, -9.078125, -8.6669921875, -8.255859375, -7.8447265625, -7.43359375, -7.0224609375, -6.611328125, -6.2001953125, -5.7890625, -5.3779296875, -4.966796875, -4.5556640625, -4.14453125, -3.7333984375, -3.322265625, -2.9111328125, -2.5, -2.0888671875, -1.677734375, -1.2666015625, -0.85546875, -0.4443359375, -0.033203125, 0.3779296875, 0.7890625, 1.2001953125, 1.611328125, 2.0224609375, 2.43359375, 2.8447265625, 3.255859375, 3.6669921875, 4.078125, 4.4892578125, 4.900390625, 5.3115234375, 5.72265625, 6.1337890625, 6.544921875, 6.9560546875, 7.3671875, 7.7783203125, 8.189453125, 8.6005859375, 9.01171875, 9.4228515625, 9.833984375, 10.2451171875, 10.65625, 11.0673828125, 11.478515625, 11.8896484375, 12.30078125, 12.7119140625, 13.123046875, 13.5341796875, 13.9453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 3.0, 2.0, 7.0, 6.0, 12.0, 20.0, 18.0, 14.0, 33.0, 50.0, 92.0, 207.0, 702.0, 1596.0, 783.0, 215.0, 102.0, 50.0, 32.0, 21.0, 12.0, 15.0, 15.0, 6.0, 14.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.1796875, -9.8350830078125, -9.490478515625, -9.1458740234375, -8.80126953125, -8.4566650390625, -8.112060546875, -7.7674560546875, -7.4228515625, -7.0782470703125, -6.733642578125, -6.3890380859375, -6.04443359375, -5.6998291015625, -5.355224609375, -5.0106201171875, -4.666015625, -4.3214111328125, -3.976806640625, -3.6322021484375, -3.28759765625, -2.9429931640625, -2.598388671875, -2.2537841796875, -1.9091796875, -1.5645751953125, -1.219970703125, -0.8753662109375, -0.53076171875, -0.1861572265625, 0.158447265625, 0.5030517578125, 0.84765625, 1.1922607421875, 1.536865234375, 1.8814697265625, 2.22607421875, 2.5706787109375, 2.915283203125, 3.2598876953125, 3.6044921875, 3.9490966796875, 4.293701171875, 4.6383056640625, 4.98291015625, 5.3275146484375, 5.672119140625, 6.0167236328125, 6.361328125, 6.7059326171875, 7.050537109375, 7.3951416015625, 7.73974609375, 8.0843505859375, 8.428955078125, 8.7735595703125, 9.1181640625, 9.4627685546875, 9.807373046875, 10.1519775390625, 10.49658203125, 10.8411865234375, 11.185791015625, 11.5303955078125, 11.875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 9.0, 36.0, 97.0, 223.0, 300.0, 173.0, 99.0, 26.0, 17.0, 6.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.9659423828125, -102.79053497314453, -99.61512756347656, -96.43972778320312, -93.26432037353516, -90.08891296386719, -86.91350555419922, -83.73809814453125, -80.56269073486328, -77.38728332519531, -74.21187591552734, -71.03646850585938, -67.86106872558594, -64.68566131591797, -61.51025390625, -58.33484649658203, -55.15944290161133, -51.98403549194336, -48.808631896972656, -45.63322448730469, -42.45781707763672, -39.28240966796875, -36.10700607299805, -32.93159866333008, -29.756193161010742, -26.580787658691406, -23.405380249023438, -20.2299747467041, -17.054569244384766, -13.879161834716797, -10.703756332397461, -7.528348922729492, -4.352943420410156, -1.177537202835083, 1.9978690147399902, 5.173274993896484, 8.348681449890137, 11.524087905883789, 14.699493408203125, 17.874900817871094, 21.05030632019043, 24.225711822509766, 27.401119232177734, 30.57652473449707, 33.751930236816406, 36.927337646484375, 40.102745056152344, 43.27815246582031, 46.453556060791016, 49.628963470458984, 52.80436706542969, 55.979774475097656, 59.155181884765625, 62.330589294433594, 65.50599670410156, 68.681396484375, 71.85680389404297, 75.03221130371094, 78.2076187133789, 81.38302612304688, 84.55842590332031, 87.73383331298828, 90.90924072265625, 94.08464813232422, 97.26005554199219]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 7.0, 8.0, 8.0, 16.0, 28.0, 29.0, 37.0, 30.0, 40.0, 48.0, 56.0, 54.0, 69.0, 88.0, 59.0, 50.0, 56.0, 58.0, 44.0, 38.0, 31.0, 37.0, 19.0, 20.0, 12.0, 12.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.268062591552734, -53.69483184814453, -52.12160110473633, -50.548370361328125, -48.975135803222656, -47.40190505981445, -45.82867431640625, -44.25544357299805, -42.682212829589844, -41.10898208618164, -39.53575134277344, -37.96251678466797, -36.389286041259766, -34.81605529785156, -33.24282455444336, -31.669593811035156, -30.096359252929688, -28.523128509521484, -26.94989585876465, -25.376665115356445, -23.80343246459961, -22.230201721191406, -20.656970977783203, -19.083740234375, -17.510507583618164, -15.937275886535645, -14.364044189453125, -12.790813446044922, -11.217581748962402, -9.644350051879883, -8.07111930847168, -6.49788761138916, -4.924659729003906, -3.351428270339966, -1.7781968116760254, -0.20496559143066406, 1.3682661056518555, 2.941497802734375, 4.514728546142578, 6.087960243225098, 7.661191940307617, 9.234423637390137, 10.807655334472656, 12.38088607788086, 13.954117774963379, 15.527349472045898, 17.1005802154541, 18.673812866210938, 20.24704360961914, 21.820274353027344, 23.39350700378418, 24.966737747192383, 26.53997039794922, 28.113201141357422, 29.686431884765625, 31.259662628173828, 32.83289337158203, 34.406124114990234, 35.97935485839844, 37.552589416503906, 39.12582015991211, 40.69905090332031, 42.272281646728516, 43.84551239013672, 45.41874694824219]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 9.0, 24.0, 40.0, 36.0, 49.0, 72.0, 112.0, 188.0, 339.0, 522.0, 837.0, 1456.0, 2687.0, 4811.0, 9017.0, 18175.0, 38786.0, 85651.0, 198274.0, 327836.0, 197097.0, 85976.0, 38303.0, 18161.0, 9063.0, 4722.0, 2586.0, 1534.0, 835.0, 505.0, 309.0, 175.0, 118.0, 75.0, 55.0, 36.0, 29.0, 12.0, 19.0, 5.0, 4.0, 0.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.2421875, -5.08087158203125, -4.9195556640625, -4.75823974609375, -4.596923828125, -4.43560791015625, -4.2742919921875, -4.11297607421875, -3.95166015625, -3.79034423828125, -3.6290283203125, -3.46771240234375, -3.306396484375, -3.14508056640625, -2.9837646484375, -2.82244873046875, -2.6611328125, -2.49981689453125, -2.3385009765625, -2.17718505859375, -2.015869140625, -1.85455322265625, -1.6932373046875, -1.53192138671875, -1.37060546875, -1.20928955078125, -1.0479736328125, -0.88665771484375, -0.725341796875, -0.56402587890625, -0.4027099609375, -0.24139404296875, -0.080078125, 0.08123779296875, 0.2425537109375, 0.40386962890625, 0.565185546875, 0.72650146484375, 0.8878173828125, 1.04913330078125, 1.21044921875, 1.37176513671875, 1.5330810546875, 1.69439697265625, 1.855712890625, 2.01702880859375, 2.1783447265625, 2.33966064453125, 2.5009765625, 2.66229248046875, 2.8236083984375, 2.98492431640625, 3.146240234375, 3.30755615234375, 3.4688720703125, 3.63018798828125, 3.79150390625, 3.95281982421875, 4.1141357421875, 4.27545166015625, 4.436767578125, 4.59808349609375, 4.7593994140625, 4.92071533203125, 5.08203125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 5.0, 5.0, 12.0, 9.0, 7.0, 9.0, 13.0, 17.0, 17.0, 13.0, 14.0, 18.0, 19.0, 33.0, 24.0, 30.0, 38.0, 37.0, 34.0, 50.0, 42.0, 39.0, 43.0, 45.0, 41.0, 42.0, 46.0, 30.0, 29.0, 35.0, 17.0, 19.0, 19.0, 21.0, 19.0, 12.0, 13.0, 13.0, 11.0, 5.0, 5.0, 8.0, 7.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.63671875, -3.5244140625, -3.412109375, -3.2998046875, -3.1875, -3.0751953125, -2.962890625, -2.8505859375, -2.73828125, -2.6259765625, -2.513671875, -2.4013671875, -2.2890625, -2.1767578125, -2.064453125, -1.9521484375, -1.83984375, -1.7275390625, -1.615234375, -1.5029296875, -1.390625, -1.2783203125, -1.166015625, -1.0537109375, -0.94140625, -0.8291015625, -0.716796875, -0.6044921875, -0.4921875, -0.3798828125, -0.267578125, -0.1552734375, -0.04296875, 0.0693359375, 0.181640625, 0.2939453125, 0.40625, 0.5185546875, 0.630859375, 0.7431640625, 0.85546875, 0.9677734375, 1.080078125, 1.1923828125, 1.3046875, 1.4169921875, 1.529296875, 1.6416015625, 1.75390625, 1.8662109375, 1.978515625, 2.0908203125, 2.203125, 2.3154296875, 2.427734375, 2.5400390625, 2.65234375, 2.7646484375, 2.876953125, 2.9892578125, 3.1015625, 3.2138671875, 3.326171875, 3.4384765625, 3.55078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 9.0, 5.0, 13.0, 23.0, 36.0, 41.0, 49.0, 60.0, 107.0, 224.0, 408.0, 819.0, 1960.0, 6692.0, 44986.0, 731032.0, 237207.0, 18316.0, 3822.0, 1303.0, 618.0, 313.0, 165.0, 91.0, 53.0, 46.0, 36.0, 32.0, 19.0, 11.0, 13.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.125, -14.580810546875, -14.03662109375, -13.492431640625, -12.9482421875, -12.404052734375, -11.85986328125, -11.315673828125, -10.771484375, -10.227294921875, -9.68310546875, -9.138916015625, -8.5947265625, -8.050537109375, -7.50634765625, -6.962158203125, -6.41796875, -5.873779296875, -5.32958984375, -4.785400390625, -4.2412109375, -3.697021484375, -3.15283203125, -2.608642578125, -2.064453125, -1.520263671875, -0.97607421875, -0.431884765625, 0.1123046875, 0.656494140625, 1.20068359375, 1.744873046875, 2.2890625, 2.833251953125, 3.37744140625, 3.921630859375, 4.4658203125, 5.010009765625, 5.55419921875, 6.098388671875, 6.642578125, 7.186767578125, 7.73095703125, 8.275146484375, 8.8193359375, 9.363525390625, 9.90771484375, 10.451904296875, 10.99609375, 11.540283203125, 12.08447265625, 12.628662109375, 13.1728515625, 13.717041015625, 14.26123046875, 14.805419921875, 15.349609375, 15.893798828125, 16.43798828125, 16.982177734375, 17.5263671875, 18.070556640625, 18.61474609375, 19.158935546875, 19.703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 4.0, 4.0, 3.0, 12.0, 13.0, 19.0, 14.0, 15.0, 21.0, 19.0, 19.0, 38.0, 26.0, 30.0, 59.0, 50.0, 41.0, 49.0, 47.0, 53.0, 42.0, 48.0, 46.0, 39.0, 43.0, 35.0, 31.0, 35.0, 27.0, 17.0, 26.0, 17.0, 14.0, 6.0, 8.0, 1.0, 6.0, 9.0, 8.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.540771484375, -15.98779296875, -15.434814453125, -14.8818359375, -14.328857421875, -13.77587890625, -13.222900390625, -12.669921875, -12.116943359375, -11.56396484375, -11.010986328125, -10.4580078125, -9.905029296875, -9.35205078125, -8.799072265625, -8.24609375, -7.693115234375, -7.14013671875, -6.587158203125, -6.0341796875, -5.481201171875, -4.92822265625, -4.375244140625, -3.822265625, -3.269287109375, -2.71630859375, -2.163330078125, -1.6103515625, -1.057373046875, -0.50439453125, 0.048583984375, 0.6015625, 1.154541015625, 1.70751953125, 2.260498046875, 2.8134765625, 3.366455078125, 3.91943359375, 4.472412109375, 5.025390625, 5.578369140625, 6.13134765625, 6.684326171875, 7.2373046875, 7.790283203125, 8.34326171875, 8.896240234375, 9.44921875, 10.002197265625, 10.55517578125, 11.108154296875, 11.6611328125, 12.214111328125, 12.76708984375, 13.320068359375, 13.873046875, 14.426025390625, 14.97900390625, 15.531982421875, 16.0849609375, 16.637939453125, 17.19091796875, 17.743896484375, 18.296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 6.0, 12.0, 9.0, 12.0, 12.0, 24.0, 35.0, 40.0, 71.0, 98.0, 198.0, 312.0, 579.0, 1228.0, 3535.0, 19187.0, 399370.0, 594202.0, 22779.0, 4109.0, 1308.0, 584.0, 275.0, 186.0, 132.0, 70.0, 44.0, 30.0, 26.0, 22.0, 17.0, 13.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.58203125, -6.3828125, -6.18359375, -5.984375, -5.78515625, -5.5859375, -5.38671875, -5.1875, -4.98828125, -4.7890625, -4.58984375, -4.390625, -4.19140625, -3.9921875, -3.79296875, -3.59375, -3.39453125, -3.1953125, -2.99609375, -2.796875, -2.59765625, -2.3984375, -2.19921875, -2.0, -1.80078125, -1.6015625, -1.40234375, -1.203125, -1.00390625, -0.8046875, -0.60546875, -0.40625, -0.20703125, -0.0078125, 0.19140625, 0.390625, 0.58984375, 0.7890625, 0.98828125, 1.1875, 1.38671875, 1.5859375, 1.78515625, 1.984375, 2.18359375, 2.3828125, 2.58203125, 2.78125, 2.98046875, 3.1796875, 3.37890625, 3.578125, 3.77734375, 3.9765625, 4.17578125, 4.375, 4.57421875, 4.7734375, 4.97265625, 5.171875, 5.37109375, 5.5703125, 5.76953125, 5.96875, 6.16796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 13.0, 27.0, 31.0, 47.0, 58.0, 101.0, 179.0, 169.0, 111.0, 84.0, 56.0, 33.0, 27.0, 17.0, 18.0, 11.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007548332214355469, -0.0007280781865119934, -0.0007013231515884399, -0.0006745681166648865, -0.000647813081741333, -0.0006210580468177795, -0.0005943030118942261, -0.0005675479769706726, -0.0005407929420471191, -0.0005140379071235657, -0.0004872828722000122, -0.00046052783727645874, -0.0004337728023529053, -0.0004070177674293518, -0.00038026273250579834, -0.0003535076975822449, -0.0003267526626586914, -0.00029999762773513794, -0.00027324259281158447, -0.000246487557888031, -0.00021973252296447754, -0.00019297748804092407, -0.0001662224531173706, -0.00013946741819381714, -0.00011271238327026367, -8.59573483467102e-05, -5.920231342315674e-05, -3.244727849960327e-05, -5.692243576049805e-06, 2.1062791347503662e-05, 4.781782627105713e-05, 7.45728611946106e-05, 0.00010132789611816406, 0.00012808293104171753, 0.000154837965965271, 0.00018159300088882446, 0.00020834803581237793, 0.0002351030707359314, 0.00026185810565948486, 0.00028861314058303833, 0.0003153681755065918, 0.00034212321043014526, 0.00036887824535369873, 0.0003956332802772522, 0.00042238831520080566, 0.00044914335012435913, 0.0004758983850479126, 0.0005026534199714661, 0.0005294084548950195, 0.000556163489818573, 0.0005829185247421265, 0.0006096735596656799, 0.0006364285945892334, 0.0006631836295127869, 0.0006899386644363403, 0.0007166936993598938, 0.0007434487342834473, 0.0007702037692070007, 0.0007969588041305542, 0.0008237138390541077, 0.0008504688739776611, 0.0008772239089012146, 0.0009039789438247681, 0.0009307339787483215, 0.000957489013671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 9.0, 13.0, 18.0, 26.0, 42.0, 69.0, 108.0, 236.0, 494.0, 1177.0, 4046.0, 22989.0, 618495.0, 377384.0, 18034.0, 3346.0, 1031.0, 454.0, 232.0, 129.0, 61.0, 39.0, 32.0, 18.0, 11.0, 14.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.703125, -7.48883056640625, -7.2745361328125, -7.06024169921875, -6.845947265625, -6.63165283203125, -6.4173583984375, -6.20306396484375, -5.98876953125, -5.77447509765625, -5.5601806640625, -5.34588623046875, -5.131591796875, -4.91729736328125, -4.7030029296875, -4.48870849609375, -4.2744140625, -4.06011962890625, -3.8458251953125, -3.63153076171875, -3.417236328125, -3.20294189453125, -2.9886474609375, -2.77435302734375, -2.56005859375, -2.34576416015625, -2.1314697265625, -1.91717529296875, -1.702880859375, -1.48858642578125, -1.2742919921875, -1.05999755859375, -0.845703125, -0.63140869140625, -0.4171142578125, -0.20281982421875, 0.011474609375, 0.22576904296875, 0.4400634765625, 0.65435791015625, 0.86865234375, 1.08294677734375, 1.2972412109375, 1.51153564453125, 1.725830078125, 1.94012451171875, 2.1544189453125, 2.36871337890625, 2.5830078125, 2.79730224609375, 3.0115966796875, 3.22589111328125, 3.440185546875, 3.65447998046875, 3.8687744140625, 4.08306884765625, 4.29736328125, 4.51165771484375, 4.7259521484375, 4.94024658203125, 5.154541015625, 5.36883544921875, 5.5831298828125, 5.79742431640625, 6.01171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 6.0, 3.0, 4.0, 8.0, 6.0, 11.0, 19.0, 22.0, 17.0, 40.0, 34.0, 46.0, 68.0, 70.0, 81.0, 94.0, 98.0, 78.0, 58.0, 48.0, 35.0, 31.0, 24.0, 17.0, 17.0, 9.0, 10.0, 10.0, 6.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.615234375, -3.467681884765625, -3.32012939453125, -3.172576904296875, -3.0250244140625, -2.877471923828125, -2.72991943359375, -2.582366943359375, -2.434814453125, -2.287261962890625, -2.13970947265625, -1.992156982421875, -1.8446044921875, -1.697052001953125, -1.54949951171875, -1.401947021484375, -1.25439453125, -1.106842041015625, -0.95928955078125, -0.811737060546875, -0.6641845703125, -0.516632080078125, -0.36907958984375, -0.221527099609375, -0.073974609375, 0.073577880859375, 0.22113037109375, 0.368682861328125, 0.5162353515625, 0.663787841796875, 0.81134033203125, 0.958892822265625, 1.1064453125, 1.253997802734375, 1.40155029296875, 1.549102783203125, 1.6966552734375, 1.844207763671875, 1.99176025390625, 2.139312744140625, 2.286865234375, 2.434417724609375, 2.58197021484375, 2.729522705078125, 2.8770751953125, 3.024627685546875, 3.17218017578125, 3.319732666015625, 3.46728515625, 3.614837646484375, 3.76239013671875, 3.909942626953125, 4.0574951171875, 4.205047607421875, 4.35260009765625, 4.500152587890625, 4.647705078125, 4.795257568359375, 4.94281005859375, 5.090362548828125, 5.2379150390625, 5.385467529296875, 5.53302001953125, 5.680572509765625, 5.828125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 12.0, 51.0, 198.0, 437.0, 222.0, 43.0, 23.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-328.909423828125, -322.1370544433594, -315.36468505859375, -308.59234619140625, -301.8199768066406, -295.047607421875, -288.2752380371094, -281.5028991699219, -274.73052978515625, -267.9581604003906, -261.185791015625, -254.41343688964844, -247.64108276367188, -240.86871337890625, -234.0963592529297, -227.32398986816406, -220.5516357421875, -213.77926635742188, -207.0069122314453, -200.2345428466797, -193.46218872070312, -186.6898193359375, -179.91746520996094, -173.1450958251953, -166.3727264404297, -159.60035705566406, -152.8280029296875, -146.05563354492188, -139.2832794189453, -132.5109100341797, -125.73855590820312, -118.9661865234375, -112.19383239746094, -105.42147064208984, -98.64910888671875, -91.87674713134766, -85.10438537597656, -78.33201599121094, -71.55966186523438, -64.78729248046875, -58.01493453979492, -51.24257278442383, -44.470211029052734, -37.697845458984375, -30.925485610961914, -24.153121948242188, -17.380760192871094, -10.6083984375, -3.8360366821289062, 2.9363255500793457, 9.708687782287598, 16.481050491333008, 23.2534122467041, 30.025775909423828, 36.79813766479492, 43.570499420166016, 50.34286117553711, 57.1152229309082, 63.8875846862793, 70.65995025634766, 77.43231201171875, 84.20467376708984, 90.97703552246094, 97.74939727783203, 104.52175903320312]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 16.0, 19.0, 18.0, 25.0, 30.0, 28.0, 28.0, 45.0, 36.0, 45.0, 56.0, 60.0, 63.0, 67.0, 50.0, 47.0, 52.0, 32.0, 42.0, 37.0, 26.0, 29.0, 30.0, 17.0, 16.0, 8.0, 12.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.53846740722656, -69.8415298461914, -67.14458465576172, -64.44764709472656, -61.75070571899414, -59.05376434326172, -56.35682678222656, -53.65988540649414, -50.96294403076172, -48.2660026550293, -45.56906509399414, -42.87212371826172, -40.1751823425293, -37.478240966796875, -34.78130340576172, -32.0843620300293, -29.38742446899414, -26.69048500061035, -23.99354362487793, -21.29660415649414, -18.59966278076172, -15.90272331237793, -13.20578384399414, -10.508842468261719, -7.81190299987793, -5.114962577819824, -2.418022632598877, 0.2789173126220703, 2.975857734680176, 5.672798156738281, 8.36973762512207, 11.066679000854492, 13.763618469238281, 16.46055793762207, 19.157499313354492, 21.85443878173828, 24.551380157470703, 27.248319625854492, 29.94525909423828, 32.6422004699707, 35.339141845703125, 38.03608322143555, 40.7330207824707, 43.429962158203125, 46.12690353393555, 48.82384490966797, 51.520782470703125, 54.21772384643555, 56.9146614074707, 59.611602783203125, 62.30854034423828, 65.00547790527344, 67.70242309570312, 70.39936065673828, 73.09629821777344, 75.79324340820312, 78.49018096923828, 81.18711853027344, 83.88406372070312, 86.58100128173828, 89.27793884277344, 91.97488403320312, 94.67182159423828, 97.36875915527344, 100.06570434570312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 8.0, 9.0, 22.0, 24.0, 32.0, 51.0, 78.0, 97.0, 159.0, 284.0, 1443.0, 226993.0, 3961359.0, 2651.0, 436.0, 223.0, 131.0, 84.0, 53.0, 41.0, 31.0, 15.0, 12.0, 9.0, 5.0, 11.0, 4.0, 1.0, 1.0, 5.0, 0.0, 0.0, 3.0], "bins": [-48.6875, -47.558349609375, -46.42919921875, -45.300048828125, -44.1708984375, -43.041748046875, -41.91259765625, -40.783447265625, -39.654296875, -38.525146484375, -37.39599609375, -36.266845703125, -35.1376953125, -34.008544921875, -32.87939453125, -31.750244140625, -30.62109375, -29.491943359375, -28.36279296875, -27.233642578125, -26.1044921875, -24.975341796875, -23.84619140625, -22.717041015625, -21.587890625, -20.458740234375, -19.32958984375, -18.200439453125, -17.0712890625, -15.942138671875, -14.81298828125, -13.683837890625, -12.5546875, -11.425537109375, -10.29638671875, -9.167236328125, -8.0380859375, -6.908935546875, -5.77978515625, -4.650634765625, -3.521484375, -2.392333984375, -1.26318359375, -0.134033203125, 0.9951171875, 2.124267578125, 3.25341796875, 4.382568359375, 5.51171875, 6.640869140625, 7.77001953125, 8.899169921875, 10.0283203125, 11.157470703125, 12.28662109375, 13.415771484375, 14.544921875, 15.674072265625, 16.80322265625, 17.932373046875, 19.0615234375, 20.190673828125, 21.31982421875, 22.448974609375, 23.578125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 9.0, 19.0, 22.0, 20.0, 30.0, 49.0, 56.0, 96.0, 111.0, 107.0, 122.0, 91.0, 82.0, 52.0, 50.0, 35.0, 26.0, 12.0, 11.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.89794921875, -6.6083984375, -6.31884765625, -6.029296875, -5.73974609375, -5.4501953125, -5.16064453125, -4.87109375, -4.58154296875, -4.2919921875, -4.00244140625, -3.712890625, -3.42333984375, -3.1337890625, -2.84423828125, -2.5546875, -2.26513671875, -1.9755859375, -1.68603515625, -1.396484375, -1.10693359375, -0.8173828125, -0.52783203125, -0.23828125, 0.05126953125, 0.3408203125, 0.63037109375, 0.919921875, 1.20947265625, 1.4990234375, 1.78857421875, 2.078125, 2.36767578125, 2.6572265625, 2.94677734375, 3.236328125, 3.52587890625, 3.8154296875, 4.10498046875, 4.39453125, 4.68408203125, 4.9736328125, 5.26318359375, 5.552734375, 5.84228515625, 6.1318359375, 6.42138671875, 6.7109375, 7.00048828125, 7.2900390625, 7.57958984375, 7.869140625, 8.15869140625, 8.4482421875, 8.73779296875, 9.02734375, 9.31689453125, 9.6064453125, 9.89599609375, 10.185546875, 10.47509765625, 10.7646484375, 11.05419921875, 11.34375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 11.0, 18.0, 44.0, 53.0, 86.0, 148.0, 250.0, 583.0, 1172.0, 3057.0, 8199.0, 32604.0, 430058.0, 3567374.0, 122346.0, 18370.0, 5831.0, 2267.0, 944.0, 404.0, 189.0, 92.0, 52.0, 32.0, 23.0, 14.0, 19.0, 6.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.4931640625, -7.228515625, -6.9638671875, -6.69921875, -6.4345703125, -6.169921875, -5.9052734375, -5.640625, -5.3759765625, -5.111328125, -4.8466796875, -4.58203125, -4.3173828125, -4.052734375, -3.7880859375, -3.5234375, -3.2587890625, -2.994140625, -2.7294921875, -2.46484375, -2.2001953125, -1.935546875, -1.6708984375, -1.40625, -1.1416015625, -0.876953125, -0.6123046875, -0.34765625, -0.0830078125, 0.181640625, 0.4462890625, 0.7109375, 0.9755859375, 1.240234375, 1.5048828125, 1.76953125, 2.0341796875, 2.298828125, 2.5634765625, 2.828125, 3.0927734375, 3.357421875, 3.6220703125, 3.88671875, 4.1513671875, 4.416015625, 4.6806640625, 4.9453125, 5.2099609375, 5.474609375, 5.7392578125, 6.00390625, 6.2685546875, 6.533203125, 6.7978515625, 7.0625, 7.3271484375, 7.591796875, 7.8564453125, 8.12109375, 8.3857421875, 8.650390625, 8.9150390625, 9.1796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 19.0, 17.0, 33.0, 69.0, 138.0, 374.0, 966.0, 1301.0, 681.0, 225.0, 84.0, 46.0, 25.0, 14.0, 16.0, 7.0, 7.0, 5.0, 5.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.5328369140625, -11.206298828125, -10.8797607421875, -10.55322265625, -10.2266845703125, -9.900146484375, -9.5736083984375, -9.2470703125, -8.9205322265625, -8.593994140625, -8.2674560546875, -7.94091796875, -7.6143798828125, -7.287841796875, -6.9613037109375, -6.634765625, -6.3082275390625, -5.981689453125, -5.6551513671875, -5.32861328125, -5.0020751953125, -4.675537109375, -4.3489990234375, -4.0224609375, -3.6959228515625, -3.369384765625, -3.0428466796875, -2.71630859375, -2.3897705078125, -2.063232421875, -1.7366943359375, -1.41015625, -1.0836181640625, -0.757080078125, -0.4305419921875, -0.10400390625, 0.2225341796875, 0.549072265625, 0.8756103515625, 1.2021484375, 1.5286865234375, 1.855224609375, 2.1817626953125, 2.50830078125, 2.8348388671875, 3.161376953125, 3.4879150390625, 3.814453125, 4.1409912109375, 4.467529296875, 4.7940673828125, 5.12060546875, 5.4471435546875, 5.773681640625, 6.1002197265625, 6.4267578125, 6.7532958984375, 7.079833984375, 7.4063720703125, 7.73291015625, 8.0594482421875, 8.385986328125, 8.7125244140625, 9.0390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 25.0, 27.0, 58.0, 142.0, 241.0, 279.0, 135.0, 40.0, 14.0, 14.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.29788208007812, -64.89727783203125, -62.496665954589844, -60.09606170654297, -57.69545364379883, -55.29484558105469, -52.89423751831055, -50.493629455566406, -48.09302520751953, -45.69241714477539, -43.29180908203125, -40.891204833984375, -38.490596771240234, -36.089988708496094, -33.68938064575195, -31.288774490356445, -28.888164520263672, -26.48755645751953, -24.086950302124023, -21.686342239379883, -19.285736083984375, -16.885128021240234, -14.484519958496094, -12.083913803100586, -9.683305740356445, -7.282698631286621, -4.882091045379639, -2.4814834594726562, -0.08087635040283203, 2.319730758666992, 4.720338821411133, 7.120944976806641, 9.521553039550781, 11.922160148620605, 14.32276725769043, 16.72337532043457, 19.123981475830078, 21.52458953857422, 23.92519760131836, 26.325803756713867, 28.726411819458008, 31.12701988220215, 33.527626037597656, 35.9282341003418, 38.32884216308594, 40.72944641113281, 43.13005828857422, 45.530662536621094, 47.931270599365234, 50.331878662109375, 52.732486724853516, 55.133094787597656, 57.53369903564453, 59.93430709838867, 62.33491516113281, 64.73551940917969, 67.1361312866211, 69.53673553466797, 71.93734741210938, 74.33795166015625, 76.73856353759766, 79.13916778564453, 81.53977966308594, 83.94038391113281, 86.34098815917969]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 3.0, 6.0, 8.0, 8.0, 14.0, 21.0, 18.0, 29.0, 37.0, 37.0, 47.0, 46.0, 48.0, 54.0, 58.0, 74.0, 54.0, 61.0, 61.0, 52.0, 41.0, 35.0, 37.0, 24.0, 27.0, 22.0, 14.0, 14.0, 12.0, 13.0, 2.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-49.101783752441406, -47.84418869018555, -46.58659744262695, -45.329002380371094, -44.0714111328125, -42.81381607055664, -41.55622482299805, -40.29862976074219, -39.041038513183594, -37.783443450927734, -36.52585220336914, -35.26825714111328, -34.01066589355469, -32.75307083129883, -31.4954776763916, -30.237884521484375, -28.980289459228516, -27.72269630432129, -26.465103149414062, -25.207509994506836, -23.94991683959961, -22.69232177734375, -21.434728622436523, -20.177135467529297, -18.91954231262207, -17.661949157714844, -16.404356002807617, -15.146761894226074, -13.889168739318848, -12.631575584411621, -11.373981475830078, -10.116388320922852, -8.85879898071289, -7.601205825805664, -6.343612194061279, -5.0860185623168945, -3.828425407409668, -2.5708322525024414, -1.3132386207580566, -0.055644989013671875, 1.2019481658935547, 2.4595415592193604, 3.717134952545166, 4.974728584289551, 6.232321739196777, 7.489914894104004, 8.747509002685547, 10.005102157592773, 11.2626953125, 12.520288467407227, 13.777881622314453, 15.035475730895996, 16.293067932128906, 17.550662994384766, 18.808256149291992, 20.06584930419922, 21.323442459106445, 22.581035614013672, 23.8386287689209, 25.096221923828125, 26.353816986083984, 27.611408233642578, 28.869003295898438, 30.126596450805664, 31.38418960571289]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 11.0, 8.0, 18.0, 27.0, 47.0, 86.0, 105.0, 202.0, 314.0, 620.0, 1275.0, 2759.0, 6511.0, 16896.0, 47903.0, 153000.0, 449187.0, 254078.0, 74085.0, 25010.0, 9057.0, 3773.0, 1705.0, 860.0, 391.0, 242.0, 149.0, 91.0, 51.0, 30.0, 15.0, 19.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0, 3.0, 3.0], "bins": [-8.9765625, -8.7559814453125, -8.535400390625, -8.3148193359375, -8.09423828125, -7.8736572265625, -7.653076171875, -7.4324951171875, -7.2119140625, -6.9913330078125, -6.770751953125, -6.5501708984375, -6.32958984375, -6.1090087890625, -5.888427734375, -5.6678466796875, -5.447265625, -5.2266845703125, -5.006103515625, -4.7855224609375, -4.56494140625, -4.3443603515625, -4.123779296875, -3.9031982421875, -3.6826171875, -3.4620361328125, -3.241455078125, -3.0208740234375, -2.80029296875, -2.5797119140625, -2.359130859375, -2.1385498046875, -1.91796875, -1.6973876953125, -1.476806640625, -1.2562255859375, -1.03564453125, -0.8150634765625, -0.594482421875, -0.3739013671875, -0.1533203125, 0.0672607421875, 0.287841796875, 0.5084228515625, 0.72900390625, 0.9495849609375, 1.170166015625, 1.3907470703125, 1.611328125, 1.8319091796875, 2.052490234375, 2.2730712890625, 2.49365234375, 2.7142333984375, 2.934814453125, 3.1553955078125, 3.3759765625, 3.5965576171875, 3.817138671875, 4.0377197265625, 4.25830078125, 4.4788818359375, 4.699462890625, 4.9200439453125, 5.140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 7.0, 22.0, 16.0, 18.0, 28.0, 29.0, 47.0, 32.0, 62.0, 63.0, 69.0, 66.0, 70.0, 77.0, 85.0, 53.0, 47.0, 54.0, 33.0, 33.0, 18.0, 15.0, 15.0, 13.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71875, -5.5345458984375, -5.350341796875, -5.1661376953125, -4.98193359375, -4.7977294921875, -4.613525390625, -4.4293212890625, -4.2451171875, -4.0609130859375, -3.876708984375, -3.6925048828125, -3.50830078125, -3.3240966796875, -3.139892578125, -2.9556884765625, -2.771484375, -2.5872802734375, -2.403076171875, -2.2188720703125, -2.03466796875, -1.8504638671875, -1.666259765625, -1.4820556640625, -1.2978515625, -1.1136474609375, -0.929443359375, -0.7452392578125, -0.56103515625, -0.3768310546875, -0.192626953125, -0.0084228515625, 0.17578125, 0.3599853515625, 0.544189453125, 0.7283935546875, 0.91259765625, 1.0968017578125, 1.281005859375, 1.4652099609375, 1.6494140625, 1.8336181640625, 2.017822265625, 2.2020263671875, 2.38623046875, 2.5704345703125, 2.754638671875, 2.9388427734375, 3.123046875, 3.3072509765625, 3.491455078125, 3.6756591796875, 3.85986328125, 4.0440673828125, 4.228271484375, 4.4124755859375, 4.5966796875, 4.7808837890625, 4.965087890625, 5.1492919921875, 5.33349609375, 5.5177001953125, 5.701904296875, 5.8861083984375, 6.0703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 15.0, 15.0, 18.0, 25.0, 31.0, 40.0, 42.0, 61.0, 99.0, 127.0, 179.0, 263.0, 437.0, 696.0, 1332.0, 2742.0, 6914.0, 20878.0, 81273.0, 467663.0, 363643.0, 70951.0, 18998.0, 6337.0, 2559.0, 1205.0, 660.0, 385.0, 299.0, 177.0, 127.0, 105.0, 58.0, 41.0, 36.0, 23.0, 21.0, 21.0, 11.0, 15.0, 6.0, 1.0, 4.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.390625, -8.1280517578125, -7.865478515625, -7.6029052734375, -7.34033203125, -7.0777587890625, -6.815185546875, -6.5526123046875, -6.2900390625, -6.0274658203125, -5.764892578125, -5.5023193359375, -5.23974609375, -4.9771728515625, -4.714599609375, -4.4520263671875, -4.189453125, -3.9268798828125, -3.664306640625, -3.4017333984375, -3.13916015625, -2.8765869140625, -2.614013671875, -2.3514404296875, -2.0888671875, -1.8262939453125, -1.563720703125, -1.3011474609375, -1.03857421875, -0.7760009765625, -0.513427734375, -0.2508544921875, 0.01171875, 0.2742919921875, 0.536865234375, 0.7994384765625, 1.06201171875, 1.3245849609375, 1.587158203125, 1.8497314453125, 2.1123046875, 2.3748779296875, 2.637451171875, 2.9000244140625, 3.16259765625, 3.4251708984375, 3.687744140625, 3.9503173828125, 4.212890625, 4.4754638671875, 4.738037109375, 5.0006103515625, 5.26318359375, 5.5257568359375, 5.788330078125, 6.0509033203125, 6.3134765625, 6.5760498046875, 6.838623046875, 7.1011962890625, 7.36376953125, 7.6263427734375, 7.888916015625, 8.1514892578125, 8.4140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 6.0, 6.0, 13.0, 12.0, 10.0, 7.0, 11.0, 16.0, 13.0, 29.0, 20.0, 34.0, 24.0, 34.0, 38.0, 43.0, 40.0, 53.0, 48.0, 41.0, 47.0, 43.0, 40.0, 49.0, 42.0, 39.0, 31.0, 26.0, 33.0, 24.0, 18.0, 12.0, 14.0, 17.0, 20.0, 6.0, 9.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.740234375, -13.30078125, -12.861328125, -12.421875, -11.982421875, -11.54296875, -11.103515625, -10.6640625, -10.224609375, -9.78515625, -9.345703125, -8.90625, -8.466796875, -8.02734375, -7.587890625, -7.1484375, -6.708984375, -6.26953125, -5.830078125, -5.390625, -4.951171875, -4.51171875, -4.072265625, -3.6328125, -3.193359375, -2.75390625, -2.314453125, -1.875, -1.435546875, -0.99609375, -0.556640625, -0.1171875, 0.322265625, 0.76171875, 1.201171875, 1.640625, 2.080078125, 2.51953125, 2.958984375, 3.3984375, 3.837890625, 4.27734375, 4.716796875, 5.15625, 5.595703125, 6.03515625, 6.474609375, 6.9140625, 7.353515625, 7.79296875, 8.232421875, 8.671875, 9.111328125, 9.55078125, 9.990234375, 10.4296875, 10.869140625, 11.30859375, 11.748046875, 12.1875, 12.626953125, 13.06640625, 13.505859375, 13.9453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 8.0, 2.0, 5.0, 7.0, 13.0, 32.0, 31.0, 56.0, 78.0, 153.0, 378.0, 1087.0, 4900.0, 89167.0, 930038.0, 18872.0, 2417.0, 723.0, 244.0, 135.0, 46.0, 45.0, 34.0, 18.0, 17.0, 8.0, 7.0, 9.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.719970703125, -8.43212890625, -8.144287109375, -7.8564453125, -7.568603515625, -7.28076171875, -6.992919921875, -6.705078125, -6.417236328125, -6.12939453125, -5.841552734375, -5.5537109375, -5.265869140625, -4.97802734375, -4.690185546875, -4.40234375, -4.114501953125, -3.82666015625, -3.538818359375, -3.2509765625, -2.963134765625, -2.67529296875, -2.387451171875, -2.099609375, -1.811767578125, -1.52392578125, -1.236083984375, -0.9482421875, -0.660400390625, -0.37255859375, -0.084716796875, 0.203125, 0.490966796875, 0.77880859375, 1.066650390625, 1.3544921875, 1.642333984375, 1.93017578125, 2.218017578125, 2.505859375, 2.793701171875, 3.08154296875, 3.369384765625, 3.6572265625, 3.945068359375, 4.23291015625, 4.520751953125, 4.80859375, 5.096435546875, 5.38427734375, 5.672119140625, 5.9599609375, 6.247802734375, 6.53564453125, 6.823486328125, 7.111328125, 7.399169921875, 7.68701171875, 7.974853515625, 8.2626953125, 8.550537109375, 8.83837890625, 9.126220703125, 9.4140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 10.0, 12.0, 22.0, 25.0, 38.0, 65.0, 114.0, 178.0, 178.0, 133.0, 72.0, 57.0, 34.0, 16.0, 15.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006918907165527344, -0.0006663650274276733, -0.0006408393383026123, -0.0006153136491775513, -0.0005897879600524902, -0.0005642622709274292, -0.0005387365818023682, -0.0005132108926773071, -0.0004876852035522461, -0.00046215951442718506, -0.000436633825302124, -0.000411108136177063, -0.00038558244705200195, -0.0003600567579269409, -0.0003345310688018799, -0.00030900537967681885, -0.0002834796905517578, -0.0002579540014266968, -0.00023242831230163574, -0.0002069026231765747, -0.00018137693405151367, -0.00015585124492645264, -0.0001303255558013916, -0.00010479986667633057, -7.927417755126953e-05, -5.3748488426208496e-05, -2.822279930114746e-05, -2.6971101760864258e-06, 2.282857894897461e-05, 4.8354268074035645e-05, 7.387995719909668e-05, 9.940564632415771e-05, 0.00012493133544921875, 0.00015045702457427979, 0.00017598271369934082, 0.00020150840282440186, 0.0002270340919494629, 0.0002525597810745239, 0.00027808547019958496, 0.000303611159324646, 0.00032913684844970703, 0.00035466253757476807, 0.0003801882266998291, 0.00040571391582489014, 0.00043123960494995117, 0.0004567652940750122, 0.00048229098320007324, 0.0005078166723251343, 0.0005333423614501953, 0.0005588680505752563, 0.0005843937397003174, 0.0006099194288253784, 0.0006354451179504395, 0.0006609708070755005, 0.0006864964962005615, 0.0007120221853256226, 0.0007375478744506836, 0.0007630735635757446, 0.0007885992527008057, 0.0008141249418258667, 0.0008396506309509277, 0.0008651763200759888, 0.0008907020092010498, 0.0009162276983261108, 0.0009417533874511719]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 9.0, 7.0, 15.0, 14.0, 17.0, 29.0, 51.0, 79.0, 90.0, 177.0, 290.0, 574.0, 1212.0, 3020.0, 10014.0, 60939.0, 739191.0, 203385.0, 20684.0, 5155.0, 1830.0, 758.0, 389.0, 211.0, 145.0, 99.0, 63.0, 37.0, 23.0, 17.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.7890625, -4.655029296875, -4.52099609375, -4.386962890625, -4.2529296875, -4.118896484375, -3.98486328125, -3.850830078125, -3.716796875, -3.582763671875, -3.44873046875, -3.314697265625, -3.1806640625, -3.046630859375, -2.91259765625, -2.778564453125, -2.64453125, -2.510498046875, -2.37646484375, -2.242431640625, -2.1083984375, -1.974365234375, -1.84033203125, -1.706298828125, -1.572265625, -1.438232421875, -1.30419921875, -1.170166015625, -1.0361328125, -0.902099609375, -0.76806640625, -0.634033203125, -0.5, -0.365966796875, -0.23193359375, -0.097900390625, 0.0361328125, 0.170166015625, 0.30419921875, 0.438232421875, 0.572265625, 0.706298828125, 0.84033203125, 0.974365234375, 1.1083984375, 1.242431640625, 1.37646484375, 1.510498046875, 1.64453125, 1.778564453125, 1.91259765625, 2.046630859375, 2.1806640625, 2.314697265625, 2.44873046875, 2.582763671875, 2.716796875, 2.850830078125, 2.98486328125, 3.118896484375, 3.2529296875, 3.386962890625, 3.52099609375, 3.655029296875, 3.7890625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 16.0, 10.0, 20.0, 35.0, 49.0, 52.0, 59.0, 93.0, 90.0, 99.0, 99.0, 86.0, 71.0, 56.0, 33.0, 25.0, 23.0, 12.0, 27.0, 11.0, 9.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.806640625, -3.6900634765625, -3.573486328125, -3.4569091796875, -3.34033203125, -3.2237548828125, -3.107177734375, -2.9906005859375, -2.8740234375, -2.7574462890625, -2.640869140625, -2.5242919921875, -2.40771484375, -2.2911376953125, -2.174560546875, -2.0579833984375, -1.94140625, -1.8248291015625, -1.708251953125, -1.5916748046875, -1.47509765625, -1.3585205078125, -1.241943359375, -1.1253662109375, -1.0087890625, -0.8922119140625, -0.775634765625, -0.6590576171875, -0.54248046875, -0.4259033203125, -0.309326171875, -0.1927490234375, -0.076171875, 0.0404052734375, 0.156982421875, 0.2735595703125, 0.39013671875, 0.5067138671875, 0.623291015625, 0.7398681640625, 0.8564453125, 0.9730224609375, 1.089599609375, 1.2061767578125, 1.32275390625, 1.4393310546875, 1.555908203125, 1.6724853515625, 1.7890625, 1.9056396484375, 2.022216796875, 2.1387939453125, 2.25537109375, 2.3719482421875, 2.488525390625, 2.6051025390625, 2.7216796875, 2.8382568359375, 2.954833984375, 3.0714111328125, 3.18798828125, 3.3045654296875, 3.421142578125, 3.5377197265625, 3.654296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 10.0, 39.0, 124.0, 292.0, 268.0, 137.0, 65.0, 30.0, 19.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-134.95684814453125, -131.083740234375, -127.21063232421875, -123.3375244140625, -119.46442413330078, -115.59131622314453, -111.71820831298828, -107.84510040283203, -103.97199249267578, -100.09888458251953, -96.22577667236328, -92.35267639160156, -88.47956848144531, -84.60646057128906, -80.73335266113281, -76.86024475097656, -72.98713684082031, -69.11402893066406, -65.24092102050781, -61.36781692504883, -57.49470901489258, -53.621604919433594, -49.748497009277344, -45.875389099121094, -42.002288818359375, -38.129180908203125, -34.25607681274414, -30.38296890258789, -26.50986099243164, -22.636754989624023, -18.763648986816406, -14.890541076660156, -11.017433166503906, -7.144326210021973, -3.2712197303771973, 0.6018867492675781, 4.474993705749512, 8.348100662231445, 12.221206665039062, 16.094314575195312, 19.96742057800293, 23.840526580810547, 27.713634490966797, 31.586740493774414, 35.45984649658203, 39.33295440673828, 43.20606231689453, 47.07917022705078, 50.952274322509766, 54.825382232666016, 58.698486328125, 62.57159423828125, 66.4447021484375, 70.31781005859375, 74.19091796875, 78.06402587890625, 81.93712615966797, 85.81023406982422, 89.68334197998047, 93.55644226074219, 97.42955017089844, 101.30265808105469, 105.17576599121094, 109.04887390136719, 112.92198181152344]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 9.0, 5.0, 6.0, 5.0, 7.0, 6.0, 12.0, 11.0, 20.0, 34.0, 35.0, 33.0, 35.0, 39.0, 37.0, 39.0, 56.0, 67.0, 67.0, 74.0, 46.0, 50.0, 40.0, 36.0, 36.0, 31.0, 31.0, 28.0, 23.0, 15.0, 13.0, 10.0, 4.0, 13.0, 8.0, 9.0, 7.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-81.96810913085938, -79.84973907470703, -77.73136901855469, -75.61299133300781, -73.49462127685547, -71.37625122070312, -69.25787353515625, -67.1395034790039, -65.02113342285156, -62.90276336669922, -60.78438949584961, -58.666015625, -56.547645568847656, -54.42927551269531, -52.3109016418457, -50.192527770996094, -48.07415771484375, -45.955787658691406, -43.8374137878418, -41.71903991699219, -39.600669860839844, -37.4822998046875, -35.36392593383789, -33.24555206298828, -31.127182006835938, -29.00881004333496, -26.890438079833984, -24.772066116333008, -22.65369415283203, -20.535322189331055, -18.416950225830078, -16.2985782623291, -14.180206298828125, -12.061834335327148, -9.943462371826172, -7.825090408325195, -5.706718444824219, -3.588346481323242, -1.4699745178222656, 0.6483974456787109, 2.7667694091796875, 4.885141372680664, 7.003513336181641, 9.121885299682617, 11.240257263183594, 13.35862922668457, 15.477001190185547, 17.595373153686523, 19.7137451171875, 21.832117080688477, 23.950489044189453, 26.06886100769043, 28.187232971191406, 30.305604934692383, 32.42397689819336, 34.54235076904297, 36.66072082519531, 38.779090881347656, 40.897464752197266, 43.015838623046875, 45.13420867919922, 47.25257873535156, 49.37095260620117, 51.48932647705078, 53.607696533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 5.0, 10.0, 17.0, 26.0, 45.0, 84.0, 210.0, 493.0, 1521.0, 6843.0, 71952.0, 3686439.0, 407794.0, 15139.0, 2587.0, 652.0, 244.0, 104.0, 43.0, 26.0, 14.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.63482666015625, -12.3243408203125, -12.01385498046875, -11.703369140625, -11.39288330078125, -11.0823974609375, -10.77191162109375, -10.46142578125, -10.15093994140625, -9.8404541015625, -9.52996826171875, -9.219482421875, -8.90899658203125, -8.5985107421875, -8.28802490234375, -7.9775390625, -7.66705322265625, -7.3565673828125, -7.04608154296875, -6.735595703125, -6.42510986328125, -6.1146240234375, -5.80413818359375, -5.49365234375, -5.18316650390625, -4.8726806640625, -4.56219482421875, -4.251708984375, -3.94122314453125, -3.6307373046875, -3.32025146484375, -3.009765625, -2.69927978515625, -2.3887939453125, -2.07830810546875, -1.767822265625, -1.45733642578125, -1.1468505859375, -0.83636474609375, -0.52587890625, -0.21539306640625, 0.0950927734375, 0.40557861328125, 0.716064453125, 1.02655029296875, 1.3370361328125, 1.64752197265625, 1.9580078125, 2.26849365234375, 2.5789794921875, 2.88946533203125, 3.199951171875, 3.51043701171875, 3.8209228515625, 4.13140869140625, 4.44189453125, 4.75238037109375, 5.0628662109375, 5.37335205078125, 5.683837890625, 5.99432373046875, 6.3048095703125, 6.61529541015625, 6.92578125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 8.0, 5.0, 7.0, 14.0, 15.0, 32.0, 23.0, 38.0, 37.0, 42.0, 54.0, 61.0, 89.0, 78.0, 70.0, 64.0, 63.0, 51.0, 51.0, 50.0, 31.0, 29.0, 25.0, 20.0, 14.0, 8.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.8125, -6.657135009765625, -6.50177001953125, -6.346405029296875, -6.1910400390625, -6.035675048828125, -5.88031005859375, -5.724945068359375, -5.569580078125, -5.414215087890625, -5.25885009765625, -5.103485107421875, -4.9481201171875, -4.792755126953125, -4.63739013671875, -4.482025146484375, -4.32666015625, -4.171295166015625, -4.01593017578125, -3.860565185546875, -3.7052001953125, -3.549835205078125, -3.39447021484375, -3.239105224609375, -3.083740234375, -2.928375244140625, -2.77301025390625, -2.617645263671875, -2.4622802734375, -2.306915283203125, -2.15155029296875, -1.996185302734375, -1.8408203125, -1.685455322265625, -1.53009033203125, -1.374725341796875, -1.2193603515625, -1.063995361328125, -0.90863037109375, -0.753265380859375, -0.597900390625, -0.442535400390625, -0.28717041015625, -0.131805419921875, 0.0235595703125, 0.178924560546875, 0.33428955078125, 0.489654541015625, 0.64501953125, 0.800384521484375, 0.95574951171875, 1.111114501953125, 1.2664794921875, 1.421844482421875, 1.57720947265625, 1.732574462890625, 1.887939453125, 2.043304443359375, 2.19866943359375, 2.354034423828125, 2.5093994140625, 2.664764404296875, 2.82012939453125, 2.975494384765625, 3.130859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 4.0, 7.0, 8.0, 19.0, 21.0, 39.0, 67.0, 129.0, 235.0, 584.0, 1487.0, 5575.0, 33157.0, 731710.0, 3318507.0, 86601.0, 11736.0, 2772.0, 883.0, 317.0, 163.0, 97.0, 53.0, 32.0, 23.0, 10.0, 11.0, 10.0, 4.0, 2.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.757568359375, -10.46826171875, -10.178955078125, -9.8896484375, -9.600341796875, -9.31103515625, -9.021728515625, -8.732421875, -8.443115234375, -8.15380859375, -7.864501953125, -7.5751953125, -7.285888671875, -6.99658203125, -6.707275390625, -6.41796875, -6.128662109375, -5.83935546875, -5.550048828125, -5.2607421875, -4.971435546875, -4.68212890625, -4.392822265625, -4.103515625, -3.814208984375, -3.52490234375, -3.235595703125, -2.9462890625, -2.656982421875, -2.36767578125, -2.078369140625, -1.7890625, -1.499755859375, -1.21044921875, -0.921142578125, -0.6318359375, -0.342529296875, -0.05322265625, 0.236083984375, 0.525390625, 0.814697265625, 1.10400390625, 1.393310546875, 1.6826171875, 1.971923828125, 2.26123046875, 2.550537109375, 2.83984375, 3.129150390625, 3.41845703125, 3.707763671875, 3.9970703125, 4.286376953125, 4.57568359375, 4.864990234375, 5.154296875, 5.443603515625, 5.73291015625, 6.022216796875, 6.3115234375, 6.600830078125, 6.89013671875, 7.179443359375, 7.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 6.0, 7.0, 19.0, 13.0, 24.0, 34.0, 74.0, 95.0, 144.0, 261.0, 474.0, 831.0, 838.0, 477.0, 273.0, 140.0, 97.0, 59.0, 46.0, 29.0, 28.0, 22.0, 12.0, 9.0, 8.0, 3.0, 8.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.5234375, -8.29327392578125, -8.0631103515625, -7.83294677734375, -7.602783203125, -7.37261962890625, -7.1424560546875, -6.91229248046875, -6.68212890625, -6.45196533203125, -6.2218017578125, -5.99163818359375, -5.761474609375, -5.53131103515625, -5.3011474609375, -5.07098388671875, -4.8408203125, -4.61065673828125, -4.3804931640625, -4.15032958984375, -3.920166015625, -3.69000244140625, -3.4598388671875, -3.22967529296875, -2.99951171875, -2.76934814453125, -2.5391845703125, -2.30902099609375, -2.078857421875, -1.84869384765625, -1.6185302734375, -1.38836669921875, -1.158203125, -0.92803955078125, -0.6978759765625, -0.46771240234375, -0.237548828125, -0.00738525390625, 0.2227783203125, 0.45294189453125, 0.68310546875, 0.91326904296875, 1.1434326171875, 1.37359619140625, 1.603759765625, 1.83392333984375, 2.0640869140625, 2.29425048828125, 2.5244140625, 2.75457763671875, 2.9847412109375, 3.21490478515625, 3.445068359375, 3.67523193359375, 3.9053955078125, 4.13555908203125, 4.36572265625, 4.59588623046875, 4.8260498046875, 5.05621337890625, 5.286376953125, 5.51654052734375, 5.7467041015625, 5.97686767578125, 6.20703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 23.0, 67.0, 161.0, 307.0, 247.0, 111.0, 33.0, 13.0, 4.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.417694091796875, -56.069366455078125, -52.72104263305664, -49.37271499633789, -46.02438735961914, -42.676063537597656, -39.327735900878906, -35.979408264160156, -32.631080627441406, -29.28275489807129, -25.93442726135254, -22.586101531982422, -19.237773895263672, -15.889448165893555, -12.541122436523438, -9.192794799804688, -5.844470977783203, -2.4961445331573486, 0.8521819114685059, 4.200508117675781, 7.548834800720215, 10.897161483764648, 14.245487213134766, 17.593814849853516, 20.942140579223633, 24.29046630859375, 27.6387939453125, 30.987119674682617, 34.335445404052734, 37.683773040771484, 41.03209686279297, 44.38042449951172, 47.72875213623047, 51.07707977294922, 54.4254035949707, 57.77373123168945, 61.1220588684082, 64.47038269042969, 67.81871032714844, 71.16703796386719, 74.51536560058594, 77.86369323730469, 81.21202087402344, 84.56034851074219, 87.9086685180664, 91.25699615478516, 94.6053237915039, 97.95365142822266, 101.30197143554688, 104.65029907226562, 107.99862670898438, 111.34695434570312, 114.69527435302734, 118.0436019897461, 121.39192962646484, 124.7402572631836, 128.08859252929688, 131.43692016601562, 134.78524780273438, 138.13357543945312, 141.48190307617188, 144.83023071289062, 148.17855834960938, 151.52688598632812, 154.8751983642578]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 6.0, 7.0, 8.0, 7.0, 11.0, 11.0, 16.0, 28.0, 26.0, 31.0, 43.0, 62.0, 72.0, 70.0, 55.0, 83.0, 77.0, 64.0, 67.0, 55.0, 45.0, 43.0, 35.0, 19.0, 19.0, 10.0, 4.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.949920654296875, -46.214561462402344, -44.47920608520508, -42.74384689331055, -41.00849151611328, -39.27313232421875, -37.537776947021484, -35.80241775512695, -34.06706237792969, -32.331703186035156, -30.59634780883789, -28.860990524291992, -27.125633239746094, -25.390274047851562, -23.654918670654297, -21.919559478759766, -20.184202194213867, -18.44884490966797, -16.71348762512207, -14.978130340576172, -13.242773056030273, -11.507414817810059, -9.77205753326416, -8.036700248718262, -6.301342964172363, -4.565985679626465, -2.8306281566619873, -1.0952706336975098, 0.6400866508483887, 2.3754444122314453, 4.110801696777344, 5.846158981323242, 7.581516265869141, 9.316873550415039, 11.052230834960938, 12.787588119506836, 14.522945404052734, 16.258304595947266, 17.99365997314453, 19.729019165039062, 21.464374542236328, 23.199731826782227, 24.935089111328125, 26.670446395874023, 28.405803680419922, 30.141162872314453, 31.87651824951172, 33.61187744140625, 35.34723663330078, 37.08259582519531, 38.81795120239258, 40.55331039428711, 42.288665771484375, 44.024024963378906, 45.75938034057617, 47.4947395324707, 49.23009490966797, 50.9654541015625, 52.700809478759766, 54.4361686706543, 56.17152404785156, 57.906883239746094, 59.64223861694336, 61.37759780883789, 63.112953186035156]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 16.0, 23.0, 40.0, 58.0, 84.0, 137.0, 280.0, 460.0, 904.0, 1883.0, 3956.0, 9144.0, 21565.0, 54437.0, 141897.0, 332014.0, 288761.0, 116216.0, 44478.0, 17918.0, 7414.0, 3434.0, 1619.0, 811.0, 407.0, 248.0, 124.0, 78.0, 46.0, 35.0, 16.0, 10.0, 6.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.625, -5.4725341796875, -5.320068359375, -5.1676025390625, -5.01513671875, -4.8626708984375, -4.710205078125, -4.5577392578125, -4.4052734375, -4.2528076171875, -4.100341796875, -3.9478759765625, -3.79541015625, -3.6429443359375, -3.490478515625, -3.3380126953125, -3.185546875, -3.0330810546875, -2.880615234375, -2.7281494140625, -2.57568359375, -2.4232177734375, -2.270751953125, -2.1182861328125, -1.9658203125, -1.8133544921875, -1.660888671875, -1.5084228515625, -1.35595703125, -1.2034912109375, -1.051025390625, -0.8985595703125, -0.74609375, -0.5936279296875, -0.441162109375, -0.2886962890625, -0.13623046875, 0.0162353515625, 0.168701171875, 0.3211669921875, 0.4736328125, 0.6260986328125, 0.778564453125, 0.9310302734375, 1.08349609375, 1.2359619140625, 1.388427734375, 1.5408935546875, 1.693359375, 1.8458251953125, 1.998291015625, 2.1507568359375, 2.30322265625, 2.4556884765625, 2.608154296875, 2.7606201171875, 2.9130859375, 3.0655517578125, 3.218017578125, 3.3704833984375, 3.52294921875, 3.6754150390625, 3.827880859375, 3.9803466796875, 4.1328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 9.0, 7.0, 7.0, 12.0, 9.0, 7.0, 15.0, 16.0, 12.0, 17.0, 18.0, 24.0, 12.0, 32.0, 20.0, 49.0, 30.0, 38.0, 38.0, 43.0, 47.0, 47.0, 45.0, 42.0, 47.0, 33.0, 43.0, 25.0, 30.0, 26.0, 19.0, 23.0, 22.0, 23.0, 20.0, 10.0, 11.0, 12.0, 11.0, 9.0, 7.0, 7.0, 6.0, 7.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.8079833984375, -2.721435546875, -2.6348876953125, -2.54833984375, -2.4617919921875, -2.375244140625, -2.2886962890625, -2.2021484375, -2.1156005859375, -2.029052734375, -1.9425048828125, -1.85595703125, -1.7694091796875, -1.682861328125, -1.5963134765625, -1.509765625, -1.4232177734375, -1.336669921875, -1.2501220703125, -1.16357421875, -1.0770263671875, -0.990478515625, -0.9039306640625, -0.8173828125, -0.7308349609375, -0.644287109375, -0.5577392578125, -0.47119140625, -0.3846435546875, -0.298095703125, -0.2115478515625, -0.125, -0.0384521484375, 0.048095703125, 0.1346435546875, 0.22119140625, 0.3077392578125, 0.394287109375, 0.4808349609375, 0.5673828125, 0.6539306640625, 0.740478515625, 0.8270263671875, 0.91357421875, 1.0001220703125, 1.086669921875, 1.1732177734375, 1.259765625, 1.3463134765625, 1.432861328125, 1.5194091796875, 1.60595703125, 1.6925048828125, 1.779052734375, 1.8656005859375, 1.9521484375, 2.0386962890625, 2.125244140625, 2.2117919921875, 2.29833984375, 2.3848876953125, 2.471435546875, 2.5579833984375, 2.64453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 9.0, 5.0, 10.0, 16.0, 32.0, 30.0, 66.0, 82.0, 155.0, 197.0, 392.0, 573.0, 984.0, 1789.0, 5035.0, 27416.0, 352283.0, 611139.0, 37753.0, 5921.0, 2063.0, 986.0, 593.0, 341.0, 249.0, 144.0, 100.0, 56.0, 40.0, 34.0, 14.0, 17.0, 9.0, 8.0, 6.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5234375, -11.1129150390625, -10.702392578125, -10.2918701171875, -9.88134765625, -9.4708251953125, -9.060302734375, -8.6497802734375, -8.2392578125, -7.8287353515625, -7.418212890625, -7.0076904296875, -6.59716796875, -6.1866455078125, -5.776123046875, -5.3656005859375, -4.955078125, -4.5445556640625, -4.134033203125, -3.7235107421875, -3.31298828125, -2.9024658203125, -2.491943359375, -2.0814208984375, -1.6708984375, -1.2603759765625, -0.849853515625, -0.4393310546875, -0.02880859375, 0.3817138671875, 0.792236328125, 1.2027587890625, 1.61328125, 2.0238037109375, 2.434326171875, 2.8448486328125, 3.25537109375, 3.6658935546875, 4.076416015625, 4.4869384765625, 4.8974609375, 5.3079833984375, 5.718505859375, 6.1290283203125, 6.53955078125, 6.9500732421875, 7.360595703125, 7.7711181640625, 8.181640625, 8.5921630859375, 9.002685546875, 9.4132080078125, 9.82373046875, 10.2342529296875, 10.644775390625, 11.0552978515625, 11.4658203125, 11.8763427734375, 12.286865234375, 12.6973876953125, 13.10791015625, 13.5184326171875, 13.928955078125, 14.3394775390625, 14.75]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 12.0, 9.0, 16.0, 16.0, 23.0, 11.0, 34.0, 33.0, 28.0, 31.0, 49.0, 35.0, 45.0, 45.0, 41.0, 47.0, 39.0, 49.0, 47.0, 45.0, 37.0, 46.0, 39.0, 35.0, 27.0, 25.0, 23.0, 17.0, 10.0, 16.0, 5.0, 16.0, 4.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7734375, -12.35400390625, -11.9345703125, -11.51513671875, -11.095703125, -10.67626953125, -10.2568359375, -9.83740234375, -9.41796875, -8.99853515625, -8.5791015625, -8.15966796875, -7.740234375, -7.32080078125, -6.9013671875, -6.48193359375, -6.0625, -5.64306640625, -5.2236328125, -4.80419921875, -4.384765625, -3.96533203125, -3.5458984375, -3.12646484375, -2.70703125, -2.28759765625, -1.8681640625, -1.44873046875, -1.029296875, -0.60986328125, -0.1904296875, 0.22900390625, 0.6484375, 1.06787109375, 1.4873046875, 1.90673828125, 2.326171875, 2.74560546875, 3.1650390625, 3.58447265625, 4.00390625, 4.42333984375, 4.8427734375, 5.26220703125, 5.681640625, 6.10107421875, 6.5205078125, 6.93994140625, 7.359375, 7.77880859375, 8.1982421875, 8.61767578125, 9.037109375, 9.45654296875, 9.8759765625, 10.29541015625, 10.71484375, 11.13427734375, 11.5537109375, 11.97314453125, 12.392578125, 12.81201171875, 13.2314453125, 13.65087890625, 14.0703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 11.0, 8.0, 13.0, 18.0, 24.0, 38.0, 58.0, 88.0, 184.0, 380.0, 860.0, 2600.0, 10772.0, 101778.0, 836427.0, 81879.0, 9504.0, 2303.0, 785.0, 354.0, 165.0, 98.0, 49.0, 43.0, 34.0, 18.0, 13.0, 12.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.4140625, -4.278076171875, -4.14208984375, -4.006103515625, -3.8701171875, -3.734130859375, -3.59814453125, -3.462158203125, -3.326171875, -3.190185546875, -3.05419921875, -2.918212890625, -2.7822265625, -2.646240234375, -2.51025390625, -2.374267578125, -2.23828125, -2.102294921875, -1.96630859375, -1.830322265625, -1.6943359375, -1.558349609375, -1.42236328125, -1.286376953125, -1.150390625, -1.014404296875, -0.87841796875, -0.742431640625, -0.6064453125, -0.470458984375, -0.33447265625, -0.198486328125, -0.0625, 0.073486328125, 0.20947265625, 0.345458984375, 0.4814453125, 0.617431640625, 0.75341796875, 0.889404296875, 1.025390625, 1.161376953125, 1.29736328125, 1.433349609375, 1.5693359375, 1.705322265625, 1.84130859375, 1.977294921875, 2.11328125, 2.249267578125, 2.38525390625, 2.521240234375, 2.6572265625, 2.793212890625, 2.92919921875, 3.065185546875, 3.201171875, 3.337158203125, 3.47314453125, 3.609130859375, 3.7451171875, 3.881103515625, 4.01708984375, 4.153076171875, 4.2890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 11.0, 5.0, 7.0, 11.0, 19.0, 20.0, 14.0, 20.0, 23.0, 24.0, 33.0, 30.0, 56.0, 64.0, 81.0, 109.0, 93.0, 72.0, 55.0, 54.0, 22.0, 33.0, 19.0, 16.0, 13.0, 19.0, 22.0, 12.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004258155822753906, -0.00041143596172332764, -0.00039705634117126465, -0.00038267672061920166, -0.00036829710006713867, -0.0003539174795150757, -0.0003395378589630127, -0.0003251582384109497, -0.0003107786178588867, -0.00029639899730682373, -0.00028201937675476074, -0.00026763975620269775, -0.00025326013565063477, -0.00023888051509857178, -0.0002245008945465088, -0.0002101212739944458, -0.0001957416534423828, -0.00018136203289031982, -0.00016698241233825684, -0.00015260279178619385, -0.00013822317123413086, -0.00012384355068206787, -0.00010946393013000488, -9.50843095779419e-05, -8.07046890258789e-05, -6.632506847381592e-05, -5.194544792175293e-05, -3.756582736968994e-05, -2.3186206817626953e-05, -8.806586265563965e-06, 5.5730342864990234e-06, 1.9952654838562012e-05, 3.4332275390625e-05, 4.871189594268799e-05, 6.309151649475098e-05, 7.747113704681396e-05, 9.185075759887695e-05, 0.00010623037815093994, 0.00012060999870300293, 0.00013498961925506592, 0.0001493692398071289, 0.0001637488603591919, 0.00017812848091125488, 0.00019250810146331787, 0.00020688772201538086, 0.00022126734256744385, 0.00023564696311950684, 0.0002500265836715698, 0.0002644062042236328, 0.0002787858247756958, 0.0002931654453277588, 0.0003075450658798218, 0.00032192468643188477, 0.00033630430698394775, 0.00035068392753601074, 0.00036506354808807373, 0.0003794431686401367, 0.0003938227891921997, 0.0004082024097442627, 0.0004225820302963257, 0.00043696165084838867, 0.00045134127140045166, 0.00046572089195251465, 0.00048010051250457764, 0.0004944801330566406]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 7.0, 13.0, 13.0, 33.0, 44.0, 92.0, 156.0, 301.0, 691.0, 1815.0, 6852.0, 53318.0, 879099.0, 92943.0, 9509.0, 2149.0, 754.0, 336.0, 176.0, 89.0, 64.0, 43.0, 17.0, 11.0, 3.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.662109375, -3.5, -3.337890625, -3.17578125, -3.013671875, -2.8515625, -2.689453125, -2.52734375, -2.365234375, -2.203125, -2.041015625, -1.87890625, -1.716796875, -1.5546875, -1.392578125, -1.23046875, -1.068359375, -0.90625, -0.744140625, -0.58203125, -0.419921875, -0.2578125, -0.095703125, 0.06640625, 0.228515625, 0.390625, 0.552734375, 0.71484375, 0.876953125, 1.0390625, 1.201171875, 1.36328125, 1.525390625, 1.6875, 1.849609375, 2.01171875, 2.173828125, 2.3359375, 2.498046875, 2.66015625, 2.822265625, 2.984375, 3.146484375, 3.30859375, 3.470703125, 3.6328125, 3.794921875, 3.95703125, 4.119140625, 4.28125, 4.443359375, 4.60546875, 4.767578125, 4.9296875, 5.091796875, 5.25390625, 5.416015625, 5.578125, 5.740234375, 5.90234375, 6.064453125, 6.2265625, 6.388671875, 6.55078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 6.0, 9.0, 19.0, 18.0, 16.0, 23.0, 28.0, 43.0, 55.0, 67.0, 60.0, 77.0, 85.0, 83.0, 73.0, 86.0, 52.0, 34.0, 35.0, 23.0, 18.0, 16.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.916015625, -2.82293701171875, -2.7298583984375, -2.63677978515625, -2.543701171875, -2.45062255859375, -2.3575439453125, -2.26446533203125, -2.17138671875, -2.07830810546875, -1.9852294921875, -1.89215087890625, -1.799072265625, -1.70599365234375, -1.6129150390625, -1.51983642578125, -1.4267578125, -1.33367919921875, -1.2406005859375, -1.14752197265625, -1.054443359375, -0.96136474609375, -0.8682861328125, -0.77520751953125, -0.68212890625, -0.58905029296875, -0.4959716796875, -0.40289306640625, -0.309814453125, -0.21673583984375, -0.1236572265625, -0.03057861328125, 0.0625, 0.15557861328125, 0.2486572265625, 0.34173583984375, 0.434814453125, 0.52789306640625, 0.6209716796875, 0.71405029296875, 0.80712890625, 0.90020751953125, 0.9932861328125, 1.08636474609375, 1.179443359375, 1.27252197265625, 1.3656005859375, 1.45867919921875, 1.5517578125, 1.64483642578125, 1.7379150390625, 1.83099365234375, 1.924072265625, 2.01715087890625, 2.1102294921875, 2.20330810546875, 2.29638671875, 2.38946533203125, 2.4825439453125, 2.57562255859375, 2.668701171875, 2.76177978515625, 2.8548583984375, 2.94793701171875, 3.041015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 20.0, 21.0, 139.0, 407.0, 256.0, 96.0, 38.0, 13.0, 10.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-197.58197021484375, -193.25399780273438, -188.926025390625, -184.59803771972656, -180.2700653076172, -175.9420928955078, -171.61412048339844, -167.2861328125, -162.95816040039062, -158.63018798828125, -154.30221557617188, -149.97422790527344, -145.64625549316406, -141.3182830810547, -136.9903106689453, -132.66232299804688, -128.3343505859375, -124.00637817382812, -119.67839813232422, -115.35042572021484, -111.02244567871094, -106.69447326660156, -102.36650085449219, -98.03852081298828, -93.71055603027344, -89.38258361816406, -85.05460357666016, -80.72663116455078, -76.39865112304688, -72.0706787109375, -67.74270629882812, -63.41472625732422, -59.08674621582031, -54.75876998901367, -50.43079376220703, -46.102821350097656, -41.77484130859375, -37.446868896484375, -33.118892669677734, -28.790916442871094, -24.462940216064453, -20.134963989257812, -15.806988716125488, -11.479013442993164, -7.151037216186523, -2.823060989379883, 1.504913330078125, 5.832889556884766, 10.160865783691406, 14.488842010498047, 18.816818237304688, 23.144792556762695, 27.472768783569336, 31.800745010375977, 36.128719329833984, 40.456695556640625, 44.784671783447266, 49.112648010253906, 53.44062423706055, 57.76860046386719, 62.09657287597656, 66.42455291748047, 70.75252532958984, 75.08050537109375, 79.40847778320312]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 8.0, 9.0, 12.0, 20.0, 14.0, 17.0, 18.0, 27.0, 27.0, 29.0, 31.0, 35.0, 44.0, 50.0, 49.0, 68.0, 75.0, 63.0, 52.0, 49.0, 41.0, 34.0, 29.0, 23.0, 29.0, 27.0, 17.0, 18.0, 12.0, 15.0, 16.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.953636169433594, -49.27656555175781, -47.59949493408203, -45.92242431640625, -44.24535369873047, -42.56828308105469, -40.891212463378906, -39.214141845703125, -37.537071228027344, -35.86000061035156, -34.18292999267578, -32.505859375, -30.82878875732422, -29.151718139648438, -27.474645614624023, -25.797574996948242, -24.120502471923828, -22.443431854248047, -20.766361236572266, -19.089290618896484, -17.412220001220703, -15.735148429870605, -14.058076858520508, -12.381006240844727, -10.703935623168945, -9.026865005493164, -7.349793910980225, -5.672722816467285, -3.995652198791504, -2.3185815811157227, -0.641510009765625, 1.0355606079101562, 2.712635040283203, 4.389705657958984, 6.066776752471924, 7.743847846984863, 9.420918464660645, 11.097989082336426, 12.775060653686523, 14.452131271362305, 16.129201889038086, 17.806272506713867, 19.48334312438965, 21.160415649414062, 22.837486267089844, 24.514556884765625, 26.191627502441406, 27.868698120117188, 29.54576873779297, 31.22283935546875, 32.89990997314453, 34.57698059082031, 36.254051208496094, 37.931121826171875, 39.608192443847656, 41.28526306152344, 42.96233367919922, 44.639404296875, 46.31647491455078, 47.99354553222656, 49.670616149902344, 51.347686767578125, 53.024757385253906, 54.70182800292969, 56.378902435302734]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 12.0, 18.0, 22.0, 38.0, 70.0, 107.0, 161.0, 215.0, 350.0, 600.0, 987.0, 1780.0, 3768.0, 8070.0, 21521.0, 78129.0, 487274.0, 2426653.0, 968952.0, 143254.0, 31616.0, 10832.0, 4646.0, 2209.0, 1191.0, 688.0, 368.0, 275.0, 149.0, 102.0, 55.0, 47.0, 44.0, 17.0, 14.0, 9.0, 5.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.130859375, -3.028778076171875, -2.92669677734375, -2.824615478515625, -2.7225341796875, -2.620452880859375, -2.51837158203125, -2.416290283203125, -2.314208984375, -2.212127685546875, -2.11004638671875, -2.007965087890625, -1.9058837890625, -1.803802490234375, -1.70172119140625, -1.599639892578125, -1.49755859375, -1.395477294921875, -1.29339599609375, -1.191314697265625, -1.0892333984375, -0.987152099609375, -0.88507080078125, -0.782989501953125, -0.680908203125, -0.578826904296875, -0.47674560546875, -0.374664306640625, -0.2725830078125, -0.170501708984375, -0.06842041015625, 0.033660888671875, 0.1357421875, 0.237823486328125, 0.33990478515625, 0.441986083984375, 0.5440673828125, 0.646148681640625, 0.74822998046875, 0.850311279296875, 0.952392578125, 1.054473876953125, 1.15655517578125, 1.258636474609375, 1.3607177734375, 1.462799072265625, 1.56488037109375, 1.666961669921875, 1.76904296875, 1.871124267578125, 1.97320556640625, 2.075286865234375, 2.1773681640625, 2.279449462890625, 2.38153076171875, 2.483612060546875, 2.585693359375, 2.687774658203125, 2.78985595703125, 2.891937255859375, 2.9940185546875, 3.096099853515625, 3.19818115234375, 3.300262451171875, 3.40234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 12.0, 3.0, 7.0, 18.0, 21.0, 15.0, 24.0, 19.0, 28.0, 35.0, 37.0, 57.0, 44.0, 54.0, 46.0, 51.0, 66.0, 55.0, 63.0, 42.0, 50.0, 46.0, 34.0, 45.0, 29.0, 23.0, 16.0, 11.0, 16.0, 6.0, 10.0, 2.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.783203125, -2.671875, -2.560546875, -2.44921875, -2.337890625, -2.2265625, -2.115234375, -2.00390625, -1.892578125, -1.78125, -1.669921875, -1.55859375, -1.447265625, -1.3359375, -1.224609375, -1.11328125, -1.001953125, -0.890625, -0.779296875, -0.66796875, -0.556640625, -0.4453125, -0.333984375, -0.22265625, -0.111328125, 0.0, 0.111328125, 0.22265625, 0.333984375, 0.4453125, 0.556640625, 0.66796875, 0.779296875, 0.890625, 1.001953125, 1.11328125, 1.224609375, 1.3359375, 1.447265625, 1.55859375, 1.669921875, 1.78125, 1.892578125, 2.00390625, 2.115234375, 2.2265625, 2.337890625, 2.44921875, 2.560546875, 2.671875, 2.783203125, 2.89453125, 3.005859375, 3.1171875, 3.228515625, 3.33984375, 3.451171875, 3.5625, 3.673828125, 3.78515625, 3.896484375, 4.0078125, 4.119140625, 4.23046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 3.0, 13.0, 21.0, 30.0, 75.0, 107.0, 188.0, 343.0, 983.0, 6321.0, 215751.0, 3934167.0, 32409.0, 2810.0, 673.0, 224.0, 76.0, 47.0, 20.0, 12.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.078125, -17.617919921875, -17.15771484375, -16.697509765625, -16.2373046875, -15.777099609375, -15.31689453125, -14.856689453125, -14.396484375, -13.936279296875, -13.47607421875, -13.015869140625, -12.5556640625, -12.095458984375, -11.63525390625, -11.175048828125, -10.71484375, -10.254638671875, -9.79443359375, -9.334228515625, -8.8740234375, -8.413818359375, -7.95361328125, -7.493408203125, -7.033203125, -6.572998046875, -6.11279296875, -5.652587890625, -5.1923828125, -4.732177734375, -4.27197265625, -3.811767578125, -3.3515625, -2.891357421875, -2.43115234375, -1.970947265625, -1.5107421875, -1.050537109375, -0.59033203125, -0.130126953125, 0.330078125, 0.790283203125, 1.25048828125, 1.710693359375, 2.1708984375, 2.631103515625, 3.09130859375, 3.551513671875, 4.01171875, 4.471923828125, 4.93212890625, 5.392333984375, 5.8525390625, 6.312744140625, 6.77294921875, 7.233154296875, 7.693359375, 8.153564453125, 8.61376953125, 9.073974609375, 9.5341796875, 9.994384765625, 10.45458984375, 10.914794921875, 11.375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 11.0, 18.0, 28.0, 41.0, 90.0, 214.0, 658.0, 1419.0, 990.0, 302.0, 149.0, 57.0, 37.0, 19.0, 9.0, 13.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.375, -14.0130615234375, -13.651123046875, -13.2891845703125, -12.92724609375, -12.5653076171875, -12.203369140625, -11.8414306640625, -11.4794921875, -11.1175537109375, -10.755615234375, -10.3936767578125, -10.03173828125, -9.6697998046875, -9.307861328125, -8.9459228515625, -8.583984375, -8.2220458984375, -7.860107421875, -7.4981689453125, -7.13623046875, -6.7742919921875, -6.412353515625, -6.0504150390625, -5.6884765625, -5.3265380859375, -4.964599609375, -4.6026611328125, -4.24072265625, -3.8787841796875, -3.516845703125, -3.1549072265625, -2.79296875, -2.4310302734375, -2.069091796875, -1.7071533203125, -1.34521484375, -0.9832763671875, -0.621337890625, -0.2593994140625, 0.1025390625, 0.4644775390625, 0.826416015625, 1.1883544921875, 1.55029296875, 1.9122314453125, 2.274169921875, 2.6361083984375, 2.998046875, 3.3599853515625, 3.721923828125, 4.0838623046875, 4.44580078125, 4.8077392578125, 5.169677734375, 5.5316162109375, 5.8935546875, 6.2554931640625, 6.617431640625, 6.9793701171875, 7.34130859375, 7.7032470703125, 8.065185546875, 8.4271240234375, 8.7890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 18.0, 43.0, 128.0, 253.0, 280.0, 149.0, 61.0, 20.0, 10.0, 8.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.3783950805664, -89.4103775024414, -86.44236755371094, -83.47434997558594, -80.50634002685547, -77.53832244873047, -74.5703125, -71.602294921875, -68.63427734375, -65.666259765625, -62.69824981689453, -59.73023223876953, -56.7622184753418, -53.79420471191406, -50.82619094848633, -47.858177185058594, -44.89016342163086, -41.922149658203125, -38.95413589477539, -35.986122131347656, -33.018104553222656, -30.050090789794922, -27.082077026367188, -24.11406135559082, -21.146047592163086, -18.17803382873535, -15.210018157958984, -12.24200439453125, -9.2739896774292, -6.305974960327148, -3.337961196899414, -0.3699455261230469, 2.5980682373046875, 5.566082954406738, 8.534097671508789, 11.502111434936523, 14.470126152038574, 17.438140869140625, 20.40615463256836, 23.374170303344727, 26.34218406677246, 29.310197830200195, 32.27821350097656, 35.2462272644043, 38.21424102783203, 41.18225860595703, 44.1502685546875, 47.1182861328125, 50.086299896240234, 53.05431365966797, 56.0223274230957, 58.99034118652344, 61.95835876464844, 64.92637634277344, 67.8943862915039, 70.8624038696289, 73.83041381835938, 76.79843139648438, 79.76644134521484, 82.73445892333984, 85.70246887207031, 88.67048645019531, 91.63850402832031, 94.60651397705078, 97.57453155517578]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 8.0, 7.0, 7.0, 16.0, 22.0, 19.0, 23.0, 37.0, 42.0, 34.0, 36.0, 36.0, 33.0, 49.0, 54.0, 53.0, 54.0, 54.0, 59.0, 53.0, 48.0, 44.0, 46.0, 12.0, 25.0, 19.0, 22.0, 16.0, 10.0, 6.0, 7.0, 11.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.88356018066406, -37.798431396484375, -36.71330261230469, -35.628173828125, -34.54304504394531, -33.457916259765625, -32.37278747558594, -31.28765869140625, -30.202529907226562, -29.117401123046875, -28.032272338867188, -26.9471435546875, -25.862014770507812, -24.776885986328125, -23.691757202148438, -22.60662841796875, -21.521501541137695, -20.436372756958008, -19.35124397277832, -18.266115188598633, -17.180986404418945, -16.095857620239258, -15.010729789733887, -13.9256010055542, -12.840472221374512, -11.755343437194824, -10.670214653015137, -9.585086822509766, -8.499958038330078, -7.414828777313232, -6.329700469970703, -5.244571685791016, -4.159440994262695, -3.074312210083008, -1.9891836643218994, -0.904055118560791, 0.18107366561889648, 1.266202449798584, 2.3513307571411133, 3.436459541320801, 4.521588325500488, 5.606717109680176, 6.691845893859863, 7.776974201202393, 8.862102508544922, 9.94723129272461, 11.032360076904297, 12.117488861083984, 13.202617645263672, 14.28774642944336, 15.372875213623047, 16.458003997802734, 17.543132781982422, 18.62826156616211, 19.713390350341797, 20.798519134521484, 21.883647918701172, 22.96877670288086, 24.053905487060547, 25.139034271240234, 26.224163055419922, 27.30929183959961, 28.394420623779297, 29.479549407958984, 30.56467628479004]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 7.0, 13.0, 13.0, 20.0, 25.0, 35.0, 89.0, 138.0, 227.0, 389.0, 679.0, 1278.0, 2521.0, 5399.0, 11620.0, 28929.0, 75390.0, 206902.0, 387281.0, 203116.0, 73830.0, 28320.0, 11678.0, 5325.0, 2467.0, 1322.0, 634.0, 361.0, 215.0, 107.0, 80.0, 42.0, 31.0, 16.0, 11.0, 14.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.6710205078125, -4.517822265625, -4.3646240234375, -4.21142578125, -4.0582275390625, -3.905029296875, -3.7518310546875, -3.5986328125, -3.4454345703125, -3.292236328125, -3.1390380859375, -2.98583984375, -2.8326416015625, -2.679443359375, -2.5262451171875, -2.373046875, -2.2198486328125, -2.066650390625, -1.9134521484375, -1.76025390625, -1.6070556640625, -1.453857421875, -1.3006591796875, -1.1474609375, -0.9942626953125, -0.841064453125, -0.6878662109375, -0.53466796875, -0.3814697265625, -0.228271484375, -0.0750732421875, 0.078125, 0.2313232421875, 0.384521484375, 0.5377197265625, 0.69091796875, 0.8441162109375, 0.997314453125, 1.1505126953125, 1.3037109375, 1.4569091796875, 1.610107421875, 1.7633056640625, 1.91650390625, 2.0697021484375, 2.222900390625, 2.3760986328125, 2.529296875, 2.6824951171875, 2.835693359375, 2.9888916015625, 3.14208984375, 3.2952880859375, 3.448486328125, 3.6016845703125, 3.7548828125, 3.9080810546875, 4.061279296875, 4.2144775390625, 4.36767578125, 4.5208740234375, 4.674072265625, 4.8272705078125, 4.98046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 11.0, 16.0, 14.0, 15.0, 16.0, 20.0, 20.0, 25.0, 24.0, 30.0, 22.0, 39.0, 38.0, 36.0, 39.0, 39.0, 44.0, 42.0, 46.0, 32.0, 37.0, 60.0, 39.0, 32.0, 31.0, 38.0, 25.0, 18.0, 23.0, 24.0, 20.0, 14.0, 12.0, 11.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.09375, -3.00579833984375, -2.9178466796875, -2.82989501953125, -2.741943359375, -2.65399169921875, -2.5660400390625, -2.47808837890625, -2.39013671875, -2.30218505859375, -2.2142333984375, -2.12628173828125, -2.038330078125, -1.95037841796875, -1.8624267578125, -1.77447509765625, -1.6865234375, -1.59857177734375, -1.5106201171875, -1.42266845703125, -1.334716796875, -1.24676513671875, -1.1588134765625, -1.07086181640625, -0.98291015625, -0.89495849609375, -0.8070068359375, -0.71905517578125, -0.631103515625, -0.54315185546875, -0.4552001953125, -0.36724853515625, -0.279296875, -0.19134521484375, -0.1033935546875, -0.01544189453125, 0.072509765625, 0.16046142578125, 0.2484130859375, 0.33636474609375, 0.42431640625, 0.51226806640625, 0.6002197265625, 0.68817138671875, 0.776123046875, 0.86407470703125, 0.9520263671875, 1.03997802734375, 1.1279296875, 1.21588134765625, 1.3038330078125, 1.39178466796875, 1.479736328125, 1.56768798828125, 1.6556396484375, 1.74359130859375, 1.83154296875, 1.91949462890625, 2.0074462890625, 2.09539794921875, 2.183349609375, 2.27130126953125, 2.3592529296875, 2.44720458984375, 2.53515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 13.0, 4.0, 12.0, 14.0, 28.0, 39.0, 60.0, 106.0, 143.0, 214.0, 408.0, 603.0, 1034.0, 2091.0, 6537.0, 32596.0, 273079.0, 655251.0, 59936.0, 10222.0, 2963.0, 1281.0, 658.0, 415.0, 284.0, 183.0, 125.0, 75.0, 58.0, 32.0, 27.0, 21.0, 10.0, 7.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.125, -10.7679443359375, -10.410888671875, -10.0538330078125, -9.69677734375, -9.3397216796875, -8.982666015625, -8.6256103515625, -8.2685546875, -7.9114990234375, -7.554443359375, -7.1973876953125, -6.84033203125, -6.4832763671875, -6.126220703125, -5.7691650390625, -5.412109375, -5.0550537109375, -4.697998046875, -4.3409423828125, -3.98388671875, -3.6268310546875, -3.269775390625, -2.9127197265625, -2.5556640625, -2.1986083984375, -1.841552734375, -1.4844970703125, -1.12744140625, -0.7703857421875, -0.413330078125, -0.0562744140625, 0.30078125, 0.6578369140625, 1.014892578125, 1.3719482421875, 1.72900390625, 2.0860595703125, 2.443115234375, 2.8001708984375, 3.1572265625, 3.5142822265625, 3.871337890625, 4.2283935546875, 4.58544921875, 4.9425048828125, 5.299560546875, 5.6566162109375, 6.013671875, 6.3707275390625, 6.727783203125, 7.0848388671875, 7.44189453125, 7.7989501953125, 8.156005859375, 8.5130615234375, 8.8701171875, 9.2271728515625, 9.584228515625, 9.9412841796875, 10.29833984375, 10.6553955078125, 11.012451171875, 11.3695068359375, 11.7265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 11.0, 11.0, 9.0, 14.0, 18.0, 9.0, 25.0, 32.0, 28.0, 30.0, 40.0, 43.0, 41.0, 48.0, 63.0, 60.0, 52.0, 45.0, 40.0, 47.0, 38.0, 54.0, 31.0, 33.0, 34.0, 20.0, 21.0, 11.0, 17.0, 17.0, 18.0, 8.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7265625, -12.3299560546875, -11.933349609375, -11.5367431640625, -11.14013671875, -10.7435302734375, -10.346923828125, -9.9503173828125, -9.5537109375, -9.1571044921875, -8.760498046875, -8.3638916015625, -7.96728515625, -7.5706787109375, -7.174072265625, -6.7774658203125, -6.380859375, -5.9842529296875, -5.587646484375, -5.1910400390625, -4.79443359375, -4.3978271484375, -4.001220703125, -3.6046142578125, -3.2080078125, -2.8114013671875, -2.414794921875, -2.0181884765625, -1.62158203125, -1.2249755859375, -0.828369140625, -0.4317626953125, -0.03515625, 0.3614501953125, 0.758056640625, 1.1546630859375, 1.55126953125, 1.9478759765625, 2.344482421875, 2.7410888671875, 3.1376953125, 3.5343017578125, 3.930908203125, 4.3275146484375, 4.72412109375, 5.1207275390625, 5.517333984375, 5.9139404296875, 6.310546875, 6.7071533203125, 7.103759765625, 7.5003662109375, 7.89697265625, 8.2935791015625, 8.690185546875, 9.0867919921875, 9.4833984375, 9.8800048828125, 10.276611328125, 10.6732177734375, 11.06982421875, 11.4664306640625, 11.863037109375, 12.2596435546875, 12.65625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 17.0, 16.0, 24.0, 35.0, 81.0, 106.0, 293.0, 1033.0, 7094.0, 240511.0, 782966.0, 14047.0, 1548.0, 394.0, 146.0, 84.0, 45.0, 23.0, 21.0, 9.0, 12.0, 3.0, 9.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.43359375, -5.24041748046875, -5.0472412109375, -4.85406494140625, -4.660888671875, -4.46771240234375, -4.2745361328125, -4.08135986328125, -3.88818359375, -3.69500732421875, -3.5018310546875, -3.30865478515625, -3.115478515625, -2.92230224609375, -2.7291259765625, -2.53594970703125, -2.3427734375, -2.14959716796875, -1.9564208984375, -1.76324462890625, -1.570068359375, -1.37689208984375, -1.1837158203125, -0.99053955078125, -0.79736328125, -0.60418701171875, -0.4110107421875, -0.21783447265625, -0.024658203125, 0.16851806640625, 0.3616943359375, 0.55487060546875, 0.748046875, 0.94122314453125, 1.1343994140625, 1.32757568359375, 1.520751953125, 1.71392822265625, 1.9071044921875, 2.10028076171875, 2.29345703125, 2.48663330078125, 2.6798095703125, 2.87298583984375, 3.066162109375, 3.25933837890625, 3.4525146484375, 3.64569091796875, 3.8388671875, 4.03204345703125, 4.2252197265625, 4.41839599609375, 4.611572265625, 4.80474853515625, 4.9979248046875, 5.19110107421875, 5.38427734375, 5.57745361328125, 5.7706298828125, 5.96380615234375, 6.156982421875, 6.35015869140625, 6.5433349609375, 6.73651123046875, 6.9296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 8.0, 15.0, 19.0, 20.0, 40.0, 33.0, 54.0, 65.0, 113.0, 137.0, 139.0, 94.0, 66.0, 37.0, 25.0, 28.0, 20.0, 14.0, 10.0, 14.0, 11.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007143020629882812, -0.0006948858499526978, -0.0006754696369171143, -0.0006560534238815308, -0.0006366372108459473, -0.0006172209978103638, -0.0005978047847747803, -0.0005783885717391968, -0.0005589723587036133, -0.0005395561456680298, -0.0005201399326324463, -0.0005007237195968628, -0.0004813075065612793, -0.0004618912935256958, -0.0004424750804901123, -0.0004230588674545288, -0.0004036426544189453, -0.0003842264413833618, -0.0003648102283477783, -0.0003453940153121948, -0.00032597780227661133, -0.00030656158924102783, -0.00028714537620544434, -0.00026772916316986084, -0.00024831295013427734, -0.00022889673709869385, -0.00020948052406311035, -0.00019006431102752686, -0.00017064809799194336, -0.00015123188495635986, -0.00013181567192077637, -0.00011239945888519287, -9.298324584960938e-05, -7.356703281402588e-05, -5.415081977844238e-05, -3.473460674285889e-05, -1.531839370727539e-05, 4.0978193283081055e-06, 2.35140323638916e-05, 4.29302453994751e-05, 6.23464584350586e-05, 8.176267147064209e-05, 0.00010117888450622559, 0.00012059509754180908, 0.00014001131057739258, 0.00015942752361297607, 0.00017884373664855957, 0.00019825994968414307, 0.00021767616271972656, 0.00023709237575531006, 0.00025650858879089355, 0.00027592480182647705, 0.00029534101486206055, 0.00031475722789764404, 0.00033417344093322754, 0.00035358965396881104, 0.00037300586700439453, 0.00039242208003997803, 0.0004118382930755615, 0.000431254506111145, 0.0004506707191467285, 0.000470086932182312, 0.0004895031452178955, 0.000508919358253479, 0.0005283355712890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 13.0, 17.0, 31.0, 25.0, 46.0, 53.0, 96.0, 152.0, 242.0, 392.0, 740.0, 1707.0, 4369.0, 15892.0, 99826.0, 716707.0, 173909.0, 24165.0, 5995.0, 2058.0, 921.0, 446.0, 267.0, 156.0, 94.0, 63.0, 38.0, 30.0, 33.0, 17.0, 9.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.75469970703125, -2.6676025390625, -2.58050537109375, -2.493408203125, -2.40631103515625, -2.3192138671875, -2.23211669921875, -2.14501953125, -2.05792236328125, -1.9708251953125, -1.88372802734375, -1.796630859375, -1.70953369140625, -1.6224365234375, -1.53533935546875, -1.4482421875, -1.36114501953125, -1.2740478515625, -1.18695068359375, -1.099853515625, -1.01275634765625, -0.9256591796875, -0.83856201171875, -0.75146484375, -0.66436767578125, -0.5772705078125, -0.49017333984375, -0.403076171875, -0.31597900390625, -0.2288818359375, -0.14178466796875, -0.0546875, 0.03240966796875, 0.1195068359375, 0.20660400390625, 0.293701171875, 0.38079833984375, 0.4678955078125, 0.55499267578125, 0.64208984375, 0.72918701171875, 0.8162841796875, 0.90338134765625, 0.990478515625, 1.07757568359375, 1.1646728515625, 1.25177001953125, 1.3388671875, 1.42596435546875, 1.5130615234375, 1.60015869140625, 1.687255859375, 1.77435302734375, 1.8614501953125, 1.94854736328125, 2.03564453125, 2.12274169921875, 2.2098388671875, 2.29693603515625, 2.384033203125, 2.47113037109375, 2.5582275390625, 2.64532470703125, 2.732421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 9.0, 4.0, 9.0, 12.0, 22.0, 18.0, 29.0, 44.0, 62.0, 68.0, 82.0, 94.0, 83.0, 92.0, 90.0, 68.0, 43.0, 49.0, 36.0, 19.0, 18.0, 11.0, 9.0, 10.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.9820556640625, -2.887939453125, -2.7938232421875, -2.69970703125, -2.6055908203125, -2.511474609375, -2.4173583984375, -2.3232421875, -2.2291259765625, -2.135009765625, -2.0408935546875, -1.94677734375, -1.8526611328125, -1.758544921875, -1.6644287109375, -1.5703125, -1.4761962890625, -1.382080078125, -1.2879638671875, -1.19384765625, -1.0997314453125, -1.005615234375, -0.9114990234375, -0.8173828125, -0.7232666015625, -0.629150390625, -0.5350341796875, -0.44091796875, -0.3468017578125, -0.252685546875, -0.1585693359375, -0.064453125, 0.0296630859375, 0.123779296875, 0.2178955078125, 0.31201171875, 0.4061279296875, 0.500244140625, 0.5943603515625, 0.6884765625, 0.7825927734375, 0.876708984375, 0.9708251953125, 1.06494140625, 1.1590576171875, 1.253173828125, 1.3472900390625, 1.44140625, 1.5355224609375, 1.629638671875, 1.7237548828125, 1.81787109375, 1.9119873046875, 2.006103515625, 2.1002197265625, 2.1943359375, 2.2884521484375, 2.382568359375, 2.4766845703125, 2.57080078125, 2.6649169921875, 2.759033203125, 2.8531494140625, 2.947265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 13.0, 43.0, 106.0, 307.0, 301.0, 125.0, 47.0, 20.0, 13.0, 10.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.4957275390625, -112.189453125, -108.8831787109375, -105.576904296875, -102.2706298828125, -98.96435546875, -95.65808868408203, -92.35181427001953, -89.04553985595703, -85.73926544189453, -82.43299102783203, -79.12671661376953, -75.82044982910156, -72.51417541503906, -69.20790100097656, -65.90162658691406, -62.59535217285156, -59.28907775878906, -55.98280334472656, -52.67653274536133, -49.37025833129883, -46.06398391723633, -42.757713317871094, -39.451438903808594, -36.145164489746094, -32.838890075683594, -29.532617568969727, -26.22634506225586, -22.92007064819336, -19.61379623413086, -16.307523727416992, -13.001251220703125, -9.694969177246094, -6.38869571685791, -3.0824222564697266, 0.22385120391845703, 3.5301246643066406, 6.836399078369141, 10.142671585083008, 13.448944091796875, 16.755218505859375, 20.061492919921875, 23.367765426635742, 26.67403793334961, 29.98031234741211, 33.28658676147461, 36.592857360839844, 39.899131774902344, 43.205406188964844, 46.511680603027344, 49.817955017089844, 53.12422561645508, 56.43050003051758, 59.73677444458008, 63.04304504394531, 66.34931945800781, 69.65559387207031, 72.96186828613281, 76.26814270019531, 79.57441711425781, 82.88069152832031, 86.18696594238281, 89.49323272705078, 92.79950714111328, 96.10578155517578]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 8.0, 4.0, 6.0, 6.0, 11.0, 18.0, 11.0, 16.0, 16.0, 19.0, 25.0, 26.0, 24.0, 38.0, 26.0, 37.0, 47.0, 75.0, 94.0, 94.0, 77.0, 37.0, 36.0, 39.0, 39.0, 32.0, 25.0, 18.0, 21.0, 14.0, 14.0, 14.0, 14.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.325225830078125, -46.54090881347656, -44.756591796875, -42.97227478027344, -41.187957763671875, -39.40364074707031, -37.619319915771484, -35.83500289916992, -34.05068588256836, -32.2663688659668, -30.482051849365234, -28.69773292541504, -26.913415908813477, -25.129098892211914, -23.34477996826172, -21.560462951660156, -19.776145935058594, -17.99182891845703, -16.20751190185547, -14.423192977905273, -12.638875961303711, -10.854558944702148, -9.07024097442627, -7.285923004150391, -5.501605987548828, -3.7172884941101074, -1.9329710006713867, -0.14865350723266602, 1.6356639862060547, 3.419981002807617, 5.204298973083496, 6.988616943359375, 8.772933959960938, 10.5572509765625, 12.341568946838379, 14.125886917114258, 15.91020393371582, 17.694520950317383, 19.478839874267578, 21.26315689086914, 23.047473907470703, 24.831790924072266, 26.616107940673828, 28.400426864624023, 30.184743881225586, 31.96906089782715, 33.753379821777344, 35.537696838378906, 37.32201385498047, 39.10633087158203, 40.890647888183594, 42.674964904785156, 44.45928192138672, 46.24359893798828, 48.02791976928711, 49.81223678588867, 51.596553802490234, 53.3808708190918, 55.16518783569336, 56.94950485229492, 58.73382568359375, 60.51814270019531, 62.302459716796875, 64.08677673339844, 65.87109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 16.0, 16.0, 36.0, 53.0, 82.0, 150.0, 302.0, 658.0, 2125.0, 11598.0, 319038.0, 3737807.0, 112908.0, 6910.0, 1462.0, 545.0, 258.0, 118.0, 63.0, 52.0, 31.0, 11.0, 9.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.9454345703125, -5.711181640625, -5.4769287109375, -5.24267578125, -5.0084228515625, -4.774169921875, -4.5399169921875, -4.3056640625, -4.0714111328125, -3.837158203125, -3.6029052734375, -3.36865234375, -3.1343994140625, -2.900146484375, -2.6658935546875, -2.431640625, -2.1973876953125, -1.963134765625, -1.7288818359375, -1.49462890625, -1.2603759765625, -1.026123046875, -0.7918701171875, -0.5576171875, -0.3233642578125, -0.089111328125, 0.1451416015625, 0.37939453125, 0.6136474609375, 0.847900390625, 1.0821533203125, 1.31640625, 1.5506591796875, 1.784912109375, 2.0191650390625, 2.25341796875, 2.4876708984375, 2.721923828125, 2.9561767578125, 3.1904296875, 3.4246826171875, 3.658935546875, 3.8931884765625, 4.12744140625, 4.3616943359375, 4.595947265625, 4.8302001953125, 5.064453125, 5.2987060546875, 5.532958984375, 5.7672119140625, 6.00146484375, 6.2357177734375, 6.469970703125, 6.7042236328125, 6.9384765625, 7.1727294921875, 7.406982421875, 7.6412353515625, 7.87548828125, 8.1097412109375, 8.343994140625, 8.5782470703125, 8.8125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 16.0, 14.0, 11.0, 19.0, 21.0, 25.0, 24.0, 25.0, 36.0, 46.0, 37.0, 31.0, 45.0, 41.0, 37.0, 48.0, 44.0, 45.0, 56.0, 41.0, 43.0, 38.0, 36.0, 31.0, 26.0, 22.0, 27.0, 22.0, 17.0, 16.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.835723876953125, -2.74566650390625, -2.655609130859375, -2.5655517578125, -2.475494384765625, -2.38543701171875, -2.295379638671875, -2.205322265625, -2.115264892578125, -2.02520751953125, -1.935150146484375, -1.8450927734375, -1.755035400390625, -1.66497802734375, -1.574920654296875, -1.48486328125, -1.394805908203125, -1.30474853515625, -1.214691162109375, -1.1246337890625, -1.034576416015625, -0.94451904296875, -0.854461669921875, -0.764404296875, -0.674346923828125, -0.58428955078125, -0.494232177734375, -0.4041748046875, -0.314117431640625, -0.22406005859375, -0.134002685546875, -0.0439453125, 0.046112060546875, 0.13616943359375, 0.226226806640625, 0.3162841796875, 0.406341552734375, 0.49639892578125, 0.586456298828125, 0.676513671875, 0.766571044921875, 0.85662841796875, 0.946685791015625, 1.0367431640625, 1.126800537109375, 1.21685791015625, 1.306915283203125, 1.39697265625, 1.487030029296875, 1.57708740234375, 1.667144775390625, 1.7572021484375, 1.847259521484375, 1.93731689453125, 2.027374267578125, 2.117431640625, 2.207489013671875, 2.29754638671875, 2.387603759765625, 2.4776611328125, 2.567718505859375, 2.65777587890625, 2.747833251953125, 2.837890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 11.0, 11.0, 21.0, 25.0, 42.0, 54.0, 106.0, 184.0, 511.0, 1617.0, 8549.0, 198929.0, 3933507.0, 44887.0, 4286.0, 907.0, 294.0, 154.0, 69.0, 38.0, 30.0, 16.0, 15.0, 16.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.6668701171875, -12.318115234375, -11.9693603515625, -11.62060546875, -11.2718505859375, -10.923095703125, -10.5743408203125, -10.2255859375, -9.8768310546875, -9.528076171875, -9.1793212890625, -8.83056640625, -8.4818115234375, -8.133056640625, -7.7843017578125, -7.435546875, -7.0867919921875, -6.738037109375, -6.3892822265625, -6.04052734375, -5.6917724609375, -5.343017578125, -4.9942626953125, -4.6455078125, -4.2967529296875, -3.947998046875, -3.5992431640625, -3.25048828125, -2.9017333984375, -2.552978515625, -2.2042236328125, -1.85546875, -1.5067138671875, -1.157958984375, -0.8092041015625, -0.46044921875, -0.1116943359375, 0.237060546875, 0.5858154296875, 0.9345703125, 1.2833251953125, 1.632080078125, 1.9808349609375, 2.32958984375, 2.6783447265625, 3.027099609375, 3.3758544921875, 3.724609375, 4.0733642578125, 4.422119140625, 4.7708740234375, 5.11962890625, 5.4683837890625, 5.817138671875, 6.1658935546875, 6.5146484375, 6.8634033203125, 7.212158203125, 7.5609130859375, 7.90966796875, 8.2584228515625, 8.607177734375, 8.9559326171875, 9.3046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 11.0, 8.0, 12.0, 11.0, 20.0, 22.0, 43.0, 58.0, 95.0, 185.0, 389.0, 650.0, 885.0, 757.0, 414.0, 209.0, 106.0, 56.0, 42.0, 23.0, 11.0, 16.0, 10.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.25689697265625, -6.0762939453125, -5.89569091796875, -5.715087890625, -5.53448486328125, -5.3538818359375, -5.17327880859375, -4.99267578125, -4.81207275390625, -4.6314697265625, -4.45086669921875, -4.270263671875, -4.08966064453125, -3.9090576171875, -3.72845458984375, -3.5478515625, -3.36724853515625, -3.1866455078125, -3.00604248046875, -2.825439453125, -2.64483642578125, -2.4642333984375, -2.28363037109375, -2.10302734375, -1.92242431640625, -1.7418212890625, -1.56121826171875, -1.380615234375, -1.20001220703125, -1.0194091796875, -0.83880615234375, -0.658203125, -0.47760009765625, -0.2969970703125, -0.11639404296875, 0.064208984375, 0.24481201171875, 0.4254150390625, 0.60601806640625, 0.78662109375, 0.96722412109375, 1.1478271484375, 1.32843017578125, 1.509033203125, 1.68963623046875, 1.8702392578125, 2.05084228515625, 2.2314453125, 2.41204833984375, 2.5926513671875, 2.77325439453125, 2.953857421875, 3.13446044921875, 3.3150634765625, 3.49566650390625, 3.67626953125, 3.85687255859375, 4.0374755859375, 4.21807861328125, 4.398681640625, 4.57928466796875, 4.7598876953125, 4.94049072265625, 5.12109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 18.0, 40.0, 88.0, 219.0, 278.0, 187.0, 83.0, 39.0, 15.0, 9.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-85.0141372680664, -82.90987396240234, -80.80561828613281, -78.70135498046875, -76.59709167480469, -74.49282836914062, -72.3885726928711, -70.28430938720703, -68.18004608154297, -66.0757827758789, -63.97152328491211, -61.86726379394531, -59.76300048828125, -57.65874099731445, -55.554481506347656, -53.450218200683594, -51.3459587097168, -49.24169921875, -47.13743591308594, -45.03317642211914, -42.92891311645508, -40.82465362548828, -38.72039031982422, -36.61613082885742, -34.511871337890625, -32.40761184692383, -30.303348541259766, -28.19908905029297, -26.094825744628906, -23.99056625366211, -21.88630485534668, -19.78204345703125, -17.677776336669922, -15.573514938354492, -13.469253540039062, -11.36499309539795, -9.26073169708252, -7.15647029876709, -5.052209854125977, -2.947948455810547, -0.8436870574951172, 1.2605741024017334, 3.364835262298584, 5.4690961837768555, 7.573357582092285, 9.677618980407715, 11.781879425048828, 13.886140823364258, 15.990402221679688, 18.094663619995117, 20.198925018310547, 22.303184509277344, 24.407447814941406, 26.511707305908203, 28.615968704223633, 30.720230102539062, 32.824493408203125, 34.92875289916992, 37.033016204833984, 39.13727569580078, 41.241539001464844, 43.34579849243164, 45.45005798339844, 47.5543212890625, 49.6585807800293]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 17.0, 17.0, 24.0, 16.0, 31.0, 33.0, 41.0, 50.0, 63.0, 68.0, 75.0, 70.0, 58.0, 68.0, 74.0, 62.0, 51.0, 28.0, 33.0, 26.0, 15.0, 14.0, 12.0, 9.0, 10.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.15859603881836, -39.11202621459961, -38.065460205078125, -37.018890380859375, -35.972320556640625, -34.925750732421875, -33.87918472290039, -32.83261489868164, -31.786046981811523, -30.739479064941406, -29.692909240722656, -28.64634132385254, -27.599773406982422, -26.553203582763672, -25.506635665893555, -24.460067749023438, -23.413497924804688, -22.36693000793457, -21.32036018371582, -20.273792266845703, -19.227222442626953, -18.180654525756836, -17.13408660888672, -16.08751678466797, -15.040948867797852, -13.994379997253418, -12.947811126708984, -11.901243209838867, -10.854674339294434, -9.80810546875, -8.761537551879883, -7.714968681335449, -6.66839599609375, -5.621827125549316, -4.575258731842041, -3.5286900997161865, -2.482121467590332, -1.4355525970458984, -0.38898420333862305, 0.6575841903686523, 1.704153060913086, 2.7507216930389404, 3.797290325164795, 4.84385871887207, 5.890427589416504, 6.9369964599609375, 7.983564853668213, 9.030133247375488, 10.076702117919922, 11.123270988464355, 12.169839859008789, 13.216407775878906, 14.26297664642334, 15.309545516967773, 16.35611343383789, 17.40268325805664, 18.449251174926758, 19.495819091796875, 20.542388916015625, 21.588956832885742, 22.63552474975586, 23.68209457397461, 24.728662490844727, 25.775230407714844, 26.821800231933594]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 13.0, 6.0, 9.0, 15.0, 16.0, 29.0, 28.0, 53.0, 83.0, 149.0, 296.0, 622.0, 1515.0, 4041.0, 12148.0, 41649.0, 166625.0, 479996.0, 252298.0, 62169.0, 17640.0, 5556.0, 1998.0, 795.0, 338.0, 190.0, 89.0, 69.0, 36.0, 25.0, 14.0, 10.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9921875, -5.8028564453125, -5.613525390625, -5.4241943359375, -5.23486328125, -5.0455322265625, -4.856201171875, -4.6668701171875, -4.4775390625, -4.2882080078125, -4.098876953125, -3.9095458984375, -3.72021484375, -3.5308837890625, -3.341552734375, -3.1522216796875, -2.962890625, -2.7735595703125, -2.584228515625, -2.3948974609375, -2.20556640625, -2.0162353515625, -1.826904296875, -1.6375732421875, -1.4482421875, -1.2589111328125, -1.069580078125, -0.8802490234375, -0.69091796875, -0.5015869140625, -0.312255859375, -0.1229248046875, 0.06640625, 0.2557373046875, 0.445068359375, 0.6343994140625, 0.82373046875, 1.0130615234375, 1.202392578125, 1.3917236328125, 1.5810546875, 1.7703857421875, 1.959716796875, 2.1490478515625, 2.33837890625, 2.5277099609375, 2.717041015625, 2.9063720703125, 3.095703125, 3.2850341796875, 3.474365234375, 3.6636962890625, 3.85302734375, 4.0423583984375, 4.231689453125, 4.4210205078125, 4.6103515625, 4.7996826171875, 4.989013671875, 5.1783447265625, 5.36767578125, 5.5570068359375, 5.746337890625, 5.9356689453125, 6.125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 8.0, 12.0, 9.0, 14.0, 24.0, 25.0, 21.0, 23.0, 18.0, 30.0, 30.0, 32.0, 39.0, 46.0, 41.0, 48.0, 44.0, 56.0, 57.0, 61.0, 58.0, 45.0, 36.0, 30.0, 40.0, 27.0, 24.0, 19.0, 23.0, 9.0, 16.0, 18.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.906524658203125, -2.80914306640625, -2.711761474609375, -2.6143798828125, -2.516998291015625, -2.41961669921875, -2.322235107421875, -2.224853515625, -2.127471923828125, -2.03009033203125, -1.932708740234375, -1.8353271484375, -1.737945556640625, -1.64056396484375, -1.543182373046875, -1.44580078125, -1.348419189453125, -1.25103759765625, -1.153656005859375, -1.0562744140625, -0.958892822265625, -0.86151123046875, -0.764129638671875, -0.666748046875, -0.569366455078125, -0.47198486328125, -0.374603271484375, -0.2772216796875, -0.179840087890625, -0.08245849609375, 0.014923095703125, 0.1123046875, 0.209686279296875, 0.30706787109375, 0.404449462890625, 0.5018310546875, 0.599212646484375, 0.69659423828125, 0.793975830078125, 0.891357421875, 0.988739013671875, 1.08612060546875, 1.183502197265625, 1.2808837890625, 1.378265380859375, 1.47564697265625, 1.573028564453125, 1.67041015625, 1.767791748046875, 1.86517333984375, 1.962554931640625, 2.0599365234375, 2.157318115234375, 2.25469970703125, 2.352081298828125, 2.449462890625, 2.546844482421875, 2.64422607421875, 2.741607666015625, 2.8389892578125, 2.936370849609375, 3.03375244140625, 3.131134033203125, 3.228515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 10.0, 8.0, 11.0, 16.0, 34.0, 52.0, 74.0, 114.0, 251.0, 497.0, 1469.0, 5109.0, 23529.0, 166944.0, 722151.0, 105964.0, 16423.0, 3727.0, 1152.0, 469.0, 196.0, 116.0, 69.0, 58.0, 35.0, 19.0, 17.0, 12.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-10.53125, -10.2569580078125, -9.982666015625, -9.7083740234375, -9.43408203125, -9.1597900390625, -8.885498046875, -8.6112060546875, -8.3369140625, -8.0626220703125, -7.788330078125, -7.5140380859375, -7.23974609375, -6.9654541015625, -6.691162109375, -6.4168701171875, -6.142578125, -5.8682861328125, -5.593994140625, -5.3197021484375, -5.04541015625, -4.7711181640625, -4.496826171875, -4.2225341796875, -3.9482421875, -3.6739501953125, -3.399658203125, -3.1253662109375, -2.85107421875, -2.5767822265625, -2.302490234375, -2.0281982421875, -1.75390625, -1.4796142578125, -1.205322265625, -0.9310302734375, -0.65673828125, -0.3824462890625, -0.108154296875, 0.1661376953125, 0.4404296875, 0.7147216796875, 0.989013671875, 1.2633056640625, 1.53759765625, 1.8118896484375, 2.086181640625, 2.3604736328125, 2.634765625, 2.9090576171875, 3.183349609375, 3.4576416015625, 3.73193359375, 4.0062255859375, 4.280517578125, 4.5548095703125, 4.8291015625, 5.1033935546875, 5.377685546875, 5.6519775390625, 5.92626953125, 6.2005615234375, 6.474853515625, 6.7491455078125, 7.0234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 7.0, 3.0, 4.0, 12.0, 15.0, 12.0, 12.0, 25.0, 22.0, 32.0, 23.0, 28.0, 35.0, 29.0, 43.0, 49.0, 56.0, 46.0, 34.0, 48.0, 45.0, 44.0, 43.0, 39.0, 39.0, 40.0, 43.0, 29.0, 24.0, 18.0, 26.0, 18.0, 11.0, 6.0, 5.0, 8.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.09375, -8.8046875, -8.515625, -8.2265625, -7.9375, -7.6484375, -7.359375, -7.0703125, -6.78125, -6.4921875, -6.203125, -5.9140625, -5.625, -5.3359375, -5.046875, -4.7578125, -4.46875, -4.1796875, -3.890625, -3.6015625, -3.3125, -3.0234375, -2.734375, -2.4453125, -2.15625, -1.8671875, -1.578125, -1.2890625, -1.0, -0.7109375, -0.421875, -0.1328125, 0.15625, 0.4453125, 0.734375, 1.0234375, 1.3125, 1.6015625, 1.890625, 2.1796875, 2.46875, 2.7578125, 3.046875, 3.3359375, 3.625, 3.9140625, 4.203125, 4.4921875, 4.78125, 5.0703125, 5.359375, 5.6484375, 5.9375, 6.2265625, 6.515625, 6.8046875, 7.09375, 7.3828125, 7.671875, 7.9609375, 8.25, 8.5390625, 8.828125, 9.1171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 8.0, 9.0, 7.0, 12.0, 13.0, 15.0, 39.0, 40.0, 61.0, 104.0, 192.0, 340.0, 643.0, 1580.0, 4497.0, 14376.0, 55070.0, 242588.0, 585020.0, 106187.0, 25755.0, 7415.0, 2551.0, 955.0, 436.0, 243.0, 138.0, 80.0, 46.0, 25.0, 33.0, 15.0, 20.0, 11.0, 7.0, 4.0, 2.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2724609375, -1.2257232666015625, -1.178985595703125, -1.1322479248046875, -1.08551025390625, -1.0387725830078125, -0.992034912109375, -0.9452972412109375, -0.8985595703125, -0.8518218994140625, -0.805084228515625, -0.7583465576171875, -0.71160888671875, -0.6648712158203125, -0.618133544921875, -0.5713958740234375, -0.524658203125, -0.4779205322265625, -0.431182861328125, -0.3844451904296875, -0.33770751953125, -0.2909698486328125, -0.244232177734375, -0.1974945068359375, -0.1507568359375, -0.1040191650390625, -0.057281494140625, -0.0105438232421875, 0.03619384765625, 0.0829315185546875, 0.129669189453125, 0.1764068603515625, 0.22314453125, 0.2698822021484375, 0.316619873046875, 0.3633575439453125, 0.41009521484375, 0.4568328857421875, 0.503570556640625, 0.5503082275390625, 0.5970458984375, 0.6437835693359375, 0.690521240234375, 0.7372589111328125, 0.78399658203125, 0.8307342529296875, 0.877471923828125, 0.9242095947265625, 0.970947265625, 1.0176849365234375, 1.064422607421875, 1.1111602783203125, 1.15789794921875, 1.2046356201171875, 1.251373291015625, 1.2981109619140625, 1.3448486328125, 1.3915863037109375, 1.438323974609375, 1.4850616455078125, 1.53179931640625, 1.5785369873046875, 1.625274658203125, 1.6720123291015625, 1.71875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 22.0, 21.0, 33.0, 55.0, 63.0, 84.0, 101.0, 106.0, 120.0, 95.0, 67.0, 54.0, 37.0, 30.0, 28.0, 18.0, 13.0, 8.0, 11.0, 1.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004391670227050781, -0.00042612478137016296, -0.0004130825400352478, -0.00040004029870033264, -0.0003869980573654175, -0.0003739558160305023, -0.00036091357469558716, -0.000347871333360672, -0.00033482909202575684, -0.0003217868506908417, -0.0003087446093559265, -0.00029570236802101135, -0.0002826601266860962, -0.00026961788535118103, -0.00025657564401626587, -0.0002435334026813507, -0.00023049116134643555, -0.00021744892001152039, -0.00020440667867660522, -0.00019136443734169006, -0.0001783221960067749, -0.00016527995467185974, -0.00015223771333694458, -0.00013919547200202942, -0.00012615323066711426, -0.0001131109893321991, -0.00010006874799728394, -8.702650666236877e-05, -7.398426532745361e-05, -6.094202399253845e-05, -4.789978265762329e-05, -3.485754132270813e-05, -2.181529998779297e-05, -8.773058652877808e-06, 4.2691826820373535e-06, 1.7311424016952515e-05, 3.0353665351867676e-05, 4.339590668678284e-05, 5.6438148021698e-05, 6.948038935661316e-05, 8.252263069152832e-05, 9.556487202644348e-05, 0.00010860711336135864, 0.0001216493546962738, 0.00013469159603118896, 0.00014773383736610413, 0.0001607760787010193, 0.00017381832003593445, 0.0001868605613708496, 0.00019990280270576477, 0.00021294504404067993, 0.0002259872853755951, 0.00023902952671051025, 0.0002520717680454254, 0.0002651140093803406, 0.00027815625071525574, 0.0002911984920501709, 0.00030424073338508606, 0.0003172829747200012, 0.0003303252160549164, 0.00034336745738983154, 0.0003564096987247467, 0.00036945194005966187, 0.000382494181394577, 0.0003955364227294922]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 16.0, 8.0, 19.0, 30.0, 60.0, 95.0, 198.0, 467.0, 1126.0, 3836.0, 17246.0, 127863.0, 741223.0, 133118.0, 17478.0, 3639.0, 1185.0, 449.0, 229.0, 105.0, 63.0, 35.0, 20.0, 16.0, 9.0, 6.0, 9.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5029296875, -1.4258880615234375, -1.348846435546875, -1.2718048095703125, -1.19476318359375, -1.1177215576171875, -1.040679931640625, -0.9636383056640625, -0.8865966796875, -0.8095550537109375, -0.732513427734375, -0.6554718017578125, -0.57843017578125, -0.5013885498046875, -0.424346923828125, -0.3473052978515625, -0.270263671875, -0.1932220458984375, -0.116180419921875, -0.0391387939453125, 0.03790283203125, 0.1149444580078125, 0.191986083984375, 0.2690277099609375, 0.3460693359375, 0.4231109619140625, 0.500152587890625, 0.5771942138671875, 0.65423583984375, 0.7312774658203125, 0.808319091796875, 0.8853607177734375, 0.96240234375, 1.0394439697265625, 1.116485595703125, 1.1935272216796875, 1.27056884765625, 1.3476104736328125, 1.424652099609375, 1.5016937255859375, 1.5787353515625, 1.6557769775390625, 1.732818603515625, 1.8098602294921875, 1.88690185546875, 1.9639434814453125, 2.040985107421875, 2.1180267333984375, 2.195068359375, 2.2721099853515625, 2.349151611328125, 2.4261932373046875, 2.50323486328125, 2.5802764892578125, 2.657318115234375, 2.7343597412109375, 2.8114013671875, 2.8884429931640625, 2.965484619140625, 3.0425262451171875, 3.11956787109375, 3.1966094970703125, 3.273651123046875, 3.3506927490234375, 3.427734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 16.0, 18.0, 16.0, 54.0, 70.0, 83.0, 106.0, 117.0, 133.0, 101.0, 69.0, 71.0, 38.0, 34.0, 19.0, 12.0, 13.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.4814453125, -2.40625, -2.3310546875, -2.255859375, -2.1806640625, -2.10546875, -2.0302734375, -1.955078125, -1.8798828125, -1.8046875, -1.7294921875, -1.654296875, -1.5791015625, -1.50390625, -1.4287109375, -1.353515625, -1.2783203125, -1.203125, -1.1279296875, -1.052734375, -0.9775390625, -0.90234375, -0.8271484375, -0.751953125, -0.6767578125, -0.6015625, -0.5263671875, -0.451171875, -0.3759765625, -0.30078125, -0.2255859375, -0.150390625, -0.0751953125, 0.0, 0.0751953125, 0.150390625, 0.2255859375, 0.30078125, 0.3759765625, 0.451171875, 0.5263671875, 0.6015625, 0.6767578125, 0.751953125, 0.8271484375, 0.90234375, 0.9775390625, 1.052734375, 1.1279296875, 1.203125, 1.2783203125, 1.353515625, 1.4287109375, 1.50390625, 1.5791015625, 1.654296875, 1.7294921875, 1.8046875, 1.8798828125, 1.955078125, 2.0302734375, 2.10546875, 2.1806640625, 2.255859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 12.0, 7.0, 9.0, 16.0, 30.0, 58.0, 80.0, 100.0, 191.0, 189.0, 102.0, 57.0, 53.0, 38.0, 18.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.0823917388916, -27.87055206298828, -26.65871238708496, -25.44687271118164, -24.23503303527832, -23.023193359375, -21.811351776123047, -20.59951400756836, -19.387672424316406, -18.175832748413086, -16.963993072509766, -15.752153396606445, -14.540313720703125, -13.328474044799805, -12.116633415222168, -10.904793739318848, -9.692955017089844, -8.481115341186523, -7.269275665283203, -6.057435512542725, -4.845595836639404, -3.633756160736084, -2.4219160079956055, -1.2100763320922852, 0.0017633438110351562, 1.213603138923645, 2.425442934036255, 3.6372828483581543, 4.849122524261475, 6.060962200164795, 7.272802352905273, 8.484642028808594, 9.696483612060547, 10.908323287963867, 12.120162963867188, 13.332002639770508, 14.543842315673828, 15.755681991577148, 16.96752166748047, 18.179363250732422, 19.39120101928711, 20.60304069519043, 21.81488037109375, 23.02672004699707, 24.23855972290039, 25.45039939880371, 26.66223907470703, 27.874080657958984, 29.085920333862305, 30.297760009765625, 31.509599685668945, 32.721439361572266, 33.93328094482422, 35.145118713378906, 36.35696029663086, 37.56879806518555, 38.7806396484375, 39.99248123168945, 41.20431900024414, 42.416160583496094, 43.62799835205078, 44.839839935302734, 46.05167770385742, 47.263519287109375, 48.47535705566406]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 3.0, 7.0, 13.0, 12.0, 13.0, 13.0, 23.0, 23.0, 26.0, 29.0, 28.0, 42.0, 35.0, 32.0, 48.0, 55.0, 64.0, 83.0, 64.0, 59.0, 48.0, 24.0, 27.0, 18.0, 23.0, 22.0, 30.0, 24.0, 16.0, 13.0, 10.0, 11.0, 17.0, 7.0, 7.0, 3.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.69568634033203, -39.576744079589844, -38.45780563354492, -37.3388671875, -36.21992492675781, -35.100982666015625, -33.9820442199707, -32.86310577392578, -31.744163513183594, -30.62522315979004, -29.506282806396484, -28.38734245300293, -27.268402099609375, -26.14946174621582, -25.030521392822266, -23.91158103942871, -22.792640686035156, -21.6737003326416, -20.554759979248047, -19.435819625854492, -18.316879272460938, -17.197938919067383, -16.078998565673828, -14.960058212280273, -13.841117858886719, -12.722177505493164, -11.60323715209961, -10.484296798706055, -9.3653564453125, -8.246416091918945, -7.127475738525391, -6.008535385131836, -4.889596939086914, -3.7706565856933594, -2.6517162322998047, -1.53277587890625, -0.4138355255126953, 0.7051048278808594, 1.824045181274414, 2.9429855346679688, 4.061925888061523, 5.180866241455078, 6.299806594848633, 7.4187469482421875, 8.537687301635742, 9.656627655029297, 10.775568008422852, 11.894508361816406, 13.013448715209961, 14.132389068603516, 15.25132942199707, 16.370269775390625, 17.48921012878418, 18.608150482177734, 19.72709083557129, 20.846031188964844, 21.9649715423584, 23.083911895751953, 24.202852249145508, 25.321792602539062, 26.440732955932617, 27.559673309326172, 28.678613662719727, 29.79755401611328, 30.916494369506836]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 17.0, 52.0, 77.0, 143.0, 316.0, 714.0, 1704.0, 5211.0, 24775.0, 374511.0, 3341066.0, 410406.0, 27055.0, 5230.0, 1619.0, 688.0, 291.0, 156.0, 94.0, 46.0, 28.0, 20.0, 11.0, 11.0, 9.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.37518310546875, -4.2269287109375, -4.07867431640625, -3.930419921875, -3.78216552734375, -3.6339111328125, -3.48565673828125, -3.33740234375, -3.18914794921875, -3.0408935546875, -2.89263916015625, -2.744384765625, -2.59613037109375, -2.4478759765625, -2.29962158203125, -2.1513671875, -2.00311279296875, -1.8548583984375, -1.70660400390625, -1.558349609375, -1.41009521484375, -1.2618408203125, -1.11358642578125, -0.96533203125, -0.81707763671875, -0.6688232421875, -0.52056884765625, -0.372314453125, -0.22406005859375, -0.0758056640625, 0.07244873046875, 0.220703125, 0.36895751953125, 0.5172119140625, 0.66546630859375, 0.813720703125, 0.96197509765625, 1.1102294921875, 1.25848388671875, 1.40673828125, 1.55499267578125, 1.7032470703125, 1.85150146484375, 1.999755859375, 2.14801025390625, 2.2962646484375, 2.44451904296875, 2.5927734375, 2.74102783203125, 2.8892822265625, 3.03753662109375, 3.185791015625, 3.33404541015625, 3.4822998046875, 3.63055419921875, 3.77880859375, 3.92706298828125, 4.0753173828125, 4.22357177734375, 4.371826171875, 4.52008056640625, 4.6683349609375, 4.81658935546875, 4.96484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 7.0, 5.0, 10.0, 6.0, 15.0, 22.0, 23.0, 16.0, 23.0, 33.0, 24.0, 39.0, 43.0, 43.0, 59.0, 57.0, 47.0, 67.0, 42.0, 59.0, 50.0, 44.0, 47.0, 35.0, 34.0, 29.0, 25.0, 27.0, 23.0, 17.0, 12.0, 5.0, 9.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.849212646484375, -2.75506591796875, -2.660919189453125, -2.5667724609375, -2.472625732421875, -2.37847900390625, -2.284332275390625, -2.190185546875, -2.096038818359375, -2.00189208984375, -1.907745361328125, -1.8135986328125, -1.719451904296875, -1.62530517578125, -1.531158447265625, -1.43701171875, -1.342864990234375, -1.24871826171875, -1.154571533203125, -1.0604248046875, -0.966278076171875, -0.87213134765625, -0.777984619140625, -0.683837890625, -0.589691162109375, -0.49554443359375, -0.401397705078125, -0.3072509765625, -0.213104248046875, -0.11895751953125, -0.024810791015625, 0.0693359375, 0.163482666015625, 0.25762939453125, 0.351776123046875, 0.4459228515625, 0.540069580078125, 0.63421630859375, 0.728363037109375, 0.822509765625, 0.916656494140625, 1.01080322265625, 1.104949951171875, 1.1990966796875, 1.293243408203125, 1.38739013671875, 1.481536865234375, 1.57568359375, 1.669830322265625, 1.76397705078125, 1.858123779296875, 1.9522705078125, 2.046417236328125, 2.14056396484375, 2.234710693359375, 2.328857421875, 2.423004150390625, 2.51715087890625, 2.611297607421875, 2.7054443359375, 2.799591064453125, 2.89373779296875, 2.987884521484375, 3.08203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 5.0, 4.0, 5.0, 17.0, 14.0, 17.0, 21.0, 37.0, 68.0, 81.0, 191.0, 376.0, 893.0, 2779.0, 12253.0, 105383.0, 3474313.0, 560746.0, 28926.0, 5379.0, 1542.0, 589.0, 275.0, 110.0, 77.0, 45.0, 29.0, 26.0, 18.0, 8.0, 10.0, 7.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.828125, -5.63848876953125, -5.4488525390625, -5.25921630859375, -5.069580078125, -4.87994384765625, -4.6903076171875, -4.50067138671875, -4.31103515625, -4.12139892578125, -3.9317626953125, -3.74212646484375, -3.552490234375, -3.36285400390625, -3.1732177734375, -2.98358154296875, -2.7939453125, -2.60430908203125, -2.4146728515625, -2.22503662109375, -2.035400390625, -1.84576416015625, -1.6561279296875, -1.46649169921875, -1.27685546875, -1.08721923828125, -0.8975830078125, -0.70794677734375, -0.518310546875, -0.32867431640625, -0.1390380859375, 0.05059814453125, 0.240234375, 0.42987060546875, 0.6195068359375, 0.80914306640625, 0.998779296875, 1.18841552734375, 1.3780517578125, 1.56768798828125, 1.75732421875, 1.94696044921875, 2.1365966796875, 2.32623291015625, 2.515869140625, 2.70550537109375, 2.8951416015625, 3.08477783203125, 3.2744140625, 3.46405029296875, 3.6536865234375, 3.84332275390625, 4.032958984375, 4.22259521484375, 4.4122314453125, 4.60186767578125, 4.79150390625, 4.98114013671875, 5.1707763671875, 5.36041259765625, 5.550048828125, 5.73968505859375, 5.9293212890625, 6.11895751953125, 6.30859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 6.0, 10.0, 14.0, 20.0, 25.0, 36.0, 56.0, 108.0, 167.0, 264.0, 480.0, 729.0, 779.0, 593.0, 311.0, 190.0, 103.0, 53.0, 38.0, 29.0, 11.0, 14.0, 5.0, 4.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.31549072265625, -4.1622314453125, -4.00897216796875, -3.855712890625, -3.70245361328125, -3.5491943359375, -3.39593505859375, -3.24267578125, -3.08941650390625, -2.9361572265625, -2.78289794921875, -2.629638671875, -2.47637939453125, -2.3231201171875, -2.16986083984375, -2.0166015625, -1.86334228515625, -1.7100830078125, -1.55682373046875, -1.403564453125, -1.25030517578125, -1.0970458984375, -0.94378662109375, -0.79052734375, -0.63726806640625, -0.4840087890625, -0.33074951171875, -0.177490234375, -0.02423095703125, 0.1290283203125, 0.28228759765625, 0.435546875, 0.58880615234375, 0.7420654296875, 0.89532470703125, 1.048583984375, 1.20184326171875, 1.3551025390625, 1.50836181640625, 1.66162109375, 1.81488037109375, 1.9681396484375, 2.12139892578125, 2.274658203125, 2.42791748046875, 2.5811767578125, 2.73443603515625, 2.8876953125, 3.04095458984375, 3.1942138671875, 3.34747314453125, 3.500732421875, 3.65399169921875, 3.8072509765625, 3.96051025390625, 4.11376953125, 4.26702880859375, 4.4202880859375, 4.57354736328125, 4.726806640625, 4.88006591796875, 5.0333251953125, 5.18658447265625, 5.33984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 20.0, 57.0, 160.0, 365.0, 257.0, 90.0, 24.0, 15.0, 9.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.72824096679688, -96.36182403564453, -93.99540710449219, -91.62898254394531, -89.26256561279297, -86.89614868164062, -84.52973175048828, -82.16331481933594, -79.79689025878906, -77.43047332763672, -75.06405639648438, -72.6976318359375, -70.33121490478516, -67.96479797363281, -65.59838104248047, -63.231964111328125, -60.86554718017578, -58.49913024902344, -56.13270950317383, -53.766292572021484, -51.399871826171875, -49.03345489501953, -46.66703796386719, -44.300621032714844, -41.934200286865234, -39.56778335571289, -37.20136260986328, -34.83494567871094, -32.468528747558594, -30.102108001708984, -27.73569107055664, -25.369272232055664, -23.00286102294922, -20.636442184448242, -18.270023345947266, -15.903606414794922, -13.537187576293945, -11.170768737792969, -8.804350852966309, -6.437932968139648, -4.071514129638672, -1.7050957679748535, 0.6613225936889648, 3.027740955352783, 5.394159317016602, 7.760578155517578, 10.126996040344238, 12.493413925170898, 14.859832763671875, 17.22625160217285, 19.592670440673828, 21.959087371826172, 24.32550621032715, 26.691925048828125, 29.05834197998047, 31.424760818481445, 33.79117965698242, 36.157596588134766, 38.524017333984375, 40.89043426513672, 43.25685119628906, 45.62327194213867, 47.989688873291016, 50.356109619140625, 52.72252655029297]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 1.0, 7.0, 15.0, 8.0, 16.0, 15.0, 21.0, 26.0, 23.0, 36.0, 30.0, 31.0, 33.0, 49.0, 44.0, 43.0, 44.0, 50.0, 49.0, 52.0, 29.0, 38.0, 39.0, 30.0, 34.0, 27.0, 34.0, 19.0, 23.0, 19.0, 21.0, 15.0, 10.0, 8.0, 7.0, 3.0, 7.0, 5.0, 5.0, 6.0, 0.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.181236267089844, -15.639416694641113, -15.0975980758667, -14.555778503417969, -14.013959884643555, -13.472140312194824, -12.930320739746094, -12.38850212097168, -11.846683502197266, -11.304863929748535, -10.763045310974121, -10.22122573852539, -9.679407119750977, -9.137587547302246, -8.595767974853516, -8.053949356079102, -7.512129783630371, -6.970310688018799, -6.428491592407227, -5.886672019958496, -5.344853401184082, -4.803033828735352, -4.261214733123779, -3.719395637512207, -3.1775765419006348, -2.6357574462890625, -2.0939383506774902, -1.5521190166473389, -1.0102999210357666, -0.46848082542419434, 0.07333850860595703, 0.6151576042175293, 1.1569766998291016, 1.6987957954406738, 2.240614891052246, 2.7824342250823975, 3.3242533206939697, 3.866072416305542, 4.407891750335693, 4.949710845947266, 5.491529941558838, 6.03334903717041, 6.575168132781982, 7.116987228393555, 7.658806800842285, 8.2006254196167, 8.74244499206543, 9.284263610839844, 9.826083183288574, 10.367902755737305, 10.909721374511719, 11.45154094696045, 11.993359565734863, 12.535179138183594, 13.076997756958008, 13.618817329406738, 14.160636901855469, 14.7024564743042, 15.244275093078613, 15.786094665527344, 16.327913284301758, 16.869731903076172, 17.41155242919922, 17.953371047973633, 18.495189666748047]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 11.0, 11.0, 18.0, 24.0, 38.0, 52.0, 94.0, 176.0, 303.0, 635.0, 1296.0, 2633.0, 6128.0, 15416.0, 44231.0, 137083.0, 401500.0, 297632.0, 91409.0, 29885.0, 11174.0, 4633.0, 2043.0, 981.0, 474.0, 275.0, 140.0, 79.0, 66.0, 30.0, 26.0, 11.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.45794677734375, -4.3221435546875, -4.18634033203125, -4.050537109375, -3.91473388671875, -3.7789306640625, -3.64312744140625, -3.50732421875, -3.37152099609375, -3.2357177734375, -3.09991455078125, -2.964111328125, -2.82830810546875, -2.6925048828125, -2.55670166015625, -2.4208984375, -2.28509521484375, -2.1492919921875, -2.01348876953125, -1.877685546875, -1.74188232421875, -1.6060791015625, -1.47027587890625, -1.33447265625, -1.19866943359375, -1.0628662109375, -0.92706298828125, -0.791259765625, -0.65545654296875, -0.5196533203125, -0.38385009765625, -0.248046875, -0.11224365234375, 0.0235595703125, 0.15936279296875, 0.295166015625, 0.43096923828125, 0.5667724609375, 0.70257568359375, 0.83837890625, 0.97418212890625, 1.1099853515625, 1.24578857421875, 1.381591796875, 1.51739501953125, 1.6531982421875, 1.78900146484375, 1.9248046875, 2.06060791015625, 2.1964111328125, 2.33221435546875, 2.468017578125, 2.60382080078125, 2.7396240234375, 2.87542724609375, 3.01123046875, 3.14703369140625, 3.2828369140625, 3.41864013671875, 3.554443359375, 3.69024658203125, 3.8260498046875, 3.96185302734375, 4.09765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 4.0, 7.0, 5.0, 14.0, 12.0, 15.0, 22.0, 23.0, 16.0, 33.0, 33.0, 41.0, 43.0, 38.0, 44.0, 53.0, 70.0, 53.0, 53.0, 51.0, 55.0, 51.0, 44.0, 33.0, 29.0, 28.0, 23.0, 22.0, 23.0, 15.0, 12.0, 9.0, 15.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.962890625, -2.86822509765625, -2.7735595703125, -2.67889404296875, -2.584228515625, -2.48956298828125, -2.3948974609375, -2.30023193359375, -2.20556640625, -2.11090087890625, -2.0162353515625, -1.92156982421875, -1.826904296875, -1.73223876953125, -1.6375732421875, -1.54290771484375, -1.4482421875, -1.35357666015625, -1.2589111328125, -1.16424560546875, -1.069580078125, -0.97491455078125, -0.8802490234375, -0.78558349609375, -0.69091796875, -0.59625244140625, -0.5015869140625, -0.40692138671875, -0.312255859375, -0.21759033203125, -0.1229248046875, -0.02825927734375, 0.06640625, 0.16107177734375, 0.2557373046875, 0.35040283203125, 0.445068359375, 0.53973388671875, 0.6343994140625, 0.72906494140625, 0.82373046875, 0.91839599609375, 1.0130615234375, 1.10772705078125, 1.202392578125, 1.29705810546875, 1.3917236328125, 1.48638916015625, 1.5810546875, 1.67572021484375, 1.7703857421875, 1.86505126953125, 1.959716796875, 2.05438232421875, 2.1490478515625, 2.24371337890625, 2.33837890625, 2.43304443359375, 2.5277099609375, 2.62237548828125, 2.717041015625, 2.81170654296875, 2.9063720703125, 3.00103759765625, 3.095703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 8.0, 4.0, 10.0, 16.0, 18.0, 28.0, 32.0, 34.0, 60.0, 73.0, 113.0, 152.0, 260.0, 376.0, 637.0, 1274.0, 2823.0, 8278.0, 31533.0, 167683.0, 682594.0, 117367.0, 23774.0, 6328.0, 2387.0, 1057.0, 587.0, 328.0, 206.0, 141.0, 112.0, 68.0, 49.0, 45.0, 23.0, 22.0, 10.0, 11.0, 11.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.28643798828125, -6.0924072265625, -5.89837646484375, -5.704345703125, -5.51031494140625, -5.3162841796875, -5.12225341796875, -4.92822265625, -4.73419189453125, -4.5401611328125, -4.34613037109375, -4.152099609375, -3.95806884765625, -3.7640380859375, -3.57000732421875, -3.3759765625, -3.18194580078125, -2.9879150390625, -2.79388427734375, -2.599853515625, -2.40582275390625, -2.2117919921875, -2.01776123046875, -1.82373046875, -1.62969970703125, -1.4356689453125, -1.24163818359375, -1.047607421875, -0.85357666015625, -0.6595458984375, -0.46551513671875, -0.271484375, -0.07745361328125, 0.1165771484375, 0.31060791015625, 0.504638671875, 0.69866943359375, 0.8927001953125, 1.08673095703125, 1.28076171875, 1.47479248046875, 1.6688232421875, 1.86285400390625, 2.056884765625, 2.25091552734375, 2.4449462890625, 2.63897705078125, 2.8330078125, 3.02703857421875, 3.2210693359375, 3.41510009765625, 3.609130859375, 3.80316162109375, 3.9971923828125, 4.19122314453125, 4.38525390625, 4.57928466796875, 4.7733154296875, 4.96734619140625, 5.161376953125, 5.35540771484375, 5.5494384765625, 5.74346923828125, 5.9375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 7.0, 8.0, 5.0, 19.0, 18.0, 25.0, 25.0, 37.0, 35.0, 29.0, 33.0, 37.0, 50.0, 48.0, 44.0, 41.0, 57.0, 38.0, 46.0, 62.0, 53.0, 36.0, 42.0, 27.0, 29.0, 26.0, 18.0, 14.0, 16.0, 9.0, 8.0, 13.0, 7.0, 5.0, 7.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1484375, -6.8687744140625, -6.589111328125, -6.3094482421875, -6.02978515625, -5.7501220703125, -5.470458984375, -5.1907958984375, -4.9111328125, -4.6314697265625, -4.351806640625, -4.0721435546875, -3.79248046875, -3.5128173828125, -3.233154296875, -2.9534912109375, -2.673828125, -2.3941650390625, -2.114501953125, -1.8348388671875, -1.55517578125, -1.2755126953125, -0.995849609375, -0.7161865234375, -0.4365234375, -0.1568603515625, 0.122802734375, 0.4024658203125, 0.68212890625, 0.9617919921875, 1.241455078125, 1.5211181640625, 1.80078125, 2.0804443359375, 2.360107421875, 2.6397705078125, 2.91943359375, 3.1990966796875, 3.478759765625, 3.7584228515625, 4.0380859375, 4.3177490234375, 4.597412109375, 4.8770751953125, 5.15673828125, 5.4364013671875, 5.716064453125, 5.9957275390625, 6.275390625, 6.5550537109375, 6.834716796875, 7.1143798828125, 7.39404296875, 7.6737060546875, 7.953369140625, 8.2330322265625, 8.5126953125, 8.7923583984375, 9.072021484375, 9.3516845703125, 9.63134765625, 9.9110107421875, 10.190673828125, 10.4703369140625, 10.75]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 16.0, 11.0, 20.0, 29.0, 35.0, 54.0, 89.0, 159.0, 263.0, 652.0, 1682.0, 5683.0, 24915.0, 159605.0, 762547.0, 73188.0, 13775.0, 3595.0, 1183.0, 449.0, 231.0, 128.0, 72.0, 46.0, 40.0, 25.0, 12.0, 12.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.1882171630859375, -2.122528076171875, -2.0568389892578125, -1.99114990234375, -1.9254608154296875, -1.859771728515625, -1.7940826416015625, -1.7283935546875, -1.6627044677734375, -1.597015380859375, -1.5313262939453125, -1.46563720703125, -1.3999481201171875, -1.334259033203125, -1.2685699462890625, -1.202880859375, -1.1371917724609375, -1.071502685546875, -1.0058135986328125, -0.94012451171875, -0.8744354248046875, -0.808746337890625, -0.7430572509765625, -0.6773681640625, -0.6116790771484375, -0.545989990234375, -0.4803009033203125, -0.41461181640625, -0.3489227294921875, -0.283233642578125, -0.2175445556640625, -0.15185546875, -0.0861663818359375, -0.020477294921875, 0.0452117919921875, 0.11090087890625, 0.1765899658203125, 0.242279052734375, 0.3079681396484375, 0.3736572265625, 0.4393463134765625, 0.505035400390625, 0.5707244873046875, 0.63641357421875, 0.7021026611328125, 0.767791748046875, 0.8334808349609375, 0.899169921875, 0.9648590087890625, 1.030548095703125, 1.0962371826171875, 1.16192626953125, 1.2276153564453125, 1.293304443359375, 1.3589935302734375, 1.4246826171875, 1.4903717041015625, 1.556060791015625, 1.6217498779296875, 1.68743896484375, 1.7531280517578125, 1.818817138671875, 1.8845062255859375, 1.9501953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 0.0, 9.0, 17.0, 17.0, 15.0, 17.0, 23.0, 29.0, 36.0, 53.0, 73.0, 101.0, 121.0, 113.0, 93.0, 58.0, 33.0, 27.0, 20.0, 32.0, 19.0, 18.0, 6.0, 6.0, 4.0, 11.0, 6.0, 11.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002930164337158203, -0.0002831853926181793, -0.00027335435152053833, -0.00026352331042289734, -0.00025369226932525635, -0.00024386122822761536, -0.00023403018712997437, -0.00022419914603233337, -0.00021436810493469238, -0.0002045370638370514, -0.0001947060227394104, -0.0001848749816417694, -0.00017504394054412842, -0.00016521289944648743, -0.00015538185834884644, -0.00014555081725120544, -0.00013571977615356445, -0.00012588873505592346, -0.00011605769395828247, -0.00010622665286064148, -9.639561176300049e-05, -8.65645706653595e-05, -7.67335295677185e-05, -6.690248847007751e-05, -5.7071447372436523e-05, -4.724040627479553e-05, -3.740936517715454e-05, -2.757832407951355e-05, -1.774728298187256e-05, -7.916241884231567e-06, 1.914799213409424e-06, 1.1745840311050415e-05, 2.1576881408691406e-05, 3.14079225063324e-05, 4.123896360397339e-05, 5.107000470161438e-05, 6.090104579925537e-05, 7.073208689689636e-05, 8.056312799453735e-05, 9.039416909217834e-05, 0.00010022521018981934, 0.00011005625128746033, 0.00011988729238510132, 0.0001297183334827423, 0.0001395493745803833, 0.0001493804156780243, 0.00015921145677566528, 0.00016904249787330627, 0.00017887353897094727, 0.00018870458006858826, 0.00019853562116622925, 0.00020836666226387024, 0.00021819770336151123, 0.00022802874445915222, 0.0002378597855567932, 0.0002476908266544342, 0.0002575218677520752, 0.0002673529088497162, 0.0002771839499473572, 0.00028701499104499817, 0.00029684603214263916, 0.00030667707324028015, 0.00031650811433792114, 0.00032633915543556213, 0.0003361701965332031]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 19.0, 15.0, 26.0, 26.0, 41.0, 70.0, 109.0, 142.0, 189.0, 293.0, 533.0, 950.0, 1844.0, 4051.0, 9956.0, 27631.0, 92880.0, 608658.0, 217870.0, 53260.0, 17290.0, 6508.0, 2857.0, 1355.0, 759.0, 404.0, 277.0, 156.0, 117.0, 79.0, 44.0, 40.0, 26.0, 17.0, 8.0, 13.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5712890625, -1.527374267578125, -1.48345947265625, -1.439544677734375, -1.3956298828125, -1.351715087890625, -1.30780029296875, -1.263885498046875, -1.219970703125, -1.176055908203125, -1.13214111328125, -1.088226318359375, -1.0443115234375, -1.000396728515625, -0.95648193359375, -0.912567138671875, -0.86865234375, -0.824737548828125, -0.78082275390625, -0.736907958984375, -0.6929931640625, -0.649078369140625, -0.60516357421875, -0.561248779296875, -0.517333984375, -0.473419189453125, -0.42950439453125, -0.385589599609375, -0.3416748046875, -0.297760009765625, -0.25384521484375, -0.209930419921875, -0.166015625, -0.122100830078125, -0.07818603515625, -0.034271240234375, 0.0096435546875, 0.053558349609375, 0.09747314453125, 0.141387939453125, 0.185302734375, 0.229217529296875, 0.27313232421875, 0.317047119140625, 0.3609619140625, 0.404876708984375, 0.44879150390625, 0.492706298828125, 0.53662109375, 0.580535888671875, 0.62445068359375, 0.668365478515625, 0.7122802734375, 0.756195068359375, 0.80010986328125, 0.844024658203125, 0.887939453125, 0.931854248046875, 0.97576904296875, 1.019683837890625, 1.0635986328125, 1.107513427734375, 1.15142822265625, 1.195343017578125, 1.2392578125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 12.0, 6.0, 18.0, 13.0, 19.0, 21.0, 30.0, 35.0, 57.0, 77.0, 76.0, 106.0, 110.0, 115.0, 66.0, 51.0, 36.0, 31.0, 26.0, 18.0, 11.0, 13.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.228515625, -2.16845703125, -2.1083984375, -2.04833984375, -1.98828125, -1.92822265625, -1.8681640625, -1.80810546875, -1.748046875, -1.68798828125, -1.6279296875, -1.56787109375, -1.5078125, -1.44775390625, -1.3876953125, -1.32763671875, -1.267578125, -1.20751953125, -1.1474609375, -1.08740234375, -1.02734375, -0.96728515625, -0.9072265625, -0.84716796875, -0.787109375, -0.72705078125, -0.6669921875, -0.60693359375, -0.546875, -0.48681640625, -0.4267578125, -0.36669921875, -0.306640625, -0.24658203125, -0.1865234375, -0.12646484375, -0.06640625, -0.00634765625, 0.0537109375, 0.11376953125, 0.173828125, 0.23388671875, 0.2939453125, 0.35400390625, 0.4140625, 0.47412109375, 0.5341796875, 0.59423828125, 0.654296875, 0.71435546875, 0.7744140625, 0.83447265625, 0.89453125, 0.95458984375, 1.0146484375, 1.07470703125, 1.134765625, 1.19482421875, 1.2548828125, 1.31494140625, 1.375, 1.43505859375, 1.4951171875, 1.55517578125, 1.615234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 20.0, 45.0, 99.0, 198.0, 384.0, 129.0, 62.0, 23.0, 18.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-73.13159942626953, -71.11799621582031, -69.1043930053711, -67.09078979492188, -65.07719421386719, -63.0635871887207, -61.04998779296875, -59.03638458251953, -57.02278137207031, -55.009178161621094, -52.995574951171875, -50.98197555541992, -48.9683723449707, -46.954769134521484, -44.94116973876953, -42.92756652832031, -40.913963317871094, -38.900360107421875, -36.886756896972656, -34.8731575012207, -32.859554290771484, -30.845951080322266, -28.83234977722168, -26.818748474121094, -24.805145263671875, -22.791542053222656, -20.77794075012207, -18.764339447021484, -16.750736236572266, -14.737133979797363, -12.723531723022461, -10.709929466247559, -8.696327209472656, -6.682724952697754, -4.669122695922852, -2.655520439147949, -0.6419181823730469, 1.3716840744018555, 3.385286331176758, 5.39888858795166, 7.4124908447265625, 9.426093101501465, 11.439695358276367, 13.45329761505127, 15.466899871826172, 17.48050308227539, 19.494104385375977, 21.507705688476562, 23.52130889892578, 25.534912109375, 27.548513412475586, 29.562114715576172, 31.57571792602539, 33.58932113647461, 35.60292053222656, 37.61652374267578, 39.630126953125, 41.64373016357422, 43.65733337402344, 45.67093276977539, 47.68453598022461, 49.69813919067383, 51.71173858642578, 53.725341796875, 55.73894500732422]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 8.0, 9.0, 12.0, 14.0, 19.0, 16.0, 19.0, 23.0, 26.0, 26.0, 32.0, 26.0, 34.0, 31.0, 51.0, 93.0, 111.0, 81.0, 50.0, 57.0, 43.0, 30.0, 27.0, 20.0, 21.0, 23.0, 19.0, 17.0, 10.0, 7.0, 12.0, 6.0, 9.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.92427062988281, -34.7377815246582, -33.55128860473633, -32.36479949951172, -31.17831039428711, -29.991819381713867, -28.805328369140625, -27.618839263916016, -26.432348251342773, -25.24585723876953, -24.059368133544922, -22.87287712097168, -21.686386108398438, -20.499897003173828, -19.313405990600586, -18.126914978027344, -16.940425872802734, -15.753935813903809, -14.567445755004883, -13.38095474243164, -12.194464683532715, -11.007974624633789, -9.821483612060547, -8.634993553161621, -7.448503494262695, -6.2620134353637695, -5.0755228996276855, -3.8890326023101807, -2.702542304992676, -1.51605224609375, -0.329561710357666, 0.856928825378418, 2.043415069580078, 3.229905366897583, 4.416395664215088, 5.602886199951172, 6.789376258850098, 7.975866317749023, 9.162357330322266, 10.348847389221191, 11.535337448120117, 12.721827507019043, 13.908317565917969, 15.094808578491211, 16.281299591064453, 17.467788696289062, 18.654279708862305, 19.840770721435547, 21.027259826660156, 22.2137508392334, 23.400239944458008, 24.58673095703125, 25.77322006225586, 26.9597110748291, 28.146202087402344, 29.332691192626953, 30.519182205200195, 31.705673217773438, 32.89216232299805, 34.078651428222656, 35.26514434814453, 36.45163345336914, 37.63812255859375, 38.824615478515625, 40.011104583740234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 16.0, 10.0, 20.0, 20.0, 27.0, 52.0, 68.0, 113.0, 151.0, 206.0, 359.0, 624.0, 1066.0, 1827.0, 3615.0, 7641.0, 20696.0, 76646.0, 359744.0, 1489544.0, 1664994.0, 428151.0, 95243.0, 25399.0, 9187.0, 3929.0, 2105.0, 1119.0, 663.0, 353.0, 220.0, 137.0, 100.0, 71.0, 48.0, 35.0, 30.0, 8.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.408203125, -2.335357666015625, -2.26251220703125, -2.189666748046875, -2.1168212890625, -2.043975830078125, -1.97113037109375, -1.898284912109375, -1.825439453125, -1.752593994140625, -1.67974853515625, -1.606903076171875, -1.5340576171875, -1.461212158203125, -1.38836669921875, -1.315521240234375, -1.24267578125, -1.169830322265625, -1.09698486328125, -1.024139404296875, -0.9512939453125, -0.878448486328125, -0.80560302734375, -0.732757568359375, -0.659912109375, -0.587066650390625, -0.51422119140625, -0.441375732421875, -0.3685302734375, -0.295684814453125, -0.22283935546875, -0.149993896484375, -0.0771484375, -0.004302978515625, 0.06854248046875, 0.141387939453125, 0.2142333984375, 0.287078857421875, 0.35992431640625, 0.432769775390625, 0.505615234375, 0.578460693359375, 0.65130615234375, 0.724151611328125, 0.7969970703125, 0.869842529296875, 0.94268798828125, 1.015533447265625, 1.08837890625, 1.161224365234375, 1.23406982421875, 1.306915283203125, 1.3797607421875, 1.452606201171875, 1.52545166015625, 1.598297119140625, 1.671142578125, 1.743988037109375, 1.81683349609375, 1.889678955078125, 1.9625244140625, 2.035369873046875, 2.10821533203125, 2.181060791015625, 2.25390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 6.0, 11.0, 15.0, 9.0, 12.0, 15.0, 22.0, 18.0, 17.0, 25.0, 32.0, 31.0, 34.0, 36.0, 31.0, 47.0, 41.0, 56.0, 57.0, 37.0, 37.0, 41.0, 33.0, 47.0, 43.0, 40.0, 31.0, 24.0, 24.0, 23.0, 13.0, 12.0, 8.0, 17.0, 12.0, 8.0, 8.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.90234375, -2.8245849609375, -2.746826171875, -2.6690673828125, -2.59130859375, -2.5135498046875, -2.435791015625, -2.3580322265625, -2.2802734375, -2.2025146484375, -2.124755859375, -2.0469970703125, -1.96923828125, -1.8914794921875, -1.813720703125, -1.7359619140625, -1.658203125, -1.5804443359375, -1.502685546875, -1.4249267578125, -1.34716796875, -1.2694091796875, -1.191650390625, -1.1138916015625, -1.0361328125, -0.9583740234375, -0.880615234375, -0.8028564453125, -0.72509765625, -0.6473388671875, -0.569580078125, -0.4918212890625, -0.4140625, -0.3363037109375, -0.258544921875, -0.1807861328125, -0.10302734375, -0.0252685546875, 0.052490234375, 0.1302490234375, 0.2080078125, 0.2857666015625, 0.363525390625, 0.4412841796875, 0.51904296875, 0.5968017578125, 0.674560546875, 0.7523193359375, 0.830078125, 0.9078369140625, 0.985595703125, 1.0633544921875, 1.14111328125, 1.2188720703125, 1.296630859375, 1.3743896484375, 1.4521484375, 1.5299072265625, 1.607666015625, 1.6854248046875, 1.76318359375, 1.8409423828125, 1.918701171875, 1.9964599609375, 2.07421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 6.0, 4.0, 11.0, 12.0, 15.0, 23.0, 22.0, 42.0, 65.0, 102.0, 167.0, 319.0, 672.0, 1806.0, 6048.0, 30541.0, 378550.0, 3507842.0, 236635.0, 23475.0, 4958.0, 1599.0, 614.0, 269.0, 165.0, 85.0, 51.0, 27.0, 35.0, 26.0, 12.0, 21.0, 16.0, 5.0, 2.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.296875, -5.133544921875, -4.97021484375, -4.806884765625, -4.6435546875, -4.480224609375, -4.31689453125, -4.153564453125, -3.990234375, -3.826904296875, -3.66357421875, -3.500244140625, -3.3369140625, -3.173583984375, -3.01025390625, -2.846923828125, -2.68359375, -2.520263671875, -2.35693359375, -2.193603515625, -2.0302734375, -1.866943359375, -1.70361328125, -1.540283203125, -1.376953125, -1.213623046875, -1.05029296875, -0.886962890625, -0.7236328125, -0.560302734375, -0.39697265625, -0.233642578125, -0.0703125, 0.093017578125, 0.25634765625, 0.419677734375, 0.5830078125, 0.746337890625, 0.90966796875, 1.072998046875, 1.236328125, 1.399658203125, 1.56298828125, 1.726318359375, 1.8896484375, 2.052978515625, 2.21630859375, 2.379638671875, 2.54296875, 2.706298828125, 2.86962890625, 3.032958984375, 3.1962890625, 3.359619140625, 3.52294921875, 3.686279296875, 3.849609375, 4.012939453125, 4.17626953125, 4.339599609375, 4.5029296875, 4.666259765625, 4.82958984375, 4.992919921875, 5.15625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 2.0, 12.0, 11.0, 25.0, 30.0, 37.0, 76.0, 118.0, 182.0, 271.0, 485.0, 675.0, 729.0, 546.0, 323.0, 202.0, 109.0, 73.0, 39.0, 30.0, 22.0, 18.0, 16.0, 9.0, 13.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.73828125, -5.579833984375, -5.42138671875, -5.262939453125, -5.1044921875, -4.946044921875, -4.78759765625, -4.629150390625, -4.470703125, -4.312255859375, -4.15380859375, -3.995361328125, -3.8369140625, -3.678466796875, -3.52001953125, -3.361572265625, -3.203125, -3.044677734375, -2.88623046875, -2.727783203125, -2.5693359375, -2.410888671875, -2.25244140625, -2.093994140625, -1.935546875, -1.777099609375, -1.61865234375, -1.460205078125, -1.3017578125, -1.143310546875, -0.98486328125, -0.826416015625, -0.66796875, -0.509521484375, -0.35107421875, -0.192626953125, -0.0341796875, 0.124267578125, 0.28271484375, 0.441162109375, 0.599609375, 0.758056640625, 0.91650390625, 1.074951171875, 1.2333984375, 1.391845703125, 1.55029296875, 1.708740234375, 1.8671875, 2.025634765625, 2.18408203125, 2.342529296875, 2.5009765625, 2.659423828125, 2.81787109375, 2.976318359375, 3.134765625, 3.293212890625, 3.45166015625, 3.610107421875, 3.7685546875, 3.927001953125, 4.08544921875, 4.243896484375, 4.40234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 14.0, 41.0, 106.0, 241.0, 284.0, 193.0, 64.0, 23.0, 14.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.05078887939453, -76.99044799804688, -74.93010711669922, -72.86976623535156, -70.80943298339844, -68.74909210205078, -66.68875122070312, -64.62841033935547, -62.56806945800781, -60.507728576660156, -58.4473876953125, -56.38705062866211, -54.32670974731445, -52.2663688659668, -50.206031799316406, -48.14569091796875, -46.085350036621094, -44.02500915527344, -41.96466827392578, -39.90433120727539, -37.843990325927734, -35.78364944458008, -33.72331237792969, -31.66297149658203, -29.602630615234375, -27.54228973388672, -25.481950759887695, -23.421611785888672, -21.361270904541016, -19.30093002319336, -17.240591049194336, -15.180251121520996, -13.119911193847656, -11.059571266174316, -8.999231338500977, -6.938891410827637, -4.878551483154297, -2.818211555480957, -0.7578716278076172, 1.3024682998657227, 3.3628082275390625, 5.423148155212402, 7.483488082885742, 9.543828010559082, 11.604167938232422, 13.664507865905762, 15.724847793579102, 17.785186767578125, 19.84552764892578, 21.905868530273438, 23.96620750427246, 26.026546478271484, 28.08688735961914, 30.147228240966797, 32.20756530761719, 34.267906188964844, 36.3282470703125, 38.388587951660156, 40.44892883300781, 42.5092658996582, 44.56960678100586, 46.629947662353516, 48.690284729003906, 50.75062561035156, 52.81096649169922]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 2.0, 14.0, 14.0, 23.0, 16.0, 19.0, 23.0, 34.0, 44.0, 47.0, 53.0, 57.0, 38.0, 53.0, 52.0, 46.0, 70.0, 59.0, 43.0, 52.0, 37.0, 27.0, 29.0, 22.0, 31.0, 14.0, 16.0, 10.0, 10.0, 7.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-29.087732315063477, -28.290224075317383, -27.492713928222656, -26.695205688476562, -25.89769744873047, -25.100187301635742, -24.30267906188965, -23.505168914794922, -22.707660675048828, -21.910152435302734, -21.112642288208008, -20.315134048461914, -19.517623901367188, -18.720115661621094, -17.922607421875, -17.125099182128906, -16.32758903503418, -15.53007984161377, -14.73257064819336, -13.935062408447266, -13.137553215026855, -12.340044021606445, -11.542535781860352, -10.745026588439941, -9.947517395019531, -9.150008201599121, -8.352499008178711, -7.554990768432617, -6.757481575012207, -5.959972381591797, -5.162463665008545, -4.364954948425293, -3.56744384765625, -2.769934892654419, -1.972425937652588, -1.1749169826507568, -0.3774080276489258, 0.4201009273529053, 1.2176098823547363, 2.0151185989379883, 2.8126277923583984, 3.6101367473602295, 4.4076457023620605, 5.2051544189453125, 6.002663612365723, 6.800172805786133, 7.597681522369385, 8.395190238952637, 9.192699432373047, 9.990208625793457, 10.787717819213867, 11.585226058959961, 12.382735252380371, 13.180244445800781, 13.977752685546875, 14.775261878967285, 15.572771072387695, 16.37027931213379, 17.167789459228516, 17.96529769897461, 18.762805938720703, 19.56031608581543, 20.357824325561523, 21.15533447265625, 21.952842712402344]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 4.0, 6.0, 8.0, 3.0, 20.0, 36.0, 49.0, 81.0, 153.0, 271.0, 504.0, 952.0, 2000.0, 4427.0, 10866.0, 30679.0, 108995.0, 437382.0, 333240.0, 79040.0, 23961.0, 8658.0, 3712.0, 1683.0, 820.0, 404.0, 254.0, 135.0, 77.0, 42.0, 27.0, 17.0, 16.0, 13.0, 7.0, 7.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.6015625, -6.42730712890625, -6.2530517578125, -6.07879638671875, -5.904541015625, -5.73028564453125, -5.5560302734375, -5.38177490234375, -5.20751953125, -5.03326416015625, -4.8590087890625, -4.68475341796875, -4.510498046875, -4.33624267578125, -4.1619873046875, -3.98773193359375, -3.8134765625, -3.63922119140625, -3.4649658203125, -3.29071044921875, -3.116455078125, -2.94219970703125, -2.7679443359375, -2.59368896484375, -2.41943359375, -2.24517822265625, -2.0709228515625, -1.89666748046875, -1.722412109375, -1.54815673828125, -1.3739013671875, -1.19964599609375, -1.025390625, -0.85113525390625, -0.6768798828125, -0.50262451171875, -0.328369140625, -0.15411376953125, 0.0201416015625, 0.19439697265625, 0.36865234375, 0.54290771484375, 0.7171630859375, 0.89141845703125, 1.065673828125, 1.23992919921875, 1.4141845703125, 1.58843994140625, 1.7626953125, 1.93695068359375, 2.1112060546875, 2.28546142578125, 2.459716796875, 2.63397216796875, 2.8082275390625, 2.98248291015625, 3.15673828125, 3.33099365234375, 3.5052490234375, 3.67950439453125, 3.853759765625, 4.02801513671875, 4.2022705078125, 4.37652587890625, 4.55078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 5.0, 9.0, 15.0, 22.0, 26.0, 34.0, 28.0, 35.0, 39.0, 41.0, 52.0, 57.0, 54.0, 81.0, 53.0, 57.0, 59.0, 57.0, 44.0, 49.0, 37.0, 26.0, 23.0, 23.0, 13.0, 12.0, 11.0, 13.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.6015625, -4.49371337890625, -4.3858642578125, -4.27801513671875, -4.170166015625, -4.06231689453125, -3.9544677734375, -3.84661865234375, -3.73876953125, -3.63092041015625, -3.5230712890625, -3.41522216796875, -3.307373046875, -3.19952392578125, -3.0916748046875, -2.98382568359375, -2.8759765625, -2.76812744140625, -2.6602783203125, -2.55242919921875, -2.444580078125, -2.33673095703125, -2.2288818359375, -2.12103271484375, -2.01318359375, -1.90533447265625, -1.7974853515625, -1.68963623046875, -1.581787109375, -1.47393798828125, -1.3660888671875, -1.25823974609375, -1.150390625, -1.04254150390625, -0.9346923828125, -0.82684326171875, -0.718994140625, -0.61114501953125, -0.5032958984375, -0.39544677734375, -0.28759765625, -0.17974853515625, -0.0718994140625, 0.03594970703125, 0.143798828125, 0.25164794921875, 0.3594970703125, 0.46734619140625, 0.5751953125, 0.68304443359375, 0.7908935546875, 0.89874267578125, 1.006591796875, 1.11444091796875, 1.2222900390625, 1.33013916015625, 1.43798828125, 1.54583740234375, 1.6536865234375, 1.76153564453125, 1.869384765625, 1.97723388671875, 2.0850830078125, 2.19293212890625, 2.30078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 7.0, 13.0, 11.0, 16.0, 14.0, 26.0, 36.0, 51.0, 71.0, 94.0, 119.0, 166.0, 265.0, 382.0, 652.0, 1241.0, 3178.0, 14094.0, 155440.0, 815560.0, 46062.0, 6522.0, 1997.0, 915.0, 481.0, 316.0, 227.0, 175.0, 122.0, 82.0, 70.0, 39.0, 28.0, 25.0, 16.0, 9.0, 10.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.3125, -8.028564453125, -7.74462890625, -7.460693359375, -7.1767578125, -6.892822265625, -6.60888671875, -6.324951171875, -6.041015625, -5.757080078125, -5.47314453125, -5.189208984375, -4.9052734375, -4.621337890625, -4.33740234375, -4.053466796875, -3.76953125, -3.485595703125, -3.20166015625, -2.917724609375, -2.6337890625, -2.349853515625, -2.06591796875, -1.781982421875, -1.498046875, -1.214111328125, -0.93017578125, -0.646240234375, -0.3623046875, -0.078369140625, 0.20556640625, 0.489501953125, 0.7734375, 1.057373046875, 1.34130859375, 1.625244140625, 1.9091796875, 2.193115234375, 2.47705078125, 2.760986328125, 3.044921875, 3.328857421875, 3.61279296875, 3.896728515625, 4.1806640625, 4.464599609375, 4.74853515625, 5.032470703125, 5.31640625, 5.600341796875, 5.88427734375, 6.168212890625, 6.4521484375, 6.736083984375, 7.02001953125, 7.303955078125, 7.587890625, 7.871826171875, 8.15576171875, 8.439697265625, 8.7236328125, 9.007568359375, 9.29150390625, 9.575439453125, 9.859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 8.0, 7.0, 8.0, 12.0, 18.0, 29.0, 25.0, 27.0, 21.0, 35.0, 49.0, 49.0, 55.0, 70.0, 63.0, 55.0, 58.0, 50.0, 45.0, 55.0, 36.0, 38.0, 37.0, 25.0, 19.0, 18.0, 11.0, 15.0, 21.0, 8.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.5087890625, -12.166015625, -11.8232421875, -11.48046875, -11.1376953125, -10.794921875, -10.4521484375, -10.109375, -9.7666015625, -9.423828125, -9.0810546875, -8.73828125, -8.3955078125, -8.052734375, -7.7099609375, -7.3671875, -7.0244140625, -6.681640625, -6.3388671875, -5.99609375, -5.6533203125, -5.310546875, -4.9677734375, -4.625, -4.2822265625, -3.939453125, -3.5966796875, -3.25390625, -2.9111328125, -2.568359375, -2.2255859375, -1.8828125, -1.5400390625, -1.197265625, -0.8544921875, -0.51171875, -0.1689453125, 0.173828125, 0.5166015625, 0.859375, 1.2021484375, 1.544921875, 1.8876953125, 2.23046875, 2.5732421875, 2.916015625, 3.2587890625, 3.6015625, 3.9443359375, 4.287109375, 4.6298828125, 4.97265625, 5.3154296875, 5.658203125, 6.0009765625, 6.34375, 6.6865234375, 7.029296875, 7.3720703125, 7.71484375, 8.0576171875, 8.400390625, 8.7431640625, 9.0859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 12.0, 7.0, 19.0, 22.0, 40.0, 63.0, 105.0, 225.0, 449.0, 1190.0, 4421.0, 29266.0, 842134.0, 154860.0, 11753.0, 2522.0, 763.0, 308.0, 140.0, 74.0, 63.0, 35.0, 20.0, 16.0, 11.0, 7.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.758941650390625, -2.66632080078125, -2.573699951171875, -2.4810791015625, -2.388458251953125, -2.29583740234375, -2.203216552734375, -2.110595703125, -2.017974853515625, -1.92535400390625, -1.832733154296875, -1.7401123046875, -1.647491455078125, -1.55487060546875, -1.462249755859375, -1.36962890625, -1.277008056640625, -1.18438720703125, -1.091766357421875, -0.9991455078125, -0.906524658203125, -0.81390380859375, -0.721282958984375, -0.628662109375, -0.536041259765625, -0.44342041015625, -0.350799560546875, -0.2581787109375, -0.165557861328125, -0.07293701171875, 0.019683837890625, 0.1123046875, 0.204925537109375, 0.29754638671875, 0.390167236328125, 0.4827880859375, 0.575408935546875, 0.66802978515625, 0.760650634765625, 0.853271484375, 0.945892333984375, 1.03851318359375, 1.131134033203125, 1.2237548828125, 1.316375732421875, 1.40899658203125, 1.501617431640625, 1.59423828125, 1.686859130859375, 1.77947998046875, 1.872100830078125, 1.9647216796875, 2.057342529296875, 2.14996337890625, 2.242584228515625, 2.335205078125, 2.427825927734375, 2.52044677734375, 2.613067626953125, 2.7056884765625, 2.798309326171875, 2.89093017578125, 2.983551025390625, 3.076171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 8.0, 4.0, 5.0, 7.0, 3.0, 10.0, 16.0, 18.0, 25.0, 26.0, 42.0, 42.0, 83.0, 125.0, 143.0, 119.0, 79.0, 68.0, 41.0, 30.0, 26.0, 21.0, 13.0, 10.0, 6.0, 6.0, 2.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00038552284240722656, -0.000372517853975296, -0.0003595128655433655, -0.00034650787711143494, -0.0003335028886795044, -0.00032049790024757385, -0.0003074929118156433, -0.00029448792338371277, -0.0002814829349517822, -0.0002684779465198517, -0.00025547295808792114, -0.0002424679696559906, -0.00022946298122406006, -0.00021645799279212952, -0.00020345300436019897, -0.00019044801592826843, -0.0001774430274963379, -0.00016443803906440735, -0.0001514330506324768, -0.00013842806220054626, -0.00012542307376861572, -0.00011241808533668518, -9.941309690475464e-05, -8.64081084728241e-05, -7.340312004089355e-05, -6.039813160896301e-05, -4.739314317703247e-05, -3.438815474510193e-05, -2.1383166313171387e-05, -8.378177881240845e-06, 4.626810550689697e-06, 1.763179898262024e-05, 3.063678741455078e-05, 4.364177584648132e-05, 5.6646764278411865e-05, 6.965175271034241e-05, 8.265674114227295e-05, 9.566172957420349e-05, 0.00010866671800613403, 0.00012167170643806458, 0.00013467669486999512, 0.00014768168330192566, 0.0001606866717338562, 0.00017369166016578674, 0.00018669664859771729, 0.00019970163702964783, 0.00021270662546157837, 0.0002257116138935089, 0.00023871660232543945, 0.00025172159075737, 0.00026472657918930054, 0.0002777315676212311, 0.0002907365560531616, 0.00030374154448509216, 0.0003167465329170227, 0.00032975152134895325, 0.0003427565097808838, 0.00035576149821281433, 0.0003687664866447449, 0.0003817714750766754, 0.00039477646350860596, 0.0004077814519405365, 0.00042078644037246704, 0.0004337914288043976, 0.0004467964172363281]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 5.0, 14.0, 13.0, 41.0, 67.0, 152.0, 305.0, 740.0, 2570.0, 12680.0, 174662.0, 818606.0, 32077.0, 4558.0, 1233.0, 429.0, 168.0, 113.0, 51.0, 26.0, 14.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.3812255859375, -2.293701171875, -2.2061767578125, -2.11865234375, -2.0311279296875, -1.943603515625, -1.8560791015625, -1.7685546875, -1.6810302734375, -1.593505859375, -1.5059814453125, -1.41845703125, -1.3309326171875, -1.243408203125, -1.1558837890625, -1.068359375, -0.9808349609375, -0.893310546875, -0.8057861328125, -0.71826171875, -0.6307373046875, -0.543212890625, -0.4556884765625, -0.3681640625, -0.2806396484375, -0.193115234375, -0.1055908203125, -0.01806640625, 0.0694580078125, 0.156982421875, 0.2445068359375, 0.33203125, 0.4195556640625, 0.507080078125, 0.5946044921875, 0.68212890625, 0.7696533203125, 0.857177734375, 0.9447021484375, 1.0322265625, 1.1197509765625, 1.207275390625, 1.2947998046875, 1.38232421875, 1.4698486328125, 1.557373046875, 1.6448974609375, 1.732421875, 1.8199462890625, 1.907470703125, 1.9949951171875, 2.08251953125, 2.1700439453125, 2.257568359375, 2.3450927734375, 2.4326171875, 2.5201416015625, 2.607666015625, 2.6951904296875, 2.78271484375, 2.8702392578125, 2.957763671875, 3.0452880859375, 3.1328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 10.0, 19.0, 16.0, 28.0, 41.0, 54.0, 100.0, 131.0, 197.0, 137.0, 97.0, 61.0, 37.0, 20.0, 12.0, 13.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.51953125, -3.4364471435546875, -3.353363037109375, -3.2702789306640625, -3.18719482421875, -3.1041107177734375, -3.021026611328125, -2.9379425048828125, -2.8548583984375, -2.7717742919921875, -2.688690185546875, -2.6056060791015625, -2.52252197265625, -2.4394378662109375, -2.356353759765625, -2.2732696533203125, -2.190185546875, -2.1071014404296875, -2.024017333984375, -1.9409332275390625, -1.85784912109375, -1.7747650146484375, -1.691680908203125, -1.6085968017578125, -1.5255126953125, -1.4424285888671875, -1.359344482421875, -1.2762603759765625, -1.19317626953125, -1.1100921630859375, -1.027008056640625, -0.9439239501953125, -0.86083984375, -0.7777557373046875, -0.694671630859375, -0.6115875244140625, -0.52850341796875, -0.4454193115234375, -0.362335205078125, -0.2792510986328125, -0.1961669921875, -0.1130828857421875, -0.029998779296875, 0.0530853271484375, 0.13616943359375, 0.2192535400390625, 0.302337646484375, 0.3854217529296875, 0.468505859375, 0.5515899658203125, 0.634674072265625, 0.7177581787109375, 0.80084228515625, 0.8839263916015625, 0.967010498046875, 1.0500946044921875, 1.1331787109375, 1.2162628173828125, 1.299346923828125, 1.3824310302734375, 1.46551513671875, 1.5485992431640625, 1.631683349609375, 1.7147674560546875, 1.7978515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 12.0, 30.0, 72.0, 137.0, 419.0, 177.0, 84.0, 26.0, 19.0, 9.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.30963134765625, -66.33072662353516, -64.35182189941406, -62.372920989990234, -60.39401626586914, -58.41511535644531, -56.43621063232422, -54.457305908203125, -52.47840118408203, -50.49949645996094, -48.52059555053711, -46.541690826416016, -44.56278610229492, -42.583885192871094, -40.60498046875, -38.626075744628906, -36.64717102050781, -34.66826629638672, -32.68936538696289, -30.710460662841797, -28.731555938720703, -26.752653121948242, -24.77375030517578, -22.794845581054688, -20.81594467163086, -18.8370418548584, -16.858137130737305, -14.879234313964844, -12.90032958984375, -10.921426773071289, -8.942523002624512, -6.963619232177734, -4.984714508056641, -3.0058107376098633, -1.026907205581665, 0.9519963264465332, 2.9309000968933105, 4.90980339050293, 6.888707160949707, 8.867610931396484, 10.846514701843262, 12.825418472290039, 14.804322242736816, 16.783226013183594, 18.762128829956055, 20.741031646728516, 22.71993637084961, 24.698841094970703, 26.677743911743164, 28.656646728515625, 30.63555145263672, 32.61445617675781, 34.59335708618164, 36.572261810302734, 38.55116653442383, 40.530067443847656, 42.50897216796875, 44.487876892089844, 46.46677780151367, 48.445682525634766, 50.42458724975586, 52.40348815917969, 54.38239288330078, 56.361297607421875, 58.34020233154297]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 15.0, 9.0, 10.0, 8.0, 22.0, 32.0, 36.0, 23.0, 41.0, 28.0, 62.0, 88.0, 209.0, 104.0, 48.0, 58.0, 53.0, 26.0, 34.0, 21.0, 19.0, 18.0, 11.0, 12.0, 5.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.12767028808594, -33.41998291015625, -31.712291717529297, -30.00460433959961, -28.29691505432129, -26.58922576904297, -24.88153839111328, -23.17384910583496, -21.46615982055664, -19.75847053527832, -18.05078125, -16.343093872070312, -14.635404586791992, -12.927715301513672, -11.220026969909668, -9.512338638305664, -7.804649353027344, -6.096960544586182, -4.3892717361450195, -2.6815829277038574, -0.9738941192626953, 0.733795166015625, 2.441483497619629, 4.149171829223633, 5.856861114501953, 7.564549922943115, 9.272238731384277, 10.979927062988281, 12.687616348266602, 14.395305633544922, 16.10299301147461, 17.81068229675293, 19.51837158203125, 21.22606086730957, 22.93375015258789, 24.641437530517578, 26.3491268157959, 28.05681610107422, 29.764503479003906, 31.472192764282227, 33.17988204956055, 34.887569427490234, 36.59526062011719, 38.302947998046875, 40.01063537597656, 41.718326568603516, 43.4260139465332, 45.133705139160156, 46.841392517089844, 48.54907989501953, 50.256771087646484, 51.96445846557617, 53.672149658203125, 55.37983703613281, 57.0875244140625, 58.79521179199219, 60.50290298461914, 62.21059036254883, 63.91828155517578, 65.62596893310547, 67.33365631103516, 69.04135131835938, 70.74903869628906, 72.45672607421875, 74.16441345214844]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 17.0, 21.0, 32.0, 63.0, 119.0, 219.0, 368.0, 669.0, 1442.0, 3171.0, 8530.0, 36019.0, 300304.0, 1769918.0, 1715424.0, 302231.0, 41063.0, 8707.0, 3189.0, 1395.0, 684.0, 308.0, 171.0, 95.0, 52.0, 25.0, 13.0, 10.0, 7.0, 3.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8359375, -4.70159912109375, -4.5672607421875, -4.43292236328125, -4.298583984375, -4.16424560546875, -4.0299072265625, -3.89556884765625, -3.76123046875, -3.62689208984375, -3.4925537109375, -3.35821533203125, -3.223876953125, -3.08953857421875, -2.9552001953125, -2.82086181640625, -2.6865234375, -2.55218505859375, -2.4178466796875, -2.28350830078125, -2.149169921875, -2.01483154296875, -1.8804931640625, -1.74615478515625, -1.61181640625, -1.47747802734375, -1.3431396484375, -1.20880126953125, -1.074462890625, -0.94012451171875, -0.8057861328125, -0.67144775390625, -0.537109375, -0.40277099609375, -0.2684326171875, -0.13409423828125, 0.000244140625, 0.13458251953125, 0.2689208984375, 0.40325927734375, 0.53759765625, 0.67193603515625, 0.8062744140625, 0.94061279296875, 1.074951171875, 1.20928955078125, 1.3436279296875, 1.47796630859375, 1.6123046875, 1.74664306640625, 1.8809814453125, 2.01531982421875, 2.149658203125, 2.28399658203125, 2.4183349609375, 2.55267333984375, 2.68701171875, 2.82135009765625, 2.9556884765625, 3.09002685546875, 3.224365234375, 3.35870361328125, 3.4930419921875, 3.62738037109375, 3.76171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 7.0, 11.0, 9.0, 12.0, 15.0, 11.0, 23.0, 20.0, 33.0, 31.0, 30.0, 46.0, 37.0, 36.0, 46.0, 39.0, 49.0, 53.0, 47.0, 45.0, 52.0, 32.0, 49.0, 29.0, 31.0, 25.0, 27.0, 19.0, 15.0, 14.0, 26.0, 12.0, 9.0, 12.0, 4.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.900390625, -2.822113037109375, -2.74383544921875, -2.665557861328125, -2.5872802734375, -2.509002685546875, -2.43072509765625, -2.352447509765625, -2.274169921875, -2.195892333984375, -2.11761474609375, -2.039337158203125, -1.9610595703125, -1.882781982421875, -1.80450439453125, -1.726226806640625, -1.64794921875, -1.569671630859375, -1.49139404296875, -1.413116455078125, -1.3348388671875, -1.256561279296875, -1.17828369140625, -1.100006103515625, -1.021728515625, -0.943450927734375, -0.86517333984375, -0.786895751953125, -0.7086181640625, -0.630340576171875, -0.55206298828125, -0.473785400390625, -0.3955078125, -0.317230224609375, -0.23895263671875, -0.160675048828125, -0.0823974609375, -0.004119873046875, 0.07415771484375, 0.152435302734375, 0.230712890625, 0.308990478515625, 0.38726806640625, 0.465545654296875, 0.5438232421875, 0.622100830078125, 0.70037841796875, 0.778656005859375, 0.85693359375, 0.935211181640625, 1.01348876953125, 1.091766357421875, 1.1700439453125, 1.248321533203125, 1.32659912109375, 1.404876708984375, 1.483154296875, 1.561431884765625, 1.63970947265625, 1.717987060546875, 1.7962646484375, 1.874542236328125, 1.95281982421875, 2.031097412109375, 2.109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 10.0, 0.0, 5.0, 10.0, 11.0, 24.0, 30.0, 50.0, 96.0, 170.0, 231.0, 453.0, 824.0, 2051.0, 7191.0, 130567.0, 3996056.0, 49028.0, 4532.0, 1417.0, 640.0, 345.0, 191.0, 124.0, 66.0, 50.0, 37.0, 16.0, 14.0, 13.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.848388671875, -11.43115234375, -11.013916015625, -10.5966796875, -10.179443359375, -9.76220703125, -9.344970703125, -8.927734375, -8.510498046875, -8.09326171875, -7.676025390625, -7.2587890625, -6.841552734375, -6.42431640625, -6.007080078125, -5.58984375, -5.172607421875, -4.75537109375, -4.338134765625, -3.9208984375, -3.503662109375, -3.08642578125, -2.669189453125, -2.251953125, -1.834716796875, -1.41748046875, -1.000244140625, -0.5830078125, -0.165771484375, 0.25146484375, 0.668701171875, 1.0859375, 1.503173828125, 1.92041015625, 2.337646484375, 2.7548828125, 3.172119140625, 3.58935546875, 4.006591796875, 4.423828125, 4.841064453125, 5.25830078125, 5.675537109375, 6.0927734375, 6.510009765625, 6.92724609375, 7.344482421875, 7.76171875, 8.178955078125, 8.59619140625, 9.013427734375, 9.4306640625, 9.847900390625, 10.26513671875, 10.682373046875, 11.099609375, 11.516845703125, 11.93408203125, 12.351318359375, 12.7685546875, 13.185791015625, 13.60302734375, 14.020263671875, 14.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 8.0, 8.0, 10.0, 25.0, 27.0, 45.0, 44.0, 74.0, 97.0, 156.0, 225.0, 373.0, 617.0, 676.0, 613.0, 374.0, 247.0, 146.0, 101.0, 74.0, 33.0, 38.0, 14.0, 10.0, 7.0, 7.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-12.3359375, -12.060302734375, -11.78466796875, -11.509033203125, -11.2333984375, -10.957763671875, -10.68212890625, -10.406494140625, -10.130859375, -9.855224609375, -9.57958984375, -9.303955078125, -9.0283203125, -8.752685546875, -8.47705078125, -8.201416015625, -7.92578125, -7.650146484375, -7.37451171875, -7.098876953125, -6.8232421875, -6.547607421875, -6.27197265625, -5.996337890625, -5.720703125, -5.445068359375, -5.16943359375, -4.893798828125, -4.6181640625, -4.342529296875, -4.06689453125, -3.791259765625, -3.515625, -3.239990234375, -2.96435546875, -2.688720703125, -2.4130859375, -2.137451171875, -1.86181640625, -1.586181640625, -1.310546875, -1.034912109375, -0.75927734375, -0.483642578125, -0.2080078125, 0.067626953125, 0.34326171875, 0.618896484375, 0.89453125, 1.170166015625, 1.44580078125, 1.721435546875, 1.9970703125, 2.272705078125, 2.54833984375, 2.823974609375, 3.099609375, 3.375244140625, 3.65087890625, 3.926513671875, 4.2021484375, 4.477783203125, 4.75341796875, 5.029052734375, 5.3046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 5.0, 6.0, 6.0, 34.0, 63.0, 134.0, 256.0, 256.0, 131.0, 50.0, 19.0, 17.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-180.18360900878906, -176.10751342773438, -172.0314178466797, -167.955322265625, -163.8792266845703, -159.80313110351562, -155.72703552246094, -151.65093994140625, -147.57484436035156, -143.49874877929688, -139.4226531982422, -135.3465576171875, -131.2704620361328, -127.19436645507812, -123.11827087402344, -119.04217529296875, -114.9660873413086, -110.8899917602539, -106.81389617919922, -102.73780059814453, -98.66170501708984, -94.58560943603516, -90.509521484375, -86.43342590332031, -82.35733032226562, -78.28123474121094, -74.20513916015625, -70.12904357910156, -66.05294799804688, -61.97685241699219, -57.900760650634766, -53.82466506958008, -49.748565673828125, -45.67247009277344, -41.59637451171875, -37.52027893066406, -33.444183349609375, -29.36808967590332, -25.291996002197266, -21.215900421142578, -17.13980484008789, -13.063709259033203, -8.987614631652832, -4.911520004272461, -0.8354244232177734, 3.240671157836914, 7.316764831542969, 11.392860412597656, 15.468955993652344, 19.54505157470703, 23.62114715576172, 27.697240829467773, 31.77333641052246, 35.84943389892578, 39.9255256652832, 44.00162124633789, 48.07771682739258, 52.153812408447266, 56.22990798950195, 60.305999755859375, 64.38209533691406, 68.45819091796875, 72.53428649902344, 76.61038208007812, 80.68647766113281]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 10.0, 11.0, 10.0, 20.0, 22.0, 31.0, 22.0, 49.0, 40.0, 44.0, 56.0, 69.0, 61.0, 63.0, 43.0, 45.0, 51.0, 36.0, 46.0, 39.0, 30.0, 36.0, 18.0, 21.0, 11.0, 25.0, 11.0, 7.0, 9.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.98793411254883, -49.326019287109375, -47.66410446166992, -46.00218963623047, -44.34027862548828, -42.67836380004883, -41.016448974609375, -39.35453414916992, -37.69261932373047, -36.030704498291016, -34.36878967285156, -32.706878662109375, -31.044963836669922, -29.38304901123047, -27.721134185791016, -26.059219360351562, -24.397308349609375, -22.735393524169922, -21.0734806060791, -19.41156578063965, -17.749652862548828, -16.087738037109375, -14.425823211669922, -12.763909339904785, -11.101995468139648, -9.440081596374512, -7.778167247772217, -6.116252899169922, -4.454339027404785, -2.7924251556396484, -1.1305103302001953, 0.5314035415649414, 2.1933135986328125, 3.8552277088165283, 5.517141819000244, 7.179056167602539, 8.840970039367676, 10.502883911132812, 12.164798736572266, 13.826712608337402, 15.488626480102539, 17.150541305541992, 18.812454223632812, 20.474369049072266, 22.13628387451172, 23.79819679260254, 25.460111618041992, 27.122024536132812, 28.783939361572266, 30.44585418701172, 32.10776901245117, 33.769683837890625, 35.43159484863281, 37.093509674072266, 38.75542449951172, 40.41733932495117, 42.079254150390625, 43.74116897583008, 45.40308380126953, 47.06499481201172, 48.72690963745117, 50.388824462890625, 52.05073928833008, 53.71265411376953, 55.37456512451172]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 4.0, 9.0, 13.0, 16.0, 12.0, 21.0, 28.0, 52.0, 77.0, 123.0, 193.0, 323.0, 522.0, 877.0, 1624.0, 3201.0, 6583.0, 15544.0, 46134.0, 191012.0, 606885.0, 119519.0, 32778.0, 11858.0, 5146.0, 2641.0, 1363.0, 819.0, 427.0, 253.0, 165.0, 103.0, 85.0, 45.0, 29.0, 19.0, 12.0, 11.0, 8.0, 8.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.01953125, -3.899017333984375, -3.77850341796875, -3.657989501953125, -3.5374755859375, -3.416961669921875, -3.29644775390625, -3.175933837890625, -3.055419921875, -2.934906005859375, -2.81439208984375, -2.693878173828125, -2.5733642578125, -2.452850341796875, -2.33233642578125, -2.211822509765625, -2.09130859375, -1.970794677734375, -1.85028076171875, -1.729766845703125, -1.6092529296875, -1.488739013671875, -1.36822509765625, -1.247711181640625, -1.127197265625, -1.006683349609375, -0.88616943359375, -0.765655517578125, -0.6451416015625, -0.524627685546875, -0.40411376953125, -0.283599853515625, -0.1630859375, -0.042572021484375, 0.07794189453125, 0.198455810546875, 0.3189697265625, 0.439483642578125, 0.55999755859375, 0.680511474609375, 0.801025390625, 0.921539306640625, 1.04205322265625, 1.162567138671875, 1.2830810546875, 1.403594970703125, 1.52410888671875, 1.644622802734375, 1.76513671875, 1.885650634765625, 2.00616455078125, 2.126678466796875, 2.2471923828125, 2.367706298828125, 2.48822021484375, 2.608734130859375, 2.729248046875, 2.849761962890625, 2.97027587890625, 3.090789794921875, 3.2113037109375, 3.331817626953125, 3.45233154296875, 3.572845458984375, 3.693359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 6.0, 11.0, 11.0, 11.0, 14.0, 18.0, 17.0, 17.0, 29.0, 39.0, 33.0, 48.0, 34.0, 44.0, 47.0, 51.0, 69.0, 49.0, 41.0, 54.0, 41.0, 45.0, 47.0, 40.0, 28.0, 31.0, 26.0, 20.0, 21.0, 12.0, 10.0, 8.0, 6.0, 3.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.661773681640625, -3.55401611328125, -3.446258544921875, -3.3385009765625, -3.230743408203125, -3.12298583984375, -3.015228271484375, -2.907470703125, -2.799713134765625, -2.69195556640625, -2.584197998046875, -2.4764404296875, -2.368682861328125, -2.26092529296875, -2.153167724609375, -2.04541015625, -1.937652587890625, -1.82989501953125, -1.722137451171875, -1.6143798828125, -1.506622314453125, -1.39886474609375, -1.291107177734375, -1.183349609375, -1.075592041015625, -0.96783447265625, -0.860076904296875, -0.7523193359375, -0.644561767578125, -0.53680419921875, -0.429046630859375, -0.3212890625, -0.213531494140625, -0.10577392578125, 0.001983642578125, 0.1097412109375, 0.217498779296875, 0.32525634765625, 0.433013916015625, 0.540771484375, 0.648529052734375, 0.75628662109375, 0.864044189453125, 0.9718017578125, 1.079559326171875, 1.18731689453125, 1.295074462890625, 1.40283203125, 1.510589599609375, 1.61834716796875, 1.726104736328125, 1.8338623046875, 1.941619873046875, 2.04937744140625, 2.157135009765625, 2.264892578125, 2.372650146484375, 2.48040771484375, 2.588165283203125, 2.6959228515625, 2.803680419921875, 2.91143798828125, 3.019195556640625, 3.126953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 3.0, 4.0, 10.0, 12.0, 11.0, 18.0, 21.0, 25.0, 50.0, 45.0, 76.0, 98.0, 155.0, 258.0, 448.0, 907.0, 2760.0, 14787.0, 433423.0, 575451.0, 14883.0, 2829.0, 932.0, 494.0, 255.0, 163.0, 116.0, 98.0, 44.0, 45.0, 24.0, 25.0, 21.0, 12.0, 10.0, 8.0, 6.0, 9.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.4453125, -7.238525390625, -7.03173828125, -6.824951171875, -6.6181640625, -6.411376953125, -6.20458984375, -5.997802734375, -5.791015625, -5.584228515625, -5.37744140625, -5.170654296875, -4.9638671875, -4.757080078125, -4.55029296875, -4.343505859375, -4.13671875, -3.929931640625, -3.72314453125, -3.516357421875, -3.3095703125, -3.102783203125, -2.89599609375, -2.689208984375, -2.482421875, -2.275634765625, -2.06884765625, -1.862060546875, -1.6552734375, -1.448486328125, -1.24169921875, -1.034912109375, -0.828125, -0.621337890625, -0.41455078125, -0.207763671875, -0.0009765625, 0.205810546875, 0.41259765625, 0.619384765625, 0.826171875, 1.032958984375, 1.23974609375, 1.446533203125, 1.6533203125, 1.860107421875, 2.06689453125, 2.273681640625, 2.48046875, 2.687255859375, 2.89404296875, 3.100830078125, 3.3076171875, 3.514404296875, 3.72119140625, 3.927978515625, 4.134765625, 4.341552734375, 4.54833984375, 4.755126953125, 4.9619140625, 5.168701171875, 5.37548828125, 5.582275390625, 5.7890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 7.0, 7.0, 7.0, 7.0, 8.0, 5.0, 7.0, 12.0, 15.0, 20.0, 25.0, 27.0, 44.0, 36.0, 48.0, 57.0, 69.0, 65.0, 71.0, 53.0, 53.0, 49.0, 36.0, 43.0, 32.0, 23.0, 22.0, 18.0, 17.0, 20.0, 14.0, 12.0, 14.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-10.734375, -10.401123046875, -10.06787109375, -9.734619140625, -9.4013671875, -9.068115234375, -8.73486328125, -8.401611328125, -8.068359375, -7.735107421875, -7.40185546875, -7.068603515625, -6.7353515625, -6.402099609375, -6.06884765625, -5.735595703125, -5.40234375, -5.069091796875, -4.73583984375, -4.402587890625, -4.0693359375, -3.736083984375, -3.40283203125, -3.069580078125, -2.736328125, -2.403076171875, -2.06982421875, -1.736572265625, -1.4033203125, -1.070068359375, -0.73681640625, -0.403564453125, -0.0703125, 0.262939453125, 0.59619140625, 0.929443359375, 1.2626953125, 1.595947265625, 1.92919921875, 2.262451171875, 2.595703125, 2.928955078125, 3.26220703125, 3.595458984375, 3.9287109375, 4.261962890625, 4.59521484375, 4.928466796875, 5.26171875, 5.594970703125, 5.92822265625, 6.261474609375, 6.5947265625, 6.927978515625, 7.26123046875, 7.594482421875, 7.927734375, 8.260986328125, 8.59423828125, 8.927490234375, 9.2607421875, 9.593994140625, 9.92724609375, 10.260498046875, 10.59375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 17.0, 23.0, 22.0, 37.0, 49.0, 98.0, 164.0, 246.0, 477.0, 1169.0, 3405.0, 15266.0, 168631.0, 827844.0, 23649.0, 4619.0, 1470.0, 588.0, 309.0, 185.0, 109.0, 63.0, 34.0, 16.0, 20.0, 10.0, 7.0, 10.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.11328125, -1.08245849609375, -1.0516357421875, -1.02081298828125, -0.989990234375, -0.95916748046875, -0.9283447265625, -0.89752197265625, -0.86669921875, -0.83587646484375, -0.8050537109375, -0.77423095703125, -0.743408203125, -0.71258544921875, -0.6817626953125, -0.65093994140625, -0.6201171875, -0.58929443359375, -0.5584716796875, -0.52764892578125, -0.496826171875, -0.46600341796875, -0.4351806640625, -0.40435791015625, -0.37353515625, -0.34271240234375, -0.3118896484375, -0.28106689453125, -0.250244140625, -0.21942138671875, -0.1885986328125, -0.15777587890625, -0.126953125, -0.09613037109375, -0.0653076171875, -0.03448486328125, -0.003662109375, 0.02716064453125, 0.0579833984375, 0.08880615234375, 0.11962890625, 0.15045166015625, 0.1812744140625, 0.21209716796875, 0.242919921875, 0.27374267578125, 0.3045654296875, 0.33538818359375, 0.3662109375, 0.39703369140625, 0.4278564453125, 0.45867919921875, 0.489501953125, 0.52032470703125, 0.5511474609375, 0.58197021484375, 0.61279296875, 0.64361572265625, 0.6744384765625, 0.70526123046875, 0.736083984375, 0.76690673828125, 0.7977294921875, 0.82855224609375, 0.859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 7.0, 7.0, 6.0, 9.0, 17.0, 19.0, 40.0, 54.0, 108.0, 117.0, 169.0, 136.0, 109.0, 49.0, 36.0, 21.0, 17.0, 18.0, 12.0, 8.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00026988983154296875, -0.00026272237300872803, -0.0002555549144744873, -0.0002483874559402466, -0.00024121999740600586, -0.00023405253887176514, -0.00022688508033752441, -0.0002197176218032837, -0.00021255016326904297, -0.00020538270473480225, -0.00019821524620056152, -0.0001910477876663208, -0.00018388032913208008, -0.00017671287059783936, -0.00016954541206359863, -0.0001623779535293579, -0.0001552104949951172, -0.00014804303646087646, -0.00014087557792663574, -0.00013370811939239502, -0.0001265406608581543, -0.00011937320232391357, -0.00011220574378967285, -0.00010503828525543213, -9.78708267211914e-05, -9.070336818695068e-05, -8.353590965270996e-05, -7.636845111846924e-05, -6.920099258422852e-05, -6.203353404998779e-05, -5.486607551574707e-05, -4.769861698150635e-05, -4.0531158447265625e-05, -3.33636999130249e-05, -2.619624137878418e-05, -1.9028782844543457e-05, -1.1861324310302734e-05, -4.693865776062012e-06, 2.473592758178711e-06, 9.641051292419434e-06, 1.6808509826660156e-05, 2.397596836090088e-05, 3.11434268951416e-05, 3.8310885429382324e-05, 4.547834396362305e-05, 5.264580249786377e-05, 5.981326103210449e-05, 6.698071956634521e-05, 7.414817810058594e-05, 8.131563663482666e-05, 8.848309516906738e-05, 9.56505537033081e-05, 0.00010281801223754883, 0.00010998547077178955, 0.00011715292930603027, 0.000124320387840271, 0.00013148784637451172, 0.00013865530490875244, 0.00014582276344299316, 0.0001529902219772339, 0.0001601576805114746, 0.00016732513904571533, 0.00017449259757995605, 0.00018166005611419678, 0.0001888275146484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 12.0, 17.0, 16.0, 22.0, 48.0, 83.0, 133.0, 228.0, 417.0, 840.0, 2085.0, 6238.0, 22835.0, 170215.0, 794103.0, 37131.0, 8970.0, 2868.0, 1171.0, 487.0, 259.0, 133.0, 86.0, 54.0, 35.0, 21.0, 14.0, 12.0, 3.0, 4.0, 11.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6831130981445312, -0.6596832275390625, -0.6362533569335938, -0.612823486328125, -0.5893936157226562, -0.5659637451171875, -0.5425338745117188, -0.51910400390625, -0.49567413330078125, -0.4722442626953125, -0.44881439208984375, -0.425384521484375, -0.40195465087890625, -0.3785247802734375, -0.35509490966796875, -0.3316650390625, -0.30823516845703125, -0.2848052978515625, -0.26137542724609375, -0.237945556640625, -0.21451568603515625, -0.1910858154296875, -0.16765594482421875, -0.14422607421875, -0.12079620361328125, -0.0973663330078125, -0.07393646240234375, -0.050506591796875, -0.02707672119140625, -0.0036468505859375, 0.01978302001953125, 0.043212890625, 0.06664276123046875, 0.0900726318359375, 0.11350250244140625, 0.136932373046875, 0.16036224365234375, 0.1837921142578125, 0.20722198486328125, 0.23065185546875, 0.25408172607421875, 0.2775115966796875, 0.30094146728515625, 0.324371337890625, 0.34780120849609375, 0.3712310791015625, 0.39466094970703125, 0.4180908203125, 0.44152069091796875, 0.4649505615234375, 0.48838043212890625, 0.511810302734375, 0.5352401733398438, 0.5586700439453125, 0.5820999145507812, 0.60552978515625, 0.6289596557617188, 0.6523895263671875, 0.6758193969726562, 0.699249267578125, 0.7226791381835938, 0.7461090087890625, 0.7695388793945312, 0.79296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 5.0, 7.0, 4.0, 18.0, 15.0, 24.0, 38.0, 44.0, 79.0, 147.0, 145.0, 149.0, 109.0, 81.0, 47.0, 28.0, 13.0, 9.0, 10.0, 11.0, 7.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.2236328125, -1.1826171875, -1.1416015625, -1.1005859375, -1.0595703125, -1.0185546875, -0.9775390625, -0.9365234375, -0.8955078125, -0.8544921875, -0.8134765625, -0.7724609375, -0.7314453125, -0.6904296875, -0.6494140625, -0.6083984375, -0.5673828125, -0.5263671875, -0.4853515625, -0.4443359375, -0.4033203125, -0.3623046875, -0.3212890625, -0.2802734375, -0.2392578125, -0.1982421875, -0.1572265625, -0.1162109375, -0.0751953125, -0.0341796875, 0.0068359375, 0.0478515625, 0.0888671875, 0.1298828125, 0.1708984375, 0.2119140625, 0.2529296875, 0.2939453125, 0.3349609375, 0.3759765625, 0.4169921875, 0.4580078125, 0.4990234375, 0.5400390625, 0.5810546875, 0.6220703125, 0.6630859375, 0.7041015625, 0.7451171875, 0.7861328125, 0.8271484375, 0.8681640625, 0.9091796875, 0.9501953125, 0.9912109375, 1.0322265625, 1.0732421875, 1.1142578125, 1.1552734375, 1.1962890625, 1.2373046875, 1.2783203125, 1.3193359375, 1.3603515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 10.0, 7.0, 18.0, 19.0, 37.0, 55.0, 82.0, 476.0, 143.0, 53.0, 29.0, 22.0, 17.0, 7.0, 11.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.872047424316406, -38.75520324707031, -37.63835906982422, -36.521514892578125, -35.40467071533203, -34.28782272338867, -33.17097854614258, -32.054134368896484, -30.93729019165039, -29.820446014404297, -28.703601837158203, -27.586755752563477, -26.469911575317383, -25.35306739807129, -24.236221313476562, -23.11937713623047, -22.002532958984375, -20.88568878173828, -19.768844604492188, -18.65199851989746, -17.535154342651367, -16.418310165405273, -15.301465034484863, -14.184619903564453, -13.06777572631836, -11.950931549072266, -10.834086418151855, -9.717241287231445, -8.600397109985352, -7.4835524559021, -6.366707801818848, -5.249863147735596, -4.133022308349609, -3.0161776542663574, -1.8993330001831055, -0.7824883460998535, 0.33435630798339844, 1.4512009620666504, 2.5680456161499023, 3.6848902702331543, 4.801734924316406, 5.918579578399658, 7.03542423248291, 8.15226936340332, 9.269113540649414, 10.385957717895508, 11.502802848815918, 12.619647979736328, 13.736492156982422, 14.853336334228516, 15.970181465148926, 17.087026596069336, 18.20387077331543, 19.320714950561523, 20.43756103515625, 21.554405212402344, 22.671249389648438, 23.78809356689453, 24.904937744140625, 26.02178382873535, 27.138628005981445, 28.25547218322754, 29.372318267822266, 30.48916244506836, 31.606006622314453]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 5.0, 4.0, 12.0, 18.0, 17.0, 20.0, 25.0, 21.0, 46.0, 37.0, 36.0, 195.0, 295.0, 35.0, 40.0, 30.0, 31.0, 25.0, 29.0, 18.0, 9.0, 13.0, 7.0, 11.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.92974853515625, -48.54539108276367, -47.16102981567383, -45.77667236328125, -44.392311096191406, -43.00795364379883, -41.62359619140625, -40.239234924316406, -38.85487747192383, -37.47052001953125, -36.086158752441406, -34.70180130004883, -33.317440032958984, -31.933082580566406, -30.548723220825195, -29.164363861083984, -27.780004501342773, -26.395645141601562, -25.01128578186035, -23.62692642211914, -22.242568969726562, -20.85820960998535, -19.47385025024414, -18.089492797851562, -16.70513153076172, -15.320772171020508, -13.936413764953613, -12.552054405212402, -11.167695999145508, -9.783336639404297, -8.398977279663086, -7.014618873596191, -5.630260467529297, -4.245901584625244, -2.8615424633026123, -1.4771833419799805, -0.09282445907592773, 1.291534423828125, 2.675893783569336, 4.0602521896362305, 5.444611549377441, 6.828970432281494, 8.213329315185547, 9.597688674926758, 10.982048034667969, 12.366406440734863, 13.750765800476074, 15.135124206542969, 16.51948356628418, 17.90384292602539, 19.2882022857666, 20.672561645507812, 22.05691909790039, 23.4412784576416, 24.825637817382812, 26.20999526977539, 27.594356536865234, 28.978715896606445, 30.363075256347656, 31.747432708740234, 33.13179397583008, 34.516151428222656, 35.9005126953125, 37.28487014770508, 38.669227600097656]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 7.0, 4.0, 8.0, 6.0, 11.0, 11.0, 11.0, 16.0, 19.0, 20.0, 18.0, 28.0, 22.0, 26.0, 33.0, 59.0, 223.0, 142.0, 66.0, 44.0, 25.0, 22.0, 27.0, 20.0, 17.0, 9.0, 15.0, 17.0, 10.0, 6.0, 6.0, 8.0, 4.0, 7.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.642578125, -2.56195068359375, -2.4813232421875, -2.40069580078125, -2.320068359375, -2.23944091796875, -2.1588134765625, -2.07818603515625, -1.99755859375, -1.91693115234375, -1.8363037109375, -1.75567626953125, -1.675048828125, -1.59442138671875, -1.5137939453125, -1.43316650390625, -1.3525390625, -1.27191162109375, -1.1912841796875, -1.11065673828125, -1.030029296875, -0.94940185546875, -0.8687744140625, -0.78814697265625, -0.70751953125, -0.62689208984375, -0.5462646484375, -0.46563720703125, -0.385009765625, -0.30438232421875, -0.2237548828125, -0.14312744140625, -0.0625, 0.01812744140625, 0.0987548828125, 0.17938232421875, 0.260009765625, 0.34063720703125, 0.4212646484375, 0.50189208984375, 0.58251953125, 0.66314697265625, 0.7437744140625, 0.82440185546875, 0.905029296875, 0.98565673828125, 1.0662841796875, 1.14691162109375, 1.2275390625, 1.30816650390625, 1.3887939453125, 1.46942138671875, 1.550048828125, 1.63067626953125, 1.7113037109375, 1.79193115234375, 1.87255859375, 1.95318603515625, 2.0338134765625, 2.11444091796875, 2.195068359375, 2.27569580078125, 2.3563232421875, 2.43695068359375, 2.517578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 20.0, 16.0, 19.0, 30.0, 28.0, 55.0, 98.0, 188.0, 469.0, 1495.0, 8877.0, 8350880.0, 22471.0, 2628.0, 687.0, 242.0, 121.0, 67.0, 45.0, 37.0, 32.0, 7.0, 9.0, 7.0, 3.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.561927795410156, -25.601804733276367, -24.641681671142578, -23.681560516357422, -22.721437454223633, -21.761314392089844, -20.801191329956055, -19.841068267822266, -18.880945205688477, -17.920822143554688, -16.9606990814209, -16.00057601928711, -15.040453910827637, -14.080331802368164, -13.120208740234375, -12.160085678100586, -11.199963569641113, -10.239840507507324, -9.279718399047852, -8.319595336914062, -7.359472274780273, -6.399349689483643, -5.439227104187012, -4.479104042053223, -3.518981456756592, -2.558858633041382, -1.5987359285354614, -0.638613224029541, 0.32150959968566895, 1.281632423400879, 2.2417550086975098, 3.201878070831299, 4.16200065612793, 5.1221232414245605, 6.08224630355835, 7.0423688888549805, 8.00249195098877, 8.962614059448242, 9.922737121582031, 10.88286018371582, 11.84298324584961, 12.803106307983398, 13.763228416442871, 14.72335147857666, 15.68347454071045, 16.643596649169922, 17.60371971130371, 18.5638427734375, 19.523963928222656, 20.484086990356445, 21.444210052490234, 22.40433120727539, 23.36445426940918, 24.32457733154297, 25.284700393676758, 26.244823455810547, 27.204946517944336, 28.165069580078125, 29.125192642211914, 30.085315704345703, 31.04543685913086, 32.00556182861328, 32.96568298339844, 33.925804138183594, 34.885929107666016]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 7.0, 5.0, 3.0, 6.0, 9.0, 7.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.76301574707031, -38.57502746582031, -37.38703536987305, -36.19904708862305, -35.01105880737305, -33.82306671142578, -32.63507843017578, -31.44709014892578, -30.25909996032715, -29.071109771728516, -27.883121490478516, -26.695131301879883, -25.50714111328125, -24.31915283203125, -23.131162643432617, -21.943172454833984, -20.755184173583984, -19.56719398498535, -18.37920570373535, -17.19121551513672, -16.00322723388672, -14.815237045288086, -13.627246856689453, -12.439257621765137, -11.25126838684082, -10.063279151916504, -8.875289916992188, -7.687299728393555, -6.499310493469238, -5.311321258544922, -4.123331546783447, -2.9353418350219727, -1.7473487854003906, -0.5593593120574951, 0.6286301612854004, 1.816619634628296, 3.0046091079711914, 4.192598342895508, 5.380588054656982, 6.568577766418457, 7.756567001342773, 8.94455623626709, 10.132545471191406, 11.320535659790039, 12.508524894714355, 13.696514129638672, 14.884504318237305, 16.072494506835938, 17.260482788085938, 18.44847297668457, 19.63646125793457, 20.824451446533203, 22.012439727783203, 23.200429916381836, 24.38842010498047, 25.57640838623047, 26.7643985748291, 27.952388763427734, 29.140377044677734, 30.328367233276367, 31.516357421875, 32.704345703125, 33.892333984375, 35.080326080322266, 36.268314361572266]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 7.0, 10.0, 14.0, 20.0, 27.0, 33.0, 47.0, 73.0, 117.0, 167.0, 248.0, 458.0, 944.0, 2333.0, 6719.0, 22042.0, 81748.0, 231109.0, 129155.0, 33722.0, 9527.0, 3125.0, 1260.0, 551.0, 318.0, 161.0, 97.0, 76.0, 43.0, 23.0, 28.0, 16.0, 13.0, 14.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.061279296875, -18.37255859375, -17.683837890625, -16.9951171875, -16.306396484375, -15.61767578125, -14.928955078125, -14.240234375, -13.551513671875, -12.86279296875, -12.174072265625, -11.4853515625, -10.796630859375, -10.10791015625, -9.419189453125, -8.73046875, -8.041748046875, -7.35302734375, -6.664306640625, -5.9755859375, -5.286865234375, -4.59814453125, -3.909423828125, -3.220703125, -2.531982421875, -1.84326171875, -1.154541015625, -0.4658203125, 0.222900390625, 0.91162109375, 1.600341796875, 2.2890625, 2.977783203125, 3.66650390625, 4.355224609375, 5.0439453125, 5.732666015625, 6.42138671875, 7.110107421875, 7.798828125, 8.487548828125, 9.17626953125, 9.864990234375, 10.5537109375, 11.242431640625, 11.93115234375, 12.619873046875, 13.30859375, 13.997314453125, 14.68603515625, 15.374755859375, 16.0634765625, 16.752197265625, 17.44091796875, 18.129638671875, 18.818359375, 19.507080078125, 20.19580078125, 20.884521484375, 21.5732421875, 22.261962890625, 22.95068359375, 23.639404296875, 24.328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 11.0, 11.0, 6.0, 21.0, 28.0, 37.0, 42.0, 47.0, 51.0, 66.0, 82.0, 88.0, 68.0, 70.0, 70.0, 72.0, 50.0, 35.0, 27.0, 17.0, 20.0, 13.0, 17.0, 7.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.1524658203125, -4.027587890625, -3.9027099609375, -3.77783203125, -3.6529541015625, -3.528076171875, -3.4031982421875, -3.2783203125, -3.1534423828125, -3.028564453125, -2.9036865234375, -2.77880859375, -2.6539306640625, -2.529052734375, -2.4041748046875, -2.279296875, -2.1544189453125, -2.029541015625, -1.9046630859375, -1.77978515625, -1.6549072265625, -1.530029296875, -1.4051513671875, -1.2802734375, -1.1553955078125, -1.030517578125, -0.9056396484375, -0.78076171875, -0.6558837890625, -0.531005859375, -0.4061279296875, -0.28125, -0.1563720703125, -0.031494140625, 0.0933837890625, 0.21826171875, 0.3431396484375, 0.468017578125, 0.5928955078125, 0.7177734375, 0.8426513671875, 0.967529296875, 1.0924072265625, 1.21728515625, 1.3421630859375, 1.467041015625, 1.5919189453125, 1.716796875, 1.8416748046875, 1.966552734375, 2.0914306640625, 2.21630859375, 2.3411865234375, 2.466064453125, 2.5909423828125, 2.7158203125, 2.8406982421875, 2.965576171875, 3.0904541015625, 3.21533203125, 3.3402099609375, 3.465087890625, 3.5899658203125, 3.71484375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 8.0, 4.0, 16.0, 57.0, 143.0, 149.0, 56.0, 18.0, 7.0, 9.0, 7.0, 1.0, 1.0, 1.0], "bins": [-79.52371215820312, -78.08739471435547, -76.65108489990234, -75.21476745605469, -73.77845764160156, -72.3421401977539, -70.90583038330078, -69.46951293945312, -68.033203125, -66.59688568115234, -65.16057586669922, -63.72426223754883, -62.28794860839844, -60.85163116455078, -59.41531753540039, -57.97900390625, -56.542686462402344, -55.10637283325195, -53.67005920410156, -52.23374557495117, -50.79743194580078, -49.361114501953125, -47.924800872802734, -46.488487243652344, -45.05217361450195, -43.61585998535156, -42.17954635620117, -40.74323272705078, -39.306915283203125, -37.870601654052734, -36.434288024902344, -34.99797439575195, -33.56166076660156, -32.12534713745117, -30.68903350830078, -29.252717971801758, -27.816404342651367, -26.380090713500977, -24.943775177001953, -23.507461547851562, -22.071147918701172, -20.63483428955078, -19.19852066040039, -17.762205123901367, -16.325891494750977, -14.889577865600586, -13.453263282775879, -12.016948699951172, -10.580636024475098, -9.14432144165039, -7.7080078125, -6.271693706512451, -4.835379600524902, -3.3990654945373535, -1.9627513885498047, -0.5264368057250977, 0.909876823425293, 2.346190929412842, 3.7825050354003906, 5.2188191413879395, 6.655133247375488, 8.091447830200195, 9.527761459350586, 10.964076042175293, 12.400389671325684]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 0.0, 2.0, 7.0, 3.0, 2.0, 4.0, 16.0, 19.0, 45.0, 78.0, 82.0, 71.0, 45.0, 24.0, 18.0, 6.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.969985961914062, -15.434263229370117, -14.898541450500488, -14.36281967163086, -13.827096939086914, -13.291374206542969, -12.75565242767334, -12.219930648803711, -11.684207916259766, -11.14848518371582, -10.612763404846191, -10.077041625976562, -9.541318893432617, -9.005596160888672, -8.469874382019043, -7.934152126312256, -7.398429870605469, -6.862707614898682, -6.3269853591918945, -5.791263103485107, -5.25554084777832, -4.719818592071533, -4.184096336364746, -3.648374080657959, -3.112651824951172, -2.5769295692443848, -2.0412073135375977, -1.5054850578308105, -0.9697628021240234, -0.43404054641723633, 0.10168170928955078, 0.6374039649963379, 1.1731243133544922, 1.7088465690612793, 2.2445688247680664, 2.7802910804748535, 3.3160133361816406, 3.8517355918884277, 4.387457847595215, 4.923180103302002, 5.458902359008789, 5.994624614715576, 6.530346870422363, 7.06606912612915, 7.6017913818359375, 8.137514114379883, 8.673235893249512, 9.20895767211914, 9.744680404663086, 10.280403137207031, 10.81612491607666, 11.351846694946289, 11.887569427490234, 12.42329216003418, 12.959013938903809, 13.494735717773438, 14.030458450317383, 14.566181182861328, 15.101902961730957, 15.637624740600586, 16.17334747314453, 16.709070205688477, 17.244792938232422, 17.780513763427734, 18.31623649597168]}, "eval/loss": 5.962278366088867, "eval/wer": 1.1028163427211424, "eval/runtime": 599.0646, "eval/samples_per_second": 4.41, "eval/steps_per_second": 0.553} \ No newline at end of file