diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.4733, "train/learning_rate": 2.396080760095012e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 107983, "_timestamp": 1646769222, "_step": 16510, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 10.0, 29843.0, 559.0, 32.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.375, -148.1171875, -143.859375, -139.6015625, -135.34375, -131.0859375, -126.828125, -122.5703125, -118.3125, -114.0546875, -109.796875, -105.5390625, -101.28125, -97.0234375, -92.765625, -88.5078125, -84.25, -79.9921875, -75.734375, -71.4765625, -67.21875, -62.9609375, -58.703125, -54.4453125, -50.1875, -45.9296875, -41.671875, -37.4140625, -33.15625, -28.8984375, -24.640625, -20.3828125, -16.125, -11.8671875, -7.609375, -3.3515625, 0.90625, 5.1640625, 9.421875, 13.6796875, 17.9375, 22.1953125, 26.453125, 30.7109375, 34.96875, 39.2265625, 43.484375, 47.7421875, 52.0, 56.2578125, 60.515625, 64.7734375, 69.03125, 73.2890625, 77.546875, 81.8046875, 86.0625, 90.3203125, 94.578125, 98.8359375, 103.09375, 107.3515625, 111.609375, 115.8671875, 120.125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 10.0, 20.0, 13.0, 18.0, 20.0, 19.0, 21.0, 35.0, 34.0, 44.0, 48.0, 45.0, 48.0, 44.0, 60.0, 34.0, 58.0, 57.0, 54.0, 59.0, 45.0, 45.0, 39.0, 28.0, 17.0, 17.0, 19.0, 14.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.37356567382812, -89.39723205566406, -87.4208984375, -85.44456481933594, -83.46823120117188, -81.49189758300781, -79.51555633544922, -77.53922271728516, -75.5628890991211, -73.58655548095703, -71.61022186279297, -69.6338882446289, -67.65755462646484, -65.68121337890625, -63.70488357543945, -61.728546142578125, -59.75221252441406, -57.77587890625, -55.79954528808594, -53.82320785522461, -51.84687423706055, -49.870540618896484, -47.89420700073242, -45.917869567871094, -43.9415397644043, -41.965206146240234, -39.98887252807617, -38.012535095214844, -36.03620147705078, -34.05986785888672, -32.083534240722656, -30.10719871520996, -28.130863189697266, -26.154529571533203, -24.178194046020508, -22.201860427856445, -20.22552490234375, -18.249191284179688, -16.272857666015625, -14.29652214050293, -12.32018756866455, -10.343852996826172, -8.367518424987793, -6.391184329986572, -4.414849758148193, -2.4385156631469727, -0.46218109130859375, 1.5141534805297852, 3.490488052368164, 5.466822624206543, 7.443157196044922, 9.419490814208984, 11.39582633972168, 13.372159957885742, 15.348494529724121, 17.3248291015625, 19.301162719726562, 21.277496337890625, 23.25383186340332, 25.230165481567383, 27.206501007080078, 29.18283462524414, 31.159168243408203, 33.13550567626953, 35.111839294433594]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 8.0, 8.0, 9.0, 11.0, 17.0, 11.0, 12.0, 15.0, 18.0, 20.0, 17.0, 28.0, 28.0, 31.0, 35.0, 38.0, 38.0, 42.0, 36.0, 36.0, 37.0, 44.0, 33.0, 33.0, 31.0, 35.0, 23.0, 34.0, 30.0, 35.0, 20.0, 19.0, 24.0, 22.0, 14.0, 17.0, 11.0, 13.0, 9.0, 9.0, 7.0, 8.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.794132232666016, -35.45803451538086, -34.12193298339844, -32.78583526611328, -31.44973373413086, -30.113636016845703, -28.777536392211914, -27.441436767578125, -26.105337142944336, -24.769237518310547, -23.433137893676758, -22.09703826904297, -20.760940551757812, -19.42483901977539, -18.088741302490234, -16.752641677856445, -15.416542053222656, -14.080442428588867, -12.744342803955078, -11.408244132995605, -10.072144508361816, -8.736044883728027, -7.399946212768555, -6.063846588134766, -4.727746963500977, -3.3916475772857666, -2.0555481910705566, -0.7194490432739258, 0.6166505813598633, 1.9527502059936523, 3.288848876953125, 4.624948501586914, 5.961051940917969, 7.297151565551758, 8.633251190185547, 9.96934986114502, 11.305449485778809, 12.641549110412598, 13.97764778137207, 15.31374740600586, 16.64984703063965, 17.985946655273438, 19.322046279907227, 20.658145904541016, 21.994243621826172, 23.330345153808594, 24.66644287109375, 26.00254249572754, 27.338642120361328, 28.674741744995117, 30.010841369628906, 31.346939086914062, 32.683040618896484, 34.01913833618164, 35.35523986816406, 36.69133758544922, 38.027435302734375, 39.36353302001953, 40.69963455200195, 42.03573226928711, 43.37183380126953, 44.70793151855469, 46.044029235839844, 47.380130767822266, 48.71623229980469]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 13.0, 13.0, 24.0, 26.0, 56.0, 72.0, 129.0, 197.0, 328.0, 491.0, 764.0, 1168.0, 1827.0, 2862.0, 4224.0, 6468.0, 9429.0, 13568.0, 19808.0, 27758.0, 37523.0, 49670.0, 63077.0, 76823.0, 89742.0, 106775.0, 116325.0, 91238.0, 79377.0, 65309.0, 51533.0, 38934.0, 28801.0, 20435.0, 14370.0, 9832.0, 6658.0, 4510.0, 2917.0, 1975.0, 1319.0, 828.0, 522.0, 319.0, 179.0, 135.0, 78.0, 55.0, 27.0, 19.0, 14.0, 12.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-156.75, -151.861328125, -146.97265625, -142.083984375, -137.1953125, -132.306640625, -127.41796875, -122.529296875, -117.640625, -112.751953125, -107.86328125, -102.974609375, -98.0859375, -93.197265625, -88.30859375, -83.419921875, -78.53125, -73.642578125, -68.75390625, -63.865234375, -58.9765625, -54.087890625, -49.19921875, -44.310546875, -39.421875, -34.533203125, -29.64453125, -24.755859375, -19.8671875, -14.978515625, -10.08984375, -5.201171875, -0.3125, 4.576171875, 9.46484375, 14.353515625, 19.2421875, 24.130859375, 29.01953125, 33.908203125, 38.796875, 43.685546875, 48.57421875, 53.462890625, 58.3515625, 63.240234375, 68.12890625, 73.017578125, 77.90625, 82.794921875, 87.68359375, 92.572265625, 97.4609375, 102.349609375, 107.23828125, 112.126953125, 117.015625, 121.904296875, 126.79296875, 131.681640625, 136.5703125, 141.458984375, 146.34765625, 151.236328125, 156.125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 10.0, 13.0, 14.0, 12.0, 21.0, 15.0, 27.0, 33.0, 40.0, 29.0, 34.0, 40.0, 39.0, 41.0, 29.0, 44.0, 67.0, 51.0, 45.0, 44.0, 36.0, 47.0, 32.0, 36.0, 31.0, 26.0, 22.0, 15.0, 19.0, 7.0, 16.0, 15.0, 9.0, 5.0, 4.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.8125, -73.2578125, -70.703125, -68.1484375, -65.59375, -63.0390625, -60.484375, -57.9296875, -55.375, -52.8203125, -50.265625, -47.7109375, -45.15625, -42.6015625, -40.046875, -37.4921875, -34.9375, -32.3828125, -29.828125, -27.2734375, -24.71875, -22.1640625, -19.609375, -17.0546875, -14.5, -11.9453125, -9.390625, -6.8359375, -4.28125, -1.7265625, 0.828125, 3.3828125, 5.9375, 8.4921875, 11.046875, 13.6015625, 16.15625, 18.7109375, 21.265625, 23.8203125, 26.375, 28.9296875, 31.484375, 34.0390625, 36.59375, 39.1484375, 41.703125, 44.2578125, 46.8125, 49.3671875, 51.921875, 54.4765625, 57.03125, 59.5859375, 62.140625, 64.6953125, 67.25, 69.8046875, 72.359375, 74.9140625, 77.46875, 80.0234375, 82.578125, 85.1328125, 87.6875]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 7.0, 14.0, 32.0, 16.0, 13.0, 30.0, 26.0, 42.0, 48.0, 44.0, 53.0, 56.0, 50.0, 44.0, 59.0, 54.0, 51.0, 45.0, 36.0, 41.0, 29.0, 30.0, 26.0, 17.0, 19.0, 22.0, 21.0, 18.0, 3.0, 10.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.42303466796875, -63.57600021362305, -61.728965759277344, -59.881927490234375, -58.03489303588867, -56.18785858154297, -54.340824127197266, -52.49378967285156, -50.646751403808594, -48.79971694946289, -46.95268249511719, -45.10564422607422, -43.258609771728516, -41.41157531738281, -39.56454086303711, -37.717506408691406, -35.87046813964844, -34.023433685302734, -32.17639923095703, -30.329362869262695, -28.48232650756836, -26.635292053222656, -24.788257598876953, -22.941221237182617, -21.094188690185547, -19.247154235839844, -17.400117874145508, -15.553083419799805, -13.706047058105469, -11.859012603759766, -10.011977195739746, -8.164941787719727, -6.317905426025391, -4.470870018005371, -2.6238348484039307, -0.7767996788024902, 1.0702357292175293, 2.9172706604003906, 4.76430606842041, 6.61134147644043, 8.45837688446045, 10.305412292480469, 12.152447700500488, 13.999483108520508, 15.846517562866211, 17.693553924560547, 19.54058837890625, 21.387622833251953, 23.23465919494629, 25.081693649291992, 26.928730010986328, 28.77576446533203, 30.622800827026367, 32.46983337402344, 34.316871643066406, 36.16390609741211, 38.01094055175781, 39.857975006103516, 41.70500946044922, 43.55204772949219, 45.39908218383789, 47.246116638183594, 49.0931510925293, 50.940185546875, 52.78722381591797]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 5.0, 12.0, 11.0, 12.0, 14.0, 19.0, 23.0, 21.0, 28.0, 32.0, 33.0, 30.0, 28.0, 37.0, 43.0, 36.0, 38.0, 54.0, 46.0, 48.0, 36.0, 23.0, 36.0, 30.0, 29.0, 37.0, 23.0, 35.0, 15.0, 19.0, 26.0, 25.0, 16.0, 14.0, 10.0, 9.0, 2.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.88264846801758, -49.40705871582031, -47.93146896362305, -46.45587921142578, -44.98028564453125, -43.504695892333984, -42.02910614013672, -40.55351638793945, -39.07792663574219, -37.60233688354492, -36.126747131347656, -34.651153564453125, -33.17556381225586, -31.699974060058594, -30.224384307861328, -28.748794555664062, -27.27320098876953, -25.797611236572266, -24.322019577026367, -22.8464298248291, -21.370838165283203, -19.895248413085938, -18.419658660888672, -16.944068908691406, -15.468477249145508, -13.992886543273926, -12.517295837402344, -11.041706085205078, -9.566115379333496, -8.090524673461914, -6.614934921264648, -5.139344215393066, -3.6637496948242188, -2.188159227371216, -0.7125687599182129, 0.7630214691162109, 2.238612174987793, 3.714202880859375, 5.189792633056641, 6.665383338928223, 8.140974044799805, 9.616564750671387, 11.092155456542969, 12.567745208740234, 14.043335914611816, 15.518926620483398, 16.994516372680664, 18.470108032226562, 19.945697784423828, 21.421287536621094, 22.896879196166992, 24.372468948364258, 25.848060607910156, 27.323650360107422, 28.799240112304688, 30.274829864501953, 31.75042152404785, 33.22601318359375, 34.701602935791016, 36.17719268798828, 37.65278244018555, 39.12837219238281, 40.603965759277344, 42.07955551147461, 43.555145263671875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 0.0, 9.0, 13.0, 15.0, 32.0, 58.0, 85.0, 139.0, 202.0, 366.0, 617.0, 961.0, 1654.0, 2701.0, 4324.0, 7131.0, 11835.0, 19698.0, 31826.0, 52893.0, 87757.0, 144813.0, 240014.0, 393268.0, 625653.0, 817063.0, 671117.0, 427333.0, 259498.0, 155774.0, 94216.0, 56348.0, 34108.0, 20619.0, 12445.0, 7630.0, 4643.0, 2879.0, 1673.0, 1125.0, 641.0, 427.0, 252.0, 170.0, 98.0, 57.0, 44.0, 20.0, 18.0, 13.0, 8.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-72.75, -70.291015625, -67.83203125, -65.373046875, -62.9140625, -60.455078125, -57.99609375, -55.537109375, -53.078125, -50.619140625, -48.16015625, -45.701171875, -43.2421875, -40.783203125, -38.32421875, -35.865234375, -33.40625, -30.947265625, -28.48828125, -26.029296875, -23.5703125, -21.111328125, -18.65234375, -16.193359375, -13.734375, -11.275390625, -8.81640625, -6.357421875, -3.8984375, -1.439453125, 1.01953125, 3.478515625, 5.9375, 8.396484375, 10.85546875, 13.314453125, 15.7734375, 18.232421875, 20.69140625, 23.150390625, 25.609375, 28.068359375, 30.52734375, 32.986328125, 35.4453125, 37.904296875, 40.36328125, 42.822265625, 45.28125, 47.740234375, 50.19921875, 52.658203125, 55.1171875, 57.576171875, 60.03515625, 62.494140625, 64.953125, 67.412109375, 69.87109375, 72.330078125, 74.7890625, 77.248046875, 79.70703125, 82.166015625, 84.625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 1.0, 5.0, 6.0, 7.0, 3.0, 7.0, 12.0, 14.0, 11.0, 15.0, 15.0, 30.0, 21.0, 29.0, 36.0, 31.0, 34.0, 33.0, 36.0, 35.0, 47.0, 52.0, 47.0, 48.0, 42.0, 32.0, 32.0, 36.0, 33.0, 37.0, 23.0, 33.0, 36.0, 18.0, 17.0, 16.0, 14.0, 16.0, 10.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.681640625, -40.26953125, -38.857421875, -37.4453125, -36.033203125, -34.62109375, -33.208984375, -31.796875, -30.384765625, -28.97265625, -27.560546875, -26.1484375, -24.736328125, -23.32421875, -21.912109375, -20.5, -19.087890625, -17.67578125, -16.263671875, -14.8515625, -13.439453125, -12.02734375, -10.615234375, -9.203125, -7.791015625, -6.37890625, -4.966796875, -3.5546875, -2.142578125, -0.73046875, 0.681640625, 2.09375, 3.505859375, 4.91796875, 6.330078125, 7.7421875, 9.154296875, 10.56640625, 11.978515625, 13.390625, 14.802734375, 16.21484375, 17.626953125, 19.0390625, 20.451171875, 21.86328125, 23.275390625, 24.6875, 26.099609375, 27.51171875, 28.923828125, 30.3359375, 31.748046875, 33.16015625, 34.572265625, 35.984375, 37.396484375, 38.80859375, 40.220703125, 41.6328125, 43.044921875, 44.45703125, 45.869140625, 47.28125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 19.0, 28.0, 46.0, 57.0, 121.0, 151.0, 266.0, 375.0, 623.0, 993.0, 1590.0, 2507.0, 4097.0, 6662.0, 11216.0, 18623.0, 30088.0, 49947.0, 81719.0, 129107.0, 203494.0, 311466.0, 457373.0, 615137.0, 666599.0, 538384.0, 380723.0, 253529.0, 162996.0, 103030.0, 63514.0, 38639.0, 23834.0, 14575.0, 8728.0, 5461.0, 3263.0, 1994.0, 1229.0, 728.0, 504.0, 309.0, 189.0, 111.0, 83.0, 46.0, 43.0, 26.0, 13.0, 5.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-52.125, -50.5087890625, -48.892578125, -47.2763671875, -45.66015625, -44.0439453125, -42.427734375, -40.8115234375, -39.1953125, -37.5791015625, -35.962890625, -34.3466796875, -32.73046875, -31.1142578125, -29.498046875, -27.8818359375, -26.265625, -24.6494140625, -23.033203125, -21.4169921875, -19.80078125, -18.1845703125, -16.568359375, -14.9521484375, -13.3359375, -11.7197265625, -10.103515625, -8.4873046875, -6.87109375, -5.2548828125, -3.638671875, -2.0224609375, -0.40625, 1.2099609375, 2.826171875, 4.4423828125, 6.05859375, 7.6748046875, 9.291015625, 10.9072265625, 12.5234375, 14.1396484375, 15.755859375, 17.3720703125, 18.98828125, 20.6044921875, 22.220703125, 23.8369140625, 25.453125, 27.0693359375, 28.685546875, 30.3017578125, 31.91796875, 33.5341796875, 35.150390625, 36.7666015625, 38.3828125, 39.9990234375, 41.615234375, 43.2314453125, 44.84765625, 46.4638671875, 48.080078125, 49.6962890625, 51.3125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 11.0, 16.0, 17.0, 28.0, 20.0, 34.0, 37.0, 60.0, 69.0, 81.0, 90.0, 101.0, 114.0, 149.0, 167.0, 208.0, 223.0, 194.0, 227.0, 215.0, 214.0, 230.0, 228.0, 201.0, 179.0, 138.0, 119.0, 129.0, 102.0, 83.0, 74.0, 64.0, 43.0, 37.0, 27.0, 27.0, 20.0, 18.0, 19.0, 9.0, 3.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-20.640625, -19.992919921875, -19.34521484375, -18.697509765625, -18.0498046875, -17.402099609375, -16.75439453125, -16.106689453125, -15.458984375, -14.811279296875, -14.16357421875, -13.515869140625, -12.8681640625, -12.220458984375, -11.57275390625, -10.925048828125, -10.27734375, -9.629638671875, -8.98193359375, -8.334228515625, -7.6865234375, -7.038818359375, -6.39111328125, -5.743408203125, -5.095703125, -4.447998046875, -3.80029296875, -3.152587890625, -2.5048828125, -1.857177734375, -1.20947265625, -0.561767578125, 0.0859375, 0.733642578125, 1.38134765625, 2.029052734375, 2.6767578125, 3.324462890625, 3.97216796875, 4.619873046875, 5.267578125, 5.915283203125, 6.56298828125, 7.210693359375, 7.8583984375, 8.506103515625, 9.15380859375, 9.801513671875, 10.44921875, 11.096923828125, 11.74462890625, 12.392333984375, 13.0400390625, 13.687744140625, 14.33544921875, 14.983154296875, 15.630859375, 16.278564453125, 16.92626953125, 17.573974609375, 18.2216796875, 18.869384765625, 19.51708984375, 20.164794921875, 20.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 11.0, 17.0, 10.0, 16.0, 24.0, 29.0, 34.0, 32.0, 45.0, 58.0, 47.0, 58.0, 58.0, 58.0, 55.0, 52.0, 64.0, 52.0, 30.0, 43.0, 32.0, 19.0, 29.0, 29.0, 21.0, 12.0, 8.0, 16.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.025115966796875, -51.130428314208984, -49.23573684692383, -47.34104919433594, -45.44636154174805, -43.551673889160156, -41.656982421875, -39.76229476928711, -37.86760711669922, -35.97291946411133, -34.07822799682617, -32.18354034423828, -30.28885269165039, -28.394163131713867, -26.499473571777344, -24.604785919189453, -22.71009635925293, -20.815406799316406, -18.920719146728516, -17.026029586791992, -15.131341934204102, -13.236652374267578, -11.341963768005371, -9.447275161743164, -7.552586555480957, -5.65789794921875, -3.763209104537964, -1.8685202598571777, 0.026168346405029297, 1.9208574295043945, 3.8155460357666016, 5.710234642028809, 7.604923248291016, 9.499611854553223, 11.39430046081543, 13.288990020751953, 15.183677673339844, 17.078367233276367, 18.97305679321289, 20.86774444580078, 22.762432098388672, 24.657121658325195, 26.551809310913086, 28.44649887084961, 30.3411865234375, 32.235877990722656, 34.13056564331055, 36.02525329589844, 37.919944763183594, 39.814632415771484, 41.70932388305664, 43.60401153564453, 45.49869918823242, 47.39338684082031, 49.28807830810547, 51.18276596069336, 53.07745361328125, 54.97214126586914, 56.8668327331543, 58.76152038574219, 60.65620803833008, 62.55089569091797, 64.44558715820312, 66.34027099609375, 68.2349624633789]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 4.0, 14.0, 8.0, 16.0, 15.0, 23.0, 25.0, 27.0, 20.0, 41.0, 42.0, 39.0, 38.0, 33.0, 45.0, 40.0, 44.0, 42.0, 54.0, 39.0, 33.0, 46.0, 49.0, 27.0, 36.0, 30.0, 19.0, 23.0, 22.0, 15.0, 16.0, 13.0, 10.0, 10.0, 10.0, 6.0, 9.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.110984802246094, -49.5527458190918, -47.9945068359375, -46.4362678527832, -44.878028869628906, -43.319786071777344, -41.76155090332031, -40.20330810546875, -38.64506912231445, -37.086830139160156, -35.52859115600586, -33.97035217285156, -32.412113189697266, -30.853872299194336, -29.29563331604004, -27.73739242553711, -26.179155349731445, -24.62091636657715, -23.06267738342285, -21.504436492919922, -19.946197509765625, -18.387958526611328, -16.82971954345703, -15.271479606628418, -13.713240623474121, -12.155001640319824, -10.596761703491211, -9.038522720336914, -7.480283260345459, -5.922043800354004, -4.363804817199707, -2.8055648803710938, -1.2473258972167969, 0.31091344356536865, 1.8691527843475342, 3.42739200592041, 4.985631465911865, 6.54387092590332, 8.102109909057617, 9.66034984588623, 11.218588829040527, 12.776827812194824, 14.335067749023438, 15.893306732177734, 17.45154571533203, 19.009784698486328, 20.568023681640625, 22.126264572143555, 23.68450355529785, 25.24274253845215, 26.800981521606445, 28.359222412109375, 29.917461395263672, 31.47570037841797, 33.033939361572266, 34.59217834472656, 36.15041732788086, 37.708656311035156, 39.26689529418945, 40.82513427734375, 42.38337326049805, 43.941612243652344, 45.499855041503906, 47.0580940246582, 48.6163330078125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 15.0, 23.0, 32.0, 44.0, 73.0, 96.0, 157.0, 248.0, 396.0, 589.0, 920.0, 1469.0, 2392.0, 3856.0, 6127.0, 10113.0, 16022.0, 25536.0, 41061.0, 64380.0, 99191.0, 141595.0, 167529.0, 152642.0, 112334.0, 74454.0, 47626.0, 30105.0, 18746.0, 11643.0, 7161.0, 4525.0, 2804.0, 1726.0, 1059.0, 675.0, 424.0, 261.0, 175.0, 113.0, 71.0, 50.0, 39.0, 16.0, 19.0, 14.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.77734375, -65.4921875, -63.20703125, -60.921875, -58.63671875, -56.3515625, -54.06640625, -51.78125, -49.49609375, -47.2109375, -44.92578125, -42.640625, -40.35546875, -38.0703125, -35.78515625, -33.5, -31.21484375, -28.9296875, -26.64453125, -24.359375, -22.07421875, -19.7890625, -17.50390625, -15.21875, -12.93359375, -10.6484375, -8.36328125, -6.078125, -3.79296875, -1.5078125, 0.77734375, 3.0625, 5.34765625, 7.6328125, 9.91796875, 12.203125, 14.48828125, 16.7734375, 19.05859375, 21.34375, 23.62890625, 25.9140625, 28.19921875, 30.484375, 32.76953125, 35.0546875, 37.33984375, 39.625, 41.91015625, 44.1953125, 46.48046875, 48.765625, 51.05078125, 53.3359375, 55.62109375, 57.90625, 60.19140625, 62.4765625, 64.76171875, 67.046875, 69.33203125, 71.6171875, 73.90234375, 76.1875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 14.0, 15.0, 15.0, 19.0, 25.0, 32.0, 34.0, 38.0, 37.0, 34.0, 42.0, 49.0, 42.0, 35.0, 37.0, 38.0, 48.0, 39.0, 32.0, 42.0, 44.0, 43.0, 29.0, 43.0, 24.0, 24.0, 15.0, 15.0, 17.0, 6.0, 12.0, 8.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.40771484375, -46.0029296875, -44.59814453125, -43.193359375, -41.78857421875, -40.3837890625, -38.97900390625, -37.57421875, -36.16943359375, -34.7646484375, -33.35986328125, -31.955078125, -30.55029296875, -29.1455078125, -27.74072265625, -26.3359375, -24.93115234375, -23.5263671875, -22.12158203125, -20.716796875, -19.31201171875, -17.9072265625, -16.50244140625, -15.09765625, -13.69287109375, -12.2880859375, -10.88330078125, -9.478515625, -8.07373046875, -6.6689453125, -5.26416015625, -3.859375, -2.45458984375, -1.0498046875, 0.35498046875, 1.759765625, 3.16455078125, 4.5693359375, 5.97412109375, 7.37890625, 8.78369140625, 10.1884765625, 11.59326171875, 12.998046875, 14.40283203125, 15.8076171875, 17.21240234375, 18.6171875, 20.02197265625, 21.4267578125, 22.83154296875, 24.236328125, 25.64111328125, 27.0458984375, 28.45068359375, 29.85546875, 31.26025390625, 32.6650390625, 34.06982421875, 35.474609375, 36.87939453125, 38.2841796875, 39.68896484375, 41.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 14.0, 13.0, 26.0, 37.0, 72.0, 92.0, 107.0, 181.0, 215.0, 342.0, 490.0, 779.0, 1210.0, 1768.0, 2678.0, 4109.0, 6199.0, 10165.0, 15909.0, 25812.0, 43268.0, 75312.0, 130976.0, 204790.0, 204443.0, 131067.0, 75118.0, 43207.0, 25931.0, 15873.0, 9891.0, 6455.0, 4074.0, 2661.0, 1782.0, 1066.0, 750.0, 507.0, 349.0, 232.0, 181.0, 118.0, 96.0, 60.0, 39.0, 27.0, 21.0, 17.0, 7.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-86.1875, -83.4072265625, -80.626953125, -77.8466796875, -75.06640625, -72.2861328125, -69.505859375, -66.7255859375, -63.9453125, -61.1650390625, -58.384765625, -55.6044921875, -52.82421875, -50.0439453125, -47.263671875, -44.4833984375, -41.703125, -38.9228515625, -36.142578125, -33.3623046875, -30.58203125, -27.8017578125, -25.021484375, -22.2412109375, -19.4609375, -16.6806640625, -13.900390625, -11.1201171875, -8.33984375, -5.5595703125, -2.779296875, 0.0009765625, 2.78125, 5.5615234375, 8.341796875, 11.1220703125, 13.90234375, 16.6826171875, 19.462890625, 22.2431640625, 25.0234375, 27.8037109375, 30.583984375, 33.3642578125, 36.14453125, 38.9248046875, 41.705078125, 44.4853515625, 47.265625, 50.0458984375, 52.826171875, 55.6064453125, 58.38671875, 61.1669921875, 63.947265625, 66.7275390625, 69.5078125, 72.2880859375, 75.068359375, 77.8486328125, 80.62890625, 83.4091796875, 86.189453125, 88.9697265625, 91.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 6.0, 14.0, 21.0, 14.0, 15.0, 21.0, 18.0, 24.0, 30.0, 26.0, 31.0, 26.0, 41.0, 39.0, 43.0, 35.0, 50.0, 42.0, 52.0, 41.0, 33.0, 35.0, 45.0, 37.0, 33.0, 28.0, 22.0, 29.0, 28.0, 17.0, 15.0, 15.0, 14.0, 13.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.953125, -28.998046875, -28.04296875, -27.087890625, -26.1328125, -25.177734375, -24.22265625, -23.267578125, -22.3125, -21.357421875, -20.40234375, -19.447265625, -18.4921875, -17.537109375, -16.58203125, -15.626953125, -14.671875, -13.716796875, -12.76171875, -11.806640625, -10.8515625, -9.896484375, -8.94140625, -7.986328125, -7.03125, -6.076171875, -5.12109375, -4.166015625, -3.2109375, -2.255859375, -1.30078125, -0.345703125, 0.609375, 1.564453125, 2.51953125, 3.474609375, 4.4296875, 5.384765625, 6.33984375, 7.294921875, 8.25, 9.205078125, 10.16015625, 11.115234375, 12.0703125, 13.025390625, 13.98046875, 14.935546875, 15.890625, 16.845703125, 17.80078125, 18.755859375, 19.7109375, 20.666015625, 21.62109375, 22.576171875, 23.53125, 24.486328125, 25.44140625, 26.396484375, 27.3515625, 28.306640625, 29.26171875, 30.216796875, 31.171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 11.0, 20.0, 20.0, 33.0, 32.0, 59.0, 86.0, 143.0, 202.0, 262.0, 384.0, 597.0, 883.0, 1433.0, 2373.0, 3931.0, 7266.0, 13785.0, 28084.0, 61056.0, 138088.0, 277547.0, 267570.0, 130051.0, 57779.0, 26888.0, 12982.0, 6872.0, 3877.0, 2180.0, 1405.0, 841.0, 563.0, 378.0, 267.0, 187.0, 110.0, 96.0, 58.0, 41.0, 33.0, 25.0, 12.0, 11.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.40625, -50.6572265625, -48.908203125, -47.1591796875, -45.41015625, -43.6611328125, -41.912109375, -40.1630859375, -38.4140625, -36.6650390625, -34.916015625, -33.1669921875, -31.41796875, -29.6689453125, -27.919921875, -26.1708984375, -24.421875, -22.6728515625, -20.923828125, -19.1748046875, -17.42578125, -15.6767578125, -13.927734375, -12.1787109375, -10.4296875, -8.6806640625, -6.931640625, -5.1826171875, -3.43359375, -1.6845703125, 0.064453125, 1.8134765625, 3.5625, 5.3115234375, 7.060546875, 8.8095703125, 10.55859375, 12.3076171875, 14.056640625, 15.8056640625, 17.5546875, 19.3037109375, 21.052734375, 22.8017578125, 24.55078125, 26.2998046875, 28.048828125, 29.7978515625, 31.546875, 33.2958984375, 35.044921875, 36.7939453125, 38.54296875, 40.2919921875, 42.041015625, 43.7900390625, 45.5390625, 47.2880859375, 49.037109375, 50.7861328125, 52.53515625, 54.2841796875, 56.033203125, 57.7822265625, 59.53125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 2.0, 5.0, 7.0, 10.0, 12.0, 20.0, 31.0, 35.0, 71.0, 92.0, 128.0, 149.0, 134.0, 93.0, 67.0, 39.0, 30.0, 19.0, 11.0, 8.0, 7.0, 7.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007198333740234375, -0.007005929946899414, -0.006813526153564453, -0.006621122360229492, -0.006428718566894531, -0.00623631477355957, -0.006043910980224609, -0.0058515071868896484, -0.0056591033935546875, -0.0054666996002197266, -0.005274295806884766, -0.005081892013549805, -0.004889488220214844, -0.004697084426879883, -0.004504680633544922, -0.004312276840209961, -0.004119873046875, -0.003927469253540039, -0.003735065460205078, -0.003542661666870117, -0.0033502578735351562, -0.0031578540802001953, -0.0029654502868652344, -0.0027730464935302734, -0.0025806427001953125, -0.0023882389068603516, -0.0021958351135253906, -0.0020034313201904297, -0.0018110275268554688, -0.0016186237335205078, -0.0014262199401855469, -0.001233816146850586, -0.001041412353515625, -0.0008490085601806641, -0.0006566047668457031, -0.0004642009735107422, -0.00027179718017578125, -7.939338684082031e-05, 0.00011301040649414062, 0.00030541419982910156, 0.0004978179931640625, 0.0006902217864990234, 0.0008826255798339844, 0.0010750293731689453, 0.0012674331665039062, 0.0014598369598388672, 0.0016522407531738281, 0.001844644546508789, 0.00203704833984375, 0.002229452133178711, 0.002421855926513672, 0.002614259719848633, 0.0028066635131835938, 0.0029990673065185547, 0.0031914710998535156, 0.0033838748931884766, 0.0035762786865234375, 0.0037686824798583984, 0.003961086273193359, 0.00415349006652832, 0.004345893859863281, 0.004538297653198242, 0.004730701446533203, 0.004923105239868164, 0.005115509033203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 10.0, 10.0, 10.0, 17.0, 18.0, 31.0, 41.0, 45.0, 82.0, 104.0, 154.0, 186.0, 235.0, 395.0, 515.0, 709.0, 1013.0, 1583.0, 2290.0, 3754.0, 6352.0, 11129.0, 20777.0, 42057.0, 85285.0, 160447.0, 234828.0, 212059.0, 127680.0, 64996.0, 31925.0, 16417.0, 8811.0, 5042.0, 3152.0, 1983.0, 1323.0, 885.0, 655.0, 410.0, 332.0, 203.0, 171.0, 125.0, 97.0, 60.0, 42.0, 39.0, 30.0, 17.0, 8.0, 5.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-58.9375, -57.08447265625, -55.2314453125, -53.37841796875, -51.525390625, -49.67236328125, -47.8193359375, -45.96630859375, -44.11328125, -42.26025390625, -40.4072265625, -38.55419921875, -36.701171875, -34.84814453125, -32.9951171875, -31.14208984375, -29.2890625, -27.43603515625, -25.5830078125, -23.72998046875, -21.876953125, -20.02392578125, -18.1708984375, -16.31787109375, -14.46484375, -12.61181640625, -10.7587890625, -8.90576171875, -7.052734375, -5.19970703125, -3.3466796875, -1.49365234375, 0.359375, 2.21240234375, 4.0654296875, 5.91845703125, 7.771484375, 9.62451171875, 11.4775390625, 13.33056640625, 15.18359375, 17.03662109375, 18.8896484375, 20.74267578125, 22.595703125, 24.44873046875, 26.3017578125, 28.15478515625, 30.0078125, 31.86083984375, 33.7138671875, 35.56689453125, 37.419921875, 39.27294921875, 41.1259765625, 42.97900390625, 44.83203125, 46.68505859375, 48.5380859375, 50.39111328125, 52.244140625, 54.09716796875, 55.9501953125, 57.80322265625, 59.65625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 7.0, 5.0, 5.0, 7.0, 13.0, 11.0, 16.0, 29.0, 38.0, 46.0, 65.0, 78.0, 77.0, 69.0, 91.0, 65.0, 74.0, 53.0, 55.0, 46.0, 34.0, 33.0, 23.0, 14.0, 7.0, 7.0, 8.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.684326171875, -22.99365234375, -22.302978515625, -21.6123046875, -20.921630859375, -20.23095703125, -19.540283203125, -18.849609375, -18.158935546875, -17.46826171875, -16.777587890625, -16.0869140625, -15.396240234375, -14.70556640625, -14.014892578125, -13.32421875, -12.633544921875, -11.94287109375, -11.252197265625, -10.5615234375, -9.870849609375, -9.18017578125, -8.489501953125, -7.798828125, -7.108154296875, -6.41748046875, -5.726806640625, -5.0361328125, -4.345458984375, -3.65478515625, -2.964111328125, -2.2734375, -1.582763671875, -0.89208984375, -0.201416015625, 0.4892578125, 1.179931640625, 1.87060546875, 2.561279296875, 3.251953125, 3.942626953125, 4.63330078125, 5.323974609375, 6.0146484375, 6.705322265625, 7.39599609375, 8.086669921875, 8.77734375, 9.468017578125, 10.15869140625, 10.849365234375, 11.5400390625, 12.230712890625, 12.92138671875, 13.612060546875, 14.302734375, 14.993408203125, 15.68408203125, 16.374755859375, 17.0654296875, 17.756103515625, 18.44677734375, 19.137451171875, 19.828125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 11.0, 12.0, 8.0, 20.0, 20.0, 27.0, 36.0, 38.0, 47.0, 42.0, 46.0, 48.0, 54.0, 59.0, 65.0, 41.0, 61.0, 45.0, 43.0, 37.0, 24.0, 37.0, 33.0, 20.0, 19.0, 16.0, 11.0, 14.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.323360443115234, -46.77022171020508, -45.21708297729492, -43.663944244384766, -42.110809326171875, -40.55767059326172, -39.00453186035156, -37.451393127441406, -35.89825439453125, -34.345115661621094, -32.79197692871094, -31.238840103149414, -29.685701370239258, -28.1325626373291, -26.579425811767578, -25.026287078857422, -23.473148345947266, -21.92000961303711, -20.366870880126953, -18.81373405456543, -17.260595321655273, -15.707456588745117, -14.154318809509277, -12.601181030273438, -11.048042297363281, -9.494903564453125, -7.941765785217285, -6.388627529144287, -4.835489273071289, -3.282351016998291, -1.729212760925293, -0.17607498168945312, 1.3770599365234375, 2.9301981925964355, 4.483336448669434, 6.036474704742432, 7.58961296081543, 9.142751693725586, 10.695889472961426, 12.249027252197266, 13.802165985107422, 15.355304718017578, 16.908443450927734, 18.461580276489258, 20.014719009399414, 21.56785774230957, 23.120994567871094, 24.67413330078125, 26.227272033691406, 27.780410766601562, 29.33354949951172, 30.886686325073242, 32.43982696533203, 33.99296188354492, 35.54610061645508, 37.099239349365234, 38.65237808227539, 40.20551681518555, 41.7586555480957, 43.31179428100586, 44.86492919921875, 46.418067932128906, 47.97120666503906, 49.52434539794922, 51.077484130859375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 12.0, 10.0, 15.0, 15.0, 21.0, 18.0, 23.0, 28.0, 28.0, 33.0, 41.0, 38.0, 45.0, 24.0, 31.0, 42.0, 44.0, 43.0, 41.0, 43.0, 40.0, 39.0, 28.0, 46.0, 32.0, 21.0, 26.0, 21.0, 26.0, 19.0, 18.0, 10.0, 11.0, 10.0, 9.0, 13.0, 7.0, 8.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.124786376953125, -38.834556579589844, -37.54433059692383, -36.25410079956055, -34.963871002197266, -33.67364501953125, -32.38341522216797, -31.093185424804688, -29.80295753479004, -28.51272964477539, -27.22249984741211, -25.93227195739746, -24.642044067382812, -23.35181427001953, -22.061586380004883, -20.771358489990234, -19.481128692626953, -18.190900802612305, -16.900671005249023, -15.610443115234375, -14.32021427154541, -13.029985427856445, -11.739757537841797, -10.449528694152832, -9.159299850463867, -7.869071006774902, -6.578842639923096, -5.288614273071289, -3.998385429382324, -2.7081565856933594, -1.4179282188415527, -0.1276998519897461, 1.1625289916992188, 2.4527575969696045, 3.7429862022399902, 5.033214569091797, 6.323443412780762, 7.613672256469727, 8.903900146484375, 10.19412899017334, 11.484357833862305, 12.77458667755127, 14.064815521240234, 15.355043411254883, 16.64527130126953, 17.935501098632812, 19.22572898864746, 20.51595687866211, 21.80618667602539, 23.09641456604004, 24.38664436340332, 25.67687225341797, 26.96710205078125, 28.2573299407959, 29.547557830810547, 30.837787628173828, 32.128013610839844, 33.418243408203125, 34.70846939086914, 35.99869918823242, 37.2889289855957, 38.57915496826172, 39.869384765625, 41.15961456298828, 42.44984436035156]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 10.0, 22.0, 25.0, 34.0, 65.0, 92.0, 124.0, 219.0, 334.0, 530.0, 757.0, 1176.0, 1829.0, 2873.0, 4350.0, 6533.0, 9795.0, 14543.0, 21615.0, 30894.0, 43421.0, 58789.0, 77051.0, 95229.0, 109021.0, 113198.0, 106108.0, 91761.0, 73891.0, 55727.0, 40390.0, 28460.0, 19735.0, 13406.0, 8986.0, 6073.0, 3986.0, 2581.0, 1672.0, 1154.0, 748.0, 475.0, 305.0, 220.0, 132.0, 79.0, 54.0, 33.0, 20.0, 12.0, 11.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.71875, -44.16357421875, -42.6083984375, -41.05322265625, -39.498046875, -37.94287109375, -36.3876953125, -34.83251953125, -33.27734375, -31.72216796875, -30.1669921875, -28.61181640625, -27.056640625, -25.50146484375, -23.9462890625, -22.39111328125, -20.8359375, -19.28076171875, -17.7255859375, -16.17041015625, -14.615234375, -13.06005859375, -11.5048828125, -9.94970703125, -8.39453125, -6.83935546875, -5.2841796875, -3.72900390625, -2.173828125, -0.61865234375, 0.9365234375, 2.49169921875, 4.046875, 5.60205078125, 7.1572265625, 8.71240234375, 10.267578125, 11.82275390625, 13.3779296875, 14.93310546875, 16.48828125, 18.04345703125, 19.5986328125, 21.15380859375, 22.708984375, 24.26416015625, 25.8193359375, 27.37451171875, 28.9296875, 30.48486328125, 32.0400390625, 33.59521484375, 35.150390625, 36.70556640625, 38.2607421875, 39.81591796875, 41.37109375, 42.92626953125, 44.4814453125, 46.03662109375, 47.591796875, 49.14697265625, 50.7021484375, 52.25732421875, 53.8125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 11.0, 13.0, 16.0, 22.0, 24.0, 27.0, 23.0, 20.0, 42.0, 39.0, 32.0, 40.0, 30.0, 41.0, 36.0, 47.0, 40.0, 41.0, 43.0, 38.0, 33.0, 43.0, 28.0, 36.0, 25.0, 20.0, 30.0, 18.0, 23.0, 15.0, 20.0, 11.0, 9.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.71875, -39.4833984375, -38.248046875, -37.0126953125, -35.77734375, -34.5419921875, -33.306640625, -32.0712890625, -30.8359375, -29.6005859375, -28.365234375, -27.1298828125, -25.89453125, -24.6591796875, -23.423828125, -22.1884765625, -20.953125, -19.7177734375, -18.482421875, -17.2470703125, -16.01171875, -14.7763671875, -13.541015625, -12.3056640625, -11.0703125, -9.8349609375, -8.599609375, -7.3642578125, -6.12890625, -4.8935546875, -3.658203125, -2.4228515625, -1.1875, 0.0478515625, 1.283203125, 2.5185546875, 3.75390625, 4.9892578125, 6.224609375, 7.4599609375, 8.6953125, 9.9306640625, 11.166015625, 12.4013671875, 13.63671875, 14.8720703125, 16.107421875, 17.3427734375, 18.578125, 19.8134765625, 21.048828125, 22.2841796875, 23.51953125, 24.7548828125, 25.990234375, 27.2255859375, 28.4609375, 29.6962890625, 30.931640625, 32.1669921875, 33.40234375, 34.6376953125, 35.873046875, 37.1083984375, 38.34375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 12.0, 17.0, 24.0, 33.0, 55.0, 71.0, 142.0, 207.0, 381.0, 584.0, 1000.0, 1550.0, 2660.0, 4235.0, 6869.0, 10683.0, 16924.0, 26056.0, 39306.0, 56705.0, 77478.0, 99242.0, 116452.0, 122375.0, 116808.0, 100090.0, 78909.0, 57618.0, 39550.0, 26481.0, 17060.0, 10829.0, 6885.0, 4226.0, 2632.0, 1666.0, 1041.0, 657.0, 371.0, 259.0, 138.0, 121.0, 67.0, 30.0, 17.0, 20.0, 7.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.09375, -47.5361328125, -45.978515625, -44.4208984375, -42.86328125, -41.3056640625, -39.748046875, -38.1904296875, -36.6328125, -35.0751953125, -33.517578125, -31.9599609375, -30.40234375, -28.8447265625, -27.287109375, -25.7294921875, -24.171875, -22.6142578125, -21.056640625, -19.4990234375, -17.94140625, -16.3837890625, -14.826171875, -13.2685546875, -11.7109375, -10.1533203125, -8.595703125, -7.0380859375, -5.48046875, -3.9228515625, -2.365234375, -0.8076171875, 0.75, 2.3076171875, 3.865234375, 5.4228515625, 6.98046875, 8.5380859375, 10.095703125, 11.6533203125, 13.2109375, 14.7685546875, 16.326171875, 17.8837890625, 19.44140625, 20.9990234375, 22.556640625, 24.1142578125, 25.671875, 27.2294921875, 28.787109375, 30.3447265625, 31.90234375, 33.4599609375, 35.017578125, 36.5751953125, 38.1328125, 39.6904296875, 41.248046875, 42.8056640625, 44.36328125, 45.9208984375, 47.478515625, 49.0361328125, 50.59375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 8.0, 14.0, 14.0, 14.0, 30.0, 31.0, 35.0, 38.0, 36.0, 41.0, 46.0, 42.0, 48.0, 41.0, 44.0, 33.0, 47.0, 41.0, 41.0, 44.0, 39.0, 32.0, 28.0, 21.0, 25.0, 21.0, 24.0, 12.0, 14.0, 12.0, 9.0, 13.0, 10.0, 8.0, 4.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.7744140625, -24.892578125, -24.0107421875, -23.12890625, -22.2470703125, -21.365234375, -20.4833984375, -19.6015625, -18.7197265625, -17.837890625, -16.9560546875, -16.07421875, -15.1923828125, -14.310546875, -13.4287109375, -12.546875, -11.6650390625, -10.783203125, -9.9013671875, -9.01953125, -8.1376953125, -7.255859375, -6.3740234375, -5.4921875, -4.6103515625, -3.728515625, -2.8466796875, -1.96484375, -1.0830078125, -0.201171875, 0.6806640625, 1.5625, 2.4443359375, 3.326171875, 4.2080078125, 5.08984375, 5.9716796875, 6.853515625, 7.7353515625, 8.6171875, 9.4990234375, 10.380859375, 11.2626953125, 12.14453125, 13.0263671875, 13.908203125, 14.7900390625, 15.671875, 16.5537109375, 17.435546875, 18.3173828125, 19.19921875, 20.0810546875, 20.962890625, 21.8447265625, 22.7265625, 23.6083984375, 24.490234375, 25.3720703125, 26.25390625, 27.1357421875, 28.017578125, 28.8994140625, 29.78125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 10.0, 12.0, 10.0, 20.0, 24.0, 26.0, 50.0, 82.0, 110.0, 180.0, 264.0, 447.0, 674.0, 1102.0, 1866.0, 3084.0, 5350.0, 9154.0, 16577.0, 30117.0, 55293.0, 96902.0, 152385.0, 191425.0, 180564.0, 128160.0, 76956.0, 43129.0, 23697.0, 12963.0, 7333.0, 4182.0, 2379.0, 1464.0, 902.0, 575.0, 379.0, 247.0, 132.0, 99.0, 74.0, 42.0, 34.0, 27.0, 17.0, 13.0, 7.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.4375, -31.4775390625, -30.517578125, -29.5576171875, -28.59765625, -27.6376953125, -26.677734375, -25.7177734375, -24.7578125, -23.7978515625, -22.837890625, -21.8779296875, -20.91796875, -19.9580078125, -18.998046875, -18.0380859375, -17.078125, -16.1181640625, -15.158203125, -14.1982421875, -13.23828125, -12.2783203125, -11.318359375, -10.3583984375, -9.3984375, -8.4384765625, -7.478515625, -6.5185546875, -5.55859375, -4.5986328125, -3.638671875, -2.6787109375, -1.71875, -0.7587890625, 0.201171875, 1.1611328125, 2.12109375, 3.0810546875, 4.041015625, 5.0009765625, 5.9609375, 6.9208984375, 7.880859375, 8.8408203125, 9.80078125, 10.7607421875, 11.720703125, 12.6806640625, 13.640625, 14.6005859375, 15.560546875, 16.5205078125, 17.48046875, 18.4404296875, 19.400390625, 20.3603515625, 21.3203125, 22.2802734375, 23.240234375, 24.2001953125, 25.16015625, 26.1201171875, 27.080078125, 28.0400390625, 29.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 8.0, 7.0, 12.0, 14.0, 33.0, 21.0, 35.0, 44.0, 51.0, 63.0, 73.0, 79.0, 72.0, 90.0, 71.0, 64.0, 51.0, 49.0, 34.0, 33.0, 18.0, 21.0, 14.0, 11.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00359344482421875, -0.0034618377685546875, -0.003330230712890625, -0.0031986236572265625, -0.0030670166015625, -0.0029354095458984375, -0.002803802490234375, -0.0026721954345703125, -0.00254058837890625, -0.0024089813232421875, -0.002277374267578125, -0.0021457672119140625, -0.00201416015625, -0.0018825531005859375, -0.001750946044921875, -0.0016193389892578125, -0.00148773193359375, -0.0013561248779296875, -0.001224517822265625, -0.0010929107666015625, -0.0009613037109375, -0.0008296966552734375, -0.000698089599609375, -0.0005664825439453125, -0.00043487548828125, -0.0003032684326171875, -0.000171661376953125, -4.00543212890625e-05, 9.1552734375e-05, 0.0002231597900390625, 0.000354766845703125, 0.0004863739013671875, 0.00061798095703125, 0.0007495880126953125, 0.000881195068359375, 0.0010128021240234375, 0.0011444091796875, 0.0012760162353515625, 0.001407623291015625, 0.0015392303466796875, 0.00167083740234375, 0.0018024444580078125, 0.001934051513671875, 0.0020656585693359375, 0.002197265625, 0.0023288726806640625, 0.002460479736328125, 0.0025920867919921875, 0.00272369384765625, 0.0028553009033203125, 0.002986907958984375, 0.0031185150146484375, 0.0032501220703125, 0.0033817291259765625, 0.003513336181640625, 0.0036449432373046875, 0.00377655029296875, 0.0039081573486328125, 0.004039764404296875, 0.0041713714599609375, 0.004302978515625, 0.0044345855712890625, 0.004566192626953125, 0.0046977996826171875, 0.00482940673828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 9.0, 9.0, 11.0, 17.0, 22.0, 55.0, 66.0, 91.0, 177.0, 327.0, 505.0, 915.0, 1496.0, 2697.0, 4865.0, 8771.0, 15906.0, 28275.0, 50341.0, 86621.0, 137645.0, 181689.0, 182552.0, 138966.0, 88788.0, 51775.0, 29160.0, 16305.0, 8878.0, 4953.0, 2863.0, 1590.0, 904.0, 521.0, 327.0, 165.0, 112.0, 67.0, 41.0, 28.0, 19.0, 14.0, 6.0, 8.0, 8.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.0625, -30.175537109375, -29.28857421875, -28.401611328125, -27.5146484375, -26.627685546875, -25.74072265625, -24.853759765625, -23.966796875, -23.079833984375, -22.19287109375, -21.305908203125, -20.4189453125, -19.531982421875, -18.64501953125, -17.758056640625, -16.87109375, -15.984130859375, -15.09716796875, -14.210205078125, -13.3232421875, -12.436279296875, -11.54931640625, -10.662353515625, -9.775390625, -8.888427734375, -8.00146484375, -7.114501953125, -6.2275390625, -5.340576171875, -4.45361328125, -3.566650390625, -2.6796875, -1.792724609375, -0.90576171875, -0.018798828125, 0.8681640625, 1.755126953125, 2.64208984375, 3.529052734375, 4.416015625, 5.302978515625, 6.18994140625, 7.076904296875, 7.9638671875, 8.850830078125, 9.73779296875, 10.624755859375, 11.51171875, 12.398681640625, 13.28564453125, 14.172607421875, 15.0595703125, 15.946533203125, 16.83349609375, 17.720458984375, 18.607421875, 19.494384765625, 20.38134765625, 21.268310546875, 22.1552734375, 23.042236328125, 23.92919921875, 24.816162109375, 25.703125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 4.0, 16.0, 8.0, 6.0, 13.0, 16.0, 21.0, 23.0, 23.0, 21.0, 35.0, 32.0, 36.0, 44.0, 38.0, 39.0, 41.0, 51.0, 39.0, 51.0, 38.0, 43.0, 27.0, 34.0, 37.0, 34.0, 18.0, 31.0, 19.0, 17.0, 21.0, 25.0, 17.0, 6.0, 13.0, 15.0, 7.0, 7.0, 1.0, 8.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0], "bins": [-8.2265625, -8.0003662109375, -7.774169921875, -7.5479736328125, -7.32177734375, -7.0955810546875, -6.869384765625, -6.6431884765625, -6.4169921875, -6.1907958984375, -5.964599609375, -5.7384033203125, -5.51220703125, -5.2860107421875, -5.059814453125, -4.8336181640625, -4.607421875, -4.3812255859375, -4.155029296875, -3.9288330078125, -3.70263671875, -3.4764404296875, -3.250244140625, -3.0240478515625, -2.7978515625, -2.5716552734375, -2.345458984375, -2.1192626953125, -1.89306640625, -1.6668701171875, -1.440673828125, -1.2144775390625, -0.98828125, -0.7620849609375, -0.535888671875, -0.3096923828125, -0.08349609375, 0.1427001953125, 0.368896484375, 0.5950927734375, 0.8212890625, 1.0474853515625, 1.273681640625, 1.4998779296875, 1.72607421875, 1.9522705078125, 2.178466796875, 2.4046630859375, 2.630859375, 2.8570556640625, 3.083251953125, 3.3094482421875, 3.53564453125, 3.7618408203125, 3.988037109375, 4.2142333984375, 4.4404296875, 4.6666259765625, 4.892822265625, 5.1190185546875, 5.34521484375, 5.5714111328125, 5.797607421875, 6.0238037109375, 6.25]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 8.0, 10.0, 12.0, 20.0, 17.0, 18.0, 20.0, 28.0, 35.0, 45.0, 50.0, 37.0, 49.0, 40.0, 51.0, 52.0, 53.0, 64.0, 46.0, 40.0, 44.0, 38.0, 37.0, 25.0, 31.0, 29.0, 13.0, 15.0, 9.0, 15.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.981536865234375, -49.49579620361328, -48.01005554199219, -46.524314880371094, -45.03857421875, -43.55283737182617, -42.06709671020508, -40.581356048583984, -39.09561538696289, -37.6098747253418, -36.1241340637207, -34.63839340209961, -33.15265655517578, -31.666913986206055, -30.181175231933594, -28.6954345703125, -27.209693908691406, -25.723953247070312, -24.23821258544922, -22.752473831176758, -21.266733169555664, -19.78099250793457, -18.29525375366211, -16.809513092041016, -15.323772430419922, -13.838031768798828, -12.35229206085205, -10.866552352905273, -9.38081169128418, -7.895071506500244, -6.409331321716309, -4.923591613769531, -3.4378509521484375, -1.952110767364502, -0.4663705825805664, 1.0193696022033691, 2.5051097869873047, 3.9908499717712402, 5.476590156555176, 6.962329864501953, 8.448070526123047, 9.93381118774414, 11.419550895690918, 12.905290603637695, 14.391031265258789, 15.876771926879883, 17.362510681152344, 18.848251342773438, 20.33399200439453, 21.819732666015625, 23.30547332763672, 24.79121208190918, 26.276952743530273, 27.762693405151367, 29.248432159423828, 30.734172821044922, 32.219913482666016, 33.70565414428711, 35.1913948059082, 36.6771354675293, 38.162872314453125, 39.64861297607422, 41.13435363769531, 42.620094299316406, 44.1058349609375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 15.0, 15.0, 10.0, 17.0, 14.0, 19.0, 20.0, 21.0, 11.0, 29.0, 25.0, 35.0, 36.0, 45.0, 39.0, 41.0, 36.0, 40.0, 28.0, 41.0, 46.0, 40.0, 32.0, 33.0, 40.0, 33.0, 32.0, 22.0, 26.0, 22.0, 22.0, 20.0, 19.0, 11.0, 11.0, 7.0, 8.0, 8.0, 6.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.29981994628906, -37.08195495605469, -35.86408615112305, -34.64622116088867, -33.42835235595703, -32.210487365722656, -30.99262237548828, -29.774755477905273, -28.556888580322266, -27.339021682739258, -26.12115478515625, -24.903289794921875, -23.685422897338867, -22.46755599975586, -21.249691009521484, -20.031824111938477, -18.81395721435547, -17.59609031677246, -16.378223419189453, -15.160358428955078, -13.94249153137207, -12.724624633789062, -11.506758689880371, -10.28889274597168, -9.071025848388672, -7.853159427642822, -6.635293006896973, -5.417426586151123, -4.199560165405273, -2.981693744659424, -1.7638273239135742, -0.5459613800048828, 0.6719093322753906, 1.8897757530212402, 3.10764217376709, 4.3255085945129395, 5.543375015258789, 6.761241436004639, 7.979107856750488, 9.19697380065918, 10.414840698242188, 11.632707595825195, 12.850573539733887, 14.068439483642578, 15.286306381225586, 16.504173278808594, 17.72203826904297, 18.939905166625977, 20.157772064208984, 21.375638961791992, 22.593505859375, 23.811370849609375, 25.029237747192383, 26.24710464477539, 27.464969635009766, 28.682836532592773, 29.90070343017578, 31.11857032775879, 32.3364372253418, 33.55430221557617, 34.77217102050781, 35.99003601074219, 37.20790100097656, 38.42576599121094, 39.64363479614258]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 7.0, 14.0, 14.0, 27.0, 32.0, 53.0, 98.0, 152.0, 244.0, 431.0, 643.0, 972.0, 1822.0, 2874.0, 4797.0, 7849.0, 12910.0, 21224.0, 35494.0, 59015.0, 97620.0, 162853.0, 274503.0, 456357.0, 697170.0, 792942.0, 609792.0, 381767.0, 229022.0, 136434.0, 81559.0, 49406.0, 29688.0, 18009.0, 11093.0, 6715.0, 4018.0, 2559.0, 1595.0, 933.0, 577.0, 393.0, 223.0, 150.0, 98.0, 65.0, 23.0, 21.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.21875, -46.57373046875, -44.9287109375, -43.28369140625, -41.638671875, -39.99365234375, -38.3486328125, -36.70361328125, -35.05859375, -33.41357421875, -31.7685546875, -30.12353515625, -28.478515625, -26.83349609375, -25.1884765625, -23.54345703125, -21.8984375, -20.25341796875, -18.6083984375, -16.96337890625, -15.318359375, -13.67333984375, -12.0283203125, -10.38330078125, -8.73828125, -7.09326171875, -5.4482421875, -3.80322265625, -2.158203125, -0.51318359375, 1.1318359375, 2.77685546875, 4.421875, 6.06689453125, 7.7119140625, 9.35693359375, 11.001953125, 12.64697265625, 14.2919921875, 15.93701171875, 17.58203125, 19.22705078125, 20.8720703125, 22.51708984375, 24.162109375, 25.80712890625, 27.4521484375, 29.09716796875, 30.7421875, 32.38720703125, 34.0322265625, 35.67724609375, 37.322265625, 38.96728515625, 40.6123046875, 42.25732421875, 43.90234375, 45.54736328125, 47.1923828125, 48.83740234375, 50.482421875, 52.12744140625, 53.7724609375, 55.41748046875, 57.0625]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 10.0, 14.0, 13.0, 9.0, 18.0, 16.0, 18.0, 24.0, 24.0, 22.0, 21.0, 26.0, 35.0, 48.0, 40.0, 29.0, 31.0, 44.0, 33.0, 27.0, 48.0, 48.0, 32.0, 33.0, 41.0, 29.0, 36.0, 26.0, 22.0, 18.0, 19.0, 23.0, 17.0, 15.0, 16.0, 10.0, 12.0, 6.0, 5.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.421875, -25.588134765625, -24.75439453125, -23.920654296875, -23.0869140625, -22.253173828125, -21.41943359375, -20.585693359375, -19.751953125, -18.918212890625, -18.08447265625, -17.250732421875, -16.4169921875, -15.583251953125, -14.74951171875, -13.915771484375, -13.08203125, -12.248291015625, -11.41455078125, -10.580810546875, -9.7470703125, -8.913330078125, -8.07958984375, -7.245849609375, -6.412109375, -5.578369140625, -4.74462890625, -3.910888671875, -3.0771484375, -2.243408203125, -1.40966796875, -0.575927734375, 0.2578125, 1.091552734375, 1.92529296875, 2.759033203125, 3.5927734375, 4.426513671875, 5.26025390625, 6.093994140625, 6.927734375, 7.761474609375, 8.59521484375, 9.428955078125, 10.2626953125, 11.096435546875, 11.93017578125, 12.763916015625, 13.59765625, 14.431396484375, 15.26513671875, 16.098876953125, 16.9326171875, 17.766357421875, 18.60009765625, 19.433837890625, 20.267578125, 21.101318359375, 21.93505859375, 22.768798828125, 23.6025390625, 24.436279296875, 25.27001953125, 26.103759765625, 26.9375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 11.0, 15.0, 18.0, 36.0, 53.0, 83.0, 110.0, 187.0, 294.0, 440.0, 638.0, 1099.0, 1673.0, 2685.0, 4127.0, 6414.0, 10538.0, 16654.0, 27840.0, 44657.0, 72249.0, 115211.0, 182281.0, 279534.0, 412011.0, 554941.0, 634405.0, 574812.0, 433036.0, 296568.0, 194404.0, 124004.0, 77427.0, 47157.0, 29709.0, 18295.0, 11438.0, 6991.0, 4440.0, 2814.0, 1806.0, 1102.0, 696.0, 486.0, 285.0, 202.0, 127.0, 99.0, 57.0, 34.0, 40.0, 20.0, 13.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-33.15625, -32.07177734375, -30.9873046875, -29.90283203125, -28.818359375, -27.73388671875, -26.6494140625, -25.56494140625, -24.48046875, -23.39599609375, -22.3115234375, -21.22705078125, -20.142578125, -19.05810546875, -17.9736328125, -16.88916015625, -15.8046875, -14.72021484375, -13.6357421875, -12.55126953125, -11.466796875, -10.38232421875, -9.2978515625, -8.21337890625, -7.12890625, -6.04443359375, -4.9599609375, -3.87548828125, -2.791015625, -1.70654296875, -0.6220703125, 0.46240234375, 1.546875, 2.63134765625, 3.7158203125, 4.80029296875, 5.884765625, 6.96923828125, 8.0537109375, 9.13818359375, 10.22265625, 11.30712890625, 12.3916015625, 13.47607421875, 14.560546875, 15.64501953125, 16.7294921875, 17.81396484375, 18.8984375, 19.98291015625, 21.0673828125, 22.15185546875, 23.236328125, 24.32080078125, 25.4052734375, 26.48974609375, 27.57421875, 28.65869140625, 29.7431640625, 30.82763671875, 31.912109375, 32.99658203125, 34.0810546875, 35.16552734375, 36.25]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 10.0, 5.0, 5.0, 5.0, 11.0, 14.0, 13.0, 14.0, 30.0, 21.0, 31.0, 42.0, 67.0, 75.0, 80.0, 80.0, 86.0, 125.0, 124.0, 167.0, 188.0, 176.0, 212.0, 193.0, 213.0, 223.0, 215.0, 172.0, 188.0, 172.0, 171.0, 151.0, 122.0, 110.0, 110.0, 85.0, 72.0, 55.0, 41.0, 34.0, 42.0, 24.0, 23.0, 15.0, 14.0, 14.0, 8.0, 9.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-13.8828125, -13.4676513671875, -13.052490234375, -12.6373291015625, -12.22216796875, -11.8070068359375, -11.391845703125, -10.9766845703125, -10.5615234375, -10.1463623046875, -9.731201171875, -9.3160400390625, -8.90087890625, -8.4857177734375, -8.070556640625, -7.6553955078125, -7.240234375, -6.8250732421875, -6.409912109375, -5.9947509765625, -5.57958984375, -5.1644287109375, -4.749267578125, -4.3341064453125, -3.9189453125, -3.5037841796875, -3.088623046875, -2.6734619140625, -2.25830078125, -1.8431396484375, -1.427978515625, -1.0128173828125, -0.59765625, -0.1824951171875, 0.232666015625, 0.6478271484375, 1.06298828125, 1.4781494140625, 1.893310546875, 2.3084716796875, 2.7236328125, 3.1387939453125, 3.553955078125, 3.9691162109375, 4.38427734375, 4.7994384765625, 5.214599609375, 5.6297607421875, 6.044921875, 6.4600830078125, 6.875244140625, 7.2904052734375, 7.70556640625, 8.1207275390625, 8.535888671875, 8.9510498046875, 9.3662109375, 9.7813720703125, 10.196533203125, 10.6116943359375, 11.02685546875, 11.4420166015625, 11.857177734375, 12.2723388671875, 12.6875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 8.0, 10.0, 17.0, 22.0, 12.0, 20.0, 22.0, 23.0, 27.0, 37.0, 24.0, 49.0, 36.0, 46.0, 49.0, 45.0, 42.0, 52.0, 39.0, 45.0, 56.0, 32.0, 40.0, 41.0, 30.0, 19.0, 23.0, 22.0, 18.0, 25.0, 12.0, 4.0, 16.0, 6.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.14870071411133, -34.011474609375, -32.87424850463867, -31.737022399902344, -30.599796295166016, -29.462570190429688, -28.32534408569336, -27.18811798095703, -26.050891876220703, -24.913665771484375, -23.776439666748047, -22.63921356201172, -21.50198745727539, -20.364761352539062, -19.227535247802734, -18.090309143066406, -16.953083038330078, -15.81585693359375, -14.678630828857422, -13.541404724121094, -12.404178619384766, -11.266952514648438, -10.12972640991211, -8.992500305175781, -7.855274200439453, -6.718048095703125, -5.580821990966797, -4.443595886230469, -3.3063697814941406, -2.1691436767578125, -1.0319175720214844, 0.10530853271484375, 1.2425384521484375, 2.3797645568847656, 3.5169906616210938, 4.654216766357422, 5.79144287109375, 6.928668975830078, 8.065895080566406, 9.203121185302734, 10.340347290039062, 11.47757339477539, 12.614799499511719, 13.752025604248047, 14.889251708984375, 16.026477813720703, 17.16370391845703, 18.30093002319336, 19.438156127929688, 20.575382232666016, 21.712608337402344, 22.849834442138672, 23.987060546875, 25.124286651611328, 26.261512756347656, 27.398738861083984, 28.535964965820312, 29.67319107055664, 30.81041717529297, 31.947643280029297, 33.084869384765625, 34.22209548950195, 35.35932159423828, 36.49654769897461, 37.63377380371094]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 2.0, 7.0, 3.0, 10.0, 11.0, 12.0, 10.0, 6.0, 20.0, 25.0, 19.0, 25.0, 34.0, 21.0, 41.0, 32.0, 36.0, 38.0, 41.0, 41.0, 36.0, 34.0, 41.0, 28.0, 47.0, 43.0, 42.0, 39.0, 31.0, 23.0, 19.0, 25.0, 23.0, 21.0, 11.0, 15.0, 20.0, 21.0, 7.0, 3.0, 5.0, 9.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-34.7421989440918, -33.759281158447266, -32.776363372802734, -31.793445587158203, -30.810527801513672, -29.82761001586914, -28.84469223022461, -27.861774444580078, -26.878856658935547, -25.895938873291016, -24.913021087646484, -23.930103302001953, -22.947185516357422, -21.96426773071289, -20.98134994506836, -19.998432159423828, -19.01551628112793, -18.0325984954834, -17.049680709838867, -16.066762924194336, -15.083845138549805, -14.100927352905273, -13.118010520935059, -12.135092735290527, -11.152174949645996, -10.169257164001465, -9.186339378356934, -8.203422546386719, -7.220504283905029, -6.237586498260498, -5.254669189453125, -4.271751403808594, -3.2888355255126953, -2.305917739868164, -1.323000192642212, -0.34008264541625977, 0.6428351402282715, 1.6257529258728027, 2.608670234680176, 3.591588020324707, 4.574505805969238, 5.5574235916137695, 6.540341377258301, 7.523258686065674, 8.506175994873047, 9.489093780517578, 10.47201156616211, 11.45492935180664, 12.437847137451172, 13.420764923095703, 14.403682708740234, 15.386600494384766, 16.369518280029297, 17.352436065673828, 18.33535385131836, 19.31827163696289, 20.301189422607422, 21.284107208251953, 22.267024993896484, 23.249942779541016, 24.232860565185547, 25.215778350830078, 26.19869613647461, 27.18161392211914, 28.16452980041504]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 14.0, 21.0, 23.0, 32.0, 59.0, 81.0, 143.0, 234.0, 367.0, 557.0, 950.0, 1498.0, 2338.0, 3804.0, 6295.0, 10408.0, 17148.0, 27423.0, 43267.0, 64741.0, 92306.0, 119095.0, 136371.0, 136208.0, 117855.0, 90910.0, 63828.0, 42380.0, 26948.0, 16931.0, 10093.0, 6295.0, 3809.0, 2284.0, 1412.0, 907.0, 561.0, 357.0, 219.0, 139.0, 73.0, 59.0, 38.0, 22.0, 19.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-63.4375, -61.3896484375, -59.341796875, -57.2939453125, -55.24609375, -53.1982421875, -51.150390625, -49.1025390625, -47.0546875, -45.0068359375, -42.958984375, -40.9111328125, -38.86328125, -36.8154296875, -34.767578125, -32.7197265625, -30.671875, -28.6240234375, -26.576171875, -24.5283203125, -22.48046875, -20.4326171875, -18.384765625, -16.3369140625, -14.2890625, -12.2412109375, -10.193359375, -8.1455078125, -6.09765625, -4.0498046875, -2.001953125, 0.0458984375, 2.09375, 4.1416015625, 6.189453125, 8.2373046875, 10.28515625, 12.3330078125, 14.380859375, 16.4287109375, 18.4765625, 20.5244140625, 22.572265625, 24.6201171875, 26.66796875, 28.7158203125, 30.763671875, 32.8115234375, 34.859375, 36.9072265625, 38.955078125, 41.0029296875, 43.05078125, 45.0986328125, 47.146484375, 49.1943359375, 51.2421875, 53.2900390625, 55.337890625, 57.3857421875, 59.43359375, 61.4814453125, 63.529296875, 65.5771484375, 67.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 8.0, 11.0, 13.0, 13.0, 9.0, 13.0, 25.0, 25.0, 17.0, 20.0, 29.0, 24.0, 28.0, 38.0, 38.0, 37.0, 37.0, 38.0, 43.0, 32.0, 32.0, 43.0, 37.0, 40.0, 34.0, 39.0, 35.0, 22.0, 28.0, 18.0, 29.0, 21.0, 17.0, 15.0, 15.0, 8.0, 8.0, 7.0, 10.0, 8.0, 2.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-21.8125, -21.13916015625, -20.4658203125, -19.79248046875, -19.119140625, -18.44580078125, -17.7724609375, -17.09912109375, -16.42578125, -15.75244140625, -15.0791015625, -14.40576171875, -13.732421875, -13.05908203125, -12.3857421875, -11.71240234375, -11.0390625, -10.36572265625, -9.6923828125, -9.01904296875, -8.345703125, -7.67236328125, -6.9990234375, -6.32568359375, -5.65234375, -4.97900390625, -4.3056640625, -3.63232421875, -2.958984375, -2.28564453125, -1.6123046875, -0.93896484375, -0.265625, 0.40771484375, 1.0810546875, 1.75439453125, 2.427734375, 3.10107421875, 3.7744140625, 4.44775390625, 5.12109375, 5.79443359375, 6.4677734375, 7.14111328125, 7.814453125, 8.48779296875, 9.1611328125, 9.83447265625, 10.5078125, 11.18115234375, 11.8544921875, 12.52783203125, 13.201171875, 13.87451171875, 14.5478515625, 15.22119140625, 15.89453125, 16.56787109375, 17.2412109375, 17.91455078125, 18.587890625, 19.26123046875, 19.9345703125, 20.60791015625, 21.28125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 12.0, 16.0, 14.0, 22.0, 35.0, 53.0, 68.0, 102.0, 135.0, 209.0, 335.0, 485.0, 770.0, 1204.0, 1908.0, 3059.0, 5209.0, 8505.0, 14525.0, 24673.0, 43364.0, 73875.0, 123686.0, 185867.0, 201833.0, 144874.0, 88896.0, 51515.0, 29689.0, 17296.0, 10216.0, 6028.0, 3740.0, 2330.0, 1391.0, 924.0, 537.0, 368.0, 232.0, 177.0, 110.0, 85.0, 61.0, 46.0, 22.0, 20.0, 5.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-87.8125, -85.1650390625, -82.517578125, -79.8701171875, -77.22265625, -74.5751953125, -71.927734375, -69.2802734375, -66.6328125, -63.9853515625, -61.337890625, -58.6904296875, -56.04296875, -53.3955078125, -50.748046875, -48.1005859375, -45.453125, -42.8056640625, -40.158203125, -37.5107421875, -34.86328125, -32.2158203125, -29.568359375, -26.9208984375, -24.2734375, -21.6259765625, -18.978515625, -16.3310546875, -13.68359375, -11.0361328125, -8.388671875, -5.7412109375, -3.09375, -0.4462890625, 2.201171875, 4.8486328125, 7.49609375, 10.1435546875, 12.791015625, 15.4384765625, 18.0859375, 20.7333984375, 23.380859375, 26.0283203125, 28.67578125, 31.3232421875, 33.970703125, 36.6181640625, 39.265625, 41.9130859375, 44.560546875, 47.2080078125, 49.85546875, 52.5029296875, 55.150390625, 57.7978515625, 60.4453125, 63.0927734375, 65.740234375, 68.3876953125, 71.03515625, 73.6826171875, 76.330078125, 78.9775390625, 81.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 14.0, 8.0, 17.0, 21.0, 12.0, 27.0, 19.0, 26.0, 33.0, 29.0, 30.0, 32.0, 37.0, 35.0, 39.0, 47.0, 27.0, 45.0, 38.0, 36.0, 43.0, 37.0, 39.0, 26.0, 45.0, 28.0, 19.0, 26.0, 23.0, 25.0, 16.0, 11.0, 14.0, 8.0, 4.0, 8.0, 6.0, 1.0, 9.0, 1.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-17.1875, -16.66455078125, -16.1416015625, -15.61865234375, -15.095703125, -14.57275390625, -14.0498046875, -13.52685546875, -13.00390625, -12.48095703125, -11.9580078125, -11.43505859375, -10.912109375, -10.38916015625, -9.8662109375, -9.34326171875, -8.8203125, -8.29736328125, -7.7744140625, -7.25146484375, -6.728515625, -6.20556640625, -5.6826171875, -5.15966796875, -4.63671875, -4.11376953125, -3.5908203125, -3.06787109375, -2.544921875, -2.02197265625, -1.4990234375, -0.97607421875, -0.453125, 0.06982421875, 0.5927734375, 1.11572265625, 1.638671875, 2.16162109375, 2.6845703125, 3.20751953125, 3.73046875, 4.25341796875, 4.7763671875, 5.29931640625, 5.822265625, 6.34521484375, 6.8681640625, 7.39111328125, 7.9140625, 8.43701171875, 8.9599609375, 9.48291015625, 10.005859375, 10.52880859375, 11.0517578125, 11.57470703125, 12.09765625, 12.62060546875, 13.1435546875, 13.66650390625, 14.189453125, 14.71240234375, 15.2353515625, 15.75830078125, 16.28125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 5.0, 11.0, 10.0, 21.0, 24.0, 25.0, 40.0, 61.0, 112.0, 125.0, 168.0, 261.0, 381.0, 598.0, 927.0, 1362.0, 2084.0, 3203.0, 4990.0, 8069.0, 13036.0, 22977.0, 40316.0, 75764.0, 150583.0, 272433.0, 212684.0, 106720.0, 55556.0, 30286.0, 17504.0, 10365.0, 6394.0, 3956.0, 2584.0, 1603.0, 1085.0, 711.0, 491.0, 328.0, 214.0, 150.0, 106.0, 87.0, 50.0, 28.0, 23.0, 18.0, 10.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-44.71875, -43.16357421875, -41.6083984375, -40.05322265625, -38.498046875, -36.94287109375, -35.3876953125, -33.83251953125, -32.27734375, -30.72216796875, -29.1669921875, -27.61181640625, -26.056640625, -24.50146484375, -22.9462890625, -21.39111328125, -19.8359375, -18.28076171875, -16.7255859375, -15.17041015625, -13.615234375, -12.06005859375, -10.5048828125, -8.94970703125, -7.39453125, -5.83935546875, -4.2841796875, -2.72900390625, -1.173828125, 0.38134765625, 1.9365234375, 3.49169921875, 5.046875, 6.60205078125, 8.1572265625, 9.71240234375, 11.267578125, 12.82275390625, 14.3779296875, 15.93310546875, 17.48828125, 19.04345703125, 20.5986328125, 22.15380859375, 23.708984375, 25.26416015625, 26.8193359375, 28.37451171875, 29.9296875, 31.48486328125, 33.0400390625, 34.59521484375, 36.150390625, 37.70556640625, 39.2607421875, 40.81591796875, 42.37109375, 43.92626953125, 45.4814453125, 47.03662109375, 48.591796875, 50.14697265625, 51.7021484375, 53.25732421875, 54.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 12.0, 14.0, 17.0, 21.0, 22.0, 25.0, 45.0, 49.0, 65.0, 61.0, 83.0, 84.0, 68.0, 77.0, 74.0, 47.0, 44.0, 29.0, 29.0, 19.0, 22.0, 11.0, 10.0, 9.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00629425048828125, -0.006113946437835693, -0.005933642387390137, -0.00575333833694458, -0.0055730342864990234, -0.005392730236053467, -0.00521242618560791, -0.0050321221351623535, -0.004851818084716797, -0.00467151403427124, -0.004491209983825684, -0.004310905933380127, -0.00413060188293457, -0.003950297832489014, -0.003769993782043457, -0.0035896897315979004, -0.0034093856811523438, -0.003229081630706787, -0.0030487775802612305, -0.002868473529815674, -0.002688169479370117, -0.0025078654289245605, -0.002327561378479004, -0.0021472573280334473, -0.0019669532775878906, -0.001786649227142334, -0.0016063451766967773, -0.0014260411262512207, -0.001245737075805664, -0.0010654330253601074, -0.0008851289749145508, -0.0007048249244689941, -0.0005245208740234375, -0.00034421682357788086, -0.00016391277313232422, 1.6391277313232422e-05, 0.00019669532775878906, 0.0003769993782043457, 0.0005573034286499023, 0.000737607479095459, 0.0009179115295410156, 0.0010982155799865723, 0.001278519630432129, 0.0014588236808776855, 0.0016391277313232422, 0.0018194317817687988, 0.0019997358322143555, 0.002180039882659912, 0.0023603439331054688, 0.0025406479835510254, 0.002720952033996582, 0.0029012560844421387, 0.0030815601348876953, 0.003261864185333252, 0.0034421682357788086, 0.0036224722862243652, 0.003802776336669922, 0.0039830803871154785, 0.004163384437561035, 0.004343688488006592, 0.0045239925384521484, 0.004704296588897705, 0.004884600639343262, 0.005064904689788818, 0.005245208740234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [6.0, 0.0, 5.0, 3.0, 7.0, 9.0, 12.0, 17.0, 17.0, 30.0, 36.0, 58.0, 94.0, 97.0, 146.0, 242.0, 361.0, 437.0, 687.0, 933.0, 1386.0, 1950.0, 2952.0, 4184.0, 6316.0, 9500.0, 14604.0, 22662.0, 37091.0, 60431.0, 97744.0, 152891.0, 193256.0, 160675.0, 105038.0, 64728.0, 39074.0, 24263.0, 15574.0, 10086.0, 6727.0, 4479.0, 3023.0, 2085.0, 1434.0, 965.0, 613.0, 479.0, 362.0, 236.0, 160.0, 107.0, 80.0, 60.0, 53.0, 31.0, 23.0, 21.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0], "bins": [-29.171875, -28.276123046875, -27.38037109375, -26.484619140625, -25.5888671875, -24.693115234375, -23.79736328125, -22.901611328125, -22.005859375, -21.110107421875, -20.21435546875, -19.318603515625, -18.4228515625, -17.527099609375, -16.63134765625, -15.735595703125, -14.83984375, -13.944091796875, -13.04833984375, -12.152587890625, -11.2568359375, -10.361083984375, -9.46533203125, -8.569580078125, -7.673828125, -6.778076171875, -5.88232421875, -4.986572265625, -4.0908203125, -3.195068359375, -2.29931640625, -1.403564453125, -0.5078125, 0.387939453125, 1.28369140625, 2.179443359375, 3.0751953125, 3.970947265625, 4.86669921875, 5.762451171875, 6.658203125, 7.553955078125, 8.44970703125, 9.345458984375, 10.2412109375, 11.136962890625, 12.03271484375, 12.928466796875, 13.82421875, 14.719970703125, 15.61572265625, 16.511474609375, 17.4072265625, 18.302978515625, 19.19873046875, 20.094482421875, 20.990234375, 21.885986328125, 22.78173828125, 23.677490234375, 24.5732421875, 25.468994140625, 26.36474609375, 27.260498046875, 28.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 6.0, 14.0, 10.0, 11.0, 16.0, 24.0, 18.0, 26.0, 26.0, 30.0, 33.0, 33.0, 49.0, 38.0, 49.0, 60.0, 49.0, 54.0, 57.0, 47.0, 33.0, 36.0, 33.0, 21.0, 34.0, 25.0, 20.0, 20.0, 12.0, 17.0, 10.0, 9.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.609375, -8.3157958984375, -8.022216796875, -7.7286376953125, -7.43505859375, -7.1414794921875, -6.847900390625, -6.5543212890625, -6.2607421875, -5.9671630859375, -5.673583984375, -5.3800048828125, -5.08642578125, -4.7928466796875, -4.499267578125, -4.2056884765625, -3.912109375, -3.6185302734375, -3.324951171875, -3.0313720703125, -2.73779296875, -2.4442138671875, -2.150634765625, -1.8570556640625, -1.5634765625, -1.2698974609375, -0.976318359375, -0.6827392578125, -0.38916015625, -0.0955810546875, 0.197998046875, 0.4915771484375, 0.78515625, 1.0787353515625, 1.372314453125, 1.6658935546875, 1.95947265625, 2.2530517578125, 2.546630859375, 2.8402099609375, 3.1337890625, 3.4273681640625, 3.720947265625, 4.0145263671875, 4.30810546875, 4.6016845703125, 4.895263671875, 5.1888427734375, 5.482421875, 5.7760009765625, 6.069580078125, 6.3631591796875, 6.65673828125, 6.9503173828125, 7.243896484375, 7.5374755859375, 7.8310546875, 8.1246337890625, 8.418212890625, 8.7117919921875, 9.00537109375, 9.2989501953125, 9.592529296875, 9.8861083984375, 10.1796875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 4.0, 9.0, 11.0, 14.0, 14.0, 18.0, 18.0, 18.0, 29.0, 30.0, 29.0, 38.0, 39.0, 65.0, 43.0, 40.0, 40.0, 55.0, 52.0, 43.0, 46.0, 38.0, 41.0, 48.0, 27.0, 27.0, 36.0, 18.0, 12.0, 12.0, 15.0, 18.0, 11.0, 7.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.590118408203125, -25.74036407470703, -24.890609741210938, -24.040857315063477, -23.191102981567383, -22.34134864807129, -21.491596221923828, -20.641841888427734, -19.79208755493164, -18.942333221435547, -18.092578887939453, -17.242826461791992, -16.3930721282959, -15.543317794799805, -14.693564414978027, -13.84381103515625, -12.994056701660156, -12.144302368164062, -11.294548988342285, -10.444795608520508, -9.595041275024414, -8.74528694152832, -7.895533561706543, -7.045779705047607, -6.196025848388672, -5.346271991729736, -4.496518135070801, -3.6467642784118652, -2.7970104217529297, -1.9472565650939941, -1.0975027084350586, -0.24774885177612305, 0.6020069122314453, 1.4517607688903809, 2.3015146255493164, 3.151268482208252, 4.0010223388671875, 4.850776195526123, 5.700530052185059, 6.550283908843994, 7.40003776550293, 8.249792098999023, 9.0995454788208, 9.949298858642578, 10.799053192138672, 11.648807525634766, 12.498560905456543, 13.34831428527832, 14.198068618774414, 15.047822952270508, 15.897576332092285, 16.747329711914062, 17.597084045410156, 18.44683837890625, 19.296592712402344, 20.146345138549805, 20.9960994720459, 21.845853805541992, 22.695606231689453, 23.545360565185547, 24.39511489868164, 25.244869232177734, 26.094623565673828, 26.94437599182129, 27.794130325317383]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 5.0, 9.0, 7.0, 12.0, 27.0, 17.0, 15.0, 19.0, 25.0, 23.0, 39.0, 35.0, 30.0, 40.0, 25.0, 38.0, 46.0, 39.0, 38.0, 41.0, 40.0, 53.0, 41.0, 34.0, 32.0, 21.0, 27.0, 25.0, 24.0, 20.0, 20.0, 16.0, 17.0, 9.0, 14.0, 12.0, 4.0, 13.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.874345779418945, -22.16553497314453, -21.45672607421875, -20.747915267944336, -20.039104461669922, -19.330293655395508, -18.621482849121094, -17.912673950195312, -17.2038631439209, -16.495052337646484, -15.786242485046387, -15.077432632446289, -14.368621826171875, -13.659811019897461, -12.951001167297363, -12.242191314697266, -11.533380508422852, -10.824569702148438, -10.11575984954834, -9.406949996948242, -8.698139190673828, -7.989328861236572, -7.280518531799316, -6.5717082023620605, -5.862897872924805, -5.154087543487549, -4.445277214050293, -3.736466884613037, -3.0276565551757812, -2.3188462257385254, -1.6100358963012695, -0.9012255668640137, -0.19241714477539062, 0.5163931846618652, 1.225203514099121, 1.934013843536377, 2.642824172973633, 3.3516345024108887, 4.0604448318481445, 4.7692551612854, 5.478065490722656, 6.186875820159912, 6.895686149597168, 7.604496479034424, 8.31330680847168, 9.022117614746094, 9.730927467346191, 10.439737319946289, 11.148548126220703, 11.857358932495117, 12.566168785095215, 13.274978637695312, 13.983789443969727, 14.69260025024414, 15.401410102844238, 16.110219955444336, 16.81903076171875, 17.527841567993164, 18.236652374267578, 18.94546127319336, 19.654272079467773, 20.363082885742188, 21.07189178466797, 21.780702590942383, 22.489513397216797]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 20.0, 40.0, 59.0, 81.0, 127.0, 204.0, 334.0, 521.0, 774.0, 1313.0, 2046.0, 3265.0, 5196.0, 7942.0, 12459.0, 19258.0, 29706.0, 44334.0, 63675.0, 86913.0, 111440.0, 127943.0, 129319.0, 112850.0, 89917.0, 66041.0, 46022.0, 30572.0, 20257.0, 13050.0, 8375.0, 5225.0, 3394.0, 2198.0, 1306.0, 852.0, 562.0, 369.0, 223.0, 138.0, 94.0, 47.0, 33.0, 13.0, 15.0, 6.0, 12.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.588134765625, -19.87939453125, -19.170654296875, -18.4619140625, -17.753173828125, -17.04443359375, -16.335693359375, -15.626953125, -14.918212890625, -14.20947265625, -13.500732421875, -12.7919921875, -12.083251953125, -11.37451171875, -10.665771484375, -9.95703125, -9.248291015625, -8.53955078125, -7.830810546875, -7.1220703125, -6.413330078125, -5.70458984375, -4.995849609375, -4.287109375, -3.578369140625, -2.86962890625, -2.160888671875, -1.4521484375, -0.743408203125, -0.03466796875, 0.674072265625, 1.3828125, 2.091552734375, 2.80029296875, 3.509033203125, 4.2177734375, 4.926513671875, 5.63525390625, 6.343994140625, 7.052734375, 7.761474609375, 8.47021484375, 9.178955078125, 9.8876953125, 10.596435546875, 11.30517578125, 12.013916015625, 12.72265625, 13.431396484375, 14.14013671875, 14.848876953125, 15.5576171875, 16.266357421875, 16.97509765625, 17.683837890625, 18.392578125, 19.101318359375, 19.81005859375, 20.518798828125, 21.2275390625, 21.936279296875, 22.64501953125, 23.353759765625, 24.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 6.0, 11.0, 7.0, 5.0, 10.0, 8.0, 9.0, 15.0, 18.0, 18.0, 21.0, 23.0, 26.0, 28.0, 26.0, 42.0, 35.0, 43.0, 32.0, 42.0, 39.0, 53.0, 34.0, 41.0, 35.0, 36.0, 37.0, 29.0, 34.0, 38.0, 26.0, 17.0, 23.0, 23.0, 8.0, 14.0, 15.0, 11.0, 11.0, 7.0, 10.0, 7.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-21.4375, -20.774658203125, -20.11181640625, -19.448974609375, -18.7861328125, -18.123291015625, -17.46044921875, -16.797607421875, -16.134765625, -15.471923828125, -14.80908203125, -14.146240234375, -13.4833984375, -12.820556640625, -12.15771484375, -11.494873046875, -10.83203125, -10.169189453125, -9.50634765625, -8.843505859375, -8.1806640625, -7.517822265625, -6.85498046875, -6.192138671875, -5.529296875, -4.866455078125, -4.20361328125, -3.540771484375, -2.8779296875, -2.215087890625, -1.55224609375, -0.889404296875, -0.2265625, 0.436279296875, 1.09912109375, 1.761962890625, 2.4248046875, 3.087646484375, 3.75048828125, 4.413330078125, 5.076171875, 5.739013671875, 6.40185546875, 7.064697265625, 7.7275390625, 8.390380859375, 9.05322265625, 9.716064453125, 10.37890625, 11.041748046875, 11.70458984375, 12.367431640625, 13.0302734375, 13.693115234375, 14.35595703125, 15.018798828125, 15.681640625, 16.344482421875, 17.00732421875, 17.670166015625, 18.3330078125, 18.995849609375, 19.65869140625, 20.321533203125, 20.984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 21.0, 43.0, 48.0, 83.0, 126.0, 154.0, 295.0, 424.0, 777.0, 1230.0, 2023.0, 3193.0, 5300.0, 8592.0, 14011.0, 22927.0, 37107.0, 58574.0, 87670.0, 122809.0, 151272.0, 151534.0, 126653.0, 91761.0, 60990.0, 38877.0, 23782.0, 14914.0, 9060.0, 5516.0, 3265.0, 2073.0, 1296.0, 803.0, 472.0, 339.0, 195.0, 130.0, 76.0, 47.0, 23.0, 24.0, 8.0, 14.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.3125, -26.432861328125, -25.55322265625, -24.673583984375, -23.7939453125, -22.914306640625, -22.03466796875, -21.155029296875, -20.275390625, -19.395751953125, -18.51611328125, -17.636474609375, -16.7568359375, -15.877197265625, -14.99755859375, -14.117919921875, -13.23828125, -12.358642578125, -11.47900390625, -10.599365234375, -9.7197265625, -8.840087890625, -7.96044921875, -7.080810546875, -6.201171875, -5.321533203125, -4.44189453125, -3.562255859375, -2.6826171875, -1.802978515625, -0.92333984375, -0.043701171875, 0.8359375, 1.715576171875, 2.59521484375, 3.474853515625, 4.3544921875, 5.234130859375, 6.11376953125, 6.993408203125, 7.873046875, 8.752685546875, 9.63232421875, 10.511962890625, 11.3916015625, 12.271240234375, 13.15087890625, 14.030517578125, 14.91015625, 15.789794921875, 16.66943359375, 17.549072265625, 18.4287109375, 19.308349609375, 20.18798828125, 21.067626953125, 21.947265625, 22.826904296875, 23.70654296875, 24.586181640625, 25.4658203125, 26.345458984375, 27.22509765625, 28.104736328125, 28.984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 1.0, 6.0, 9.0, 5.0, 7.0, 8.0, 17.0, 20.0, 24.0, 28.0, 20.0, 27.0, 34.0, 11.0, 27.0, 38.0, 31.0, 36.0, 35.0, 35.0, 52.0, 40.0, 41.0, 37.0, 34.0, 33.0, 33.0, 32.0, 40.0, 32.0, 21.0, 22.0, 19.0, 22.0, 23.0, 11.0, 16.0, 11.0, 15.0, 10.0, 5.0, 8.0, 8.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 5.0, 1.0], "bins": [-16.171875, -15.698486328125, -15.22509765625, -14.751708984375, -14.2783203125, -13.804931640625, -13.33154296875, -12.858154296875, -12.384765625, -11.911376953125, -11.43798828125, -10.964599609375, -10.4912109375, -10.017822265625, -9.54443359375, -9.071044921875, -8.59765625, -8.124267578125, -7.65087890625, -7.177490234375, -6.7041015625, -6.230712890625, -5.75732421875, -5.283935546875, -4.810546875, -4.337158203125, -3.86376953125, -3.390380859375, -2.9169921875, -2.443603515625, -1.97021484375, -1.496826171875, -1.0234375, -0.550048828125, -0.07666015625, 0.396728515625, 0.8701171875, 1.343505859375, 1.81689453125, 2.290283203125, 2.763671875, 3.237060546875, 3.71044921875, 4.183837890625, 4.6572265625, 5.130615234375, 5.60400390625, 6.077392578125, 6.55078125, 7.024169921875, 7.49755859375, 7.970947265625, 8.4443359375, 8.917724609375, 9.39111328125, 9.864501953125, 10.337890625, 10.811279296875, 11.28466796875, 11.758056640625, 12.2314453125, 12.704833984375, 13.17822265625, 13.651611328125, 14.125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 12.0, 24.0, 35.0, 52.0, 67.0, 88.0, 122.0, 216.0, 296.0, 468.0, 736.0, 1181.0, 2031.0, 3690.0, 7434.0, 15823.0, 37305.0, 93890.0, 226332.0, 328168.0, 193503.0, 77735.0, 31130.0, 13556.0, 6455.0, 3311.0, 1820.0, 1038.0, 640.0, 439.0, 304.0, 197.0, 140.0, 98.0, 68.0, 53.0, 26.0, 23.0, 10.0, 8.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.47119140625, -31.2861328125, -30.10107421875, -28.916015625, -27.73095703125, -26.5458984375, -25.36083984375, -24.17578125, -22.99072265625, -21.8056640625, -20.62060546875, -19.435546875, -18.25048828125, -17.0654296875, -15.88037109375, -14.6953125, -13.51025390625, -12.3251953125, -11.14013671875, -9.955078125, -8.77001953125, -7.5849609375, -6.39990234375, -5.21484375, -4.02978515625, -2.8447265625, -1.65966796875, -0.474609375, 0.71044921875, 1.8955078125, 3.08056640625, 4.265625, 5.45068359375, 6.6357421875, 7.82080078125, 9.005859375, 10.19091796875, 11.3759765625, 12.56103515625, 13.74609375, 14.93115234375, 16.1162109375, 17.30126953125, 18.486328125, 19.67138671875, 20.8564453125, 22.04150390625, 23.2265625, 24.41162109375, 25.5966796875, 26.78173828125, 27.966796875, 29.15185546875, 30.3369140625, 31.52197265625, 32.70703125, 33.89208984375, 35.0771484375, 36.26220703125, 37.447265625, 38.63232421875, 39.8173828125, 41.00244140625, 42.1875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 7.0, 9.0, 13.0, 6.0, 17.0, 23.0, 34.0, 41.0, 66.0, 66.0, 66.0, 65.0, 88.0, 85.0, 72.0, 80.0, 54.0, 51.0, 36.0, 24.0, 22.0, 13.0, 17.0, 14.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00267791748046875, -0.0025843679904937744, -0.002490818500518799, -0.0023972690105438232, -0.0023037195205688477, -0.002210170030593872, -0.0021166205406188965, -0.002023071050643921, -0.0019295215606689453, -0.0018359720706939697, -0.0017424225807189941, -0.0016488730907440186, -0.001555323600769043, -0.0014617741107940674, -0.0013682246208190918, -0.0012746751308441162, -0.0011811256408691406, -0.001087576150894165, -0.0009940266609191895, -0.0009004771709442139, -0.0008069276809692383, -0.0007133781909942627, -0.0006198287010192871, -0.0005262792110443115, -0.00043272972106933594, -0.00033918023109436035, -0.00024563074111938477, -0.00015208125114440918, -5.8531761169433594e-05, 3.501772880554199e-05, 0.00012856721878051758, 0.00022211670875549316, 0.00031566619873046875, 0.00040921568870544434, 0.0005027651786804199, 0.0005963146686553955, 0.0006898641586303711, 0.0007834136486053467, 0.0008769631385803223, 0.0009705126285552979, 0.0010640621185302734, 0.001157611608505249, 0.0012511610984802246, 0.0013447105884552002, 0.0014382600784301758, 0.0015318095684051514, 0.001625359058380127, 0.0017189085483551025, 0.0018124580383300781, 0.0019060075283050537, 0.0019995570182800293, 0.002093106508255005, 0.0021866559982299805, 0.002280205488204956, 0.0023737549781799316, 0.0024673044681549072, 0.002560853958129883, 0.0026544034481048584, 0.002747952938079834, 0.0028415024280548096, 0.002935051918029785, 0.0030286014080047607, 0.0031221508979797363, 0.003215700387954712, 0.0033092498779296875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 10.0, 15.0, 13.0, 32.0, 32.0, 42.0, 72.0, 108.0, 123.0, 165.0, 265.0, 378.0, 569.0, 855.0, 1403.0, 2232.0, 3779.0, 6572.0, 12301.0, 23380.0, 46768.0, 92495.0, 167042.0, 230618.0, 201879.0, 124093.0, 64306.0, 31377.0, 16330.0, 8788.0, 4843.0, 2773.0, 1625.0, 1033.0, 682.0, 460.0, 335.0, 226.0, 127.0, 113.0, 89.0, 54.0, 49.0, 42.0, 20.0, 13.0, 4.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-23.96875, -23.236328125, -22.50390625, -21.771484375, -21.0390625, -20.306640625, -19.57421875, -18.841796875, -18.109375, -17.376953125, -16.64453125, -15.912109375, -15.1796875, -14.447265625, -13.71484375, -12.982421875, -12.25, -11.517578125, -10.78515625, -10.052734375, -9.3203125, -8.587890625, -7.85546875, -7.123046875, -6.390625, -5.658203125, -4.92578125, -4.193359375, -3.4609375, -2.728515625, -1.99609375, -1.263671875, -0.53125, 0.201171875, 0.93359375, 1.666015625, 2.3984375, 3.130859375, 3.86328125, 4.595703125, 5.328125, 6.060546875, 6.79296875, 7.525390625, 8.2578125, 8.990234375, 9.72265625, 10.455078125, 11.1875, 11.919921875, 12.65234375, 13.384765625, 14.1171875, 14.849609375, 15.58203125, 16.314453125, 17.046875, 17.779296875, 18.51171875, 19.244140625, 19.9765625, 20.708984375, 21.44140625, 22.173828125, 22.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 3.0, 7.0, 9.0, 22.0, 18.0, 29.0, 27.0, 30.0, 43.0, 54.0, 53.0, 59.0, 58.0, 67.0, 70.0, 66.0, 69.0, 58.0, 48.0, 31.0, 35.0, 29.0, 17.0, 20.0, 10.0, 12.0, 10.0, 7.0, 5.0, 7.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.08990478515625, -7.8360595703125, -7.58221435546875, -7.328369140625, -7.07452392578125, -6.8206787109375, -6.56683349609375, -6.31298828125, -6.05914306640625, -5.8052978515625, -5.55145263671875, -5.297607421875, -5.04376220703125, -4.7899169921875, -4.53607177734375, -4.2822265625, -4.02838134765625, -3.7745361328125, -3.52069091796875, -3.266845703125, -3.01300048828125, -2.7591552734375, -2.50531005859375, -2.25146484375, -1.99761962890625, -1.7437744140625, -1.48992919921875, -1.236083984375, -0.98223876953125, -0.7283935546875, -0.47454833984375, -0.220703125, 0.03314208984375, 0.2869873046875, 0.54083251953125, 0.794677734375, 1.04852294921875, 1.3023681640625, 1.55621337890625, 1.81005859375, 2.06390380859375, 2.3177490234375, 2.57159423828125, 2.825439453125, 3.07928466796875, 3.3331298828125, 3.58697509765625, 3.8408203125, 4.09466552734375, 4.3485107421875, 4.60235595703125, 4.856201171875, 5.11004638671875, 5.3638916015625, 5.61773681640625, 5.87158203125, 6.12542724609375, 6.3792724609375, 6.63311767578125, 6.886962890625, 7.14080810546875, 7.3946533203125, 7.64849853515625, 7.90234375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 2.0, 9.0, 16.0, 15.0, 16.0, 17.0, 15.0, 21.0, 19.0, 23.0, 38.0, 34.0, 37.0, 48.0, 59.0, 58.0, 51.0, 55.0, 58.0, 56.0, 53.0, 34.0, 37.0, 33.0, 29.0, 24.0, 21.0, 26.0, 21.0, 12.0, 7.0, 14.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.149505615234375, -26.284074783325195, -25.418643951416016, -24.553211212158203, -23.687780380249023, -22.822349548339844, -21.95691680908203, -21.09148597717285, -20.226055145263672, -19.360624313354492, -18.495193481445312, -17.6297607421875, -16.76432991027832, -15.89889907836914, -15.033467292785645, -14.168035507202148, -13.302604675292969, -12.437173843383789, -11.571742057800293, -10.706310272216797, -9.840879440307617, -8.975448608398438, -8.110016822814941, -7.2445855140686035, -6.379154205322266, -5.513722896575928, -4.64829158782959, -3.782860279083252, -2.917428970336914, -2.051997661590576, -1.1865663528442383, -0.3211350440979004, 0.5442943572998047, 1.4097256660461426, 2.2751569747924805, 3.1405882835388184, 4.006019592285156, 4.871450901031494, 5.736882209777832, 6.60231351852417, 7.467744827270508, 8.333175659179688, 9.198607444763184, 10.06403923034668, 10.92947006225586, 11.794900894165039, 12.660332679748535, 13.525764465332031, 14.391195297241211, 15.25662612915039, 16.122058868408203, 16.987489700317383, 17.852920532226562, 18.718351364135742, 19.583782196044922, 20.449214935302734, 21.314645767211914, 22.180076599121094, 23.045509338378906, 23.910940170288086, 24.776371002197266, 25.641801834106445, 26.507232666015625, 27.372665405273438, 28.238096237182617]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 7.0, 10.0, 6.0, 19.0, 19.0, 15.0, 7.0, 21.0, 25.0, 31.0, 31.0, 38.0, 26.0, 40.0, 39.0, 30.0, 50.0, 43.0, 42.0, 42.0, 33.0, 49.0, 38.0, 42.0, 27.0, 34.0, 20.0, 21.0, 32.0, 11.0, 18.0, 13.0, 26.0, 12.0, 10.0, 9.0, 8.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-25.594215393066406, -24.87730598449707, -24.160396575927734, -23.443485260009766, -22.72657585144043, -22.009666442871094, -21.292757034301758, -20.575847625732422, -19.858936309814453, -19.142026901245117, -18.42511749267578, -17.708206176757812, -16.991296768188477, -16.27438735961914, -15.557477951049805, -14.840567588806152, -14.123658180236816, -13.40674877166748, -12.689838409423828, -11.972929000854492, -11.25601863861084, -10.539109230041504, -9.822198867797852, -9.105289459228516, -8.38838005065918, -7.6714701652526855, -6.954560279846191, -6.2376508712768555, -5.520740509033203, -4.803831100463867, -4.086921215057373, -3.370011329650879, -2.6531009674072266, -1.9361910820007324, -1.2192813158035278, -0.5023715496063232, 0.2145383358001709, 0.931448221206665, 1.64835786819458, 2.365267753601074, 3.0821776390075684, 3.7990875244140625, 4.515997409820557, 5.232907295227051, 5.949816703796387, 6.666727066040039, 7.383636474609375, 8.100545883178711, 8.817456245422363, 9.5343656539917, 10.251276016235352, 10.968185424804688, 11.68509578704834, 12.402005195617676, 13.118915557861328, 13.835824966430664, 14.552734375, 15.269643783569336, 15.986554145812988, 16.70346450805664, 17.420373916625977, 18.137283325195312, 18.85419273376465, 19.571102142333984, 20.288013458251953]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 16.0, 19.0, 29.0, 40.0, 40.0, 73.0, 135.0, 203.0, 392.0, 638.0, 1095.0, 1944.0, 3739.0, 7189.0, 14545.0, 29801.0, 64075.0, 140770.0, 328985.0, 757380.0, 1198534.0, 902649.0, 411310.0, 176298.0, 79609.0, 37178.0, 18053.0, 8925.0, 4641.0, 2539.0, 1422.0, 746.0, 473.0, 294.0, 164.0, 109.0, 68.0, 49.0, 34.0, 22.0, 18.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.0625, -29.0126953125, -27.962890625, -26.9130859375, -25.86328125, -24.8134765625, -23.763671875, -22.7138671875, -21.6640625, -20.6142578125, -19.564453125, -18.5146484375, -17.46484375, -16.4150390625, -15.365234375, -14.3154296875, -13.265625, -12.2158203125, -11.166015625, -10.1162109375, -9.06640625, -8.0166015625, -6.966796875, -5.9169921875, -4.8671875, -3.8173828125, -2.767578125, -1.7177734375, -0.66796875, 0.3818359375, 1.431640625, 2.4814453125, 3.53125, 4.5810546875, 5.630859375, 6.6806640625, 7.73046875, 8.7802734375, 9.830078125, 10.8798828125, 11.9296875, 12.9794921875, 14.029296875, 15.0791015625, 16.12890625, 17.1787109375, 18.228515625, 19.2783203125, 20.328125, 21.3779296875, 22.427734375, 23.4775390625, 24.52734375, 25.5771484375, 26.626953125, 27.6767578125, 28.7265625, 29.7763671875, 30.826171875, 31.8759765625, 32.92578125, 33.9755859375, 35.025390625, 36.0751953125, 37.125]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 6.0, 7.0, 6.0, 3.0, 15.0, 12.0, 14.0, 18.0, 16.0, 16.0, 20.0, 30.0, 34.0, 26.0, 31.0, 37.0, 37.0, 40.0, 39.0, 48.0, 37.0, 48.0, 34.0, 42.0, 28.0, 32.0, 46.0, 45.0, 32.0, 40.0, 24.0, 16.0, 21.0, 19.0, 14.0, 16.0, 7.0, 11.0, 10.0, 7.0, 8.0, 6.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0], "bins": [-20.140625, -19.5838623046875, -19.027099609375, -18.4703369140625, -17.91357421875, -17.3568115234375, -16.800048828125, -16.2432861328125, -15.6865234375, -15.1297607421875, -14.572998046875, -14.0162353515625, -13.45947265625, -12.9027099609375, -12.345947265625, -11.7891845703125, -11.232421875, -10.6756591796875, -10.118896484375, -9.5621337890625, -9.00537109375, -8.4486083984375, -7.891845703125, -7.3350830078125, -6.7783203125, -6.2215576171875, -5.664794921875, -5.1080322265625, -4.55126953125, -3.9945068359375, -3.437744140625, -2.8809814453125, -2.32421875, -1.7674560546875, -1.210693359375, -0.6539306640625, -0.09716796875, 0.4595947265625, 1.016357421875, 1.5731201171875, 2.1298828125, 2.6866455078125, 3.243408203125, 3.8001708984375, 4.35693359375, 4.9136962890625, 5.470458984375, 6.0272216796875, 6.583984375, 7.1407470703125, 7.697509765625, 8.2542724609375, 8.81103515625, 9.3677978515625, 9.924560546875, 10.4813232421875, 11.0380859375, 11.5948486328125, 12.151611328125, 12.7083740234375, 13.26513671875, 13.8218994140625, 14.378662109375, 14.9354248046875, 15.4921875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 8.0, 8.0, 13.0, 22.0, 37.0, 47.0, 94.0, 125.0, 200.0, 389.0, 600.0, 1098.0, 2135.0, 3979.0, 7384.0, 14308.0, 28427.0, 56037.0, 110949.0, 219489.0, 422902.0, 746622.0, 972283.0, 742610.0, 420364.0, 218103.0, 110824.0, 56435.0, 28199.0, 14584.0, 7456.0, 3878.0, 2027.0, 1090.0, 603.0, 341.0, 193.0, 151.0, 82.0, 49.0, 45.0, 25.0, 14.0, 9.0, 13.0, 4.0, 4.0, 3.0, 4.0, 1.0, 6.0, 0.0, 1.0], "bins": [-29.546875, -28.664794921875, -27.78271484375, -26.900634765625, -26.0185546875, -25.136474609375, -24.25439453125, -23.372314453125, -22.490234375, -21.608154296875, -20.72607421875, -19.843994140625, -18.9619140625, -18.079833984375, -17.19775390625, -16.315673828125, -15.43359375, -14.551513671875, -13.66943359375, -12.787353515625, -11.9052734375, -11.023193359375, -10.14111328125, -9.259033203125, -8.376953125, -7.494873046875, -6.61279296875, -5.730712890625, -4.8486328125, -3.966552734375, -3.08447265625, -2.202392578125, -1.3203125, -0.438232421875, 0.44384765625, 1.325927734375, 2.2080078125, 3.090087890625, 3.97216796875, 4.854248046875, 5.736328125, 6.618408203125, 7.50048828125, 8.382568359375, 9.2646484375, 10.146728515625, 11.02880859375, 11.910888671875, 12.79296875, 13.675048828125, 14.55712890625, 15.439208984375, 16.3212890625, 17.203369140625, 18.08544921875, 18.967529296875, 19.849609375, 20.731689453125, 21.61376953125, 22.495849609375, 23.3779296875, 24.260009765625, 25.14208984375, 26.024169921875, 26.90625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 9.0, 11.0, 14.0, 24.0, 24.0, 29.0, 34.0, 50.0, 50.0, 62.0, 83.0, 108.0, 119.0, 169.0, 169.0, 184.0, 211.0, 261.0, 263.0, 260.0, 264.0, 261.0, 225.0, 226.0, 178.0, 152.0, 128.0, 108.0, 92.0, 66.0, 59.0, 47.0, 35.0, 33.0, 16.0, 19.0, 15.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-11.265625, -10.98223876953125, -10.6988525390625, -10.41546630859375, -10.132080078125, -9.84869384765625, -9.5653076171875, -9.28192138671875, -8.99853515625, -8.71514892578125, -8.4317626953125, -8.14837646484375, -7.864990234375, -7.58160400390625, -7.2982177734375, -7.01483154296875, -6.7314453125, -6.44805908203125, -6.1646728515625, -5.88128662109375, -5.597900390625, -5.31451416015625, -5.0311279296875, -4.74774169921875, -4.46435546875, -4.18096923828125, -3.8975830078125, -3.61419677734375, -3.330810546875, -3.04742431640625, -2.7640380859375, -2.48065185546875, -2.197265625, -1.91387939453125, -1.6304931640625, -1.34710693359375, -1.063720703125, -0.78033447265625, -0.4969482421875, -0.21356201171875, 0.06982421875, 0.35321044921875, 0.6365966796875, 0.91998291015625, 1.203369140625, 1.48675537109375, 1.7701416015625, 2.05352783203125, 2.3369140625, 2.62030029296875, 2.9036865234375, 3.18707275390625, 3.470458984375, 3.75384521484375, 4.0372314453125, 4.32061767578125, 4.60400390625, 4.88739013671875, 5.1707763671875, 5.45416259765625, 5.737548828125, 6.02093505859375, 6.3043212890625, 6.58770751953125, 6.87109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 9.0, 8.0, 16.0, 10.0, 17.0, 18.0, 25.0, 30.0, 30.0, 44.0, 32.0, 35.0, 52.0, 49.0, 54.0, 57.0, 62.0, 48.0, 60.0, 54.0, 51.0, 34.0, 31.0, 24.0, 29.0, 23.0, 22.0, 15.0, 12.0, 15.0, 9.0, 7.0, 6.0, 0.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.61591148376465, -25.807968139648438, -25.000022888183594, -24.192079544067383, -23.384136199951172, -22.576190948486328, -21.768247604370117, -20.960304260253906, -20.152359008789062, -19.34441566467285, -18.536470413208008, -17.728527069091797, -16.920581817626953, -16.112638473510742, -15.304695129394531, -14.496750831604004, -13.688806533813477, -12.88086223602295, -12.072917938232422, -11.264974594116211, -10.457030296325684, -9.649085998535156, -8.841142654418945, -8.033198356628418, -7.225254058837891, -6.417309761047363, -5.609365940093994, -4.801422119140625, -3.9934778213500977, -3.1855335235595703, -2.377589702606201, -1.569645881652832, -0.7617034912109375, 0.04624056816101074, 0.854184627532959, 1.6621286869049072, 2.4700727462768555, 3.278017044067383, 4.085960865020752, 4.893904685974121, 5.701848983764648, 6.509793281555176, 7.317737102508545, 8.125680923461914, 8.933625221252441, 9.741569519042969, 10.54951286315918, 11.357457160949707, 12.165401458740234, 12.973345756530762, 13.781290054321289, 14.5892333984375, 15.397177696228027, 16.205121994018555, 17.013065338134766, 17.82101058959961, 18.62895393371582, 19.43689727783203, 20.244842529296875, 21.052785873413086, 21.860729217529297, 22.66867446899414, 23.47661781311035, 24.284561157226562, 25.092506408691406]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 15.0, 8.0, 10.0, 8.0, 15.0, 19.0, 10.0, 13.0, 20.0, 14.0, 21.0, 24.0, 35.0, 37.0, 26.0, 27.0, 26.0, 33.0, 43.0, 24.0, 38.0, 39.0, 34.0, 41.0, 44.0, 32.0, 26.0, 39.0, 27.0, 23.0, 21.0, 28.0, 24.0, 27.0, 27.0, 25.0, 16.0, 10.0, 3.0, 8.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-18.963850021362305, -18.39661979675293, -17.829391479492188, -17.262161254882812, -16.694931030273438, -16.127700805664062, -15.56047248840332, -14.993242263793945, -14.426012992858887, -13.858783721923828, -13.291553497314453, -12.724324226379395, -12.157094955444336, -11.589864730834961, -11.022635459899902, -10.455406188964844, -9.888175964355469, -9.32094669342041, -8.753716468811035, -8.186487197875977, -7.61925745010376, -7.052027702331543, -6.484798431396484, -5.917568683624268, -5.350338935852051, -4.783109188079834, -4.215879440307617, -3.6486501693725586, -3.081420421600342, -2.514190673828125, -1.9469611644744873, -1.3797316551208496, -0.8125038146972656, -0.24527418613433838, 0.32195544242858887, 0.8891850709915161, 1.4564146995544434, 2.02364444732666, 2.590873956680298, 3.1581034660339355, 3.7253332138061523, 4.292562961578369, 4.859792709350586, 5.4270219802856445, 5.994251728057861, 6.561481475830078, 7.128710746765137, 7.6959404945373535, 8.26317024230957, 8.830399513244629, 9.397629737854004, 9.964859008789062, 10.532089233398438, 11.099318504333496, 11.666547775268555, 12.23377799987793, 12.801007270812988, 13.368236541748047, 13.935466766357422, 14.50269603729248, 15.069925308227539, 15.637155532836914, 16.20438575744629, 16.77161407470703, 17.338844299316406]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 8.0, 14.0, 19.0, 26.0, 39.0, 58.0, 93.0, 152.0, 204.0, 334.0, 495.0, 743.0, 1109.0, 1628.0, 2787.0, 4120.0, 6520.0, 10517.0, 17327.0, 27917.0, 45801.0, 73928.0, 116221.0, 165047.0, 180387.0, 143419.0, 94948.0, 59323.0, 36292.0, 21903.0, 13584.0, 8538.0, 5369.0, 3271.0, 2237.0, 1384.0, 964.0, 604.0, 414.0, 283.0, 166.0, 131.0, 84.0, 55.0, 26.0, 25.0, 17.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-55.03125, -53.42529296875, -51.8193359375, -50.21337890625, -48.607421875, -47.00146484375, -45.3955078125, -43.78955078125, -42.18359375, -40.57763671875, -38.9716796875, -37.36572265625, -35.759765625, -34.15380859375, -32.5478515625, -30.94189453125, -29.3359375, -27.72998046875, -26.1240234375, -24.51806640625, -22.912109375, -21.30615234375, -19.7001953125, -18.09423828125, -16.48828125, -14.88232421875, -13.2763671875, -11.67041015625, -10.064453125, -8.45849609375, -6.8525390625, -5.24658203125, -3.640625, -2.03466796875, -0.4287109375, 1.17724609375, 2.783203125, 4.38916015625, 5.9951171875, 7.60107421875, 9.20703125, 10.81298828125, 12.4189453125, 14.02490234375, 15.630859375, 17.23681640625, 18.8427734375, 20.44873046875, 22.0546875, 23.66064453125, 25.2666015625, 26.87255859375, 28.478515625, 30.08447265625, 31.6904296875, 33.29638671875, 34.90234375, 36.50830078125, 38.1142578125, 39.72021484375, 41.326171875, 42.93212890625, 44.5380859375, 46.14404296875, 47.75]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 11.0, 15.0, 11.0, 18.0, 18.0, 20.0, 20.0, 20.0, 23.0, 32.0, 27.0, 24.0, 33.0, 31.0, 55.0, 38.0, 33.0, 36.0, 47.0, 37.0, 45.0, 53.0, 31.0, 45.0, 28.0, 33.0, 33.0, 23.0, 28.0, 27.0, 18.0, 14.0, 16.0, 17.0, 7.0, 5.0, 5.0, 1.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -19.167236328125, -18.60009765625, -18.032958984375, -17.4658203125, -16.898681640625, -16.33154296875, -15.764404296875, -15.197265625, -14.630126953125, -14.06298828125, -13.495849609375, -12.9287109375, -12.361572265625, -11.79443359375, -11.227294921875, -10.66015625, -10.093017578125, -9.52587890625, -8.958740234375, -8.3916015625, -7.824462890625, -7.25732421875, -6.690185546875, -6.123046875, -5.555908203125, -4.98876953125, -4.421630859375, -3.8544921875, -3.287353515625, -2.72021484375, -2.153076171875, -1.5859375, -1.018798828125, -0.45166015625, 0.115478515625, 0.6826171875, 1.249755859375, 1.81689453125, 2.384033203125, 2.951171875, 3.518310546875, 4.08544921875, 4.652587890625, 5.2197265625, 5.786865234375, 6.35400390625, 6.921142578125, 7.48828125, 8.055419921875, 8.62255859375, 9.189697265625, 9.7568359375, 10.323974609375, 10.89111328125, 11.458251953125, 12.025390625, 12.592529296875, 13.15966796875, 13.726806640625, 14.2939453125, 14.861083984375, 15.42822265625, 15.995361328125, 16.5625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 13.0, 20.0, 23.0, 33.0, 55.0, 50.0, 110.0, 195.0, 278.0, 390.0, 628.0, 999.0, 1556.0, 2499.0, 4050.0, 6426.0, 10859.0, 17719.0, 29636.0, 51209.0, 89309.0, 151029.0, 218621.0, 186587.0, 114507.0, 66139.0, 38094.0, 22564.0, 13515.0, 8048.0, 4951.0, 3092.0, 1924.0, 1239.0, 788.0, 476.0, 342.0, 204.0, 129.0, 82.0, 61.0, 32.0, 24.0, 12.0, 15.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0], "bins": [-55.25, -53.70361328125, -52.1572265625, -50.61083984375, -49.064453125, -47.51806640625, -45.9716796875, -44.42529296875, -42.87890625, -41.33251953125, -39.7861328125, -38.23974609375, -36.693359375, -35.14697265625, -33.6005859375, -32.05419921875, -30.5078125, -28.96142578125, -27.4150390625, -25.86865234375, -24.322265625, -22.77587890625, -21.2294921875, -19.68310546875, -18.13671875, -16.59033203125, -15.0439453125, -13.49755859375, -11.951171875, -10.40478515625, -8.8583984375, -7.31201171875, -5.765625, -4.21923828125, -2.6728515625, -1.12646484375, 0.419921875, 1.96630859375, 3.5126953125, 5.05908203125, 6.60546875, 8.15185546875, 9.6982421875, 11.24462890625, 12.791015625, 14.33740234375, 15.8837890625, 17.43017578125, 18.9765625, 20.52294921875, 22.0693359375, 23.61572265625, 25.162109375, 26.70849609375, 28.2548828125, 29.80126953125, 31.34765625, 32.89404296875, 34.4404296875, 35.98681640625, 37.533203125, 39.07958984375, 40.6259765625, 42.17236328125, 43.71875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 10.0, 10.0, 8.0, 17.0, 16.0, 28.0, 18.0, 26.0, 31.0, 42.0, 26.0, 47.0, 44.0, 42.0, 44.0, 53.0, 51.0, 41.0, 54.0, 37.0, 39.0, 36.0, 43.0, 41.0, 19.0, 31.0, 25.0, 23.0, 12.0, 13.0, 12.0, 12.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.203125, -12.738525390625, -12.27392578125, -11.809326171875, -11.3447265625, -10.880126953125, -10.41552734375, -9.950927734375, -9.486328125, -9.021728515625, -8.55712890625, -8.092529296875, -7.6279296875, -7.163330078125, -6.69873046875, -6.234130859375, -5.76953125, -5.304931640625, -4.84033203125, -4.375732421875, -3.9111328125, -3.446533203125, -2.98193359375, -2.517333984375, -2.052734375, -1.588134765625, -1.12353515625, -0.658935546875, -0.1943359375, 0.270263671875, 0.73486328125, 1.199462890625, 1.6640625, 2.128662109375, 2.59326171875, 3.057861328125, 3.5224609375, 3.987060546875, 4.45166015625, 4.916259765625, 5.380859375, 5.845458984375, 6.31005859375, 6.774658203125, 7.2392578125, 7.703857421875, 8.16845703125, 8.633056640625, 9.09765625, 9.562255859375, 10.02685546875, 10.491455078125, 10.9560546875, 11.420654296875, 11.88525390625, 12.349853515625, 12.814453125, 13.279052734375, 13.74365234375, 14.208251953125, 14.6728515625, 15.137451171875, 15.60205078125, 16.066650390625, 16.53125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 12.0, 14.0, 8.0, 23.0, 39.0, 36.0, 54.0, 119.0, 160.0, 270.0, 448.0, 712.0, 1374.0, 2695.0, 5023.0, 10373.0, 23981.0, 59545.0, 173257.0, 422047.0, 221130.0, 73494.0, 28639.0, 12327.0, 5922.0, 3004.0, 1594.0, 866.0, 538.0, 292.0, 169.0, 124.0, 95.0, 54.0, 34.0, 19.0, 14.0, 7.0, 9.0, 7.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.6875, -46.1787109375, -44.669921875, -43.1611328125, -41.65234375, -40.1435546875, -38.634765625, -37.1259765625, -35.6171875, -34.1083984375, -32.599609375, -31.0908203125, -29.58203125, -28.0732421875, -26.564453125, -25.0556640625, -23.546875, -22.0380859375, -20.529296875, -19.0205078125, -17.51171875, -16.0029296875, -14.494140625, -12.9853515625, -11.4765625, -9.9677734375, -8.458984375, -6.9501953125, -5.44140625, -3.9326171875, -2.423828125, -0.9150390625, 0.59375, 2.1025390625, 3.611328125, 5.1201171875, 6.62890625, 8.1376953125, 9.646484375, 11.1552734375, 12.6640625, 14.1728515625, 15.681640625, 17.1904296875, 18.69921875, 20.2080078125, 21.716796875, 23.2255859375, 24.734375, 26.2431640625, 27.751953125, 29.2607421875, 30.76953125, 32.2783203125, 33.787109375, 35.2958984375, 36.8046875, 38.3134765625, 39.822265625, 41.3310546875, 42.83984375, 44.3486328125, 45.857421875, 47.3662109375, 48.875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 12.0, 26.0, 18.0, 39.0, 75.0, 101.0, 154.0, 179.0, 123.0, 84.0, 45.0, 43.0, 23.0, 13.0, 13.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0063323974609375, -0.006166338920593262, -0.0060002803802490234, -0.005834221839904785, -0.005668163299560547, -0.005502104759216309, -0.00533604621887207, -0.005169987678527832, -0.005003929138183594, -0.0048378705978393555, -0.004671812057495117, -0.004505753517150879, -0.004339694976806641, -0.004173636436462402, -0.004007577896118164, -0.0038415193557739258, -0.0036754608154296875, -0.0035094022750854492, -0.003343343734741211, -0.0031772851943969727, -0.0030112266540527344, -0.002845168113708496, -0.002679109573364258, -0.0025130510330200195, -0.0023469924926757812, -0.002180933952331543, -0.0020148754119873047, -0.0018488168716430664, -0.0016827583312988281, -0.0015166997909545898, -0.0013506412506103516, -0.0011845827102661133, -0.001018524169921875, -0.0008524656295776367, -0.0006864070892333984, -0.0005203485488891602, -0.0003542900085449219, -0.0001882314682006836, -2.2172927856445312e-05, 0.00014388561248779297, 0.00030994415283203125, 0.00047600269317626953, 0.0006420612335205078, 0.0008081197738647461, 0.0009741783142089844, 0.0011402368545532227, 0.001306295394897461, 0.0014723539352416992, 0.0016384124755859375, 0.0018044710159301758, 0.001970529556274414, 0.0021365880966186523, 0.0023026466369628906, 0.002468705177307129, 0.002634763717651367, 0.0028008222579956055, 0.0029668807983398438, 0.003132939338684082, 0.0032989978790283203, 0.0034650564193725586, 0.003631114959716797, 0.003797173500061035, 0.0039632320404052734, 0.004129290580749512, 0.00429534912109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 12.0, 16.0, 14.0, 26.0, 38.0, 57.0, 103.0, 148.0, 232.0, 370.0, 579.0, 952.0, 1470.0, 2456.0, 3779.0, 6862.0, 11724.0, 20516.0, 36638.0, 66921.0, 121261.0, 197310.0, 222119.0, 155425.0, 88166.0, 48194.0, 26423.0, 14909.0, 8535.0, 5194.0, 3051.0, 1879.0, 1195.0, 691.0, 454.0, 297.0, 184.0, 111.0, 75.0, 57.0, 38.0, 18.0, 17.0, 12.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0], "bins": [-24.046875, -23.3642578125, -22.681640625, -21.9990234375, -21.31640625, -20.6337890625, -19.951171875, -19.2685546875, -18.5859375, -17.9033203125, -17.220703125, -16.5380859375, -15.85546875, -15.1728515625, -14.490234375, -13.8076171875, -13.125, -12.4423828125, -11.759765625, -11.0771484375, -10.39453125, -9.7119140625, -9.029296875, -8.3466796875, -7.6640625, -6.9814453125, -6.298828125, -5.6162109375, -4.93359375, -4.2509765625, -3.568359375, -2.8857421875, -2.203125, -1.5205078125, -0.837890625, -0.1552734375, 0.52734375, 1.2099609375, 1.892578125, 2.5751953125, 3.2578125, 3.9404296875, 4.623046875, 5.3056640625, 5.98828125, 6.6708984375, 7.353515625, 8.0361328125, 8.71875, 9.4013671875, 10.083984375, 10.7666015625, 11.44921875, 12.1318359375, 12.814453125, 13.4970703125, 14.1796875, 14.8623046875, 15.544921875, 16.2275390625, 16.91015625, 17.5927734375, 18.275390625, 18.9580078125, 19.640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 3.0, 9.0, 8.0, 7.0, 16.0, 11.0, 16.0, 19.0, 22.0, 38.0, 35.0, 31.0, 38.0, 41.0, 66.0, 61.0, 57.0, 60.0, 64.0, 56.0, 36.0, 50.0, 43.0, 31.0, 31.0, 32.0, 26.0, 17.0, 15.0, 11.0, 10.0, 7.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.89984130859375, -5.6785888671875, -5.45733642578125, -5.236083984375, -5.01483154296875, -4.7935791015625, -4.57232666015625, -4.35107421875, -4.12982177734375, -3.9085693359375, -3.68731689453125, -3.466064453125, -3.24481201171875, -3.0235595703125, -2.80230712890625, -2.5810546875, -2.35980224609375, -2.1385498046875, -1.91729736328125, -1.696044921875, -1.47479248046875, -1.2535400390625, -1.03228759765625, -0.81103515625, -0.58978271484375, -0.3685302734375, -0.14727783203125, 0.073974609375, 0.29522705078125, 0.5164794921875, 0.73773193359375, 0.958984375, 1.18023681640625, 1.4014892578125, 1.62274169921875, 1.843994140625, 2.06524658203125, 2.2864990234375, 2.50775146484375, 2.72900390625, 2.95025634765625, 3.1715087890625, 3.39276123046875, 3.614013671875, 3.83526611328125, 4.0565185546875, 4.27777099609375, 4.4990234375, 4.72027587890625, 4.9415283203125, 5.16278076171875, 5.384033203125, 5.60528564453125, 5.8265380859375, 6.04779052734375, 6.26904296875, 6.49029541015625, 6.7115478515625, 6.93280029296875, 7.154052734375, 7.37530517578125, 7.5965576171875, 7.81781005859375, 8.0390625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 11.0, 17.0, 21.0, 12.0, 14.0, 18.0, 28.0, 41.0, 28.0, 40.0, 42.0, 42.0, 46.0, 60.0, 53.0, 58.0, 47.0, 49.0, 48.0, 44.0, 32.0, 30.0, 28.0, 34.0, 22.0, 17.0, 13.0, 16.0, 13.0, 13.0, 14.0, 8.0, 2.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.716218948364258, -17.10547637939453, -16.494731903076172, -15.883988380432129, -15.273244857788086, -14.66250228881836, -14.051758766174316, -13.441015243530273, -12.83027172088623, -12.219528198242188, -11.608784675598145, -10.998041152954102, -10.387298583984375, -9.776554107666016, -9.165811538696289, -8.555068016052246, -7.944324493408203, -7.33358097076416, -6.722837448120117, -6.112094402313232, -5.5013508796691895, -4.8906073570251465, -4.279864311218262, -3.6691207885742188, -3.058377265930176, -2.447633743286133, -1.836890459060669, -1.2261470556259155, -0.6154036521911621, -0.004660129547119141, 0.6060831546783447, 1.2168264389038086, 1.8275699615478516, 2.4383134841918945, 3.0490567684173584, 3.6598000526428223, 4.270543575286865, 4.881287097930908, 5.492030143737793, 6.102773666381836, 6.713517189025879, 7.324260711669922, 7.935004234313965, 8.545747756958008, 9.156490325927734, 9.767234802246094, 10.37797737121582, 10.988720893859863, 11.599464416503906, 12.21020793914795, 12.820951461791992, 13.431694984436035, 14.042438507080078, 14.653181076049805, 15.263924598693848, 15.87466812133789, 16.48541259765625, 17.096155166625977, 17.706899642944336, 18.317642211914062, 18.928386688232422, 19.53912925720215, 20.149873733520508, 20.760616302490234, 21.37135887145996]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 3.0, 10.0, 3.0, 11.0, 7.0, 11.0, 9.0, 16.0, 19.0, 25.0, 7.0, 20.0, 16.0, 16.0, 31.0, 28.0, 25.0, 27.0, 26.0, 31.0, 38.0, 37.0, 48.0, 34.0, 33.0, 34.0, 38.0, 40.0, 24.0, 26.0, 36.0, 30.0, 39.0, 28.0, 26.0, 23.0, 20.0, 16.0, 14.0, 14.0, 11.0, 7.0, 10.0, 3.0, 8.0, 5.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0], "bins": [-15.952142715454102, -15.489089965820312, -15.026036262512207, -14.562983512878418, -14.099930763244629, -13.636877059936523, -13.173824310302734, -12.710771560668945, -12.247718811035156, -11.784666061401367, -11.321612358093262, -10.858559608459473, -10.395506858825684, -9.932453155517578, -9.469400405883789, -9.00634765625, -8.543293952941895, -8.080241203308105, -7.617187976837158, -7.154134750366211, -6.691082000732422, -6.228028774261475, -5.764975547790527, -5.301922798156738, -4.838869571685791, -4.375816345214844, -3.9127635955810547, -3.4497103691101074, -2.9866573810577393, -2.523604393005371, -2.060551166534424, -1.5974981784820557, -1.1344451904296875, -0.6713921427726746, -0.20833909511566162, 0.2547140121459961, 0.7177670001983643, 1.1808199882507324, 1.6438732147216797, 2.106926202774048, 2.569979190826416, 3.033032178878784, 3.4960851669311523, 3.9591383934020996, 4.422191619873047, 4.885244369506836, 5.348297595977783, 5.8113508224487305, 6.2744035720825195, 6.737456798553467, 7.200509548187256, 7.663562774658203, 8.126615524291992, 8.589668273925781, 9.052721977233887, 9.515774726867676, 9.978828430175781, 10.44188117980957, 10.904934883117676, 11.367987632751465, 11.831040382385254, 12.29409408569336, 12.757146835327148, 13.220199584960938, 13.683252334594727]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 9.0, 16.0, 19.0, 29.0, 47.0, 55.0, 109.0, 171.0, 228.0, 376.0, 600.0, 933.0, 1345.0, 2104.0, 3200.0, 4914.0, 7927.0, 11628.0, 17931.0, 26828.0, 39293.0, 56017.0, 76647.0, 97887.0, 116202.0, 122878.0, 115679.0, 97586.0, 75650.0, 55746.0, 39352.0, 26012.0, 17682.0, 11662.0, 7668.0, 4910.0, 3145.0, 2144.0, 1325.0, 860.0, 589.0, 427.0, 249.0, 151.0, 98.0, 66.0, 62.0, 39.0, 33.0, 10.0, 5.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0], "bins": [-14.1015625, -13.66748046875, -13.2333984375, -12.79931640625, -12.365234375, -11.93115234375, -11.4970703125, -11.06298828125, -10.62890625, -10.19482421875, -9.7607421875, -9.32666015625, -8.892578125, -8.45849609375, -8.0244140625, -7.59033203125, -7.15625, -6.72216796875, -6.2880859375, -5.85400390625, -5.419921875, -4.98583984375, -4.5517578125, -4.11767578125, -3.68359375, -3.24951171875, -2.8154296875, -2.38134765625, -1.947265625, -1.51318359375, -1.0791015625, -0.64501953125, -0.2109375, 0.22314453125, 0.6572265625, 1.09130859375, 1.525390625, 1.95947265625, 2.3935546875, 2.82763671875, 3.26171875, 3.69580078125, 4.1298828125, 4.56396484375, 4.998046875, 5.43212890625, 5.8662109375, 6.30029296875, 6.734375, 7.16845703125, 7.6025390625, 8.03662109375, 8.470703125, 8.90478515625, 9.3388671875, 9.77294921875, 10.20703125, 10.64111328125, 11.0751953125, 11.50927734375, 11.943359375, 12.37744140625, 12.8115234375, 13.24560546875, 13.6796875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 7.0, 11.0, 10.0, 12.0, 13.0, 13.0, 15.0, 26.0, 21.0, 26.0, 22.0, 19.0, 26.0, 31.0, 33.0, 45.0, 34.0, 38.0, 26.0, 41.0, 36.0, 34.0, 41.0, 46.0, 41.0, 38.0, 31.0, 39.0, 35.0, 24.0, 22.0, 26.0, 18.0, 24.0, 12.0, 13.0, 6.0, 8.0, 3.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.0, -16.5118408203125, -16.023681640625, -15.5355224609375, -15.04736328125, -14.5592041015625, -14.071044921875, -13.5828857421875, -13.0947265625, -12.6065673828125, -12.118408203125, -11.6302490234375, -11.14208984375, -10.6539306640625, -10.165771484375, -9.6776123046875, -9.189453125, -8.7012939453125, -8.213134765625, -7.7249755859375, -7.23681640625, -6.7486572265625, -6.260498046875, -5.7723388671875, -5.2841796875, -4.7960205078125, -4.307861328125, -3.8197021484375, -3.33154296875, -2.8433837890625, -2.355224609375, -1.8670654296875, -1.37890625, -0.8907470703125, -0.402587890625, 0.0855712890625, 0.57373046875, 1.0618896484375, 1.550048828125, 2.0382080078125, 2.5263671875, 3.0145263671875, 3.502685546875, 3.9908447265625, 4.47900390625, 4.9671630859375, 5.455322265625, 5.9434814453125, 6.431640625, 6.9197998046875, 7.407958984375, 7.8961181640625, 8.38427734375, 8.8724365234375, 9.360595703125, 9.8487548828125, 10.3369140625, 10.8250732421875, 11.313232421875, 11.8013916015625, 12.28955078125, 12.7777099609375, 13.265869140625, 13.7540283203125, 14.2421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 18.0, 26.0, 38.0, 65.0, 96.0, 138.0, 245.0, 403.0, 635.0, 1006.0, 1641.0, 2600.0, 4256.0, 7128.0, 11837.0, 19805.0, 33984.0, 56633.0, 90273.0, 131245.0, 162559.0, 163079.0, 131186.0, 89765.0, 56385.0, 33461.0, 19884.0, 11973.0, 7049.0, 4295.0, 2544.0, 1616.0, 994.0, 577.0, 409.0, 243.0, 167.0, 112.0, 60.0, 45.0, 26.0, 16.0, 8.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.9375, -18.3963623046875, -17.855224609375, -17.3140869140625, -16.77294921875, -16.2318115234375, -15.690673828125, -15.1495361328125, -14.6083984375, -14.0672607421875, -13.526123046875, -12.9849853515625, -12.44384765625, -11.9027099609375, -11.361572265625, -10.8204345703125, -10.279296875, -9.7381591796875, -9.197021484375, -8.6558837890625, -8.11474609375, -7.5736083984375, -7.032470703125, -6.4913330078125, -5.9501953125, -5.4090576171875, -4.867919921875, -4.3267822265625, -3.78564453125, -3.2445068359375, -2.703369140625, -2.1622314453125, -1.62109375, -1.0799560546875, -0.538818359375, 0.0023193359375, 0.54345703125, 1.0845947265625, 1.625732421875, 2.1668701171875, 2.7080078125, 3.2491455078125, 3.790283203125, 4.3314208984375, 4.87255859375, 5.4136962890625, 5.954833984375, 6.4959716796875, 7.037109375, 7.5782470703125, 8.119384765625, 8.6605224609375, 9.20166015625, 9.7427978515625, 10.283935546875, 10.8250732421875, 11.3662109375, 11.9073486328125, 12.448486328125, 12.9896240234375, 13.53076171875, 14.0718994140625, 14.613037109375, 15.1541748046875, 15.6953125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 5.0, 9.0, 6.0, 8.0, 13.0, 7.0, 11.0, 16.0, 20.0, 31.0, 26.0, 29.0, 24.0, 42.0, 57.0, 40.0, 39.0, 28.0, 37.0, 36.0, 51.0, 46.0, 37.0, 39.0, 52.0, 41.0, 38.0, 25.0, 30.0, 25.0, 21.0, 17.0, 20.0, 20.0, 10.0, 10.0, 11.0, 7.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-12.0859375, -11.73095703125, -11.3759765625, -11.02099609375, -10.666015625, -10.31103515625, -9.9560546875, -9.60107421875, -9.24609375, -8.89111328125, -8.5361328125, -8.18115234375, -7.826171875, -7.47119140625, -7.1162109375, -6.76123046875, -6.40625, -6.05126953125, -5.6962890625, -5.34130859375, -4.986328125, -4.63134765625, -4.2763671875, -3.92138671875, -3.56640625, -3.21142578125, -2.8564453125, -2.50146484375, -2.146484375, -1.79150390625, -1.4365234375, -1.08154296875, -0.7265625, -0.37158203125, -0.0166015625, 0.33837890625, 0.693359375, 1.04833984375, 1.4033203125, 1.75830078125, 2.11328125, 2.46826171875, 2.8232421875, 3.17822265625, 3.533203125, 3.88818359375, 4.2431640625, 4.59814453125, 4.953125, 5.30810546875, 5.6630859375, 6.01806640625, 6.373046875, 6.72802734375, 7.0830078125, 7.43798828125, 7.79296875, 8.14794921875, 8.5029296875, 8.85791015625, 9.212890625, 9.56787109375, 9.9228515625, 10.27783203125, 10.6328125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 10.0, 11.0, 11.0, 16.0, 45.0, 49.0, 67.0, 116.0, 182.0, 265.0, 416.0, 721.0, 1105.0, 1865.0, 3070.0, 5470.0, 9774.0, 18251.0, 36446.0, 75226.0, 151489.0, 243525.0, 230707.0, 134680.0, 65333.0, 32259.0, 16489.0, 8825.0, 4873.0, 2820.0, 1666.0, 1007.0, 639.0, 410.0, 247.0, 168.0, 100.0, 66.0, 53.0, 30.0, 15.0, 9.0, 6.0, 5.0, 1.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.203125, -14.67724609375, -14.1513671875, -13.62548828125, -13.099609375, -12.57373046875, -12.0478515625, -11.52197265625, -10.99609375, -10.47021484375, -9.9443359375, -9.41845703125, -8.892578125, -8.36669921875, -7.8408203125, -7.31494140625, -6.7890625, -6.26318359375, -5.7373046875, -5.21142578125, -4.685546875, -4.15966796875, -3.6337890625, -3.10791015625, -2.58203125, -2.05615234375, -1.5302734375, -1.00439453125, -0.478515625, 0.04736328125, 0.5732421875, 1.09912109375, 1.625, 2.15087890625, 2.6767578125, 3.20263671875, 3.728515625, 4.25439453125, 4.7802734375, 5.30615234375, 5.83203125, 6.35791015625, 6.8837890625, 7.40966796875, 7.935546875, 8.46142578125, 8.9873046875, 9.51318359375, 10.0390625, 10.56494140625, 11.0908203125, 11.61669921875, 12.142578125, 12.66845703125, 13.1943359375, 13.72021484375, 14.24609375, 14.77197265625, 15.2978515625, 15.82373046875, 16.349609375, 16.87548828125, 17.4013671875, 17.92724609375, 18.453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 27.0, 28.0, 47.0, 38.0, 59.0, 71.0, 82.0, 73.0, 90.0, 77.0, 64.0, 57.0, 42.0, 46.0, 39.0, 28.0, 18.0, 11.0, 8.0, 12.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019388198852539062, -0.0018799751996994019, -0.0018211305141448975, -0.001762285828590393, -0.0017034411430358887, -0.0016445964574813843, -0.0015857517719268799, -0.0015269070863723755, -0.001468062400817871, -0.0014092177152633667, -0.0013503730297088623, -0.001291528344154358, -0.0012326836585998535, -0.0011738389730453491, -0.0011149942874908447, -0.0010561496019363403, -0.000997304916381836, -0.0009384602308273315, -0.0008796155452728271, -0.0008207708597183228, -0.0007619261741638184, -0.000703081488609314, -0.0006442368030548096, -0.0005853921175003052, -0.0005265474319458008, -0.0004677027463912964, -0.000408858060836792, -0.0003500133752822876, -0.0002911686897277832, -0.0002323240041732788, -0.00017347931861877441, -0.00011463463306427002, -5.5789947509765625e-05, 3.0547380447387695e-06, 6.189942359924316e-05, 0.00012074410915374756, 0.00017958879470825195, 0.00023843348026275635, 0.00029727816581726074, 0.00035612285137176514, 0.00041496753692626953, 0.0004738122224807739, 0.0005326569080352783, 0.0005915015935897827, 0.0006503462791442871, 0.0007091909646987915, 0.0007680356502532959, 0.0008268803358078003, 0.0008857250213623047, 0.0009445697069168091, 0.0010034143924713135, 0.0010622590780258179, 0.0011211037635803223, 0.0011799484491348267, 0.001238793134689331, 0.0012976378202438354, 0.0013564825057983398, 0.0014153271913528442, 0.0014741718769073486, 0.001533016562461853, 0.0015918612480163574, 0.0016507059335708618, 0.0017095506191253662, 0.0017683953046798706, 0.001827239990234375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 14.0, 17.0, 28.0, 33.0, 44.0, 73.0, 77.0, 131.0, 203.0, 269.0, 393.0, 583.0, 917.0, 1412.0, 2358.0, 3821.0, 6765.0, 11526.0, 21451.0, 39784.0, 74939.0, 134561.0, 205545.0, 213045.0, 148133.0, 83228.0, 44121.0, 23500.0, 13006.0, 7272.0, 4198.0, 2532.0, 1511.0, 1013.0, 617.0, 451.0, 293.0, 203.0, 160.0, 101.0, 48.0, 57.0, 28.0, 21.0, 21.0, 9.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.7890625, -14.328125, -13.8671875, -13.40625, -12.9453125, -12.484375, -12.0234375, -11.5625, -11.1015625, -10.640625, -10.1796875, -9.71875, -9.2578125, -8.796875, -8.3359375, -7.875, -7.4140625, -6.953125, -6.4921875, -6.03125, -5.5703125, -5.109375, -4.6484375, -4.1875, -3.7265625, -3.265625, -2.8046875, -2.34375, -1.8828125, -1.421875, -0.9609375, -0.5, -0.0390625, 0.421875, 0.8828125, 1.34375, 1.8046875, 2.265625, 2.7265625, 3.1875, 3.6484375, 4.109375, 4.5703125, 5.03125, 5.4921875, 5.953125, 6.4140625, 6.875, 7.3359375, 7.796875, 8.2578125, 8.71875, 9.1796875, 9.640625, 10.1015625, 10.5625, 11.0234375, 11.484375, 11.9453125, 12.40625, 12.8671875, 13.328125, 13.7890625, 14.25, 14.7109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 4.0, 6.0, 4.0, 8.0, 13.0, 16.0, 14.0, 16.0, 22.0, 27.0, 35.0, 43.0, 39.0, 35.0, 48.0, 52.0, 57.0, 58.0, 47.0, 48.0, 51.0, 48.0, 47.0, 29.0, 38.0, 39.0, 35.0, 22.0, 9.0, 18.0, 9.0, 7.0, 11.0, 7.0, 6.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.91998291015625, -3.8009033203125, -3.68182373046875, -3.562744140625, -3.44366455078125, -3.3245849609375, -3.20550537109375, -3.08642578125, -2.96734619140625, -2.8482666015625, -2.72918701171875, -2.610107421875, -2.49102783203125, -2.3719482421875, -2.25286865234375, -2.1337890625, -2.01470947265625, -1.8956298828125, -1.77655029296875, -1.657470703125, -1.53839111328125, -1.4193115234375, -1.30023193359375, -1.18115234375, -1.06207275390625, -0.9429931640625, -0.82391357421875, -0.704833984375, -0.58575439453125, -0.4666748046875, -0.34759521484375, -0.228515625, -0.10943603515625, 0.0096435546875, 0.12872314453125, 0.247802734375, 0.36688232421875, 0.4859619140625, 0.60504150390625, 0.72412109375, 0.84320068359375, 0.9622802734375, 1.08135986328125, 1.200439453125, 1.31951904296875, 1.4385986328125, 1.55767822265625, 1.6767578125, 1.79583740234375, 1.9149169921875, 2.03399658203125, 2.153076171875, 2.27215576171875, 2.3912353515625, 2.51031494140625, 2.62939453125, 2.74847412109375, 2.8675537109375, 2.98663330078125, 3.105712890625, 3.22479248046875, 3.3438720703125, 3.46295166015625, 3.58203125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 8.0, 9.0, 14.0, 13.0, 20.0, 21.0, 16.0, 24.0, 41.0, 44.0, 29.0, 54.0, 54.0, 49.0, 49.0, 61.0, 53.0, 53.0, 38.0, 56.0, 35.0, 31.0, 33.0, 23.0, 34.0, 19.0, 20.0, 22.0, 9.0, 7.0, 11.0, 6.0, 6.0, 3.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.620800018310547, -17.036314010620117, -16.451826095581055, -15.867340087890625, -15.282854080200195, -14.69836711883545, -14.113880157470703, -13.529394149780273, -12.944907188415527, -12.360420227050781, -11.775934219360352, -11.191447257995605, -10.60696029663086, -10.02247428894043, -9.437987327575684, -8.853500366210938, -8.269014358520508, -7.68452787399292, -7.100041389465332, -6.515554428100586, -5.931067943572998, -5.34658145904541, -4.762094497680664, -4.177608013153076, -3.5931215286254883, -3.0086350440979004, -2.4241483211517334, -1.839661717414856, -1.2551751136779785, -0.6706886291503906, -0.08620190620422363, 0.49828481674194336, 1.082773208618164, 1.6672598123550415, 2.251746416091919, 2.836233139038086, 3.420719623565674, 4.005206108093262, 4.589693069458008, 5.174179553985596, 5.758666038513184, 6.3431525230407715, 6.927639007568359, 7.5121259689331055, 8.096612930297852, 8.681098937988281, 9.265585899353027, 9.850072860717773, 10.434558868408203, 11.01904582977295, 11.603531837463379, 12.188018798828125, 12.772504806518555, 13.3569917678833, 13.941478729248047, 14.525964736938477, 15.110451698303223, 15.694938659667969, 16.2794246673584, 16.863910675048828, 17.44839859008789, 18.03288459777832, 18.61737060546875, 19.201858520507812, 19.786344528198242]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 10.0, 12.0, 11.0, 7.0, 16.0, 13.0, 12.0, 15.0, 19.0, 21.0, 24.0, 18.0, 24.0, 31.0, 31.0, 28.0, 30.0, 32.0, 36.0, 39.0, 38.0, 34.0, 37.0, 33.0, 42.0, 35.0, 36.0, 29.0, 34.0, 34.0, 21.0, 28.0, 23.0, 21.0, 24.0, 14.0, 11.0, 13.0, 18.0, 10.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.68523120880127, -14.213888168334961, -13.742544174194336, -13.271201133728027, -12.799858093261719, -12.328514099121094, -11.857171058654785, -11.385828018188477, -10.914484024047852, -10.443140983581543, -9.971796989440918, -9.50045394897461, -9.029109954833984, -8.557766914367676, -8.086423873901367, -7.6150803565979, -7.143736839294434, -6.672393321990967, -6.2010498046875, -5.729706764221191, -5.258363246917725, -4.787019729614258, -4.315676689147949, -3.8443331718444824, -3.3729896545410156, -2.901646137237549, -2.430302858352661, -1.9589594602584839, -1.4876160621643066, -1.0162725448608398, -0.5449292659759521, -0.07358598709106445, 0.39775657653808594, 0.8690999746322632, 1.3404433727264404, 1.8117867708206177, 2.283130168914795, 2.7544736862182617, 3.2258169651031494, 3.697160243988037, 4.168503761291504, 4.639847278594971, 5.1111907958984375, 5.582533836364746, 6.053877353668213, 6.52522087097168, 6.996563911437988, 7.467907428741455, 7.939250946044922, 8.41059398651123, 8.881937980651855, 9.353281021118164, 9.824625015258789, 10.295968055725098, 10.767311096191406, 11.238655090332031, 11.70999813079834, 12.181341171264648, 12.652685165405273, 13.124028205871582, 13.59537124633789, 14.066715240478516, 14.538058280944824, 15.009401321411133, 15.480745315551758]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 30.0, 21.0, 30.0, 45.0, 78.0, 125.0, 181.0, 256.0, 409.0, 629.0, 987.0, 1613.0, 2600.0, 3996.0, 6389.0, 10570.0, 17536.0, 29591.0, 52230.0, 95677.0, 185083.0, 375865.0, 697923.0, 940429.0, 801701.0, 469654.0, 231632.0, 117300.0, 62804.0, 35188.0, 20507.0, 12638.0, 7662.0, 4791.0, 2964.0, 1800.0, 1173.0, 777.0, 508.0, 308.0, 203.0, 125.0, 93.0, 58.0, 29.0, 23.0, 13.0, 10.0, 6.0, 8.0, 1.0, 0.0, 3.0], "bins": [-16.5625, -16.084716796875, -15.60693359375, -15.129150390625, -14.6513671875, -14.173583984375, -13.69580078125, -13.218017578125, -12.740234375, -12.262451171875, -11.78466796875, -11.306884765625, -10.8291015625, -10.351318359375, -9.87353515625, -9.395751953125, -8.91796875, -8.440185546875, -7.96240234375, -7.484619140625, -7.0068359375, -6.529052734375, -6.05126953125, -5.573486328125, -5.095703125, -4.617919921875, -4.14013671875, -3.662353515625, -3.1845703125, -2.706787109375, -2.22900390625, -1.751220703125, -1.2734375, -0.795654296875, -0.31787109375, 0.159912109375, 0.6376953125, 1.115478515625, 1.59326171875, 2.071044921875, 2.548828125, 3.026611328125, 3.50439453125, 3.982177734375, 4.4599609375, 4.937744140625, 5.41552734375, 5.893310546875, 6.37109375, 6.848876953125, 7.32666015625, 7.804443359375, 8.2822265625, 8.760009765625, 9.23779296875, 9.715576171875, 10.193359375, 10.671142578125, 11.14892578125, 11.626708984375, 12.1044921875, 12.582275390625, 13.06005859375, 13.537841796875, 14.015625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 12.0, 11.0, 10.0, 11.0, 12.0, 17.0, 18.0, 32.0, 22.0, 23.0, 25.0, 22.0, 29.0, 38.0, 26.0, 41.0, 40.0, 50.0, 35.0, 39.0, 39.0, 44.0, 38.0, 35.0, 43.0, 30.0, 28.0, 31.0, 21.0, 34.0, 26.0, 14.0, 20.0, 11.0, 10.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.015625, -11.651123046875, -11.28662109375, -10.922119140625, -10.5576171875, -10.193115234375, -9.82861328125, -9.464111328125, -9.099609375, -8.735107421875, -8.37060546875, -8.006103515625, -7.6416015625, -7.277099609375, -6.91259765625, -6.548095703125, -6.18359375, -5.819091796875, -5.45458984375, -5.090087890625, -4.7255859375, -4.361083984375, -3.99658203125, -3.632080078125, -3.267578125, -2.903076171875, -2.53857421875, -2.174072265625, -1.8095703125, -1.445068359375, -1.08056640625, -0.716064453125, -0.3515625, 0.012939453125, 0.37744140625, 0.741943359375, 1.1064453125, 1.470947265625, 1.83544921875, 2.199951171875, 2.564453125, 2.928955078125, 3.29345703125, 3.657958984375, 4.0224609375, 4.386962890625, 4.75146484375, 5.115966796875, 5.48046875, 5.844970703125, 6.20947265625, 6.573974609375, 6.9384765625, 7.302978515625, 7.66748046875, 8.031982421875, 8.396484375, 8.760986328125, 9.12548828125, 9.489990234375, 9.8544921875, 10.218994140625, 10.58349609375, 10.947998046875, 11.3125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 14.0, 18.0, 25.0, 33.0, 62.0, 110.0, 158.0, 211.0, 351.0, 505.0, 831.0, 1294.0, 2048.0, 3141.0, 4922.0, 8049.0, 12843.0, 21172.0, 35686.0, 60859.0, 103867.0, 179548.0, 311525.0, 527289.0, 787556.0, 801985.0, 548323.0, 326000.0, 188539.0, 108952.0, 63584.0, 37184.0, 22432.0, 13162.0, 8182.0, 5080.0, 3242.0, 2012.0, 1257.0, 820.0, 518.0, 330.0, 228.0, 122.0, 70.0, 54.0, 36.0, 18.0, 12.0, 10.0, 6.0, 5.0, 6.0, 2.0], "bins": [-15.984375, -15.5281982421875, -15.072021484375, -14.6158447265625, -14.15966796875, -13.7034912109375, -13.247314453125, -12.7911376953125, -12.3349609375, -11.8787841796875, -11.422607421875, -10.9664306640625, -10.51025390625, -10.0540771484375, -9.597900390625, -9.1417236328125, -8.685546875, -8.2293701171875, -7.773193359375, -7.3170166015625, -6.86083984375, -6.4046630859375, -5.948486328125, -5.4923095703125, -5.0361328125, -4.5799560546875, -4.123779296875, -3.6676025390625, -3.21142578125, -2.7552490234375, -2.299072265625, -1.8428955078125, -1.38671875, -0.9305419921875, -0.474365234375, -0.0181884765625, 0.43798828125, 0.8941650390625, 1.350341796875, 1.8065185546875, 2.2626953125, 2.7188720703125, 3.175048828125, 3.6312255859375, 4.08740234375, 4.5435791015625, 4.999755859375, 5.4559326171875, 5.912109375, 6.3682861328125, 6.824462890625, 7.2806396484375, 7.73681640625, 8.1929931640625, 8.649169921875, 9.1053466796875, 9.5615234375, 10.0177001953125, 10.473876953125, 10.9300537109375, 11.38623046875, 11.8424072265625, 12.298583984375, 12.7547607421875, 13.2109375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 13.0, 16.0, 16.0, 29.0, 33.0, 39.0, 51.0, 65.0, 96.0, 113.0, 118.0, 152.0, 189.0, 217.0, 217.0, 226.0, 276.0, 251.0, 289.0, 236.0, 225.0, 205.0, 167.0, 132.0, 134.0, 102.0, 85.0, 88.0, 53.0, 40.0, 28.0, 34.0, 25.0, 19.0, 21.0, 13.0, 12.0, 12.0, 7.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.8671875, -5.6893310546875, -5.511474609375, -5.3336181640625, -5.15576171875, -4.9779052734375, -4.800048828125, -4.6221923828125, -4.4443359375, -4.2664794921875, -4.088623046875, -3.9107666015625, -3.73291015625, -3.5550537109375, -3.377197265625, -3.1993408203125, -3.021484375, -2.8436279296875, -2.665771484375, -2.4879150390625, -2.31005859375, -2.1322021484375, -1.954345703125, -1.7764892578125, -1.5986328125, -1.4207763671875, -1.242919921875, -1.0650634765625, -0.88720703125, -0.7093505859375, -0.531494140625, -0.3536376953125, -0.17578125, 0.0020751953125, 0.179931640625, 0.3577880859375, 0.53564453125, 0.7135009765625, 0.891357421875, 1.0692138671875, 1.2470703125, 1.4249267578125, 1.602783203125, 1.7806396484375, 1.95849609375, 2.1363525390625, 2.314208984375, 2.4920654296875, 2.669921875, 2.8477783203125, 3.025634765625, 3.2034912109375, 3.38134765625, 3.5592041015625, 3.737060546875, 3.9149169921875, 4.0927734375, 4.2706298828125, 4.448486328125, 4.6263427734375, 4.80419921875, 4.9820556640625, 5.159912109375, 5.3377685546875, 5.515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 8.0, 8.0, 17.0, 14.0, 21.0, 23.0, 20.0, 29.0, 42.0, 27.0, 38.0, 53.0, 50.0, 50.0, 53.0, 52.0, 57.0, 53.0, 52.0, 46.0, 47.0, 42.0, 37.0, 26.0, 26.0, 21.0, 16.0, 12.0, 19.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.505298614501953, -13.981097221374512, -13.45689582824707, -12.932694435119629, -12.408493041992188, -11.88429069519043, -11.360089302062988, -10.835887908935547, -10.311686515808105, -9.787485122680664, -9.263283729553223, -8.739082336425781, -8.214879989624023, -7.69067907333374, -7.166477203369141, -6.642275810241699, -6.118074417114258, -5.593873023986816, -5.069671630859375, -4.545469760894775, -4.021268367767334, -3.4970669746398926, -2.972865343093872, -2.4486637115478516, -1.9244623184204102, -1.4002608060836792, -0.8760592937469482, -0.3518577814102173, 0.17234373092651367, 0.6965451240539551, 1.2207467555999756, 1.744948387145996, 2.2691497802734375, 2.793351173400879, 3.3175528049468994, 3.84175443649292, 4.365955829620361, 4.890157222747803, 5.414359092712402, 5.938560485839844, 6.462761878967285, 6.986963272094727, 7.511164665222168, 8.03536605834961, 8.559568405151367, 9.083768844604492, 9.60797119140625, 10.132172584533691, 10.656373977661133, 11.180575370788574, 11.704776763916016, 12.228978157043457, 12.753179550170898, 13.277381896972656, 13.801583290100098, 14.325784683227539, 14.84998607635498, 15.374187469482422, 15.898388862609863, 16.422590255737305, 16.946792602539062, 17.470993041992188, 17.995195388793945, 18.519397735595703, 19.043598175048828]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 10.0, 9.0, 8.0, 10.0, 14.0, 14.0, 16.0, 12.0, 21.0, 38.0, 21.0, 32.0, 33.0, 30.0, 37.0, 42.0, 43.0, 41.0, 45.0, 42.0, 36.0, 46.0, 47.0, 27.0, 42.0, 44.0, 30.0, 28.0, 25.0, 19.0, 19.0, 21.0, 14.0, 15.0, 10.0, 13.0, 8.0, 6.0, 8.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.387277603149414, -14.947333335876465, -14.507389068603516, -14.067444801330566, -13.627500534057617, -13.187556266784668, -12.747611999511719, -12.30766773223877, -11.86772346496582, -11.427779197692871, -10.987834930419922, -10.547890663146973, -10.107946395874023, -9.668002128601074, -9.228057861328125, -8.788113594055176, -8.348169326782227, -7.908225059509277, -7.468280792236328, -7.028336524963379, -6.58839225769043, -6.1484479904174805, -5.708503723144531, -5.268559455871582, -4.828614234924316, -4.388669967651367, -3.948725700378418, -3.5087814331054688, -3.0688371658325195, -2.628892660140991, -2.188948392868042, -1.7490041255950928, -1.3090600967407227, -0.8691158294677734, -0.42917150259017944, 0.01077282428741455, 0.45071709156036377, 0.8906614780426025, 1.3306057453155518, 1.770550012588501, 2.21049427986145, 2.6504385471343994, 3.0903828144073486, 3.530327320098877, 3.970271587371826, 4.410215854644775, 4.850160121917725, 5.290104389190674, 5.730048656463623, 6.169992923736572, 6.6099371910095215, 7.049881458282471, 7.48982572555542, 7.929770469665527, 8.369714736938477, 8.809659004211426, 9.249603271484375, 9.689547538757324, 10.129491806030273, 10.569436073303223, 11.009380340576172, 11.449324607849121, 11.88926887512207, 12.32921314239502, 12.769157409667969]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 10.0, 13.0, 27.0, 27.0, 34.0, 59.0, 93.0, 116.0, 147.0, 186.0, 262.0, 399.0, 612.0, 923.0, 1307.0, 1826.0, 2898.0, 4759.0, 7747.0, 13245.0, 23766.0, 46432.0, 95602.0, 198380.0, 276168.0, 185866.0, 88857.0, 43253.0, 22529.0, 12530.0, 7337.0, 4540.0, 2825.0, 1807.0, 1236.0, 824.0, 553.0, 408.0, 288.0, 197.0, 128.0, 93.0, 65.0, 58.0, 30.0, 26.0, 17.0, 14.0, 8.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.09375, -32.04150390625, -30.9892578125, -29.93701171875, -28.884765625, -27.83251953125, -26.7802734375, -25.72802734375, -24.67578125, -23.62353515625, -22.5712890625, -21.51904296875, -20.466796875, -19.41455078125, -18.3623046875, -17.31005859375, -16.2578125, -15.20556640625, -14.1533203125, -13.10107421875, -12.048828125, -10.99658203125, -9.9443359375, -8.89208984375, -7.83984375, -6.78759765625, -5.7353515625, -4.68310546875, -3.630859375, -2.57861328125, -1.5263671875, -0.47412109375, 0.578125, 1.63037109375, 2.6826171875, 3.73486328125, 4.787109375, 5.83935546875, 6.8916015625, 7.94384765625, 8.99609375, 10.04833984375, 11.1005859375, 12.15283203125, 13.205078125, 14.25732421875, 15.3095703125, 16.36181640625, 17.4140625, 18.46630859375, 19.5185546875, 20.57080078125, 21.623046875, 22.67529296875, 23.7275390625, 24.77978515625, 25.83203125, 26.88427734375, 27.9365234375, 28.98876953125, 30.041015625, 31.09326171875, 32.1455078125, 33.19775390625, 34.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 12.0, 6.0, 17.0, 7.0, 8.0, 14.0, 14.0, 13.0, 22.0, 21.0, 27.0, 32.0, 35.0, 38.0, 43.0, 36.0, 54.0, 39.0, 39.0, 38.0, 46.0, 40.0, 46.0, 43.0, 41.0, 39.0, 36.0, 27.0, 25.0, 22.0, 23.0, 14.0, 17.0, 16.0, 11.0, 11.0, 10.0, 6.0, 2.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.203125, -14.77294921875, -14.3427734375, -13.91259765625, -13.482421875, -13.05224609375, -12.6220703125, -12.19189453125, -11.76171875, -11.33154296875, -10.9013671875, -10.47119140625, -10.041015625, -9.61083984375, -9.1806640625, -8.75048828125, -8.3203125, -7.89013671875, -7.4599609375, -7.02978515625, -6.599609375, -6.16943359375, -5.7392578125, -5.30908203125, -4.87890625, -4.44873046875, -4.0185546875, -3.58837890625, -3.158203125, -2.72802734375, -2.2978515625, -1.86767578125, -1.4375, -1.00732421875, -0.5771484375, -0.14697265625, 0.283203125, 0.71337890625, 1.1435546875, 1.57373046875, 2.00390625, 2.43408203125, 2.8642578125, 3.29443359375, 3.724609375, 4.15478515625, 4.5849609375, 5.01513671875, 5.4453125, 5.87548828125, 6.3056640625, 6.73583984375, 7.166015625, 7.59619140625, 8.0263671875, 8.45654296875, 8.88671875, 9.31689453125, 9.7470703125, 10.17724609375, 10.607421875, 11.03759765625, 11.4677734375, 11.89794921875, 12.328125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 7.0, 5.0, 9.0, 12.0, 9.0, 27.0, 35.0, 42.0, 84.0, 89.0, 132.0, 211.0, 263.0, 389.0, 588.0, 859.0, 1283.0, 1930.0, 2967.0, 4638.0, 7539.0, 11937.0, 20456.0, 36812.0, 71375.0, 146917.0, 266219.0, 228071.0, 114650.0, 56152.0, 29907.0, 16871.0, 10020.0, 6206.0, 3929.0, 2624.0, 1740.0, 1072.0, 771.0, 519.0, 373.0, 237.0, 172.0, 125.0, 78.0, 52.0, 50.0, 35.0, 26.0, 14.0, 11.0, 11.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.359375, -26.442138671875, -25.52490234375, -24.607666015625, -23.6904296875, -22.773193359375, -21.85595703125, -20.938720703125, -20.021484375, -19.104248046875, -18.18701171875, -17.269775390625, -16.3525390625, -15.435302734375, -14.51806640625, -13.600830078125, -12.68359375, -11.766357421875, -10.84912109375, -9.931884765625, -9.0146484375, -8.097412109375, -7.18017578125, -6.262939453125, -5.345703125, -4.428466796875, -3.51123046875, -2.593994140625, -1.6767578125, -0.759521484375, 0.15771484375, 1.074951171875, 1.9921875, 2.909423828125, 3.82666015625, 4.743896484375, 5.6611328125, 6.578369140625, 7.49560546875, 8.412841796875, 9.330078125, 10.247314453125, 11.16455078125, 12.081787109375, 12.9990234375, 13.916259765625, 14.83349609375, 15.750732421875, 16.66796875, 17.585205078125, 18.50244140625, 19.419677734375, 20.3369140625, 21.254150390625, 22.17138671875, 23.088623046875, 24.005859375, 24.923095703125, 25.84033203125, 26.757568359375, 27.6748046875, 28.592041015625, 29.50927734375, 30.426513671875, 31.34375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 5.0, 8.0, 9.0, 12.0, 13.0, 19.0, 15.0, 11.0, 19.0, 21.0, 21.0, 22.0, 28.0, 28.0, 37.0, 36.0, 47.0, 47.0, 42.0, 44.0, 45.0, 47.0, 30.0, 50.0, 35.0, 35.0, 30.0, 35.0, 34.0, 22.0, 21.0, 22.0, 15.0, 22.0, 11.0, 11.0, 11.0, 4.0, 9.0, 7.0, 5.0, 2.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.453125, -9.178466796875, -8.90380859375, -8.629150390625, -8.3544921875, -8.079833984375, -7.80517578125, -7.530517578125, -7.255859375, -6.981201171875, -6.70654296875, -6.431884765625, -6.1572265625, -5.882568359375, -5.60791015625, -5.333251953125, -5.05859375, -4.783935546875, -4.50927734375, -4.234619140625, -3.9599609375, -3.685302734375, -3.41064453125, -3.135986328125, -2.861328125, -2.586669921875, -2.31201171875, -2.037353515625, -1.7626953125, -1.488037109375, -1.21337890625, -0.938720703125, -0.6640625, -0.389404296875, -0.11474609375, 0.159912109375, 0.4345703125, 0.709228515625, 0.98388671875, 1.258544921875, 1.533203125, 1.807861328125, 2.08251953125, 2.357177734375, 2.6318359375, 2.906494140625, 3.18115234375, 3.455810546875, 3.73046875, 4.005126953125, 4.27978515625, 4.554443359375, 4.8291015625, 5.103759765625, 5.37841796875, 5.653076171875, 5.927734375, 6.202392578125, 6.47705078125, 6.751708984375, 7.0263671875, 7.301025390625, 7.57568359375, 7.850341796875, 8.125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 15.0, 10.0, 13.0, 22.0, 35.0, 30.0, 66.0, 75.0, 92.0, 175.0, 229.0, 402.0, 639.0, 965.0, 1491.0, 2669.0, 4641.0, 8698.0, 17820.0, 39572.0, 95947.0, 240864.0, 342642.0, 168155.0, 65911.0, 27937.0, 13161.0, 6754.0, 3739.0, 2122.0, 1328.0, 800.0, 497.0, 328.0, 195.0, 155.0, 95.0, 81.0, 54.0, 44.0, 23.0, 13.0, 13.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.828125, -15.3056640625, -14.783203125, -14.2607421875, -13.73828125, -13.2158203125, -12.693359375, -12.1708984375, -11.6484375, -11.1259765625, -10.603515625, -10.0810546875, -9.55859375, -9.0361328125, -8.513671875, -7.9912109375, -7.46875, -6.9462890625, -6.423828125, -5.9013671875, -5.37890625, -4.8564453125, -4.333984375, -3.8115234375, -3.2890625, -2.7666015625, -2.244140625, -1.7216796875, -1.19921875, -0.6767578125, -0.154296875, 0.3681640625, 0.890625, 1.4130859375, 1.935546875, 2.4580078125, 2.98046875, 3.5029296875, 4.025390625, 4.5478515625, 5.0703125, 5.5927734375, 6.115234375, 6.6376953125, 7.16015625, 7.6826171875, 8.205078125, 8.7275390625, 9.25, 9.7724609375, 10.294921875, 10.8173828125, 11.33984375, 11.8623046875, 12.384765625, 12.9072265625, 13.4296875, 13.9521484375, 14.474609375, 14.9970703125, 15.51953125, 16.0419921875, 16.564453125, 17.0869140625, 17.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 1.0, 9.0, 15.0, 18.0, 21.0, 41.0, 48.0, 94.0, 139.0, 159.0, 133.0, 102.0, 81.0, 36.0, 19.0, 19.0, 14.0, 14.0, 11.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017681121826171875, -0.0017173439264297485, -0.0016665756702423096, -0.0016158074140548706, -0.0015650391578674316, -0.0015142709016799927, -0.0014635026454925537, -0.0014127343893051147, -0.0013619661331176758, -0.0013111978769302368, -0.0012604296207427979, -0.0012096613645553589, -0.00115889310836792, -0.001108124852180481, -0.001057356595993042, -0.001006588339805603, -0.0009558200836181641, -0.0009050518274307251, -0.0008542835712432861, -0.0008035153150558472, -0.0007527470588684082, -0.0007019788026809692, -0.0006512105464935303, -0.0006004422903060913, -0.0005496740341186523, -0.0004989057779312134, -0.0004481375217437744, -0.00039736926555633545, -0.0003466010093688965, -0.0002958327531814575, -0.00024506449699401855, -0.0001942962408065796, -0.00014352798461914062, -9.275972843170166e-05, -4.1991472244262695e-05, 8.77678394317627e-06, 5.9545040130615234e-05, 0.0001103132963180542, 0.00016108155250549316, 0.00021184980869293213, 0.0002626180648803711, 0.00031338632106781006, 0.000364154577255249, 0.000414922833442688, 0.00046569108963012695, 0.0005164593458175659, 0.0005672276020050049, 0.0006179958581924438, 0.0006687641143798828, 0.0007195323705673218, 0.0007703006267547607, 0.0008210688829421997, 0.0008718371391296387, 0.0009226053953170776, 0.0009733736515045166, 0.0010241419076919556, 0.0010749101638793945, 0.0011256784200668335, 0.0011764466762542725, 0.0012272149324417114, 0.0012779831886291504, 0.0013287514448165894, 0.0013795197010040283, 0.0014302879571914673, 0.0014810562133789062]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 21.0, 24.0, 35.0, 42.0, 65.0, 90.0, 111.0, 199.0, 268.0, 386.0, 546.0, 809.0, 1258.0, 1930.0, 3094.0, 5016.0, 8425.0, 14298.0, 25466.0, 46627.0, 87067.0, 152642.0, 216686.0, 198496.0, 126866.0, 69326.0, 37567.0, 20630.0, 11877.0, 6947.0, 4130.0, 2626.0, 1626.0, 1033.0, 721.0, 458.0, 317.0, 226.0, 180.0, 112.0, 73.0, 53.0, 43.0, 33.0, 27.0, 19.0, 14.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-10.9140625, -10.5599365234375, -10.205810546875, -9.8516845703125, -9.49755859375, -9.1434326171875, -8.789306640625, -8.4351806640625, -8.0810546875, -7.7269287109375, -7.372802734375, -7.0186767578125, -6.66455078125, -6.3104248046875, -5.956298828125, -5.6021728515625, -5.248046875, -4.8939208984375, -4.539794921875, -4.1856689453125, -3.83154296875, -3.4774169921875, -3.123291015625, -2.7691650390625, -2.4150390625, -2.0609130859375, -1.706787109375, -1.3526611328125, -0.99853515625, -0.6444091796875, -0.290283203125, 0.0638427734375, 0.41796875, 0.7720947265625, 1.126220703125, 1.4803466796875, 1.83447265625, 2.1885986328125, 2.542724609375, 2.8968505859375, 3.2509765625, 3.6051025390625, 3.959228515625, 4.3133544921875, 4.66748046875, 5.0216064453125, 5.375732421875, 5.7298583984375, 6.083984375, 6.4381103515625, 6.792236328125, 7.1463623046875, 7.50048828125, 7.8546142578125, 8.208740234375, 8.5628662109375, 8.9169921875, 9.2711181640625, 9.625244140625, 9.9793701171875, 10.33349609375, 10.6876220703125, 11.041748046875, 11.3958740234375, 11.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 9.0, 12.0, 20.0, 25.0, 20.0, 32.0, 30.0, 43.0, 63.0, 60.0, 67.0, 79.0, 77.0, 65.0, 72.0, 53.0, 56.0, 49.0, 35.0, 22.0, 22.0, 17.0, 19.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.53759765625, -4.3916015625, -4.24560546875, -4.099609375, -3.95361328125, -3.8076171875, -3.66162109375, -3.515625, -3.36962890625, -3.2236328125, -3.07763671875, -2.931640625, -2.78564453125, -2.6396484375, -2.49365234375, -2.34765625, -2.20166015625, -2.0556640625, -1.90966796875, -1.763671875, -1.61767578125, -1.4716796875, -1.32568359375, -1.1796875, -1.03369140625, -0.8876953125, -0.74169921875, -0.595703125, -0.44970703125, -0.3037109375, -0.15771484375, -0.01171875, 0.13427734375, 0.2802734375, 0.42626953125, 0.572265625, 0.71826171875, 0.8642578125, 1.01025390625, 1.15625, 1.30224609375, 1.4482421875, 1.59423828125, 1.740234375, 1.88623046875, 2.0322265625, 2.17822265625, 2.32421875, 2.47021484375, 2.6162109375, 2.76220703125, 2.908203125, 3.05419921875, 3.2001953125, 3.34619140625, 3.4921875, 3.63818359375, 3.7841796875, 3.93017578125, 4.076171875, 4.22216796875, 4.3681640625, 4.51416015625, 4.66015625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 9.0, 12.0, 18.0, 19.0, 19.0, 32.0, 36.0, 28.0, 35.0, 42.0, 47.0, 57.0, 58.0, 32.0, 42.0, 52.0, 57.0, 33.0, 39.0, 47.0, 37.0, 34.0, 30.0, 27.0, 23.0, 22.0, 19.0, 11.0, 10.0, 14.0, 14.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.578789710998535, -12.14874267578125, -11.718695640563965, -11.28864860534668, -10.858601570129395, -10.42855453491211, -9.998507499694824, -9.568460464477539, -9.138413429260254, -8.708366394042969, -8.278319358825684, -7.848272323608398, -7.418225288391113, -6.988178253173828, -6.558131217956543, -6.128084182739258, -5.698037147521973, -5.2679901123046875, -4.837943077087402, -4.407896041870117, -3.977849006652832, -3.547801971435547, -3.1177549362182617, -2.6877079010009766, -2.2576608657836914, -1.8276138305664062, -1.397566795349121, -0.9675197601318359, -0.5374727249145508, -0.10742568969726562, 0.32262134552001953, 0.7526683807373047, 1.1827163696289062, 1.6127634048461914, 2.0428104400634766, 2.4728574752807617, 2.902904510498047, 3.332951545715332, 3.762998580932617, 4.193045616149902, 4.6230926513671875, 5.053139686584473, 5.483186721801758, 5.913233757019043, 6.343280792236328, 6.773327827453613, 7.203374862670898, 7.633421897888184, 8.063468933105469, 8.493515968322754, 8.923563003540039, 9.353610038757324, 9.78365707397461, 10.213704109191895, 10.64375114440918, 11.073798179626465, 11.50384521484375, 11.933892250061035, 12.36393928527832, 12.793986320495605, 13.22403335571289, 13.654080390930176, 14.084127426147461, 14.514174461364746, 14.944221496582031]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 11.0, 6.0, 6.0, 12.0, 15.0, 8.0, 11.0, 14.0, 24.0, 19.0, 32.0, 29.0, 34.0, 25.0, 30.0, 44.0, 37.0, 43.0, 43.0, 46.0, 46.0, 31.0, 33.0, 40.0, 43.0, 33.0, 44.0, 30.0, 39.0, 32.0, 18.0, 20.0, 17.0, 19.0, 12.0, 10.0, 13.0, 10.0, 5.0, 1.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-14.63601016998291, -14.240499496459961, -13.844987869262695, -13.449477195739746, -13.053966522216797, -12.658454895019531, -12.262944221496582, -11.867433547973633, -11.471921920776367, -11.076411247253418, -10.680899620056152, -10.285388946533203, -9.889877319335938, -9.494366645812988, -9.098855972290039, -8.703344345092773, -8.307833671569824, -7.912322521209717, -7.516811370849609, -7.12130069732666, -6.725789546966553, -6.330278396606445, -5.934767723083496, -5.539256572723389, -5.143745422363281, -4.748234272003174, -4.352723121643066, -3.957212448120117, -3.5617012977600098, -3.1661901473999023, -2.770679235458374, -2.3751683235168457, -1.9796571731567383, -1.5841461420059204, -1.1886351108551025, -0.7931240797042847, -0.3976130485534668, -0.0021020174026489258, 0.39340901374816895, 0.7889199256896973, 1.1844310760498047, 1.5799421072006226, 1.9754531383514404, 2.3709640502929688, 2.766475200653076, 3.1619863510131836, 3.557497262954712, 3.9530081748962402, 4.348519325256348, 4.744030475616455, 5.1395416259765625, 5.535052299499512, 5.930563449859619, 6.326074600219727, 6.721585273742676, 7.117096424102783, 7.512607574462891, 7.908118724822998, 8.303629875183105, 8.699140548706055, 9.09465217590332, 9.49016284942627, 9.885673522949219, 10.281185150146484, 10.676695823669434]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 7.0, 15.0, 16.0, 31.0, 31.0, 70.0, 80.0, 144.0, 210.0, 282.0, 394.0, 624.0, 907.0, 1482.0, 2297.0, 3690.0, 6124.0, 10139.0, 16718.0, 28431.0, 47503.0, 77761.0, 117695.0, 155682.0, 167804.0, 143378.0, 102504.0, 65265.0, 39603.0, 23519.0, 13893.0, 8438.0, 5120.0, 3115.0, 1946.0, 1234.0, 772.0, 541.0, 363.0, 220.0, 147.0, 105.0, 76.0, 54.0, 38.0, 25.0, 25.0, 13.0, 10.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.078125, -11.651611328125, -11.22509765625, -10.798583984375, -10.3720703125, -9.945556640625, -9.51904296875, -9.092529296875, -8.666015625, -8.239501953125, -7.81298828125, -7.386474609375, -6.9599609375, -6.533447265625, -6.10693359375, -5.680419921875, -5.25390625, -4.827392578125, -4.40087890625, -3.974365234375, -3.5478515625, -3.121337890625, -2.69482421875, -2.268310546875, -1.841796875, -1.415283203125, -0.98876953125, -0.562255859375, -0.1357421875, 0.290771484375, 0.71728515625, 1.143798828125, 1.5703125, 1.996826171875, 2.42333984375, 2.849853515625, 3.2763671875, 3.702880859375, 4.12939453125, 4.555908203125, 4.982421875, 5.408935546875, 5.83544921875, 6.261962890625, 6.6884765625, 7.114990234375, 7.54150390625, 7.968017578125, 8.39453125, 8.821044921875, 9.24755859375, 9.674072265625, 10.1005859375, 10.527099609375, 10.95361328125, 11.380126953125, 11.806640625, 12.233154296875, 12.65966796875, 13.086181640625, 13.5126953125, 13.939208984375, 14.36572265625, 14.792236328125, 15.21875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 9.0, 2.0, 4.0, 6.0, 7.0, 10.0, 8.0, 13.0, 17.0, 15.0, 28.0, 24.0, 26.0, 23.0, 36.0, 45.0, 29.0, 43.0, 29.0, 43.0, 33.0, 35.0, 42.0, 42.0, 42.0, 46.0, 29.0, 39.0, 31.0, 39.0, 31.0, 24.0, 26.0, 25.0, 16.0, 19.0, 15.0, 17.0, 12.0, 8.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.7667236328125, -12.392822265625, -12.0189208984375, -11.64501953125, -11.2711181640625, -10.897216796875, -10.5233154296875, -10.1494140625, -9.7755126953125, -9.401611328125, -9.0277099609375, -8.65380859375, -8.2799072265625, -7.906005859375, -7.5321044921875, -7.158203125, -6.7843017578125, -6.410400390625, -6.0364990234375, -5.66259765625, -5.2886962890625, -4.914794921875, -4.5408935546875, -4.1669921875, -3.7930908203125, -3.419189453125, -3.0452880859375, -2.67138671875, -2.2974853515625, -1.923583984375, -1.5496826171875, -1.17578125, -0.8018798828125, -0.427978515625, -0.0540771484375, 0.31982421875, 0.6937255859375, 1.067626953125, 1.4415283203125, 1.8154296875, 2.1893310546875, 2.563232421875, 2.9371337890625, 3.31103515625, 3.6849365234375, 4.058837890625, 4.4327392578125, 4.806640625, 5.1805419921875, 5.554443359375, 5.9283447265625, 6.30224609375, 6.6761474609375, 7.050048828125, 7.4239501953125, 7.7978515625, 8.1717529296875, 8.545654296875, 8.9195556640625, 9.29345703125, 9.6673583984375, 10.041259765625, 10.4151611328125, 10.7890625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 13.0, 17.0, 20.0, 48.0, 58.0, 68.0, 113.0, 180.0, 271.0, 413.0, 627.0, 961.0, 1566.0, 2298.0, 3713.0, 6050.0, 9960.0, 16559.0, 27015.0, 44098.0, 70615.0, 106525.0, 143676.0, 163237.0, 146870.0, 110821.0, 73704.0, 46668.0, 28161.0, 17125.0, 10179.0, 6204.0, 3937.0, 2462.0, 1533.0, 962.0, 613.0, 432.0, 261.0, 184.0, 109.0, 75.0, 44.0, 41.0, 24.0, 13.0, 11.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.8828125, -11.506103515625, -11.12939453125, -10.752685546875, -10.3759765625, -9.999267578125, -9.62255859375, -9.245849609375, -8.869140625, -8.492431640625, -8.11572265625, -7.739013671875, -7.3623046875, -6.985595703125, -6.60888671875, -6.232177734375, -5.85546875, -5.478759765625, -5.10205078125, -4.725341796875, -4.3486328125, -3.971923828125, -3.59521484375, -3.218505859375, -2.841796875, -2.465087890625, -2.08837890625, -1.711669921875, -1.3349609375, -0.958251953125, -0.58154296875, -0.204833984375, 0.171875, 0.548583984375, 0.92529296875, 1.302001953125, 1.6787109375, 2.055419921875, 2.43212890625, 2.808837890625, 3.185546875, 3.562255859375, 3.93896484375, 4.315673828125, 4.6923828125, 5.069091796875, 5.44580078125, 5.822509765625, 6.19921875, 6.575927734375, 6.95263671875, 7.329345703125, 7.7060546875, 8.082763671875, 8.45947265625, 8.836181640625, 9.212890625, 9.589599609375, 9.96630859375, 10.343017578125, 10.7197265625, 11.096435546875, 11.47314453125, 11.849853515625, 12.2265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 8.0, 9.0, 5.0, 9.0, 10.0, 13.0, 14.0, 17.0, 27.0, 21.0, 27.0, 37.0, 39.0, 32.0, 39.0, 49.0, 39.0, 38.0, 56.0, 38.0, 39.0, 41.0, 44.0, 46.0, 49.0, 32.0, 31.0, 27.0, 26.0, 24.0, 17.0, 20.0, 24.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.39251708984375, -8.1365966796875, -7.88067626953125, -7.624755859375, -7.36883544921875, -7.1129150390625, -6.85699462890625, -6.60107421875, -6.34515380859375, -6.0892333984375, -5.83331298828125, -5.577392578125, -5.32147216796875, -5.0655517578125, -4.80963134765625, -4.5537109375, -4.29779052734375, -4.0418701171875, -3.78594970703125, -3.530029296875, -3.27410888671875, -3.0181884765625, -2.76226806640625, -2.50634765625, -2.25042724609375, -1.9945068359375, -1.73858642578125, -1.482666015625, -1.22674560546875, -0.9708251953125, -0.71490478515625, -0.458984375, -0.20306396484375, 0.0528564453125, 0.30877685546875, 0.564697265625, 0.82061767578125, 1.0765380859375, 1.33245849609375, 1.58837890625, 1.84429931640625, 2.1002197265625, 2.35614013671875, 2.612060546875, 2.86798095703125, 3.1239013671875, 3.37982177734375, 3.6357421875, 3.89166259765625, 4.1475830078125, 4.40350341796875, 4.659423828125, 4.91534423828125, 5.1712646484375, 5.42718505859375, 5.68310546875, 5.93902587890625, 6.1949462890625, 6.45086669921875, 6.706787109375, 6.96270751953125, 7.2186279296875, 7.47454833984375, 7.73046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 2.0, 6.0, 20.0, 26.0, 33.0, 70.0, 82.0, 161.0, 224.0, 352.0, 528.0, 848.0, 1361.0, 2393.0, 3981.0, 7199.0, 13620.0, 26235.0, 54431.0, 113385.0, 209110.0, 254724.0, 177759.0, 91318.0, 43414.0, 21381.0, 11179.0, 5907.0, 3563.0, 2030.0, 1202.0, 740.0, 460.0, 282.0, 185.0, 116.0, 87.0, 45.0, 41.0, 19.0, 11.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.2056884765625, -9.880126953125, -9.5545654296875, -9.22900390625, -8.9034423828125, -8.577880859375, -8.2523193359375, -7.9267578125, -7.6011962890625, -7.275634765625, -6.9500732421875, -6.62451171875, -6.2989501953125, -5.973388671875, -5.6478271484375, -5.322265625, -4.9967041015625, -4.671142578125, -4.3455810546875, -4.02001953125, -3.6944580078125, -3.368896484375, -3.0433349609375, -2.7177734375, -2.3922119140625, -2.066650390625, -1.7410888671875, -1.41552734375, -1.0899658203125, -0.764404296875, -0.4388427734375, -0.11328125, 0.2122802734375, 0.537841796875, 0.8634033203125, 1.18896484375, 1.5145263671875, 1.840087890625, 2.1656494140625, 2.4912109375, 2.8167724609375, 3.142333984375, 3.4678955078125, 3.79345703125, 4.1190185546875, 4.444580078125, 4.7701416015625, 5.095703125, 5.4212646484375, 5.746826171875, 6.0723876953125, 6.39794921875, 6.7235107421875, 7.049072265625, 7.3746337890625, 7.7001953125, 8.0257568359375, 8.351318359375, 8.6768798828125, 9.00244140625, 9.3280029296875, 9.653564453125, 9.9791259765625, 10.3046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 17.0, 25.0, 46.0, 47.0, 73.0, 94.0, 133.0, 116.0, 92.0, 97.0, 65.0, 53.0, 42.0, 24.0, 26.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0021343231201171875, -0.0020851343870162964, -0.0020359456539154053, -0.001986756920814514, -0.001937568187713623, -0.001888379454612732, -0.0018391907215118408, -0.0017900019884109497, -0.0017408132553100586, -0.0016916245222091675, -0.0016424357891082764, -0.0015932470560073853, -0.0015440583229064941, -0.001494869589805603, -0.001445680856704712, -0.0013964921236038208, -0.0013473033905029297, -0.0012981146574020386, -0.0012489259243011475, -0.0011997371912002563, -0.0011505484580993652, -0.0011013597249984741, -0.001052170991897583, -0.001002982258796692, -0.0009537935256958008, -0.0009046047925949097, -0.0008554160594940186, -0.0008062273263931274, -0.0007570385932922363, -0.0007078498601913452, -0.0006586611270904541, -0.000609472393989563, -0.0005602836608886719, -0.0005110949277877808, -0.00046190619468688965, -0.00041271746158599854, -0.0003635287284851074, -0.0003143399953842163, -0.0002651512622833252, -0.00021596252918243408, -0.00016677379608154297, -0.00011758506298065186, -6.839632987976074e-05, -1.920759677886963e-05, 2.9981136322021484e-05, 7.91698694229126e-05, 0.0001283586025238037, 0.00017754733562469482, 0.00022673606872558594, 0.00027592480182647705, 0.00032511353492736816, 0.0003743022680282593, 0.0004234910011291504, 0.0004726797342300415, 0.0005218684673309326, 0.0005710572004318237, 0.0006202459335327148, 0.000669434666633606, 0.0007186233997344971, 0.0007678121328353882, 0.0008170008659362793, 0.0008661895990371704, 0.0009153783321380615, 0.0009645670652389526, 0.0010137557983398438]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 19.0, 17.0, 37.0, 50.0, 85.0, 128.0, 192.0, 300.0, 442.0, 725.0, 1097.0, 1782.0, 2842.0, 4494.0, 7609.0, 12551.0, 21610.0, 38563.0, 68470.0, 119530.0, 179449.0, 199626.0, 157692.0, 99249.0, 55819.0, 31591.0, 17762.0, 10454.0, 6131.0, 3799.0, 2372.0, 1442.0, 922.0, 601.0, 367.0, 264.0, 159.0, 108.0, 62.0, 39.0, 33.0, 17.0, 9.0, 10.0, 3.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.328125, -8.08544921875, -7.8427734375, -7.60009765625, -7.357421875, -7.11474609375, -6.8720703125, -6.62939453125, -6.38671875, -6.14404296875, -5.9013671875, -5.65869140625, -5.416015625, -5.17333984375, -4.9306640625, -4.68798828125, -4.4453125, -4.20263671875, -3.9599609375, -3.71728515625, -3.474609375, -3.23193359375, -2.9892578125, -2.74658203125, -2.50390625, -2.26123046875, -2.0185546875, -1.77587890625, -1.533203125, -1.29052734375, -1.0478515625, -0.80517578125, -0.5625, -0.31982421875, -0.0771484375, 0.16552734375, 0.408203125, 0.65087890625, 0.8935546875, 1.13623046875, 1.37890625, 1.62158203125, 1.8642578125, 2.10693359375, 2.349609375, 2.59228515625, 2.8349609375, 3.07763671875, 3.3203125, 3.56298828125, 3.8056640625, 4.04833984375, 4.291015625, 4.53369140625, 4.7763671875, 5.01904296875, 5.26171875, 5.50439453125, 5.7470703125, 5.98974609375, 6.232421875, 6.47509765625, 6.7177734375, 6.96044921875, 7.203125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 12.0, 12.0, 16.0, 24.0, 24.0, 21.0, 26.0, 34.0, 57.0, 57.0, 47.0, 58.0, 50.0, 72.0, 79.0, 57.0, 57.0, 43.0, 37.0, 29.0, 30.0, 26.0, 18.0, 17.0, 18.0, 18.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.424346923828125, -2.34478759765625, -2.265228271484375, -2.1856689453125, -2.106109619140625, -2.02655029296875, -1.946990966796875, -1.867431640625, -1.787872314453125, -1.70831298828125, -1.628753662109375, -1.5491943359375, -1.469635009765625, -1.39007568359375, -1.310516357421875, -1.23095703125, -1.151397705078125, -1.07183837890625, -0.992279052734375, -0.9127197265625, -0.833160400390625, -0.75360107421875, -0.674041748046875, -0.594482421875, -0.514923095703125, -0.43536376953125, -0.355804443359375, -0.2762451171875, -0.196685791015625, -0.11712646484375, -0.037567138671875, 0.0419921875, 0.121551513671875, 0.20111083984375, 0.280670166015625, 0.3602294921875, 0.439788818359375, 0.51934814453125, 0.598907470703125, 0.678466796875, 0.758026123046875, 0.83758544921875, 0.917144775390625, 0.9967041015625, 1.076263427734375, 1.15582275390625, 1.235382080078125, 1.31494140625, 1.394500732421875, 1.47406005859375, 1.553619384765625, 1.6331787109375, 1.712738037109375, 1.79229736328125, 1.871856689453125, 1.951416015625, 2.030975341796875, 2.11053466796875, 2.190093994140625, 2.2696533203125, 2.349212646484375, 2.42877197265625, 2.508331298828125, 2.587890625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 6.0, 9.0, 14.0, 14.0, 19.0, 17.0, 27.0, 31.0, 29.0, 45.0, 45.0, 41.0, 45.0, 47.0, 46.0, 50.0, 55.0, 37.0, 57.0, 43.0, 29.0, 41.0, 33.0, 31.0, 24.0, 19.0, 22.0, 11.0, 22.0, 13.0, 9.0, 8.0, 6.0, 15.0, 2.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.397566795349121, -10.998830795288086, -10.600095748901367, -10.201360702514648, -9.802624702453613, -9.403888702392578, -9.00515365600586, -8.60641860961914, -8.207682609558105, -7.8089470863342285, -7.410211563110352, -7.011476039886475, -6.612740516662598, -6.214004993438721, -5.815269470214844, -5.416533946990967, -5.01779842376709, -4.619062900543213, -4.220327377319336, -3.821591854095459, -3.422856330871582, -3.024120807647705, -2.625385284423828, -2.226649761199951, -1.8279142379760742, -1.4291787147521973, -1.0304431915283203, -0.6317076683044434, -0.2329721450805664, 0.16576337814331055, 0.5644989013671875, 0.9632344245910645, 1.3619709014892578, 1.7607064247131348, 2.1594419479370117, 2.5581774711608887, 2.9569129943847656, 3.3556485176086426, 3.7543840408325195, 4.1531195640563965, 4.551855087280273, 4.95059061050415, 5.349326133728027, 5.748061656951904, 6.146797180175781, 6.545532703399658, 6.944268226623535, 7.343003749847412, 7.741739273071289, 8.140474319458008, 8.539210319519043, 8.937946319580078, 9.336681365966797, 9.735416412353516, 10.13415241241455, 10.532888412475586, 10.931623458862305, 11.330358505249023, 11.729094505310059, 12.127830505371094, 12.526565551757812, 12.925300598144531, 13.324036598205566, 13.722772598266602, 14.12150764465332]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 5.0, 5.0, 7.0, 12.0, 15.0, 15.0, 10.0, 17.0, 25.0, 24.0, 26.0, 35.0, 37.0, 33.0, 42.0, 33.0, 43.0, 41.0, 40.0, 35.0, 43.0, 50.0, 37.0, 33.0, 36.0, 34.0, 38.0, 32.0, 35.0, 23.0, 14.0, 16.0, 18.0, 15.0, 17.0, 9.0, 11.0, 10.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.395416259765625, -12.01191234588623, -11.628408432006836, -11.244904518127441, -10.861400604248047, -10.477897644042969, -10.094393730163574, -9.71088981628418, -9.327385902404785, -8.94388198852539, -8.560378074645996, -8.176874160766602, -7.793370723724365, -7.409866809844971, -7.026363372802734, -6.64285945892334, -6.259355545043945, -5.875851631164551, -5.492347717285156, -5.10884428024292, -4.725340366363525, -4.341836452484131, -3.9583327770233154, -3.5748291015625, -3.1913251876831055, -2.807821273803711, -2.4243175983428955, -2.04081392288208, -1.6573100090026855, -1.2738062143325806, -0.8903024196624756, -0.5067987442016602, -0.12329387664794922, 0.26020991802215576, 0.6437137126922607, 1.0272175073623657, 1.4107213020324707, 1.7942250967025757, 2.1777288913726807, 2.561232566833496, 2.9447364807128906, 3.328240394592285, 3.7117440700531006, 4.095247745513916, 4.4787516593933105, 4.862255573272705, 5.245759010314941, 5.629262924194336, 6.0127668380737305, 6.396270751953125, 6.7797746658325195, 7.163278102874756, 7.54678201675415, 7.930285930633545, 8.313789367675781, 8.697293281555176, 9.08079719543457, 9.464301109313965, 9.84780502319336, 10.231308937072754, 10.614812850952148, 10.998315811157227, 11.381819725036621, 11.765323638916016, 12.14882755279541]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 11.0, 17.0, 29.0, 33.0, 41.0, 82.0, 121.0, 191.0, 276.0, 397.0, 603.0, 1008.0, 1611.0, 2398.0, 3763.0, 6099.0, 9619.0, 15834.0, 26346.0, 45316.0, 80786.0, 152619.0, 304567.0, 592754.0, 899280.0, 878975.0, 559437.0, 283765.0, 143461.0, 76367.0, 43122.0, 25189.0, 15179.0, 9206.0, 5683.0, 3611.0, 2309.0, 1471.0, 922.0, 635.0, 383.0, 245.0, 173.0, 120.0, 84.0, 45.0, 36.0, 21.0, 11.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.84375, -10.493408203125, -10.14306640625, -9.792724609375, -9.4423828125, -9.092041015625, -8.74169921875, -8.391357421875, -8.041015625, -7.690673828125, -7.34033203125, -6.989990234375, -6.6396484375, -6.289306640625, -5.93896484375, -5.588623046875, -5.23828125, -4.887939453125, -4.53759765625, -4.187255859375, -3.8369140625, -3.486572265625, -3.13623046875, -2.785888671875, -2.435546875, -2.085205078125, -1.73486328125, -1.384521484375, -1.0341796875, -0.683837890625, -0.33349609375, 0.016845703125, 0.3671875, 0.717529296875, 1.06787109375, 1.418212890625, 1.7685546875, 2.118896484375, 2.46923828125, 2.819580078125, 3.169921875, 3.520263671875, 3.87060546875, 4.220947265625, 4.5712890625, 4.921630859375, 5.27197265625, 5.622314453125, 5.97265625, 6.322998046875, 6.67333984375, 7.023681640625, 7.3740234375, 7.724365234375, 8.07470703125, 8.425048828125, 8.775390625, 9.125732421875, 9.47607421875, 9.826416015625, 10.1767578125, 10.527099609375, 10.87744140625, 11.227783203125, 11.578125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 8.0, 8.0, 17.0, 17.0, 20.0, 18.0, 28.0, 30.0, 20.0, 25.0, 38.0, 37.0, 40.0, 33.0, 52.0, 35.0, 45.0, 55.0, 32.0, 41.0, 31.0, 27.0, 46.0, 31.0, 33.0, 26.0, 27.0, 26.0, 35.0, 19.0, 14.0, 9.0, 8.0, 11.0, 9.0, 2.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.2330322265625, -7.966064453125, -7.6990966796875, -7.43212890625, -7.1651611328125, -6.898193359375, -6.6312255859375, -6.3642578125, -6.0972900390625, -5.830322265625, -5.5633544921875, -5.29638671875, -5.0294189453125, -4.762451171875, -4.4954833984375, -4.228515625, -3.9615478515625, -3.694580078125, -3.4276123046875, -3.16064453125, -2.8936767578125, -2.626708984375, -2.3597412109375, -2.0927734375, -1.8258056640625, -1.558837890625, -1.2918701171875, -1.02490234375, -0.7579345703125, -0.490966796875, -0.2239990234375, 0.04296875, 0.3099365234375, 0.576904296875, 0.8438720703125, 1.11083984375, 1.3778076171875, 1.644775390625, 1.9117431640625, 2.1787109375, 2.4456787109375, 2.712646484375, 2.9796142578125, 3.24658203125, 3.5135498046875, 3.780517578125, 4.0474853515625, 4.314453125, 4.5814208984375, 4.848388671875, 5.1153564453125, 5.38232421875, 5.6492919921875, 5.916259765625, 6.1832275390625, 6.4501953125, 6.7171630859375, 6.984130859375, 7.2510986328125, 7.51806640625, 7.7850341796875, 8.052001953125, 8.3189697265625, 8.5859375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 20.0, 18.0, 42.0, 67.0, 110.0, 153.0, 242.0, 348.0, 553.0, 799.0, 1235.0, 1933.0, 3030.0, 4760.0, 7380.0, 11968.0, 19924.0, 32950.0, 55844.0, 96219.0, 167308.0, 294294.0, 507852.0, 776066.0, 824888.0, 578420.0, 340347.0, 193891.0, 111207.0, 64525.0, 37841.0, 23028.0, 13783.0, 8461.0, 5401.0, 3304.0, 2121.0, 1442.0, 871.0, 527.0, 379.0, 251.0, 155.0, 107.0, 66.0, 47.0, 44.0, 16.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0], "bins": [-10.984375, -10.65283203125, -10.3212890625, -9.98974609375, -9.658203125, -9.32666015625, -8.9951171875, -8.66357421875, -8.33203125, -8.00048828125, -7.6689453125, -7.33740234375, -7.005859375, -6.67431640625, -6.3427734375, -6.01123046875, -5.6796875, -5.34814453125, -5.0166015625, -4.68505859375, -4.353515625, -4.02197265625, -3.6904296875, -3.35888671875, -3.02734375, -2.69580078125, -2.3642578125, -2.03271484375, -1.701171875, -1.36962890625, -1.0380859375, -0.70654296875, -0.375, -0.04345703125, 0.2880859375, 0.61962890625, 0.951171875, 1.28271484375, 1.6142578125, 1.94580078125, 2.27734375, 2.60888671875, 2.9404296875, 3.27197265625, 3.603515625, 3.93505859375, 4.2666015625, 4.59814453125, 4.9296875, 5.26123046875, 5.5927734375, 5.92431640625, 6.255859375, 6.58740234375, 6.9189453125, 7.25048828125, 7.58203125, 7.91357421875, 8.2451171875, 8.57666015625, 8.908203125, 9.23974609375, 9.5712890625, 9.90283203125, 10.234375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 10.0, 7.0, 11.0, 8.0, 9.0, 30.0, 20.0, 37.0, 42.0, 57.0, 61.0, 99.0, 99.0, 145.0, 175.0, 238.0, 273.0, 290.0, 305.0, 295.0, 290.0, 294.0, 233.0, 215.0, 164.0, 138.0, 131.0, 86.0, 75.0, 64.0, 49.0, 32.0, 27.0, 20.0, 11.0, 10.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.47296142578125, -4.3248291015625, -4.17669677734375, -4.028564453125, -3.88043212890625, -3.7322998046875, -3.58416748046875, -3.43603515625, -3.28790283203125, -3.1397705078125, -2.99163818359375, -2.843505859375, -2.69537353515625, -2.5472412109375, -2.39910888671875, -2.2509765625, -2.10284423828125, -1.9547119140625, -1.80657958984375, -1.658447265625, -1.51031494140625, -1.3621826171875, -1.21405029296875, -1.06591796875, -0.91778564453125, -0.7696533203125, -0.62152099609375, -0.473388671875, -0.32525634765625, -0.1771240234375, -0.02899169921875, 0.119140625, 0.26727294921875, 0.4154052734375, 0.56353759765625, 0.711669921875, 0.85980224609375, 1.0079345703125, 1.15606689453125, 1.30419921875, 1.45233154296875, 1.6004638671875, 1.74859619140625, 1.896728515625, 2.04486083984375, 2.1929931640625, 2.34112548828125, 2.4892578125, 2.63739013671875, 2.7855224609375, 2.93365478515625, 3.081787109375, 3.22991943359375, 3.3780517578125, 3.52618408203125, 3.67431640625, 3.82244873046875, 3.9705810546875, 4.11871337890625, 4.266845703125, 4.41497802734375, 4.5631103515625, 4.71124267578125, 4.859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 9.0, 16.0, 9.0, 19.0, 27.0, 28.0, 36.0, 40.0, 38.0, 46.0, 44.0, 52.0, 52.0, 50.0, 49.0, 57.0, 48.0, 51.0, 49.0, 39.0, 29.0, 27.0, 25.0, 31.0, 18.0, 19.0, 16.0, 11.0, 10.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.619545936584473, -11.259020805358887, -10.8984956741333, -10.537969589233398, -10.177444458007812, -9.816919326782227, -9.45639419555664, -9.095869064331055, -8.735343933105469, -8.374818801879883, -8.014293670654297, -7.653768062591553, -7.293242454528809, -6.932717323303223, -6.572192192077637, -6.211667060852051, -5.851140975952148, -5.4906158447265625, -5.130090236663818, -4.769565105438232, -4.409039497375488, -4.048514366149902, -3.6879892349243164, -3.3274638652801514, -2.9669384956359863, -2.6064131259918213, -2.2458877563476562, -1.8853626251220703, -1.5248372554779053, -1.1643118858337402, -0.8037867546081543, -0.44326138496398926, -0.08273601531982422, 0.27778929471969604, 0.6383146047592163, 0.9988398551940918, 1.3593652248382568, 1.7198905944824219, 2.080415725708008, 2.440941095352173, 2.801466464996338, 3.161991834640503, 3.522517204284668, 3.883042335510254, 4.24356746673584, 4.604093074798584, 4.96461820602417, 5.325143814086914, 5.6856689453125, 6.046194076538086, 6.40671968460083, 6.767244815826416, 7.12777042388916, 7.488295555114746, 7.848820686340332, 8.209345817565918, 8.56987190246582, 8.930397033691406, 9.290922164916992, 9.651447296142578, 10.01197338104248, 10.372498512268066, 10.733023643493652, 11.093548774719238, 11.454073905944824]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 4.0, 5.0, 18.0, 11.0, 12.0, 20.0, 20.0, 30.0, 37.0, 30.0, 34.0, 24.0, 37.0, 34.0, 32.0, 46.0, 43.0, 39.0, 46.0, 29.0, 49.0, 27.0, 45.0, 31.0, 41.0, 31.0, 24.0, 24.0, 23.0, 28.0, 18.0, 16.0, 15.0, 8.0, 11.0, 10.0, 9.0, 2.0, 11.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.037527084350586, -9.726256370544434, -9.414985656738281, -9.103713989257812, -8.79244327545166, -8.481172561645508, -8.169900894165039, -7.858630180358887, -7.547359466552734, -7.236088752746582, -6.9248175621032715, -6.613546371459961, -6.302275657653809, -5.991004943847656, -5.679733753204346, -5.368462562561035, -5.057191848754883, -4.7459211349487305, -4.43464994430542, -4.123378753662109, -3.812108039855957, -3.5008370876312256, -3.189566135406494, -2.8782951831817627, -2.5670242309570312, -2.2557532787323, -1.9444823265075684, -1.633211374282837, -1.3219404220581055, -1.010669469833374, -0.6993985176086426, -0.38812756538391113, -0.07685661315917969, 0.23441433906555176, 0.5456852912902832, 0.8569562435150146, 1.168227195739746, 1.4794981479644775, 1.790769100189209, 2.1020400524139404, 2.413311004638672, 2.7245819568634033, 3.0358529090881348, 3.347123861312866, 3.6583948135375977, 3.969665765762329, 4.2809367179870605, 4.592207908630371, 4.903478622436523, 5.214749336242676, 5.526020526885986, 5.837291717529297, 6.148562431335449, 6.459833145141602, 6.771104335784912, 7.082375526428223, 7.393646240234375, 7.704916954040527, 8.01618766784668, 8.327459335327148, 8.6387300491333, 8.950000762939453, 9.261272430419922, 9.572543144226074, 9.883813858032227]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 8.0, 36.0, 33.0, 52.0, 77.0, 101.0, 134.0, 178.0, 293.0, 417.0, 586.0, 935.0, 1276.0, 1850.0, 2864.0, 4375.0, 6599.0, 9638.0, 14367.0, 21960.0, 33026.0, 48157.0, 70267.0, 97131.0, 122556.0, 136834.0, 128011.0, 104503.0, 77274.0, 54280.0, 37025.0, 24495.0, 16119.0, 10863.0, 7317.0, 4799.0, 3349.0, 2141.0, 1463.0, 1035.0, 660.0, 441.0, 335.0, 241.0, 132.0, 99.0, 67.0, 37.0, 40.0, 22.0, 25.0, 7.0, 12.0, 6.0, 3.0, 0.0, 4.0], "bins": [-9.71875, -9.4210205078125, -9.123291015625, -8.8255615234375, -8.52783203125, -8.2301025390625, -7.932373046875, -7.6346435546875, -7.3369140625, -7.0391845703125, -6.741455078125, -6.4437255859375, -6.14599609375, -5.8482666015625, -5.550537109375, -5.2528076171875, -4.955078125, -4.6573486328125, -4.359619140625, -4.0618896484375, -3.76416015625, -3.4664306640625, -3.168701171875, -2.8709716796875, -2.5732421875, -2.2755126953125, -1.977783203125, -1.6800537109375, -1.38232421875, -1.0845947265625, -0.786865234375, -0.4891357421875, -0.19140625, 0.1063232421875, 0.404052734375, 0.7017822265625, 0.99951171875, 1.2972412109375, 1.594970703125, 1.8927001953125, 2.1904296875, 2.4881591796875, 2.785888671875, 3.0836181640625, 3.38134765625, 3.6790771484375, 3.976806640625, 4.2745361328125, 4.572265625, 4.8699951171875, 5.167724609375, 5.4654541015625, 5.76318359375, 6.0609130859375, 6.358642578125, 6.6563720703125, 6.9541015625, 7.2518310546875, 7.549560546875, 7.8472900390625, 8.14501953125, 8.4427490234375, 8.740478515625, 9.0382080078125, 9.3359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 13.0, 8.0, 17.0, 17.0, 19.0, 23.0, 28.0, 23.0, 27.0, 37.0, 35.0, 42.0, 32.0, 34.0, 32.0, 39.0, 31.0, 36.0, 38.0, 37.0, 32.0, 37.0, 27.0, 35.0, 35.0, 33.0, 33.0, 25.0, 20.0, 19.0, 14.0, 12.0, 11.0, 11.0, 14.0, 10.0, 5.0, 10.0, 3.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.1015625, -8.8089599609375, -8.516357421875, -8.2237548828125, -7.93115234375, -7.6385498046875, -7.345947265625, -7.0533447265625, -6.7607421875, -6.4681396484375, -6.175537109375, -5.8829345703125, -5.59033203125, -5.2977294921875, -5.005126953125, -4.7125244140625, -4.419921875, -4.1273193359375, -3.834716796875, -3.5421142578125, -3.24951171875, -2.9569091796875, -2.664306640625, -2.3717041015625, -2.0791015625, -1.7864990234375, -1.493896484375, -1.2012939453125, -0.90869140625, -0.6160888671875, -0.323486328125, -0.0308837890625, 0.26171875, 0.5543212890625, 0.846923828125, 1.1395263671875, 1.43212890625, 1.7247314453125, 2.017333984375, 2.3099365234375, 2.6025390625, 2.8951416015625, 3.187744140625, 3.4803466796875, 3.77294921875, 4.0655517578125, 4.358154296875, 4.6507568359375, 4.943359375, 5.2359619140625, 5.528564453125, 5.8211669921875, 6.11376953125, 6.4063720703125, 6.698974609375, 6.9915771484375, 7.2841796875, 7.5767822265625, 7.869384765625, 8.1619873046875, 8.45458984375, 8.7471923828125, 9.039794921875, 9.3323974609375, 9.625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 14.0, 22.0, 27.0, 49.0, 57.0, 84.0, 126.0, 174.0, 242.0, 306.0, 514.0, 778.0, 1208.0, 1875.0, 3174.0, 5432.0, 9791.0, 18925.0, 38520.0, 81819.0, 173019.0, 284674.0, 217106.0, 107364.0, 49922.0, 24185.0, 12439.0, 6473.0, 3757.0, 2264.0, 1387.0, 922.0, 615.0, 347.0, 280.0, 208.0, 139.0, 75.0, 80.0, 35.0, 35.0, 15.0, 16.0, 13.0, 11.0, 9.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-20.421875, -19.796875, -19.171875, -18.546875, -17.921875, -17.296875, -16.671875, -16.046875, -15.421875, -14.796875, -14.171875, -13.546875, -12.921875, -12.296875, -11.671875, -11.046875, -10.421875, -9.796875, -9.171875, -8.546875, -7.921875, -7.296875, -6.671875, -6.046875, -5.421875, -4.796875, -4.171875, -3.546875, -2.921875, -2.296875, -1.671875, -1.046875, -0.421875, 0.203125, 0.828125, 1.453125, 2.078125, 2.703125, 3.328125, 3.953125, 4.578125, 5.203125, 5.828125, 6.453125, 7.078125, 7.703125, 8.328125, 8.953125, 9.578125, 10.203125, 10.828125, 11.453125, 12.078125, 12.703125, 13.328125, 13.953125, 14.578125, 15.203125, 15.828125, 16.453125, 17.078125, 17.703125, 18.328125, 18.953125, 19.578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 11.0, 20.0, 7.0, 12.0, 13.0, 23.0, 28.0, 26.0, 26.0, 30.0, 31.0, 38.0, 58.0, 30.0, 31.0, 45.0, 42.0, 42.0, 34.0, 48.0, 40.0, 33.0, 44.0, 40.0, 23.0, 30.0, 30.0, 24.0, 17.0, 28.0, 15.0, 16.0, 11.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.89892578125, -6.6806640625, -6.46240234375, -6.244140625, -6.02587890625, -5.8076171875, -5.58935546875, -5.37109375, -5.15283203125, -4.9345703125, -4.71630859375, -4.498046875, -4.27978515625, -4.0615234375, -3.84326171875, -3.625, -3.40673828125, -3.1884765625, -2.97021484375, -2.751953125, -2.53369140625, -2.3154296875, -2.09716796875, -1.87890625, -1.66064453125, -1.4423828125, -1.22412109375, -1.005859375, -0.78759765625, -0.5693359375, -0.35107421875, -0.1328125, 0.08544921875, 0.3037109375, 0.52197265625, 0.740234375, 0.95849609375, 1.1767578125, 1.39501953125, 1.61328125, 1.83154296875, 2.0498046875, 2.26806640625, 2.486328125, 2.70458984375, 2.9228515625, 3.14111328125, 3.359375, 3.57763671875, 3.7958984375, 4.01416015625, 4.232421875, 4.45068359375, 4.6689453125, 4.88720703125, 5.10546875, 5.32373046875, 5.5419921875, 5.76025390625, 5.978515625, 6.19677734375, 6.4150390625, 6.63330078125, 6.8515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 15.0, 12.0, 23.0, 21.0, 41.0, 72.0, 110.0, 144.0, 269.0, 462.0, 879.0, 1779.0, 3947.0, 8599.0, 21817.0, 59921.0, 182656.0, 409839.0, 234512.0, 77137.0, 26985.0, 10443.0, 4447.0, 2001.0, 1053.0, 548.0, 310.0, 162.0, 113.0, 65.0, 51.0, 35.0, 18.0, 17.0, 11.0, 7.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0390625, -13.594970703125, -13.15087890625, -12.706787109375, -12.2626953125, -11.818603515625, -11.37451171875, -10.930419921875, -10.486328125, -10.042236328125, -9.59814453125, -9.154052734375, -8.7099609375, -8.265869140625, -7.82177734375, -7.377685546875, -6.93359375, -6.489501953125, -6.04541015625, -5.601318359375, -5.1572265625, -4.713134765625, -4.26904296875, -3.824951171875, -3.380859375, -2.936767578125, -2.49267578125, -2.048583984375, -1.6044921875, -1.160400390625, -0.71630859375, -0.272216796875, 0.171875, 0.615966796875, 1.06005859375, 1.504150390625, 1.9482421875, 2.392333984375, 2.83642578125, 3.280517578125, 3.724609375, 4.168701171875, 4.61279296875, 5.056884765625, 5.5009765625, 5.945068359375, 6.38916015625, 6.833251953125, 7.27734375, 7.721435546875, 8.16552734375, 8.609619140625, 9.0537109375, 9.497802734375, 9.94189453125, 10.385986328125, 10.830078125, 11.274169921875, 11.71826171875, 12.162353515625, 12.6064453125, 13.050537109375, 13.49462890625, 13.938720703125, 14.3828125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 16.0, 14.0, 20.0, 32.0, 41.0, 40.0, 66.0, 85.0, 84.0, 93.0, 104.0, 86.0, 70.0, 46.0, 43.0, 29.0, 25.0, 13.0, 15.0, 13.0, 11.0, 3.0, 4.0, 10.0, 7.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006146430969238281, -0.0005947276949882507, -0.0005748122930526733, -0.000554896891117096, -0.0005349814891815186, -0.0005150660872459412, -0.0004951506853103638, -0.0004752352833747864, -0.000455319881439209, -0.0004354044795036316, -0.0004154890775680542, -0.0003955736756324768, -0.0003756582736968994, -0.000355742871761322, -0.00033582746982574463, -0.00031591206789016724, -0.00029599666595458984, -0.00027608126401901245, -0.00025616586208343506, -0.00023625046014785767, -0.00021633505821228027, -0.00019641965627670288, -0.0001765042543411255, -0.0001565888524055481, -0.0001366734504699707, -0.00011675804853439331, -9.684264659881592e-05, -7.692724466323853e-05, -5.701184272766113e-05, -3.709644079208374e-05, -1.7181038856506348e-05, 2.734363079071045e-06, 2.2649765014648438e-05, 4.256516695022583e-05, 6.248056888580322e-05, 8.239597082138062e-05, 0.00010231137275695801, 0.0001222267746925354, 0.0001421421766281128, 0.00016205757856369019, 0.00018197298049926758, 0.00020188838243484497, 0.00022180378437042236, 0.00024171918630599976, 0.00026163458824157715, 0.00028154999017715454, 0.00030146539211273193, 0.0003213807940483093, 0.0003412961959838867, 0.0003612115979194641, 0.0003811269998550415, 0.0004010424017906189, 0.0004209578037261963, 0.0004408732056617737, 0.0004607886075973511, 0.00048070400953292847, 0.0005006194114685059, 0.0005205348134040833, 0.0005404502153396606, 0.000560365617275238, 0.0005802810192108154, 0.0006001964211463928, 0.0006201118230819702, 0.0006400272250175476, 0.000659942626953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 15.0, 13.0, 22.0, 45.0, 58.0, 77.0, 108.0, 161.0, 257.0, 370.0, 533.0, 785.0, 1240.0, 2007.0, 3337.0, 5263.0, 8777.0, 14567.0, 25191.0, 43964.0, 74912.0, 122044.0, 170988.0, 184085.0, 149997.0, 97944.0, 58572.0, 33782.0, 19376.0, 11586.0, 6874.0, 4254.0, 2568.0, 1652.0, 1079.0, 717.0, 423.0, 281.0, 196.0, 143.0, 84.0, 60.0, 49.0, 20.0, 24.0, 22.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.63671875, -6.4310302734375, -6.225341796875, -6.0196533203125, -5.81396484375, -5.6082763671875, -5.402587890625, -5.1968994140625, -4.9912109375, -4.7855224609375, -4.579833984375, -4.3741455078125, -4.16845703125, -3.9627685546875, -3.757080078125, -3.5513916015625, -3.345703125, -3.1400146484375, -2.934326171875, -2.7286376953125, -2.52294921875, -2.3172607421875, -2.111572265625, -1.9058837890625, -1.7001953125, -1.4945068359375, -1.288818359375, -1.0831298828125, -0.87744140625, -0.6717529296875, -0.466064453125, -0.2603759765625, -0.0546875, 0.1510009765625, 0.356689453125, 0.5623779296875, 0.76806640625, 0.9737548828125, 1.179443359375, 1.3851318359375, 1.5908203125, 1.7965087890625, 2.002197265625, 2.2078857421875, 2.41357421875, 2.6192626953125, 2.824951171875, 3.0306396484375, 3.236328125, 3.4420166015625, 3.647705078125, 3.8533935546875, 4.05908203125, 4.2647705078125, 4.470458984375, 4.6761474609375, 4.8818359375, 5.0875244140625, 5.293212890625, 5.4989013671875, 5.70458984375, 5.9102783203125, 6.115966796875, 6.3216552734375, 6.52734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 14.0, 10.0, 15.0, 21.0, 36.0, 29.0, 54.0, 70.0, 73.0, 65.0, 68.0, 74.0, 71.0, 82.0, 67.0, 56.0, 39.0, 34.0, 25.0, 31.0, 12.0, 16.0, 6.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.55828857421875, -3.4447021484375, -3.33111572265625, -3.217529296875, -3.10394287109375, -2.9903564453125, -2.87677001953125, -2.76318359375, -2.64959716796875, -2.5360107421875, -2.42242431640625, -2.308837890625, -2.19525146484375, -2.0816650390625, -1.96807861328125, -1.8544921875, -1.74090576171875, -1.6273193359375, -1.51373291015625, -1.400146484375, -1.28656005859375, -1.1729736328125, -1.05938720703125, -0.94580078125, -0.83221435546875, -0.7186279296875, -0.60504150390625, -0.491455078125, -0.37786865234375, -0.2642822265625, -0.15069580078125, -0.037109375, 0.07647705078125, 0.1900634765625, 0.30364990234375, 0.417236328125, 0.53082275390625, 0.6444091796875, 0.75799560546875, 0.87158203125, 0.98516845703125, 1.0987548828125, 1.21234130859375, 1.325927734375, 1.43951416015625, 1.5531005859375, 1.66668701171875, 1.7802734375, 1.89385986328125, 2.0074462890625, 2.12103271484375, 2.234619140625, 2.34820556640625, 2.4617919921875, 2.57537841796875, 2.68896484375, 2.80255126953125, 2.9161376953125, 3.02972412109375, 3.143310546875, 3.25689697265625, 3.3704833984375, 3.48406982421875, 3.59765625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 8.0, 13.0, 9.0, 12.0, 27.0, 14.0, 31.0, 27.0, 32.0, 35.0, 39.0, 47.0, 32.0, 45.0, 52.0, 51.0, 57.0, 50.0, 40.0, 49.0, 53.0, 41.0, 44.0, 19.0, 25.0, 18.0, 16.0, 13.0, 19.0, 17.0, 11.0, 9.0, 5.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.239821434020996, -9.9097261428833, -9.579631805419922, -9.249536514282227, -8.919442176818848, -8.589346885681152, -8.259252548217773, -7.929157257080078, -7.599062442779541, -7.268967628479004, -6.938872814178467, -6.60877799987793, -6.278682708740234, -5.9485883712768555, -5.61849308013916, -5.288398265838623, -4.958303451538086, -4.628208637237549, -4.298113822937012, -3.9680187702178955, -3.6379239559173584, -3.3078291416168213, -2.977734088897705, -2.647639274597168, -2.317544460296631, -1.9874496459960938, -1.657354712486267, -1.3272597789764404, -0.9971649646759033, -0.6670701503753662, -0.33697521686553955, -0.006880283355712891, 0.3232154846191406, 0.6533103585243225, 0.9834052324295044, 1.313500165939331, 1.6435949802398682, 1.9736897945404053, 2.3037848472595215, 2.6338796615600586, 2.9639744758605957, 3.294069290161133, 3.62416410446167, 3.954259157180786, 4.284354209899902, 4.614448547363281, 4.944543838500977, 5.274638652801514, 5.604733467102051, 5.934828281402588, 6.264923095703125, 6.595017910003662, 6.925112724304199, 7.2552080154418945, 7.585302829742432, 7.915397644042969, 8.245492935180664, 8.57558822631836, 8.905682563781738, 9.235777854919434, 9.565872192382812, 9.895967483520508, 10.226061820983887, 10.556157112121582, 10.886251449584961]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 15.0, 14.0, 12.0, 19.0, 20.0, 27.0, 29.0, 33.0, 25.0, 36.0, 35.0, 50.0, 35.0, 40.0, 40.0, 38.0, 43.0, 41.0, 46.0, 41.0, 41.0, 34.0, 30.0, 42.0, 22.0, 29.0, 20.0, 18.0, 19.0, 17.0, 14.0, 14.0, 8.0, 3.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.418608665466309, -10.10146427154541, -9.784318923950195, -9.467174530029297, -9.150030136108398, -8.8328857421875, -8.515740394592285, -8.198596000671387, -7.88145112991333, -7.564306259155273, -7.247161865234375, -6.930016994476318, -6.612872123718262, -6.295727729797363, -5.978582859039307, -5.66143798828125, -5.344293594360352, -5.027148723602295, -4.7100043296813965, -4.39285945892334, -4.075715065002441, -3.7585701942443848, -3.441425323486328, -3.1242806911468506, -2.807136058807373, -2.4899914264678955, -2.172846794128418, -1.8557019233703613, -1.5385572910308838, -1.2214126586914062, -0.9042679071426392, -0.5871231555938721, -0.2699775695800781, 0.04716712236404419, 0.3643118143081665, 0.6814565062522888, 0.9986011981964111, 1.3157458305358887, 1.6328905820846558, 1.9500353336334229, 2.2671799659729004, 2.584324598312378, 2.9014692306518555, 3.218614101409912, 3.5357587337493896, 3.852903366088867, 4.170048236846924, 4.4871931076049805, 4.804337501525879, 5.1214823722839355, 5.438626766204834, 5.755771636962891, 6.072916030883789, 6.390060901641846, 6.707205772399902, 7.024350166320801, 7.341495037078857, 7.658639907836914, 7.9757843017578125, 8.292928695678711, 8.610074043273926, 8.927218437194824, 9.244362831115723, 9.561508178710938, 9.878652572631836]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 6.0, 8.0, 19.0, 35.0, 35.0, 62.0, 110.0, 182.0, 250.0, 423.0, 662.0, 961.0, 1592.0, 2441.0, 3735.0, 5823.0, 8993.0, 13921.0, 21888.0, 33646.0, 50021.0, 72179.0, 97642.0, 121185.0, 133872.0, 126920.0, 106555.0, 79921.0, 56601.0, 38230.0, 24994.0, 16292.0, 10499.0, 6819.0, 4282.0, 2781.0, 1798.0, 1142.0, 695.0, 501.0, 305.0, 185.0, 120.0, 74.0, 60.0, 25.0, 23.0, 16.0, 9.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.2421875, -8.959228515625, -8.67626953125, -8.393310546875, -8.1103515625, -7.827392578125, -7.54443359375, -7.261474609375, -6.978515625, -6.695556640625, -6.41259765625, -6.129638671875, -5.8466796875, -5.563720703125, -5.28076171875, -4.997802734375, -4.71484375, -4.431884765625, -4.14892578125, -3.865966796875, -3.5830078125, -3.300048828125, -3.01708984375, -2.734130859375, -2.451171875, -2.168212890625, -1.88525390625, -1.602294921875, -1.3193359375, -1.036376953125, -0.75341796875, -0.470458984375, -0.1875, 0.095458984375, 0.37841796875, 0.661376953125, 0.9443359375, 1.227294921875, 1.51025390625, 1.793212890625, 2.076171875, 2.359130859375, 2.64208984375, 2.925048828125, 3.2080078125, 3.490966796875, 3.77392578125, 4.056884765625, 4.33984375, 4.622802734375, 4.90576171875, 5.188720703125, 5.4716796875, 5.754638671875, 6.03759765625, 6.320556640625, 6.603515625, 6.886474609375, 7.16943359375, 7.452392578125, 7.7353515625, 8.018310546875, 8.30126953125, 8.584228515625, 8.8671875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 5.0, 3.0, 4.0, 4.0, 11.0, 14.0, 9.0, 10.0, 16.0, 16.0, 18.0, 26.0, 32.0, 30.0, 34.0, 35.0, 33.0, 33.0, 45.0, 39.0, 28.0, 45.0, 36.0, 38.0, 48.0, 32.0, 32.0, 39.0, 37.0, 35.0, 25.0, 31.0, 27.0, 23.0, 16.0, 9.0, 17.0, 21.0, 7.0, 5.0, 7.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.78125, -8.4896240234375, -8.197998046875, -7.9063720703125, -7.61474609375, -7.3231201171875, -7.031494140625, -6.7398681640625, -6.4482421875, -6.1566162109375, -5.864990234375, -5.5733642578125, -5.28173828125, -4.9901123046875, -4.698486328125, -4.4068603515625, -4.115234375, -3.8236083984375, -3.531982421875, -3.2403564453125, -2.94873046875, -2.6571044921875, -2.365478515625, -2.0738525390625, -1.7822265625, -1.4906005859375, -1.198974609375, -0.9073486328125, -0.61572265625, -0.3240966796875, -0.032470703125, 0.2591552734375, 0.55078125, 0.8424072265625, 1.134033203125, 1.4256591796875, 1.71728515625, 2.0089111328125, 2.300537109375, 2.5921630859375, 2.8837890625, 3.1754150390625, 3.467041015625, 3.7586669921875, 4.05029296875, 4.3419189453125, 4.633544921875, 4.9251708984375, 5.216796875, 5.5084228515625, 5.800048828125, 6.0916748046875, 6.38330078125, 6.6749267578125, 6.966552734375, 7.2581787109375, 7.5498046875, 7.8414306640625, 8.133056640625, 8.4246826171875, 8.71630859375, 9.0079345703125, 9.299560546875, 9.5911865234375, 9.8828125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 12.0, 16.0, 22.0, 34.0, 36.0, 58.0, 89.0, 121.0, 202.0, 275.0, 409.0, 662.0, 1031.0, 1431.0, 2301.0, 3449.0, 5294.0, 8079.0, 12488.0, 19132.0, 29676.0, 43812.0, 63608.0, 86665.0, 111966.0, 128151.0, 128587.0, 112715.0, 89528.0, 65518.0, 45277.0, 30475.0, 20101.0, 12969.0, 8360.0, 5526.0, 3514.0, 2370.0, 1589.0, 985.0, 680.0, 441.0, 270.0, 222.0, 121.0, 83.0, 69.0, 46.0, 32.0, 18.0, 11.0, 9.0, 6.0, 4.0, 3.0, 4.0], "bins": [-8.53125, -8.2806396484375, -8.030029296875, -7.7794189453125, -7.52880859375, -7.2781982421875, -7.027587890625, -6.7769775390625, -6.5263671875, -6.2757568359375, -6.025146484375, -5.7745361328125, -5.52392578125, -5.2733154296875, -5.022705078125, -4.7720947265625, -4.521484375, -4.2708740234375, -4.020263671875, -3.7696533203125, -3.51904296875, -3.2684326171875, -3.017822265625, -2.7672119140625, -2.5166015625, -2.2659912109375, -2.015380859375, -1.7647705078125, -1.51416015625, -1.2635498046875, -1.012939453125, -0.7623291015625, -0.51171875, -0.2611083984375, -0.010498046875, 0.2401123046875, 0.49072265625, 0.7413330078125, 0.991943359375, 1.2425537109375, 1.4931640625, 1.7437744140625, 1.994384765625, 2.2449951171875, 2.49560546875, 2.7462158203125, 2.996826171875, 3.2474365234375, 3.498046875, 3.7486572265625, 3.999267578125, 4.2498779296875, 4.50048828125, 4.7510986328125, 5.001708984375, 5.2523193359375, 5.5029296875, 5.7535400390625, 6.004150390625, 6.2547607421875, 6.50537109375, 6.7559814453125, 7.006591796875, 7.2572021484375, 7.5078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 1.0, 4.0, 6.0, 14.0, 11.0, 12.0, 13.0, 16.0, 13.0, 16.0, 19.0, 33.0, 33.0, 32.0, 40.0, 33.0, 40.0, 34.0, 40.0, 46.0, 50.0, 36.0, 32.0, 32.0, 32.0, 33.0, 38.0, 40.0, 26.0, 34.0, 24.0, 25.0, 26.0, 16.0, 19.0, 15.0, 14.0, 10.0, 3.0, 5.0, 5.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.23046875, -5.04217529296875, -4.8538818359375, -4.66558837890625, -4.477294921875, -4.28900146484375, -4.1007080078125, -3.91241455078125, -3.72412109375, -3.53582763671875, -3.3475341796875, -3.15924072265625, -2.970947265625, -2.78265380859375, -2.5943603515625, -2.40606689453125, -2.2177734375, -2.02947998046875, -1.8411865234375, -1.65289306640625, -1.464599609375, -1.27630615234375, -1.0880126953125, -0.89971923828125, -0.71142578125, -0.52313232421875, -0.3348388671875, -0.14654541015625, 0.041748046875, 0.23004150390625, 0.4183349609375, 0.60662841796875, 0.794921875, 0.98321533203125, 1.1715087890625, 1.35980224609375, 1.548095703125, 1.73638916015625, 1.9246826171875, 2.11297607421875, 2.30126953125, 2.48956298828125, 2.6778564453125, 2.86614990234375, 3.054443359375, 3.24273681640625, 3.4310302734375, 3.61932373046875, 3.8076171875, 3.99591064453125, 4.1842041015625, 4.37249755859375, 4.560791015625, 4.74908447265625, 4.9373779296875, 5.12567138671875, 5.31396484375, 5.50225830078125, 5.6905517578125, 5.87884521484375, 6.067138671875, 6.25543212890625, 6.4437255859375, 6.63201904296875, 6.8203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 10.0, 13.0, 22.0, 34.0, 57.0, 68.0, 123.0, 155.0, 246.0, 384.0, 624.0, 957.0, 1582.0, 2530.0, 4354.0, 7638.0, 13975.0, 26162.0, 49621.0, 96548.0, 171746.0, 229258.0, 194631.0, 116454.0, 61012.0, 31737.0, 16468.0, 9128.0, 5062.0, 3082.0, 1777.0, 1144.0, 653.0, 441.0, 281.0, 188.0, 129.0, 82.0, 56.0, 38.0, 26.0, 24.0, 8.0, 14.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.890625, -8.634033203125, -8.37744140625, -8.120849609375, -7.8642578125, -7.607666015625, -7.35107421875, -7.094482421875, -6.837890625, -6.581298828125, -6.32470703125, -6.068115234375, -5.8115234375, -5.554931640625, -5.29833984375, -5.041748046875, -4.78515625, -4.528564453125, -4.27197265625, -4.015380859375, -3.7587890625, -3.502197265625, -3.24560546875, -2.989013671875, -2.732421875, -2.475830078125, -2.21923828125, -1.962646484375, -1.7060546875, -1.449462890625, -1.19287109375, -0.936279296875, -0.6796875, -0.423095703125, -0.16650390625, 0.090087890625, 0.3466796875, 0.603271484375, 0.85986328125, 1.116455078125, 1.373046875, 1.629638671875, 1.88623046875, 2.142822265625, 2.3994140625, 2.656005859375, 2.91259765625, 3.169189453125, 3.42578125, 3.682373046875, 3.93896484375, 4.195556640625, 4.4521484375, 4.708740234375, 4.96533203125, 5.221923828125, 5.478515625, 5.735107421875, 5.99169921875, 6.248291015625, 6.5048828125, 6.761474609375, 7.01806640625, 7.274658203125, 7.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 7.0, 8.0, 7.0, 15.0, 18.0, 37.0, 34.0, 52.0, 70.0, 54.0, 90.0, 83.0, 86.0, 88.0, 82.0, 61.0, 44.0, 38.0, 26.0, 21.0, 20.0, 12.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010852813720703125, -0.001055017113685608, -0.0010247528553009033, -0.0009944885969161987, -0.0009642243385314941, -0.0009339600801467896, -0.000903695821762085, -0.0008734315633773804, -0.0008431673049926758, -0.0008129030466079712, -0.0007826387882232666, -0.000752374529838562, -0.0007221102714538574, -0.0006918460130691528, -0.0006615817546844482, -0.0006313174962997437, -0.0006010532379150391, -0.0005707889795303345, -0.0005405247211456299, -0.0005102604627609253, -0.0004799962043762207, -0.0004497319459915161, -0.0004194676876068115, -0.00038920342922210693, -0.00035893917083740234, -0.00032867491245269775, -0.00029841065406799316, -0.0002681463956832886, -0.00023788213729858398, -0.0002076178789138794, -0.0001773536205291748, -0.00014708936214447021, -0.00011682510375976562, -8.656084537506104e-05, -5.6296586990356445e-05, -2.6032328605651855e-05, 4.231929779052734e-06, 3.4496188163757324e-05, 6.476044654846191e-05, 9.50247049331665e-05, 0.0001252889633178711, 0.00015555322170257568, 0.00018581748008728027, 0.00021608173847198486, 0.00024634599685668945, 0.00027661025524139404, 0.00030687451362609863, 0.0003371387720108032, 0.0003674030303955078, 0.0003976672887802124, 0.000427931547164917, 0.0004581958055496216, 0.0004884600639343262, 0.0005187243223190308, 0.0005489885807037354, 0.0005792528390884399, 0.0006095170974731445, 0.0006397813558578491, 0.0006700456142425537, 0.0007003098726272583, 0.0007305741310119629, 0.0007608383893966675, 0.0007911026477813721, 0.0008213669061660767, 0.0008516311645507812]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 2.0, 5.0, 10.0, 21.0, 11.0, 35.0, 49.0, 64.0, 96.0, 146.0, 225.0, 357.0, 523.0, 900.0, 1388.0, 2291.0, 3667.0, 6571.0, 10770.0, 18799.0, 32708.0, 56964.0, 93410.0, 142855.0, 180411.0, 172318.0, 127256.0, 81352.0, 48207.0, 27849.0, 16176.0, 9161.0, 5407.0, 3147.0, 1935.0, 1268.0, 738.0, 525.0, 332.0, 208.0, 127.0, 91.0, 48.0, 42.0, 27.0, 22.0, 19.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.63671875, -5.44134521484375, -5.2459716796875, -5.05059814453125, -4.855224609375, -4.65985107421875, -4.4644775390625, -4.26910400390625, -4.07373046875, -3.87835693359375, -3.6829833984375, -3.48760986328125, -3.292236328125, -3.09686279296875, -2.9014892578125, -2.70611572265625, -2.5107421875, -2.31536865234375, -2.1199951171875, -1.92462158203125, -1.729248046875, -1.53387451171875, -1.3385009765625, -1.14312744140625, -0.94775390625, -0.75238037109375, -0.5570068359375, -0.36163330078125, -0.166259765625, 0.02911376953125, 0.2244873046875, 0.41986083984375, 0.615234375, 0.81060791015625, 1.0059814453125, 1.20135498046875, 1.396728515625, 1.59210205078125, 1.7874755859375, 1.98284912109375, 2.17822265625, 2.37359619140625, 2.5689697265625, 2.76434326171875, 2.959716796875, 3.15509033203125, 3.3504638671875, 3.54583740234375, 3.7412109375, 3.93658447265625, 4.1319580078125, 4.32733154296875, 4.522705078125, 4.71807861328125, 4.9134521484375, 5.10882568359375, 5.30419921875, 5.49957275390625, 5.6949462890625, 5.89031982421875, 6.085693359375, 6.28106689453125, 6.4764404296875, 6.67181396484375, 6.8671875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 12.0, 9.0, 14.0, 13.0, 19.0, 18.0, 23.0, 22.0, 38.0, 36.0, 44.0, 61.0, 62.0, 69.0, 55.0, 53.0, 51.0, 62.0, 44.0, 45.0, 34.0, 39.0, 17.0, 19.0, 19.0, 16.0, 13.0, 13.0, 9.0, 6.0, 4.0, 7.0, 5.0, 3.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.099609375, -2.037750244140625, -1.97589111328125, -1.914031982421875, -1.8521728515625, -1.790313720703125, -1.72845458984375, -1.666595458984375, -1.604736328125, -1.542877197265625, -1.48101806640625, -1.419158935546875, -1.3572998046875, -1.295440673828125, -1.23358154296875, -1.171722412109375, -1.10986328125, -1.048004150390625, -0.98614501953125, -0.924285888671875, -0.8624267578125, -0.800567626953125, -0.73870849609375, -0.676849365234375, -0.614990234375, -0.553131103515625, -0.49127197265625, -0.429412841796875, -0.3675537109375, -0.305694580078125, -0.24383544921875, -0.181976318359375, -0.1201171875, -0.058258056640625, 0.00360107421875, 0.065460205078125, 0.1273193359375, 0.189178466796875, 0.25103759765625, 0.312896728515625, 0.374755859375, 0.436614990234375, 0.49847412109375, 0.560333251953125, 0.6221923828125, 0.684051513671875, 0.74591064453125, 0.807769775390625, 0.86962890625, 0.931488037109375, 0.99334716796875, 1.055206298828125, 1.1170654296875, 1.178924560546875, 1.24078369140625, 1.302642822265625, 1.364501953125, 1.426361083984375, 1.48822021484375, 1.550079345703125, 1.6119384765625, 1.673797607421875, 1.73565673828125, 1.797515869140625, 1.859375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 7.0, 9.0, 8.0, 5.0, 9.0, 15.0, 16.0, 19.0, 30.0, 35.0, 27.0, 43.0, 27.0, 35.0, 50.0, 51.0, 59.0, 57.0, 52.0, 55.0, 59.0, 63.0, 38.0, 27.0, 30.0, 30.0, 15.0, 20.0, 22.0, 13.0, 21.0, 13.0, 13.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8006591796875, -10.46111011505127, -10.121562004089355, -9.782012939453125, -9.442464828491211, -9.10291576385498, -8.76336669921875, -8.423818588256836, -8.084270477294922, -7.74472188949585, -7.405173301696777, -7.065624237060547, -6.726076126098633, -6.386527061462402, -6.04697847366333, -5.707429885864258, -5.367880821228027, -5.028332233428955, -4.688783645629883, -4.349234580993652, -4.009686470031738, -3.670137643814087, -3.3305888175964355, -2.9910402297973633, -2.651491641998291, -2.3119430541992188, -1.972394347190857, -1.6328456401824951, -1.2932970523834229, -0.9537484645843506, -0.6141996383666992, -0.27465105056762695, 0.0648965835571289, 0.40444523096084595, 0.743993878364563, 1.0835425853729248, 1.423091173171997, 1.7626397609710693, 2.1021885871887207, 2.441737174987793, 2.7812857627868652, 3.1208343505859375, 3.4603829383850098, 3.799931764602661, 4.1394805908203125, 4.479028701782227, 4.818577766418457, 5.158126354217529, 5.497674942016602, 5.837223529815674, 6.176772117614746, 6.516321182250977, 6.855869293212891, 7.195418357849121, 7.534966945648193, 7.874515533447266, 8.21406364440918, 8.55361270904541, 8.893160820007324, 9.232709884643555, 9.572257995605469, 9.9118070602417, 10.25135612487793, 10.590904235839844, 10.930453300476074]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 11.0, 4.0, 7.0, 7.0, 5.0, 22.0, 19.0, 18.0, 18.0, 29.0, 30.0, 22.0, 41.0, 32.0, 32.0, 37.0, 46.0, 43.0, 43.0, 57.0, 47.0, 42.0, 41.0, 39.0, 42.0, 50.0, 25.0, 25.0, 30.0, 21.0, 20.0, 15.0, 14.0, 13.0, 12.0, 6.0, 14.0, 13.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.268064498901367, -11.931300163269043, -11.594535827636719, -11.257771492004395, -10.92100715637207, -10.58424186706543, -10.247477531433105, -9.910713195800781, -9.573948860168457, -9.237184524536133, -8.900420188903809, -8.563655853271484, -8.226890563964844, -7.890126705169678, -7.553361892700195, -7.216597557067871, -6.879833221435547, -6.543068885803223, -6.206304550170898, -5.869539737701416, -5.532775402069092, -5.196011066436768, -4.859246253967285, -4.522481918334961, -4.185717582702637, -3.8489532470703125, -3.512188673019409, -3.175424098968506, -2.8386597633361816, -2.5018954277038574, -2.165130853652954, -1.8283662796020508, -1.4916009902954102, -1.1548365354537964, -0.8180720806121826, -0.48130762577056885, -0.14454317092895508, 0.1922212839126587, 0.5289857387542725, 0.8657503128051758, 1.2025146484375, 1.5392791032791138, 1.8760435581207275, 2.212808132171631, 2.549572467803955, 2.8863368034362793, 3.2231013774871826, 3.559865951538086, 3.89663028717041, 4.233394622802734, 4.570158958435059, 4.906923770904541, 5.243688106536865, 5.5804524421691895, 5.917217254638672, 6.253981590270996, 6.59074592590332, 6.9275102615356445, 7.264274597167969, 7.601039409637451, 7.937803745269775, 8.274568557739258, 8.611332893371582, 8.948097229003906, 9.28486156463623]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 17.0, 22.0, 21.0, 41.0, 77.0, 91.0, 121.0, 218.0, 316.0, 478.0, 824.0, 1276.0, 2062.0, 3310.0, 5614.0, 9646.0, 17168.0, 31603.0, 60088.0, 124412.0, 277687.0, 632249.0, 1075374.0, 988782.0, 520217.0, 225755.0, 102809.0, 50870.0, 27109.0, 14856.0, 8553.0, 4830.0, 2987.0, 1799.0, 1101.0, 683.0, 399.0, 272.0, 175.0, 111.0, 71.0, 57.0, 31.0, 22.0, 16.0, 9.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-11.6484375, -11.3045654296875, -10.960693359375, -10.6168212890625, -10.27294921875, -9.9290771484375, -9.585205078125, -9.2413330078125, -8.8974609375, -8.5535888671875, -8.209716796875, -7.8658447265625, -7.52197265625, -7.1781005859375, -6.834228515625, -6.4903564453125, -6.146484375, -5.8026123046875, -5.458740234375, -5.1148681640625, -4.77099609375, -4.4271240234375, -4.083251953125, -3.7393798828125, -3.3955078125, -3.0516357421875, -2.707763671875, -2.3638916015625, -2.02001953125, -1.6761474609375, -1.332275390625, -0.9884033203125, -0.64453125, -0.3006591796875, 0.043212890625, 0.3870849609375, 0.73095703125, 1.0748291015625, 1.418701171875, 1.7625732421875, 2.1064453125, 2.4503173828125, 2.794189453125, 3.1380615234375, 3.48193359375, 3.8258056640625, 4.169677734375, 4.5135498046875, 4.857421875, 5.2012939453125, 5.545166015625, 5.8890380859375, 6.23291015625, 6.5767822265625, 6.920654296875, 7.2645263671875, 7.6083984375, 7.9522705078125, 8.296142578125, 8.6400146484375, 8.98388671875, 9.3277587890625, 9.671630859375, 10.0155029296875, 10.359375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 11.0, 7.0, 6.0, 10.0, 11.0, 20.0, 15.0, 18.0, 28.0, 23.0, 37.0, 34.0, 37.0, 27.0, 37.0, 33.0, 50.0, 46.0, 54.0, 58.0, 52.0, 39.0, 48.0, 46.0, 32.0, 39.0, 17.0, 29.0, 15.0, 21.0, 16.0, 16.0, 18.0, 14.0, 9.0, 3.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.6484375, -8.41119384765625, -8.1739501953125, -7.93670654296875, -7.699462890625, -7.46221923828125, -7.2249755859375, -6.98773193359375, -6.75048828125, -6.51324462890625, -6.2760009765625, -6.03875732421875, -5.801513671875, -5.56427001953125, -5.3270263671875, -5.08978271484375, -4.8525390625, -4.61529541015625, -4.3780517578125, -4.14080810546875, -3.903564453125, -3.66632080078125, -3.4290771484375, -3.19183349609375, -2.95458984375, -2.71734619140625, -2.4801025390625, -2.24285888671875, -2.005615234375, -1.76837158203125, -1.5311279296875, -1.29388427734375, -1.056640625, -0.81939697265625, -0.5821533203125, -0.34490966796875, -0.107666015625, 0.12957763671875, 0.3668212890625, 0.60406494140625, 0.84130859375, 1.07855224609375, 1.3157958984375, 1.55303955078125, 1.790283203125, 2.02752685546875, 2.2647705078125, 2.50201416015625, 2.7392578125, 2.97650146484375, 3.2137451171875, 3.45098876953125, 3.688232421875, 3.92547607421875, 4.1627197265625, 4.39996337890625, 4.63720703125, 4.87445068359375, 5.1116943359375, 5.34893798828125, 5.586181640625, 5.82342529296875, 6.0606689453125, 6.29791259765625, 6.53515625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 7.0, 17.0, 33.0, 46.0, 64.0, 105.0, 159.0, 263.0, 398.0, 602.0, 986.0, 1540.0, 2371.0, 3925.0, 6503.0, 10916.0, 18999.0, 32902.0, 58653.0, 107317.0, 199822.0, 370548.0, 654602.0, 926608.0, 776236.0, 461904.0, 252151.0, 134907.0, 73940.0, 40775.0, 23056.0, 13468.0, 8070.0, 4720.0, 2927.0, 1754.0, 1072.0, 682.0, 449.0, 276.0, 175.0, 131.0, 67.0, 41.0, 38.0, 26.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4453125, -9.147216796875, -8.84912109375, -8.551025390625, -8.2529296875, -7.954833984375, -7.65673828125, -7.358642578125, -7.060546875, -6.762451171875, -6.46435546875, -6.166259765625, -5.8681640625, -5.570068359375, -5.27197265625, -4.973876953125, -4.67578125, -4.377685546875, -4.07958984375, -3.781494140625, -3.4833984375, -3.185302734375, -2.88720703125, -2.589111328125, -2.291015625, -1.992919921875, -1.69482421875, -1.396728515625, -1.0986328125, -0.800537109375, -0.50244140625, -0.204345703125, 0.09375, 0.391845703125, 0.68994140625, 0.988037109375, 1.2861328125, 1.584228515625, 1.88232421875, 2.180419921875, 2.478515625, 2.776611328125, 3.07470703125, 3.372802734375, 3.6708984375, 3.968994140625, 4.26708984375, 4.565185546875, 4.86328125, 5.161376953125, 5.45947265625, 5.757568359375, 6.0556640625, 6.353759765625, 6.65185546875, 6.949951171875, 7.248046875, 7.546142578125, 7.84423828125, 8.142333984375, 8.4404296875, 8.738525390625, 9.03662109375, 9.334716796875, 9.6328125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 14.0, 16.0, 21.0, 27.0, 44.0, 51.0, 69.0, 70.0, 78.0, 113.0, 159.0, 162.0, 202.0, 257.0, 258.0, 260.0, 323.0, 283.0, 272.0, 243.0, 195.0, 162.0, 147.0, 112.0, 113.0, 83.0, 75.0, 53.0, 39.0, 36.0, 31.0, 23.0, 21.0, 13.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6328125, -3.51702880859375, -3.4012451171875, -3.28546142578125, -3.169677734375, -3.05389404296875, -2.9381103515625, -2.82232666015625, -2.70654296875, -2.59075927734375, -2.4749755859375, -2.35919189453125, -2.243408203125, -2.12762451171875, -2.0118408203125, -1.89605712890625, -1.7802734375, -1.66448974609375, -1.5487060546875, -1.43292236328125, -1.317138671875, -1.20135498046875, -1.0855712890625, -0.96978759765625, -0.85400390625, -0.73822021484375, -0.6224365234375, -0.50665283203125, -0.390869140625, -0.27508544921875, -0.1593017578125, -0.04351806640625, 0.072265625, 0.18804931640625, 0.3038330078125, 0.41961669921875, 0.535400390625, 0.65118408203125, 0.7669677734375, 0.88275146484375, 0.99853515625, 1.11431884765625, 1.2301025390625, 1.34588623046875, 1.461669921875, 1.57745361328125, 1.6932373046875, 1.80902099609375, 1.9248046875, 2.04058837890625, 2.1563720703125, 2.27215576171875, 2.387939453125, 2.50372314453125, 2.6195068359375, 2.73529052734375, 2.85107421875, 2.96685791015625, 3.0826416015625, 3.19842529296875, 3.314208984375, 3.42999267578125, 3.5457763671875, 3.66156005859375, 3.77734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 6.0, 12.0, 10.0, 18.0, 12.0, 16.0, 19.0, 33.0, 28.0, 28.0, 34.0, 34.0, 44.0, 48.0, 45.0, 47.0, 49.0, 54.0, 63.0, 53.0, 34.0, 39.0, 42.0, 35.0, 28.0, 25.0, 19.0, 17.0, 21.0, 12.0, 14.0, 8.0, 7.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.11755084991455, -7.827308177947998, -7.537065505981445, -7.246822834014893, -6.95658016204834, -6.666337966918945, -6.376095294952393, -6.08585262298584, -5.795609951019287, -5.505367279052734, -5.215124607086182, -4.924881935119629, -4.634639739990234, -4.344396591186523, -4.054154396057129, -3.763911724090576, -3.4736690521240234, -3.1834263801574707, -2.893183708190918, -2.6029412746429443, -2.3126986026763916, -2.022455930709839, -1.7322133779525757, -1.4419708251953125, -1.1517281532287598, -0.8614855408668518, -0.5712429285049438, -0.2810003161430359, 0.00924229621887207, 0.2994849681854248, 0.589727520942688, 0.8799700736999512, 1.170212745666504, 1.4604554176330566, 1.7506979703903198, 2.040940523147583, 2.3311831951141357, 2.6214258670806885, 2.911668300628662, 3.201910972595215, 3.4921536445617676, 3.7823963165283203, 4.072638988494873, 4.362881660461426, 4.65312385559082, 4.943367004394531, 5.233609199523926, 5.5238518714904785, 5.814094543457031, 6.104337215423584, 6.394579887390137, 6.6848225593566895, 6.975065231323242, 7.265307426452637, 7.5555500984191895, 7.845792770385742, 8.136035919189453, 8.426278114318848, 8.716521263122559, 9.006763458251953, 9.297006607055664, 9.587248802185059, 9.87749195098877, 10.167734146118164, 10.457976341247559]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 9.0, 5.0, 11.0, 19.0, 18.0, 14.0, 22.0, 17.0, 22.0, 33.0, 30.0, 27.0, 26.0, 37.0, 34.0, 37.0, 42.0, 34.0, 38.0, 37.0, 48.0, 44.0, 41.0, 38.0, 29.0, 38.0, 31.0, 31.0, 22.0, 23.0, 26.0, 22.0, 17.0, 13.0, 9.0, 4.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-9.299307823181152, -9.035682678222656, -8.77205753326416, -8.508432388305664, -8.244807243347168, -7.981182098388672, -7.717556953430176, -7.45393180847168, -7.190306663513184, -6.9266815185546875, -6.663056373596191, -6.399431228637695, -6.135806083679199, -5.872180938720703, -5.608555793762207, -5.344930648803711, -5.081305503845215, -4.817680358886719, -4.554055213928223, -4.290430068969727, -4.0268049240112305, -3.7631797790527344, -3.4995546340942383, -3.235929489135742, -2.972304344177246, -2.70867919921875, -2.445054054260254, -2.181428909301758, -1.9178037643432617, -1.6541786193847656, -1.3905534744262695, -1.1269283294677734, -0.8633027076721191, -0.599677562713623, -0.33605241775512695, -0.07242727279663086, 0.19119787216186523, 0.45482301712036133, 0.7184481620788574, 0.9820733070373535, 1.2456984519958496, 1.5093235969543457, 1.7729487419128418, 2.036573886871338, 2.300199031829834, 2.56382417678833, 2.827449321746826, 3.0910744667053223, 3.3546996116638184, 3.6183247566223145, 3.8819499015808105, 4.145575046539307, 4.409200191497803, 4.672825336456299, 4.936450481414795, 5.200075626373291, 5.463700771331787, 5.727325916290283, 5.990951061248779, 6.254576206207275, 6.5182013511657715, 6.781826496124268, 7.045451641082764, 7.30907678604126, 7.572701930999756]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 12.0, 20.0, 21.0, 44.0, 57.0, 77.0, 130.0, 192.0, 328.0, 585.0, 896.0, 1584.0, 2774.0, 5339.0, 10190.0, 21926.0, 50461.0, 119766.0, 249268.0, 289674.0, 166022.0, 70617.0, 29736.0, 13641.0, 6595.0, 3606.0, 1978.0, 1183.0, 687.0, 422.0, 234.0, 169.0, 115.0, 71.0, 47.0, 25.0, 19.0, 18.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.352783203125, -13.87744140625, -13.402099609375, -12.9267578125, -12.451416015625, -11.97607421875, -11.500732421875, -11.025390625, -10.550048828125, -10.07470703125, -9.599365234375, -9.1240234375, -8.648681640625, -8.17333984375, -7.697998046875, -7.22265625, -6.747314453125, -6.27197265625, -5.796630859375, -5.3212890625, -4.845947265625, -4.37060546875, -3.895263671875, -3.419921875, -2.944580078125, -2.46923828125, -1.993896484375, -1.5185546875, -1.043212890625, -0.56787109375, -0.092529296875, 0.3828125, 0.858154296875, 1.33349609375, 1.808837890625, 2.2841796875, 2.759521484375, 3.23486328125, 3.710205078125, 4.185546875, 4.660888671875, 5.13623046875, 5.611572265625, 6.0869140625, 6.562255859375, 7.03759765625, 7.512939453125, 7.98828125, 8.463623046875, 8.93896484375, 9.414306640625, 9.8896484375, 10.364990234375, 10.84033203125, 11.315673828125, 11.791015625, 12.266357421875, 12.74169921875, 13.217041015625, 13.6923828125, 14.167724609375, 14.64306640625, 15.118408203125, 15.59375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 9.0, 5.0, 6.0, 8.0, 21.0, 14.0, 14.0, 17.0, 18.0, 23.0, 27.0, 22.0, 29.0, 22.0, 44.0, 31.0, 26.0, 30.0, 41.0, 38.0, 35.0, 46.0, 40.0, 43.0, 33.0, 34.0, 23.0, 24.0, 33.0, 34.0, 28.0, 23.0, 25.0, 22.0, 15.0, 12.0, 11.0, 13.0, 8.0, 14.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.45703125, -7.20892333984375, -6.9608154296875, -6.71270751953125, -6.464599609375, -6.21649169921875, -5.9683837890625, -5.72027587890625, -5.47216796875, -5.22406005859375, -4.9759521484375, -4.72784423828125, -4.479736328125, -4.23162841796875, -3.9835205078125, -3.73541259765625, -3.4873046875, -3.23919677734375, -2.9910888671875, -2.74298095703125, -2.494873046875, -2.24676513671875, -1.9986572265625, -1.75054931640625, -1.50244140625, -1.25433349609375, -1.0062255859375, -0.75811767578125, -0.510009765625, -0.26190185546875, -0.0137939453125, 0.23431396484375, 0.482421875, 0.73052978515625, 0.9786376953125, 1.22674560546875, 1.474853515625, 1.72296142578125, 1.9710693359375, 2.21917724609375, 2.46728515625, 2.71539306640625, 2.9635009765625, 3.21160888671875, 3.459716796875, 3.70782470703125, 3.9559326171875, 4.20404052734375, 4.4521484375, 4.70025634765625, 4.9483642578125, 5.19647216796875, 5.444580078125, 5.69268798828125, 5.9407958984375, 6.18890380859375, 6.43701171875, 6.68511962890625, 6.9332275390625, 7.18133544921875, 7.429443359375, 7.67755126953125, 7.9256591796875, 8.17376708984375, 8.421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 13.0, 6.0, 15.0, 23.0, 23.0, 23.0, 36.0, 70.0, 69.0, 98.0, 151.0, 247.0, 308.0, 434.0, 692.0, 1018.0, 1587.0, 2460.0, 4074.0, 6903.0, 12094.0, 23674.0, 47711.0, 105733.0, 224292.0, 292118.0, 170421.0, 76708.0, 35422.0, 17595.0, 9592.0, 5523.0, 3340.0, 2012.0, 1280.0, 864.0, 573.0, 398.0, 272.0, 202.0, 133.0, 121.0, 59.0, 51.0, 42.0, 24.0, 11.0, 9.0, 14.0, 9.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.3359375, -13.89208984375, -13.4482421875, -13.00439453125, -12.560546875, -12.11669921875, -11.6728515625, -11.22900390625, -10.78515625, -10.34130859375, -9.8974609375, -9.45361328125, -9.009765625, -8.56591796875, -8.1220703125, -7.67822265625, -7.234375, -6.79052734375, -6.3466796875, -5.90283203125, -5.458984375, -5.01513671875, -4.5712890625, -4.12744140625, -3.68359375, -3.23974609375, -2.7958984375, -2.35205078125, -1.908203125, -1.46435546875, -1.0205078125, -0.57666015625, -0.1328125, 0.31103515625, 0.7548828125, 1.19873046875, 1.642578125, 2.08642578125, 2.5302734375, 2.97412109375, 3.41796875, 3.86181640625, 4.3056640625, 4.74951171875, 5.193359375, 5.63720703125, 6.0810546875, 6.52490234375, 6.96875, 7.41259765625, 7.8564453125, 8.30029296875, 8.744140625, 9.18798828125, 9.6318359375, 10.07568359375, 10.51953125, 10.96337890625, 11.4072265625, 11.85107421875, 12.294921875, 12.73876953125, 13.1826171875, 13.62646484375, 14.0703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0, 4.0, 3.0, 8.0, 12.0, 12.0, 14.0, 12.0, 19.0, 19.0, 13.0, 19.0, 19.0, 23.0, 33.0, 33.0, 31.0, 39.0, 37.0, 31.0, 37.0, 27.0, 48.0, 41.0, 32.0, 38.0, 43.0, 45.0, 36.0, 32.0, 25.0, 25.0, 26.0, 26.0, 23.0, 22.0, 14.0, 3.0, 13.0, 16.0, 7.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.11328125, -4.95416259765625, -4.7950439453125, -4.63592529296875, -4.476806640625, -4.31768798828125, -4.1585693359375, -3.99945068359375, -3.84033203125, -3.68121337890625, -3.5220947265625, -3.36297607421875, -3.203857421875, -3.04473876953125, -2.8856201171875, -2.72650146484375, -2.5673828125, -2.40826416015625, -2.2491455078125, -2.09002685546875, -1.930908203125, -1.77178955078125, -1.6126708984375, -1.45355224609375, -1.29443359375, -1.13531494140625, -0.9761962890625, -0.81707763671875, -0.657958984375, -0.49884033203125, -0.3397216796875, -0.18060302734375, -0.021484375, 0.13763427734375, 0.2967529296875, 0.45587158203125, 0.614990234375, 0.77410888671875, 0.9332275390625, 1.09234619140625, 1.25146484375, 1.41058349609375, 1.5697021484375, 1.72882080078125, 1.887939453125, 2.04705810546875, 2.2061767578125, 2.36529541015625, 2.5244140625, 2.68353271484375, 2.8426513671875, 3.00177001953125, 3.160888671875, 3.32000732421875, 3.4791259765625, 3.63824462890625, 3.79736328125, 3.95648193359375, 4.1156005859375, 4.27471923828125, 4.433837890625, 4.59295654296875, 4.7520751953125, 4.91119384765625, 5.0703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 9.0, 5.0, 10.0, 17.0, 22.0, 45.0, 40.0, 52.0, 93.0, 153.0, 243.0, 344.0, 570.0, 1019.0, 1755.0, 3206.0, 6234.0, 13189.0, 30150.0, 77326.0, 212385.0, 376333.0, 198360.0, 72801.0, 28520.0, 12586.0, 5895.0, 3054.0, 1616.0, 918.0, 563.0, 360.0, 207.0, 153.0, 90.0, 66.0, 49.0, 36.0, 26.0, 11.0, 14.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.4453125, -9.1630859375, -8.880859375, -8.5986328125, -8.31640625, -8.0341796875, -7.751953125, -7.4697265625, -7.1875, -6.9052734375, -6.623046875, -6.3408203125, -6.05859375, -5.7763671875, -5.494140625, -5.2119140625, -4.9296875, -4.6474609375, -4.365234375, -4.0830078125, -3.80078125, -3.5185546875, -3.236328125, -2.9541015625, -2.671875, -2.3896484375, -2.107421875, -1.8251953125, -1.54296875, -1.2607421875, -0.978515625, -0.6962890625, -0.4140625, -0.1318359375, 0.150390625, 0.4326171875, 0.71484375, 0.9970703125, 1.279296875, 1.5615234375, 1.84375, 2.1259765625, 2.408203125, 2.6904296875, 2.97265625, 3.2548828125, 3.537109375, 3.8193359375, 4.1015625, 4.3837890625, 4.666015625, 4.9482421875, 5.23046875, 5.5126953125, 5.794921875, 6.0771484375, 6.359375, 6.6416015625, 6.923828125, 7.2060546875, 7.48828125, 7.7705078125, 8.052734375, 8.3349609375, 8.6171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 5.0, 9.0, 19.0, 20.0, 31.0, 67.0, 71.0, 99.0, 122.0, 112.0, 114.0, 85.0, 65.0, 49.0, 34.0, 28.0, 13.0, 7.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006365776062011719, -0.000620424747467041, -0.0006042718887329102, -0.0005881190299987793, -0.0005719661712646484, -0.0005558133125305176, -0.0005396604537963867, -0.0005235075950622559, -0.000507354736328125, -0.0004912018775939941, -0.0004750490188598633, -0.0004588961601257324, -0.00044274330139160156, -0.0004265904426574707, -0.00041043758392333984, -0.000394284725189209, -0.0003781318664550781, -0.00036197900772094727, -0.0003458261489868164, -0.00032967329025268555, -0.0003135204315185547, -0.00029736757278442383, -0.00028121471405029297, -0.0002650618553161621, -0.00024890899658203125, -0.0002327561378479004, -0.00021660327911376953, -0.00020045042037963867, -0.0001842975616455078, -0.00016814470291137695, -0.0001519918441772461, -0.00013583898544311523, -0.00011968612670898438, -0.00010353326797485352, -8.738040924072266e-05, -7.12275505065918e-05, -5.507469177246094e-05, -3.892183303833008e-05, -2.276897430419922e-05, -6.616115570068359e-06, 9.5367431640625e-06, 2.568960189819336e-05, 4.184246063232422e-05, 5.799531936645508e-05, 7.414817810058594e-05, 9.03010368347168e-05, 0.00010645389556884766, 0.00012260675430297852, 0.00013875961303710938, 0.00015491247177124023, 0.0001710653305053711, 0.00018721818923950195, 0.0002033710479736328, 0.00021952390670776367, 0.00023567676544189453, 0.0002518296241760254, 0.00026798248291015625, 0.0002841353416442871, 0.00030028820037841797, 0.00031644105911254883, 0.0003325939178466797, 0.00034874677658081055, 0.0003648996353149414, 0.00038105249404907227, 0.0003972053527832031]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 18.0, 18.0, 21.0, 32.0, 52.0, 95.0, 91.0, 153.0, 237.0, 310.0, 475.0, 717.0, 1003.0, 1589.0, 2434.0, 3913.0, 6300.0, 10331.0, 18282.0, 32711.0, 59126.0, 103962.0, 163185.0, 200628.0, 174180.0, 114559.0, 66198.0, 36686.0, 20475.0, 11675.0, 6891.0, 4305.0, 2662.0, 1715.0, 1109.0, 768.0, 526.0, 366.0, 219.0, 170.0, 120.0, 80.0, 57.0, 37.0, 23.0, 15.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.22265625, -5.06243896484375, -4.9022216796875, -4.74200439453125, -4.581787109375, -4.42156982421875, -4.2613525390625, -4.10113525390625, -3.94091796875, -3.78070068359375, -3.6204833984375, -3.46026611328125, -3.300048828125, -3.13983154296875, -2.9796142578125, -2.81939697265625, -2.6591796875, -2.49896240234375, -2.3387451171875, -2.17852783203125, -2.018310546875, -1.85809326171875, -1.6978759765625, -1.53765869140625, -1.37744140625, -1.21722412109375, -1.0570068359375, -0.89678955078125, -0.736572265625, -0.57635498046875, -0.4161376953125, -0.25592041015625, -0.095703125, 0.06451416015625, 0.2247314453125, 0.38494873046875, 0.545166015625, 0.70538330078125, 0.8656005859375, 1.02581787109375, 1.18603515625, 1.34625244140625, 1.5064697265625, 1.66668701171875, 1.826904296875, 1.98712158203125, 2.1473388671875, 2.30755615234375, 2.4677734375, 2.62799072265625, 2.7882080078125, 2.94842529296875, 3.108642578125, 3.26885986328125, 3.4290771484375, 3.58929443359375, 3.74951171875, 3.90972900390625, 4.0699462890625, 4.23016357421875, 4.390380859375, 4.55059814453125, 4.7108154296875, 4.87103271484375, 5.03125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 4.0, 8.0, 6.0, 11.0, 15.0, 14.0, 19.0, 20.0, 37.0, 50.0, 57.0, 52.0, 56.0, 68.0, 86.0, 79.0, 67.0, 56.0, 63.0, 44.0, 40.0, 42.0, 30.0, 19.0, 14.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8837890625, -1.8101654052734375, -1.736541748046875, -1.6629180908203125, -1.58929443359375, -1.5156707763671875, -1.442047119140625, -1.3684234619140625, -1.2947998046875, -1.2211761474609375, -1.147552490234375, -1.0739288330078125, -1.00030517578125, -0.9266815185546875, -0.853057861328125, -0.7794342041015625, -0.705810546875, -0.6321868896484375, -0.558563232421875, -0.4849395751953125, -0.41131591796875, -0.3376922607421875, -0.264068603515625, -0.1904449462890625, -0.1168212890625, -0.0431976318359375, 0.030426025390625, 0.1040496826171875, 0.17767333984375, 0.2512969970703125, 0.324920654296875, 0.3985443115234375, 0.47216796875, 0.5457916259765625, 0.619415283203125, 0.6930389404296875, 0.76666259765625, 0.8402862548828125, 0.913909912109375, 0.9875335693359375, 1.0611572265625, 1.1347808837890625, 1.208404541015625, 1.2820281982421875, 1.35565185546875, 1.4292755126953125, 1.502899169921875, 1.5765228271484375, 1.650146484375, 1.7237701416015625, 1.797393798828125, 1.8710174560546875, 1.94464111328125, 2.0182647705078125, 2.091888427734375, 2.1655120849609375, 2.2391357421875, 2.3127593994140625, 2.386383056640625, 2.4600067138671875, 2.53363037109375, 2.6072540283203125, 2.680877685546875, 2.7545013427734375, 2.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 9.0, 3.0, 6.0, 6.0, 16.0, 11.0, 18.0, 15.0, 22.0, 24.0, 35.0, 32.0, 40.0, 45.0, 41.0, 57.0, 47.0, 58.0, 63.0, 47.0, 62.0, 48.0, 39.0, 40.0, 38.0, 35.0, 38.0, 16.0, 15.0, 13.0, 12.0, 10.0, 10.0, 11.0, 3.0, 1.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.010624885559082, -8.702438354492188, -8.394251823425293, -8.086066246032715, -7.77787971496582, -7.469693183898926, -7.161506652832031, -6.853320121765137, -6.5451340675354, -6.236947536468506, -5.9287614822387695, -5.620574951171875, -5.3123884201049805, -5.004202365875244, -4.69601583480835, -4.387829780578613, -4.079643249511719, -3.7714569568634033, -3.463270664215088, -3.1550841331481934, -2.846897840499878, -2.5387115478515625, -2.230525016784668, -1.9223387241363525, -1.614152431488037, -1.3059661388397217, -0.9977797269821167, -0.6895933747291565, -0.3814070224761963, -0.07322072982788086, 0.23496568202972412, 0.5431520938873291, 0.8513393402099609, 1.1595256328582764, 1.4677120447158813, 1.7758984565734863, 2.0840847492218018, 2.392271041870117, 2.7004575729370117, 3.008643865585327, 3.3168301582336426, 3.625016450881958, 3.9332027435302734, 4.241389274597168, 4.5495758056640625, 4.857761859893799, 5.165948390960693, 5.47413444519043, 5.782320976257324, 6.090507507324219, 6.398693561553955, 6.70688009262085, 7.015066146850586, 7.3232526779174805, 7.631439208984375, 7.9396257400512695, 8.247812271118164, 8.555998802185059, 8.864185333251953, 9.172370910644531, 9.480557441711426, 9.78874397277832, 10.096930503845215, 10.40511703491211, 10.713302612304688]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 10.0, 9.0, 13.0, 9.0, 12.0, 25.0, 15.0, 14.0, 15.0, 29.0, 40.0, 29.0, 36.0, 29.0, 29.0, 44.0, 35.0, 45.0, 33.0, 37.0, 40.0, 39.0, 42.0, 42.0, 37.0, 33.0, 26.0, 24.0, 24.0, 29.0, 26.0, 24.0, 13.0, 17.0, 16.0, 17.0, 5.0, 2.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.665674209594727, -8.413859367370605, -8.162044525146484, -7.910229206085205, -7.658413887023926, -7.406599044799805, -7.154784202575684, -6.9029693603515625, -6.651154041290283, -6.399339199066162, -6.147523880004883, -5.895709037780762, -5.643894195556641, -5.392078876495361, -5.14026403427124, -4.888448715209961, -4.63663387298584, -4.384819030761719, -4.1330037117004395, -3.8811888694763184, -3.629373788833618, -3.377558708190918, -3.125743865966797, -2.8739287853240967, -2.6221137046813965, -2.3702986240386963, -2.118483543395996, -1.866668701171875, -1.6148536205291748, -1.3630385398864746, -1.111223578453064, -0.8594086170196533, -0.6075940132141113, -0.3557789921760559, -0.10396397113800049, 0.14785104990005493, 0.39966607093811035, 0.6514811515808105, 0.9032961130142212, 1.1551110744476318, 1.406926155090332, 1.6587412357330322, 1.9105561971664429, 2.1623711585998535, 2.4141862392425537, 2.666001319885254, 2.917816162109375, 3.169631242752075, 3.4214463233947754, 3.6732614040374756, 3.925076484680176, 4.176891326904297, 4.428706169128418, 4.680521488189697, 4.932336330413818, 5.184151649475098, 5.435966491699219, 5.68778133392334, 5.939596652984619, 6.19141149520874, 6.4432268142700195, 6.695041656494141, 6.946856498718262, 7.198671340942383, 7.450486660003662]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 9.0, 12.0, 18.0, 30.0, 39.0, 52.0, 73.0, 109.0, 176.0, 281.0, 443.0, 720.0, 1193.0, 1974.0, 3288.0, 5630.0, 9326.0, 15531.0, 26110.0, 42995.0, 67321.0, 101188.0, 135950.0, 154823.0, 147126.0, 117176.0, 82002.0, 53437.0, 32730.0, 19465.0, 11689.0, 6887.0, 4174.0, 2515.0, 1536.0, 922.0, 578.0, 351.0, 207.0, 166.0, 89.0, 63.0, 42.0, 30.0, 23.0, 12.0, 12.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-9.3515625, -9.0657958984375, -8.780029296875, -8.4942626953125, -8.20849609375, -7.9227294921875, -7.636962890625, -7.3511962890625, -7.0654296875, -6.7796630859375, -6.493896484375, -6.2081298828125, -5.92236328125, -5.6365966796875, -5.350830078125, -5.0650634765625, -4.779296875, -4.4935302734375, -4.207763671875, -3.9219970703125, -3.63623046875, -3.3504638671875, -3.064697265625, -2.7789306640625, -2.4931640625, -2.2073974609375, -1.921630859375, -1.6358642578125, -1.35009765625, -1.0643310546875, -0.778564453125, -0.4927978515625, -0.20703125, 0.0787353515625, 0.364501953125, 0.6502685546875, 0.93603515625, 1.2218017578125, 1.507568359375, 1.7933349609375, 2.0791015625, 2.3648681640625, 2.650634765625, 2.9364013671875, 3.22216796875, 3.5079345703125, 3.793701171875, 4.0794677734375, 4.365234375, 4.6510009765625, 4.936767578125, 5.2225341796875, 5.50830078125, 5.7940673828125, 6.079833984375, 6.3656005859375, 6.6513671875, 6.9371337890625, 7.222900390625, 7.5086669921875, 7.79443359375, 8.0802001953125, 8.365966796875, 8.6517333984375, 8.9375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 4.0, 8.0, 2.0, 10.0, 9.0, 9.0, 13.0, 14.0, 14.0, 18.0, 17.0, 18.0, 27.0, 30.0, 25.0, 35.0, 29.0, 33.0, 31.0, 31.0, 35.0, 38.0, 41.0, 36.0, 35.0, 35.0, 30.0, 29.0, 33.0, 21.0, 30.0, 25.0, 23.0, 35.0, 14.0, 20.0, 24.0, 12.0, 14.0, 22.0, 10.0, 15.0, 7.0, 6.0, 10.0, 4.0, 4.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.87890625, -6.653564453125, -6.42822265625, -6.202880859375, -5.9775390625, -5.752197265625, -5.52685546875, -5.301513671875, -5.076171875, -4.850830078125, -4.62548828125, -4.400146484375, -4.1748046875, -3.949462890625, -3.72412109375, -3.498779296875, -3.2734375, -3.048095703125, -2.82275390625, -2.597412109375, -2.3720703125, -2.146728515625, -1.92138671875, -1.696044921875, -1.470703125, -1.245361328125, -1.02001953125, -0.794677734375, -0.5693359375, -0.343994140625, -0.11865234375, 0.106689453125, 0.33203125, 0.557373046875, 0.78271484375, 1.008056640625, 1.2333984375, 1.458740234375, 1.68408203125, 1.909423828125, 2.134765625, 2.360107421875, 2.58544921875, 2.810791015625, 3.0361328125, 3.261474609375, 3.48681640625, 3.712158203125, 3.9375, 4.162841796875, 4.38818359375, 4.613525390625, 4.8388671875, 5.064208984375, 5.28955078125, 5.514892578125, 5.740234375, 5.965576171875, 6.19091796875, 6.416259765625, 6.6416015625, 6.866943359375, 7.09228515625, 7.317626953125, 7.54296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 8.0, 11.0, 22.0, 27.0, 33.0, 54.0, 91.0, 119.0, 214.0, 286.0, 446.0, 687.0, 1030.0, 1700.0, 2657.0, 3910.0, 5970.0, 9360.0, 14171.0, 21582.0, 32463.0, 47757.0, 68149.0, 91514.0, 113580.0, 127454.0, 125147.0, 108459.0, 83984.0, 61314.0, 42701.0, 28864.0, 19078.0, 12480.0, 8138.0, 5150.0, 3551.0, 2257.0, 1422.0, 968.0, 596.0, 374.0, 264.0, 170.0, 130.0, 75.0, 44.0, 35.0, 23.0, 16.0, 6.0, 4.0, 2.0, 7.0, 3.0, 1.0], "bins": [-7.15234375, -6.9410400390625, -6.729736328125, -6.5184326171875, -6.30712890625, -6.0958251953125, -5.884521484375, -5.6732177734375, -5.4619140625, -5.2506103515625, -5.039306640625, -4.8280029296875, -4.61669921875, -4.4053955078125, -4.194091796875, -3.9827880859375, -3.771484375, -3.5601806640625, -3.348876953125, -3.1375732421875, -2.92626953125, -2.7149658203125, -2.503662109375, -2.2923583984375, -2.0810546875, -1.8697509765625, -1.658447265625, -1.4471435546875, -1.23583984375, -1.0245361328125, -0.813232421875, -0.6019287109375, -0.390625, -0.1793212890625, 0.031982421875, 0.2432861328125, 0.45458984375, 0.6658935546875, 0.877197265625, 1.0885009765625, 1.2998046875, 1.5111083984375, 1.722412109375, 1.9337158203125, 2.14501953125, 2.3563232421875, 2.567626953125, 2.7789306640625, 2.990234375, 3.2015380859375, 3.412841796875, 3.6241455078125, 3.83544921875, 4.0467529296875, 4.258056640625, 4.4693603515625, 4.6806640625, 4.8919677734375, 5.103271484375, 5.3145751953125, 5.52587890625, 5.7371826171875, 5.948486328125, 6.1597900390625, 6.37109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 3.0, 10.0, 11.0, 17.0, 25.0, 24.0, 33.0, 26.0, 43.0, 35.0, 40.0, 28.0, 47.0, 41.0, 51.0, 44.0, 38.0, 48.0, 48.0, 38.0, 51.0, 32.0, 35.0, 39.0, 32.0, 31.0, 18.0, 19.0, 20.0, 14.0, 7.0, 8.0, 7.0, 2.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.36761474609375, -5.1805419921875, -4.99346923828125, -4.806396484375, -4.61932373046875, -4.4322509765625, -4.24517822265625, -4.05810546875, -3.87103271484375, -3.6839599609375, -3.49688720703125, -3.309814453125, -3.12274169921875, -2.9356689453125, -2.74859619140625, -2.5615234375, -2.37445068359375, -2.1873779296875, -2.00030517578125, -1.813232421875, -1.62615966796875, -1.4390869140625, -1.25201416015625, -1.06494140625, -0.87786865234375, -0.6907958984375, -0.50372314453125, -0.316650390625, -0.12957763671875, 0.0574951171875, 0.24456787109375, 0.431640625, 0.61871337890625, 0.8057861328125, 0.99285888671875, 1.179931640625, 1.36700439453125, 1.5540771484375, 1.74114990234375, 1.92822265625, 2.11529541015625, 2.3023681640625, 2.48944091796875, 2.676513671875, 2.86358642578125, 3.0506591796875, 3.23773193359375, 3.4248046875, 3.61187744140625, 3.7989501953125, 3.98602294921875, 4.173095703125, 4.36016845703125, 4.5472412109375, 4.73431396484375, 4.92138671875, 5.10845947265625, 5.2955322265625, 5.48260498046875, 5.669677734375, 5.85675048828125, 6.0438232421875, 6.23089599609375, 6.41796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 16.0, 20.0, 37.0, 44.0, 73.0, 101.0, 158.0, 257.0, 401.0, 602.0, 1000.0, 1670.0, 2692.0, 4770.0, 8815.0, 16704.0, 34548.0, 74534.0, 155945.0, 256776.0, 236743.0, 130563.0, 61501.0, 28654.0, 13913.0, 7541.0, 4065.0, 2393.0, 1515.0, 911.0, 559.0, 319.0, 252.0, 164.0, 90.0, 58.0, 42.0, 23.0, 18.0, 14.0, 5.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.27587890625, -7.9892578125, -7.70263671875, -7.416015625, -7.12939453125, -6.8427734375, -6.55615234375, -6.26953125, -5.98291015625, -5.6962890625, -5.40966796875, -5.123046875, -4.83642578125, -4.5498046875, -4.26318359375, -3.9765625, -3.68994140625, -3.4033203125, -3.11669921875, -2.830078125, -2.54345703125, -2.2568359375, -1.97021484375, -1.68359375, -1.39697265625, -1.1103515625, -0.82373046875, -0.537109375, -0.25048828125, 0.0361328125, 0.32275390625, 0.609375, 0.89599609375, 1.1826171875, 1.46923828125, 1.755859375, 2.04248046875, 2.3291015625, 2.61572265625, 2.90234375, 3.18896484375, 3.4755859375, 3.76220703125, 4.048828125, 4.33544921875, 4.6220703125, 4.90869140625, 5.1953125, 5.48193359375, 5.7685546875, 6.05517578125, 6.341796875, 6.62841796875, 6.9150390625, 7.20166015625, 7.48828125, 7.77490234375, 8.0615234375, 8.34814453125, 8.634765625, 8.92138671875, 9.2080078125, 9.49462890625, 9.78125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 17.0, 13.0, 19.0, 21.0, 33.0, 61.0, 68.0, 91.0, 102.0, 120.0, 95.0, 97.0, 57.0, 48.0, 40.0, 32.0, 18.0, 22.0, 10.0, 10.0, 8.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0012416839599609375, -0.0012094229459762573, -0.0011771619319915771, -0.001144900918006897, -0.0011126399040222168, -0.0010803788900375366, -0.0010481178760528564, -0.0010158568620681763, -0.000983595848083496, -0.0009513348340988159, -0.0009190738201141357, -0.0008868128061294556, -0.0008545517921447754, -0.0008222907781600952, -0.000790029764175415, -0.0007577687501907349, -0.0007255077362060547, -0.0006932467222213745, -0.0006609857082366943, -0.0006287246942520142, -0.000596463680267334, -0.0005642026662826538, -0.0005319416522979736, -0.0004996806383132935, -0.0004674196243286133, -0.0004351586103439331, -0.00040289759635925293, -0.00037063658237457275, -0.0003383755683898926, -0.0003061145544052124, -0.0002738535404205322, -0.00024159252643585205, -0.00020933151245117188, -0.0001770704984664917, -0.00014480948448181152, -0.00011254847049713135, -8.028745651245117e-05, -4.8026442527770996e-05, -1.576542854309082e-05, 1.6495585441589355e-05, 4.875659942626953e-05, 8.101761341094971e-05, 0.00011327862739562988, 0.00014553964138031006, 0.00017780065536499023, 0.0002100616693496704, 0.00024232268333435059, 0.00027458369731903076, 0.00030684471130371094, 0.0003391057252883911, 0.0003713667392730713, 0.00040362775325775146, 0.00043588876724243164, 0.0004681497812271118, 0.000500410795211792, 0.0005326718091964722, 0.0005649328231811523, 0.0005971938371658325, 0.0006294548511505127, 0.0006617158651351929, 0.000693976879119873, 0.0007262378931045532, 0.0007584989070892334, 0.0007907599210739136, 0.0008230209350585938]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 2.0, 12.0, 20.0, 13.0, 27.0, 39.0, 64.0, 57.0, 111.0, 189.0, 245.0, 391.0, 569.0, 1039.0, 1679.0, 2733.0, 4863.0, 8579.0, 15785.0, 30056.0, 58159.0, 108594.0, 176748.0, 215984.0, 180739.0, 112454.0, 60435.0, 31173.0, 16351.0, 8855.0, 5034.0, 2922.0, 1713.0, 1002.0, 666.0, 417.0, 266.0, 178.0, 119.0, 88.0, 63.0, 38.0, 22.0, 14.0, 13.0, 8.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.41015625, -6.2001953125, -5.990234375, -5.7802734375, -5.5703125, -5.3603515625, -5.150390625, -4.9404296875, -4.73046875, -4.5205078125, -4.310546875, -4.1005859375, -3.890625, -3.6806640625, -3.470703125, -3.2607421875, -3.05078125, -2.8408203125, -2.630859375, -2.4208984375, -2.2109375, -2.0009765625, -1.791015625, -1.5810546875, -1.37109375, -1.1611328125, -0.951171875, -0.7412109375, -0.53125, -0.3212890625, -0.111328125, 0.0986328125, 0.30859375, 0.5185546875, 0.728515625, 0.9384765625, 1.1484375, 1.3583984375, 1.568359375, 1.7783203125, 1.98828125, 2.1982421875, 2.408203125, 2.6181640625, 2.828125, 3.0380859375, 3.248046875, 3.4580078125, 3.66796875, 3.8779296875, 4.087890625, 4.2978515625, 4.5078125, 4.7177734375, 4.927734375, 5.1376953125, 5.34765625, 5.5576171875, 5.767578125, 5.9775390625, 6.1875, 6.3974609375, 6.607421875, 6.8173828125, 7.02734375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 11.0, 5.0, 11.0, 4.0, 15.0, 26.0, 22.0, 37.0, 45.0, 59.0, 64.0, 74.0, 76.0, 75.0, 84.0, 58.0, 63.0, 57.0, 44.0, 46.0, 26.0, 31.0, 12.0, 11.0, 8.0, 4.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.30859375, -3.215850830078125, -3.12310791015625, -3.030364990234375, -2.9376220703125, -2.844879150390625, -2.75213623046875, -2.659393310546875, -2.566650390625, -2.473907470703125, -2.38116455078125, -2.288421630859375, -2.1956787109375, -2.102935791015625, -2.01019287109375, -1.917449951171875, -1.82470703125, -1.731964111328125, -1.63922119140625, -1.546478271484375, -1.4537353515625, -1.360992431640625, -1.26824951171875, -1.175506591796875, -1.082763671875, -0.990020751953125, -0.89727783203125, -0.804534912109375, -0.7117919921875, -0.619049072265625, -0.52630615234375, -0.433563232421875, -0.3408203125, -0.248077392578125, -0.15533447265625, -0.062591552734375, 0.0301513671875, 0.122894287109375, 0.21563720703125, 0.308380126953125, 0.401123046875, 0.493865966796875, 0.58660888671875, 0.679351806640625, 0.7720947265625, 0.864837646484375, 0.95758056640625, 1.050323486328125, 1.14306640625, 1.235809326171875, 1.32855224609375, 1.421295166015625, 1.5140380859375, 1.606781005859375, 1.69952392578125, 1.792266845703125, 1.885009765625, 1.977752685546875, 2.07049560546875, 2.163238525390625, 2.2559814453125, 2.348724365234375, 2.44146728515625, 2.534210205078125, 2.626953125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 11.0, 10.0, 22.0, 23.0, 18.0, 29.0, 25.0, 32.0, 39.0, 43.0, 51.0, 49.0, 55.0, 59.0, 50.0, 65.0, 62.0, 53.0, 37.0, 38.0, 41.0, 45.0, 25.0, 28.0, 19.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 7.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.412333488464355, -8.092952728271484, -7.773571968078613, -7.454191207885742, -7.134810447692871, -6.8154296875, -6.496048450469971, -6.1766676902771, -5.8572869300842285, -5.537906169891357, -5.218525409698486, -4.899144649505615, -4.579763412475586, -4.260382652282715, -3.9410018920898438, -3.6216211318969727, -3.3022403717041016, -2.9828596115112305, -2.6634788513183594, -2.344097852706909, -2.024717092514038, -1.705336332321167, -1.3859554529190063, -1.0665745735168457, -0.7471938133239746, -0.42781299352645874, -0.10843217372894287, 0.210948646068573, 0.5303294658660889, 0.84971022605896, 1.1690911054611206, 1.4884719848632812, 1.8078536987304688, 2.12723445892334, 2.446615219116211, 2.765996217727661, 3.0853769779205322, 3.4047577381134033, 3.7241387367248535, 4.043519496917725, 4.362900257110596, 4.682281017303467, 5.001661777496338, 5.321042537689209, 5.640423774719238, 5.959804534912109, 6.2791852951049805, 6.598566055297852, 6.917946815490723, 7.237327575683594, 7.556708335876465, 7.876089096069336, 8.195469856262207, 8.514850616455078, 8.83423137664795, 9.15361213684082, 9.472993850708008, 9.792374610900879, 10.11175537109375, 10.431136131286621, 10.750516891479492, 11.069897651672363, 11.389278411865234, 11.708660125732422, 12.028039932250977]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 9.0, 15.0, 12.0, 18.0, 17.0, 14.0, 23.0, 24.0, 27.0, 29.0, 33.0, 28.0, 37.0, 31.0, 44.0, 37.0, 48.0, 46.0, 46.0, 44.0, 40.0, 41.0, 29.0, 26.0, 38.0, 35.0, 28.0, 22.0, 16.0, 21.0, 19.0, 18.0, 13.0, 14.0, 8.0, 9.0, 8.0, 7.0, 1.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.691641807556152, -9.422221183776855, -9.152799606323242, -8.883378982543945, -8.613957405090332, -8.344536781311035, -8.075115203857422, -7.805694580078125, -7.536273002624512, -7.266851902008057, -6.997430801391602, -6.7280097007751465, -6.458588600158691, -6.189167499542236, -5.919746398925781, -5.650325775146484, -5.380904674530029, -5.111483573913574, -4.842062473297119, -4.572641372680664, -4.303220272064209, -4.033799171447754, -3.764378309249878, -3.494957208633423, -3.2255361080169678, -2.9561150074005127, -2.6866939067840576, -2.4172730445861816, -2.1478519439697266, -1.878430724143982, -1.6090097427368164, -1.3395886421203613, -1.070167064666748, -0.800745964050293, -0.5313249230384827, -0.26190388202667236, 0.007517218589782715, 0.2769383192062378, 0.5463593006134033, 0.8157804012298584, 1.0852015018463135, 1.3546226024627686, 1.6240437030792236, 1.8934646844863892, 2.1628856658935547, 2.4323067665100098, 2.701727867126465, 2.97114896774292, 3.240570068359375, 3.50999116897583, 3.779412269592285, 4.04883337020874, 4.318254470825195, 4.58767557144165, 4.8570966720581055, 5.126517295837402, 5.395938873291016, 5.665359973907471, 5.934781074523926, 6.204202175140381, 6.473623275756836, 6.743044376373291, 7.012465476989746, 7.281886100769043, 7.551307201385498]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 6.0, 8.0, 9.0, 15.0, 33.0, 52.0, 63.0, 79.0, 131.0, 198.0, 262.0, 400.0, 555.0, 882.0, 1403.0, 2204.0, 3425.0, 5551.0, 9113.0, 15598.0, 26807.0, 49146.0, 94682.0, 197171.0, 430146.0, 815170.0, 1029720.0, 755643.0, 379749.0, 175733.0, 86202.0, 46235.0, 26099.0, 15258.0, 9420.0, 5809.0, 3765.0, 2476.0, 1637.0, 1087.0, 742.0, 500.0, 344.0, 231.0, 162.0, 123.0, 72.0, 61.0, 38.0, 31.0, 14.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0], "bins": [-8.734375, -8.47314453125, -8.2119140625, -7.95068359375, -7.689453125, -7.42822265625, -7.1669921875, -6.90576171875, -6.64453125, -6.38330078125, -6.1220703125, -5.86083984375, -5.599609375, -5.33837890625, -5.0771484375, -4.81591796875, -4.5546875, -4.29345703125, -4.0322265625, -3.77099609375, -3.509765625, -3.24853515625, -2.9873046875, -2.72607421875, -2.46484375, -2.20361328125, -1.9423828125, -1.68115234375, -1.419921875, -1.15869140625, -0.8974609375, -0.63623046875, -0.375, -0.11376953125, 0.1474609375, 0.40869140625, 0.669921875, 0.93115234375, 1.1923828125, 1.45361328125, 1.71484375, 1.97607421875, 2.2373046875, 2.49853515625, 2.759765625, 3.02099609375, 3.2822265625, 3.54345703125, 3.8046875, 4.06591796875, 4.3271484375, 4.58837890625, 4.849609375, 5.11083984375, 5.3720703125, 5.63330078125, 5.89453125, 6.15576171875, 6.4169921875, 6.67822265625, 6.939453125, 7.20068359375, 7.4619140625, 7.72314453125, 7.984375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 13.0, 9.0, 18.0, 15.0, 21.0, 11.0, 24.0, 31.0, 23.0, 34.0, 32.0, 31.0, 36.0, 36.0, 50.0, 43.0, 48.0, 49.0, 39.0, 34.0, 29.0, 37.0, 46.0, 24.0, 24.0, 32.0, 19.0, 27.0, 22.0, 19.0, 23.0, 11.0, 14.0, 10.0, 13.0, 10.0, 4.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.73876953125, -5.5556640625, -5.37255859375, -5.189453125, -5.00634765625, -4.8232421875, -4.64013671875, -4.45703125, -4.27392578125, -4.0908203125, -3.90771484375, -3.724609375, -3.54150390625, -3.3583984375, -3.17529296875, -2.9921875, -2.80908203125, -2.6259765625, -2.44287109375, -2.259765625, -2.07666015625, -1.8935546875, -1.71044921875, -1.52734375, -1.34423828125, -1.1611328125, -0.97802734375, -0.794921875, -0.61181640625, -0.4287109375, -0.24560546875, -0.0625, 0.12060546875, 0.3037109375, 0.48681640625, 0.669921875, 0.85302734375, 1.0361328125, 1.21923828125, 1.40234375, 1.58544921875, 1.7685546875, 1.95166015625, 2.134765625, 2.31787109375, 2.5009765625, 2.68408203125, 2.8671875, 3.05029296875, 3.2333984375, 3.41650390625, 3.599609375, 3.78271484375, 3.9658203125, 4.14892578125, 4.33203125, 4.51513671875, 4.6982421875, 4.88134765625, 5.064453125, 5.24755859375, 5.4306640625, 5.61376953125, 5.796875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 14.0, 15.0, 21.0, 33.0, 63.0, 82.0, 127.0, 185.0, 312.0, 511.0, 829.0, 1396.0, 2371.0, 3907.0, 6757.0, 11809.0, 20883.0, 38197.0, 72521.0, 141952.0, 290136.0, 587033.0, 997201.0, 947898.0, 531914.0, 262511.0, 129056.0, 65925.0, 34974.0, 19134.0, 10830.0, 6366.0, 3777.0, 2185.0, 1289.0, 790.0, 483.0, 303.0, 188.0, 125.0, 61.0, 41.0, 31.0, 20.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5234375, -8.2386474609375, -7.953857421875, -7.6690673828125, -7.38427734375, -7.0994873046875, -6.814697265625, -6.5299072265625, -6.2451171875, -5.9603271484375, -5.675537109375, -5.3907470703125, -5.10595703125, -4.8211669921875, -4.536376953125, -4.2515869140625, -3.966796875, -3.6820068359375, -3.397216796875, -3.1124267578125, -2.82763671875, -2.5428466796875, -2.258056640625, -1.9732666015625, -1.6884765625, -1.4036865234375, -1.118896484375, -0.8341064453125, -0.54931640625, -0.2645263671875, 0.020263671875, 0.3050537109375, 0.58984375, 0.8746337890625, 1.159423828125, 1.4442138671875, 1.72900390625, 2.0137939453125, 2.298583984375, 2.5833740234375, 2.8681640625, 3.1529541015625, 3.437744140625, 3.7225341796875, 4.00732421875, 4.2921142578125, 4.576904296875, 4.8616943359375, 5.146484375, 5.4312744140625, 5.716064453125, 6.0008544921875, 6.28564453125, 6.5704345703125, 6.855224609375, 7.1400146484375, 7.4248046875, 7.7095947265625, 7.994384765625, 8.2791748046875, 8.56396484375, 8.8487548828125, 9.133544921875, 9.4183349609375, 9.703125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 4.0, 11.0, 18.0, 18.0, 32.0, 38.0, 24.0, 41.0, 61.0, 82.0, 84.0, 123.0, 164.0, 165.0, 186.0, 241.0, 327.0, 291.0, 299.0, 310.0, 248.0, 247.0, 197.0, 170.0, 152.0, 96.0, 81.0, 82.0, 47.0, 57.0, 41.0, 18.0, 30.0, 21.0, 17.0, 12.0, 10.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.306640625, -3.20794677734375, -3.1092529296875, -3.01055908203125, -2.911865234375, -2.81317138671875, -2.7144775390625, -2.61578369140625, -2.51708984375, -2.41839599609375, -2.3197021484375, -2.22100830078125, -2.122314453125, -2.02362060546875, -1.9249267578125, -1.82623291015625, -1.7275390625, -1.62884521484375, -1.5301513671875, -1.43145751953125, -1.332763671875, -1.23406982421875, -1.1353759765625, -1.03668212890625, -0.93798828125, -0.83929443359375, -0.7406005859375, -0.64190673828125, -0.543212890625, -0.44451904296875, -0.3458251953125, -0.24713134765625, -0.1484375, -0.04974365234375, 0.0489501953125, 0.14764404296875, 0.246337890625, 0.34503173828125, 0.4437255859375, 0.54241943359375, 0.64111328125, 0.73980712890625, 0.8385009765625, 0.93719482421875, 1.035888671875, 1.13458251953125, 1.2332763671875, 1.33197021484375, 1.4306640625, 1.52935791015625, 1.6280517578125, 1.72674560546875, 1.825439453125, 1.92413330078125, 2.0228271484375, 2.12152099609375, 2.22021484375, 2.31890869140625, 2.4176025390625, 2.51629638671875, 2.614990234375, 2.71368408203125, 2.8123779296875, 2.91107177734375, 3.009765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 14.0, 20.0, 30.0, 21.0, 25.0, 46.0, 42.0, 65.0, 60.0, 48.0, 58.0, 49.0, 68.0, 49.0, 42.0, 46.0, 53.0, 45.0, 23.0, 32.0, 20.0, 18.0, 12.0, 17.0, 11.0, 6.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.733976364135742, -7.454599380493164, -7.175222873687744, -6.895845890045166, -6.616469383239746, -6.337092399597168, -6.05771541595459, -5.778338432312012, -5.498961925506592, -5.219584941864014, -4.940208435058594, -4.660831451416016, -4.3814544677734375, -4.102077960968018, -3.8227009773254395, -3.5433242321014404, -3.2639474868774414, -2.9845707416534424, -2.7051939964294434, -2.4258170127868652, -2.146440267562866, -1.8670635223388672, -1.5876866579055786, -1.30830979347229, -1.028933048248291, -0.7495562434196472, -0.4701794385910034, -0.19080263376235962, 0.08857417106628418, 0.3679509162902832, 0.6473277807235718, 0.9267046451568604, 1.2060813903808594, 1.4854581356048584, 1.764835000038147, 2.0442118644714355, 2.3235886096954346, 2.6029653549194336, 2.8823423385620117, 3.1617190837860107, 3.4410958290100098, 3.720472574234009, 3.999849319458008, 4.279226303100586, 4.558603286743164, 4.837979793548584, 5.117356777191162, 5.396733283996582, 5.67611026763916, 5.955487251281738, 6.234863758087158, 6.514240741729736, 6.793617248535156, 7.072994232177734, 7.3523712158203125, 7.631748199462891, 7.9111247062683105, 8.19050121307373, 8.469878196716309, 8.749255180358887, 9.028632164001465, 9.308008193969727, 9.587385177612305, 9.866762161254883, 10.146139144897461]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 9.0, 11.0, 8.0, 4.0, 11.0, 10.0, 16.0, 30.0, 21.0, 25.0, 26.0, 42.0, 31.0, 33.0, 30.0, 33.0, 41.0, 44.0, 50.0, 41.0, 24.0, 42.0, 40.0, 40.0, 39.0, 37.0, 36.0, 36.0, 27.0, 17.0, 20.0, 20.0, 14.0, 14.0, 19.0, 12.0, 6.0, 4.0, 9.0, 8.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.681656837463379, -7.452150821685791, -7.222645282745361, -6.993139266967773, -6.7636332511901855, -6.534127235412598, -6.304621696472168, -6.07511568069458, -5.845609664916992, -5.616103649139404, -5.386598110198975, -5.157092094421387, -4.927586078643799, -4.698080062866211, -4.468574523925781, -4.239068508148193, -4.0095624923706055, -3.7800567150115967, -3.550550699234009, -3.321044921875, -3.091538906097412, -2.8620331287384033, -2.6325273513793945, -2.4030213356018066, -2.173515796661377, -1.9440099000930786, -1.7145040035247803, -1.4849982261657715, -1.2554922103881836, -1.0259864330291748, -0.7964805364608765, -0.5669746398925781, -0.33746862411499023, -0.10796274244785309, 0.12154313921928406, 0.35104900598526, 0.5805549025535583, 0.8100607395172119, 1.0395666360855103, 1.2690725326538086, 1.498578429222107, 1.7280843257904053, 1.9575902223587036, 2.187096118927002, 2.4166018962860107, 2.6461076736450195, 2.8756136894226074, 3.1051197052001953, 3.334625482559204, 3.564131259918213, 3.793637275695801, 4.023143291473389, 4.252648830413818, 4.482154846191406, 4.711660861968994, 4.941166877746582, 5.170672416687012, 5.4001784324646, 5.629683971405029, 5.859189987182617, 6.088696002960205, 6.318202018737793, 6.547707557678223, 6.7772135734558105, 7.006719589233398]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 18.0, 13.0, 29.0, 27.0, 52.0, 72.0, 129.0, 201.0, 283.0, 435.0, 690.0, 1049.0, 1664.0, 2794.0, 4524.0, 7591.0, 12918.0, 22226.0, 38997.0, 66864.0, 109370.0, 163683.0, 191177.0, 160623.0, 108132.0, 64615.0, 37503.0, 21291.0, 12594.0, 7442.0, 4495.0, 2512.0, 1669.0, 1062.0, 626.0, 404.0, 273.0, 165.0, 108.0, 75.0, 46.0, 38.0, 23.0, 13.0, 11.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.4140625, -7.18572998046875, -6.9573974609375, -6.72906494140625, -6.500732421875, -6.27239990234375, -6.0440673828125, -5.81573486328125, -5.58740234375, -5.35906982421875, -5.1307373046875, -4.90240478515625, -4.674072265625, -4.44573974609375, -4.2174072265625, -3.98907470703125, -3.7607421875, -3.53240966796875, -3.3040771484375, -3.07574462890625, -2.847412109375, -2.61907958984375, -2.3907470703125, -2.16241455078125, -1.93408203125, -1.70574951171875, -1.4774169921875, -1.24908447265625, -1.020751953125, -0.79241943359375, -0.5640869140625, -0.33575439453125, -0.107421875, 0.12091064453125, 0.3492431640625, 0.57757568359375, 0.805908203125, 1.03424072265625, 1.2625732421875, 1.49090576171875, 1.71923828125, 1.94757080078125, 2.1759033203125, 2.40423583984375, 2.632568359375, 2.86090087890625, 3.0892333984375, 3.31756591796875, 3.5458984375, 3.77423095703125, 4.0025634765625, 4.23089599609375, 4.459228515625, 4.68756103515625, 4.9158935546875, 5.14422607421875, 5.37255859375, 5.60089111328125, 5.8292236328125, 6.05755615234375, 6.285888671875, 6.51422119140625, 6.7425537109375, 6.97088623046875, 7.19921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 5.0, 9.0, 10.0, 9.0, 13.0, 22.0, 24.0, 23.0, 16.0, 25.0, 32.0, 36.0, 48.0, 29.0, 29.0, 44.0, 49.0, 46.0, 52.0, 36.0, 49.0, 36.0, 41.0, 35.0, 35.0, 37.0, 25.0, 33.0, 16.0, 20.0, 18.0, 13.0, 17.0, 9.0, 10.0, 10.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.3011474609375, -7.059326171875, -6.8175048828125, -6.57568359375, -6.3338623046875, -6.092041015625, -5.8502197265625, -5.6083984375, -5.3665771484375, -5.124755859375, -4.8829345703125, -4.64111328125, -4.3992919921875, -4.157470703125, -3.9156494140625, -3.673828125, -3.4320068359375, -3.190185546875, -2.9483642578125, -2.70654296875, -2.4647216796875, -2.222900390625, -1.9810791015625, -1.7392578125, -1.4974365234375, -1.255615234375, -1.0137939453125, -0.77197265625, -0.5301513671875, -0.288330078125, -0.0465087890625, 0.1953125, 0.4371337890625, 0.678955078125, 0.9207763671875, 1.16259765625, 1.4044189453125, 1.646240234375, 1.8880615234375, 2.1298828125, 2.3717041015625, 2.613525390625, 2.8553466796875, 3.09716796875, 3.3389892578125, 3.580810546875, 3.8226318359375, 4.064453125, 4.3062744140625, 4.548095703125, 4.7899169921875, 5.03173828125, 5.2735595703125, 5.515380859375, 5.7572021484375, 5.9990234375, 6.2408447265625, 6.482666015625, 6.7244873046875, 6.96630859375, 7.2081298828125, 7.449951171875, 7.6917724609375, 7.93359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 11.0, 8.0, 21.0, 26.0, 29.0, 48.0, 75.0, 91.0, 117.0, 160.0, 223.0, 352.0, 541.0, 825.0, 1310.0, 2185.0, 3876.0, 7299.0, 15025.0, 31988.0, 76720.0, 181123.0, 319365.0, 227762.0, 99179.0, 41130.0, 18485.0, 8989.0, 4715.0, 2483.0, 1489.0, 972.0, 591.0, 379.0, 242.0, 205.0, 123.0, 99.0, 79.0, 48.0, 55.0, 28.0, 24.0, 21.0, 7.0, 5.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0], "bins": [-13.859375, -13.4593505859375, -13.059326171875, -12.6593017578125, -12.25927734375, -11.8592529296875, -11.459228515625, -11.0592041015625, -10.6591796875, -10.2591552734375, -9.859130859375, -9.4591064453125, -9.05908203125, -8.6590576171875, -8.259033203125, -7.8590087890625, -7.458984375, -7.0589599609375, -6.658935546875, -6.2589111328125, -5.85888671875, -5.4588623046875, -5.058837890625, -4.6588134765625, -4.2587890625, -3.8587646484375, -3.458740234375, -3.0587158203125, -2.65869140625, -2.2586669921875, -1.858642578125, -1.4586181640625, -1.05859375, -0.6585693359375, -0.258544921875, 0.1414794921875, 0.54150390625, 0.9415283203125, 1.341552734375, 1.7415771484375, 2.1416015625, 2.5416259765625, 2.941650390625, 3.3416748046875, 3.74169921875, 4.1417236328125, 4.541748046875, 4.9417724609375, 5.341796875, 5.7418212890625, 6.141845703125, 6.5418701171875, 6.94189453125, 7.3419189453125, 7.741943359375, 8.1419677734375, 8.5419921875, 8.9420166015625, 9.342041015625, 9.7420654296875, 10.14208984375, 10.5421142578125, 10.942138671875, 11.3421630859375, 11.7421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 10.0, 13.0, 19.0, 28.0, 11.0, 19.0, 21.0, 30.0, 38.0, 34.0, 25.0, 40.0, 35.0, 46.0, 47.0, 41.0, 47.0, 39.0, 53.0, 41.0, 43.0, 40.0, 33.0, 39.0, 29.0, 33.0, 21.0, 22.0, 23.0, 12.0, 19.0, 6.0, 9.0, 5.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.712158203125, -4.54931640625, -4.386474609375, -4.2236328125, -4.060791015625, -3.89794921875, -3.735107421875, -3.572265625, -3.409423828125, -3.24658203125, -3.083740234375, -2.9208984375, -2.758056640625, -2.59521484375, -2.432373046875, -2.26953125, -2.106689453125, -1.94384765625, -1.781005859375, -1.6181640625, -1.455322265625, -1.29248046875, -1.129638671875, -0.966796875, -0.803955078125, -0.64111328125, -0.478271484375, -0.3154296875, -0.152587890625, 0.01025390625, 0.173095703125, 0.3359375, 0.498779296875, 0.66162109375, 0.824462890625, 0.9873046875, 1.150146484375, 1.31298828125, 1.475830078125, 1.638671875, 1.801513671875, 1.96435546875, 2.127197265625, 2.2900390625, 2.452880859375, 2.61572265625, 2.778564453125, 2.94140625, 3.104248046875, 3.26708984375, 3.429931640625, 3.5927734375, 3.755615234375, 3.91845703125, 4.081298828125, 4.244140625, 4.406982421875, 4.56982421875, 4.732666015625, 4.8955078125, 5.058349609375, 5.22119140625, 5.384033203125, 5.546875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 10.0, 5.0, 17.0, 20.0, 23.0, 27.0, 62.0, 85.0, 101.0, 180.0, 223.0, 384.0, 516.0, 856.0, 1306.0, 2155.0, 3672.0, 6552.0, 12387.0, 25074.0, 54565.0, 125007.0, 266034.0, 285703.0, 142542.0, 61476.0, 28270.0, 13755.0, 7170.0, 3959.0, 2379.0, 1396.0, 917.0, 567.0, 376.0, 250.0, 162.0, 106.0, 85.0, 59.0, 43.0, 25.0, 16.0, 11.0, 10.0, 6.0, 4.0, 9.0, 4.0, 0.0, 1.0], "bins": [-6.1015625, -5.93243408203125, -5.7633056640625, -5.59417724609375, -5.425048828125, -5.25592041015625, -5.0867919921875, -4.91766357421875, -4.74853515625, -4.57940673828125, -4.4102783203125, -4.24114990234375, -4.072021484375, -3.90289306640625, -3.7337646484375, -3.56463623046875, -3.3955078125, -3.22637939453125, -3.0572509765625, -2.88812255859375, -2.718994140625, -2.54986572265625, -2.3807373046875, -2.21160888671875, -2.04248046875, -1.87335205078125, -1.7042236328125, -1.53509521484375, -1.365966796875, -1.19683837890625, -1.0277099609375, -0.85858154296875, -0.689453125, -0.52032470703125, -0.3511962890625, -0.18206787109375, -0.012939453125, 0.15618896484375, 0.3253173828125, 0.49444580078125, 0.66357421875, 0.83270263671875, 1.0018310546875, 1.17095947265625, 1.340087890625, 1.50921630859375, 1.6783447265625, 1.84747314453125, 2.0166015625, 2.18572998046875, 2.3548583984375, 2.52398681640625, 2.693115234375, 2.86224365234375, 3.0313720703125, 3.20050048828125, 3.36962890625, 3.53875732421875, 3.7078857421875, 3.87701416015625, 4.046142578125, 4.21527099609375, 4.3843994140625, 4.55352783203125, 4.72265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 8.0, 15.0, 14.0, 23.0, 22.0, 40.0, 51.0, 69.0, 80.0, 105.0, 117.0, 105.0, 81.0, 71.0, 48.0, 48.0, 21.0, 14.0, 11.0, 14.0, 9.0, 5.0, 4.0, 13.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003571510314941406, -0.00034651532769203186, -0.0003358796238899231, -0.00032524392008781433, -0.00031460821628570557, -0.0003039725124835968, -0.00029333680868148804, -0.00028270110487937927, -0.0002720654010772705, -0.00026142969727516174, -0.000250793993473053, -0.00024015828967094421, -0.00022952258586883545, -0.00021888688206672668, -0.00020825117826461792, -0.00019761547446250916, -0.0001869797706604004, -0.00017634406685829163, -0.00016570836305618286, -0.0001550726592540741, -0.00014443695545196533, -0.00013380125164985657, -0.0001231655478477478, -0.00011252984404563904, -0.00010189414024353027, -9.125843644142151e-05, -8.062273263931274e-05, -6.998702883720398e-05, -5.9351325035095215e-05, -4.871562123298645e-05, -3.8079917430877686e-05, -2.744421362876892e-05, -1.6808509826660156e-05, -6.172806024551392e-06, 4.462897777557373e-06, 1.5098601579666138e-05, 2.5734305381774902e-05, 3.637000918388367e-05, 4.700571298599243e-05, 5.7641416788101196e-05, 6.827712059020996e-05, 7.891282439231873e-05, 8.954852819442749e-05, 0.00010018423199653625, 0.00011081993579864502, 0.00012145563960075378, 0.00013209134340286255, 0.0001427270472049713, 0.00015336275100708008, 0.00016399845480918884, 0.0001746341586112976, 0.00018526986241340637, 0.00019590556621551514, 0.0002065412700176239, 0.00021717697381973267, 0.00022781267762184143, 0.0002384483814239502, 0.00024908408522605896, 0.0002597197890281677, 0.0002703554928302765, 0.00028099119663238525, 0.000291626900434494, 0.0003022626042366028, 0.00031289830803871155, 0.0003235340118408203]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 14.0, 17.0, 21.0, 20.0, 36.0, 44.0, 47.0, 73.0, 98.0, 181.0, 243.0, 394.0, 573.0, 910.0, 1454.0, 2318.0, 3771.0, 6674.0, 12107.0, 23892.0, 48988.0, 103099.0, 197215.0, 258012.0, 190718.0, 99392.0, 47025.0, 22994.0, 11659.0, 6563.0, 3716.0, 2245.0, 1372.0, 886.0, 593.0, 361.0, 228.0, 186.0, 128.0, 76.0, 70.0, 40.0, 22.0, 28.0, 20.0, 7.0, 13.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-4.69140625, -4.54693603515625, -4.4024658203125, -4.25799560546875, -4.113525390625, -3.96905517578125, -3.8245849609375, -3.68011474609375, -3.53564453125, -3.39117431640625, -3.2467041015625, -3.10223388671875, -2.957763671875, -2.81329345703125, -2.6688232421875, -2.52435302734375, -2.3798828125, -2.23541259765625, -2.0909423828125, -1.94647216796875, -1.802001953125, -1.65753173828125, -1.5130615234375, -1.36859130859375, -1.22412109375, -1.07965087890625, -0.9351806640625, -0.79071044921875, -0.646240234375, -0.50177001953125, -0.3572998046875, -0.21282958984375, -0.068359375, 0.07611083984375, 0.2205810546875, 0.36505126953125, 0.509521484375, 0.65399169921875, 0.7984619140625, 0.94293212890625, 1.08740234375, 1.23187255859375, 1.3763427734375, 1.52081298828125, 1.665283203125, 1.80975341796875, 1.9542236328125, 2.09869384765625, 2.2431640625, 2.38763427734375, 2.5321044921875, 2.67657470703125, 2.821044921875, 2.96551513671875, 3.1099853515625, 3.25445556640625, 3.39892578125, 3.54339599609375, 3.6878662109375, 3.83233642578125, 3.976806640625, 4.12127685546875, 4.2657470703125, 4.41021728515625, 4.5546875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 4.0, 10.0, 10.0, 17.0, 19.0, 21.0, 36.0, 31.0, 45.0, 59.0, 63.0, 55.0, 85.0, 75.0, 66.0, 72.0, 66.0, 50.0, 41.0, 35.0, 22.0, 20.0, 22.0, 16.0, 9.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6279296875, -1.5830841064453125, -1.538238525390625, -1.4933929443359375, -1.44854736328125, -1.4037017822265625, -1.358856201171875, -1.3140106201171875, -1.2691650390625, -1.2243194580078125, -1.179473876953125, -1.1346282958984375, -1.08978271484375, -1.0449371337890625, -1.000091552734375, -0.9552459716796875, -0.910400390625, -0.8655548095703125, -0.820709228515625, -0.7758636474609375, -0.73101806640625, -0.6861724853515625, -0.641326904296875, -0.5964813232421875, -0.5516357421875, -0.5067901611328125, -0.461944580078125, -0.4170989990234375, -0.37225341796875, -0.3274078369140625, -0.282562255859375, -0.2377166748046875, -0.19287109375, -0.1480255126953125, -0.103179931640625, -0.0583343505859375, -0.01348876953125, 0.0313568115234375, 0.076202392578125, 0.1210479736328125, 0.1658935546875, 0.2107391357421875, 0.255584716796875, 0.3004302978515625, 0.34527587890625, 0.3901214599609375, 0.434967041015625, 0.4798126220703125, 0.524658203125, 0.5695037841796875, 0.614349365234375, 0.6591949462890625, 0.70404052734375, 0.7488861083984375, 0.793731689453125, 0.8385772705078125, 0.8834228515625, 0.9282684326171875, 0.973114013671875, 1.0179595947265625, 1.06280517578125, 1.1076507568359375, 1.152496337890625, 1.1973419189453125, 1.2421875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 5.0, 8.0, 14.0, 7.0, 10.0, 17.0, 11.0, 19.0, 30.0, 22.0, 42.0, 43.0, 45.0, 59.0, 58.0, 65.0, 52.0, 65.0, 41.0, 50.0, 55.0, 38.0, 32.0, 34.0, 34.0, 31.0, 24.0, 14.0, 12.0, 12.0, 8.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.885694980621338, -6.6188063621521, -6.351917743682861, -6.085029125213623, -5.818140506744385, -5.5512518882751465, -5.284363746643066, -5.017475128173828, -4.75058650970459, -4.483697891235352, -4.216809272766113, -3.949920654296875, -3.6830320358276367, -3.4161434173583984, -3.1492550373077393, -2.882366418838501, -2.6154775619506836, -2.3485889434814453, -2.081700325012207, -1.8148118257522583, -1.54792320728302, -1.2810345888137817, -1.014146089553833, -0.7472574710845947, -0.48036885261535645, -0.21348026394844055, 0.05340832471847534, 0.32029688358306885, 0.5871855020523071, 0.8540741205215454, 1.1209626197814941, 1.3878512382507324, 1.654740333557129, 1.9216289520263672, 2.1885175704956055, 2.4554061889648438, 2.722294807434082, 2.9891834259033203, 3.2560718059539795, 3.5229604244232178, 3.789849042892456, 4.056737422943115, 4.3236260414123535, 4.590514659881592, 4.85740327835083, 5.124291896820068, 5.391180515289307, 5.658069133758545, 5.924957752227783, 6.1918463706970215, 6.45873498916626, 6.725623607635498, 6.992512226104736, 7.259400844573975, 7.526288986206055, 7.793177604675293, 8.060066223144531, 8.32695484161377, 8.593843460083008, 8.860732078552246, 9.127620697021484, 9.394509315490723, 9.661397933959961, 9.9282865524292, 10.195175170898438]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 8.0, 7.0, 8.0, 10.0, 11.0, 10.0, 12.0, 26.0, 24.0, 23.0, 16.0, 33.0, 32.0, 38.0, 38.0, 24.0, 45.0, 32.0, 42.0, 43.0, 34.0, 37.0, 36.0, 39.0, 36.0, 35.0, 33.0, 42.0, 29.0, 26.0, 20.0, 22.0, 12.0, 15.0, 25.0, 16.0, 7.0, 9.0, 10.0, 5.0, 4.0, 4.0, 6.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.1655449867248535, -6.950623989105225, -6.735702991485596, -6.520781993865967, -6.305860996246338, -6.090939998626709, -5.876018524169922, -5.661097526550293, -5.446176528930664, -5.231255531311035, -5.016334533691406, -4.801413536071777, -4.586492538452148, -4.3715715408325195, -4.156650543212891, -3.9417293071746826, -3.726808547973633, -3.511887550354004, -3.296966552734375, -3.082045555114746, -2.867124557495117, -2.6522035598754883, -2.4372823238372803, -2.2223613262176514, -2.0074403285980225, -1.7925193309783936, -1.5775983333587646, -1.3626772165298462, -1.1477562189102173, -0.9328352212905884, -0.7179141044616699, -0.502993106842041, -0.2880721092224121, -0.07315108180046082, 0.14176994562149048, 0.35669100284576416, 0.5716120004653931, 0.786532998085022, 1.0014541149139404, 1.2163751125335693, 1.4312961101531982, 1.6462171077728271, 1.861138105392456, 2.076059341430664, 2.290980339050293, 2.505901336669922, 2.720822334289551, 2.9357433319091797, 3.1506643295288086, 3.3655853271484375, 3.5805063247680664, 3.7954273223876953, 4.010348320007324, 4.225269317626953, 4.440190315246582, 4.655111312866211, 4.87003231048584, 5.084953308105469, 5.299874305725098, 5.514795303344727, 5.7297163009643555, 5.944637298583984, 6.159558296203613, 6.374479293823242, 6.589400768280029]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 13.0, 14.0, 20.0, 59.0, 81.0, 148.0, 213.0, 382.0, 601.0, 992.0, 1608.0, 2738.0, 4449.0, 7430.0, 12477.0, 20704.0, 33686.0, 55469.0, 87031.0, 124376.0, 156408.0, 159675.0, 131610.0, 93800.0, 60237.0, 37511.0, 22523.0, 13613.0, 8193.0, 5009.0, 2962.0, 1787.0, 1073.0, 646.0, 378.0, 243.0, 168.0, 85.0, 59.0, 32.0, 11.0, 17.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.52569580078125, -6.3013916015625, -6.07708740234375, -5.852783203125, -5.62847900390625, -5.4041748046875, -5.17987060546875, -4.95556640625, -4.73126220703125, -4.5069580078125, -4.28265380859375, -4.058349609375, -3.83404541015625, -3.6097412109375, -3.38543701171875, -3.1611328125, -2.93682861328125, -2.7125244140625, -2.48822021484375, -2.263916015625, -2.03961181640625, -1.8153076171875, -1.59100341796875, -1.36669921875, -1.14239501953125, -0.9180908203125, -0.69378662109375, -0.469482421875, -0.24517822265625, -0.0208740234375, 0.20343017578125, 0.427734375, 0.65203857421875, 0.8763427734375, 1.10064697265625, 1.324951171875, 1.54925537109375, 1.7735595703125, 1.99786376953125, 2.22216796875, 2.44647216796875, 2.6707763671875, 2.89508056640625, 3.119384765625, 3.34368896484375, 3.5679931640625, 3.79229736328125, 4.0166015625, 4.24090576171875, 4.4652099609375, 4.68951416015625, 4.913818359375, 5.13812255859375, 5.3624267578125, 5.58673095703125, 5.81103515625, 6.03533935546875, 6.2596435546875, 6.48394775390625, 6.708251953125, 6.93255615234375, 7.1568603515625, 7.38116455078125, 7.60546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 4.0, 9.0, 14.0, 18.0, 12.0, 16.0, 15.0, 31.0, 26.0, 22.0, 33.0, 32.0, 28.0, 53.0, 34.0, 36.0, 48.0, 39.0, 42.0, 42.0, 28.0, 42.0, 23.0, 42.0, 33.0, 35.0, 27.0, 33.0, 21.0, 20.0, 21.0, 18.0, 14.0, 11.0, 15.0, 13.0, 8.0, 5.0, 2.0, 4.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-7.30859375, -7.09014892578125, -6.8717041015625, -6.65325927734375, -6.434814453125, -6.21636962890625, -5.9979248046875, -5.77947998046875, -5.56103515625, -5.34259033203125, -5.1241455078125, -4.90570068359375, -4.687255859375, -4.46881103515625, -4.2503662109375, -4.03192138671875, -3.8134765625, -3.59503173828125, -3.3765869140625, -3.15814208984375, -2.939697265625, -2.72125244140625, -2.5028076171875, -2.28436279296875, -2.06591796875, -1.84747314453125, -1.6290283203125, -1.41058349609375, -1.192138671875, -0.97369384765625, -0.7552490234375, -0.53680419921875, -0.318359375, -0.09991455078125, 0.1185302734375, 0.33697509765625, 0.555419921875, 0.77386474609375, 0.9923095703125, 1.21075439453125, 1.42919921875, 1.64764404296875, 1.8660888671875, 2.08453369140625, 2.302978515625, 2.52142333984375, 2.7398681640625, 2.95831298828125, 3.1767578125, 3.39520263671875, 3.6136474609375, 3.83209228515625, 4.050537109375, 4.26898193359375, 4.4874267578125, 4.70587158203125, 4.92431640625, 5.14276123046875, 5.3612060546875, 5.57965087890625, 5.798095703125, 6.01654052734375, 6.2349853515625, 6.45343017578125, 6.671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 5.0, 11.0, 11.0, 20.0, 30.0, 52.0, 65.0, 90.0, 110.0, 206.0, 282.0, 432.0, 656.0, 932.0, 1437.0, 2200.0, 3302.0, 5184.0, 7866.0, 12227.0, 19250.0, 29949.0, 46050.0, 68624.0, 98431.0, 128239.0, 145103.0, 136508.0, 109619.0, 79156.0, 53735.0, 35082.0, 22505.0, 14467.0, 9318.0, 5921.0, 3951.0, 2463.0, 1700.0, 1086.0, 735.0, 479.0, 341.0, 248.0, 167.0, 100.0, 85.0, 40.0, 24.0, 18.0, 11.0, 14.0, 10.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328125, -5.14862060546875, -4.9691162109375, -4.78961181640625, -4.610107421875, -4.43060302734375, -4.2510986328125, -4.07159423828125, -3.89208984375, -3.71258544921875, -3.5330810546875, -3.35357666015625, -3.174072265625, -2.99456787109375, -2.8150634765625, -2.63555908203125, -2.4560546875, -2.27655029296875, -2.0970458984375, -1.91754150390625, -1.738037109375, -1.55853271484375, -1.3790283203125, -1.19952392578125, -1.02001953125, -0.84051513671875, -0.6610107421875, -0.48150634765625, -0.302001953125, -0.12249755859375, 0.0570068359375, 0.23651123046875, 0.416015625, 0.59552001953125, 0.7750244140625, 0.95452880859375, 1.134033203125, 1.31353759765625, 1.4930419921875, 1.67254638671875, 1.85205078125, 2.03155517578125, 2.2110595703125, 2.39056396484375, 2.570068359375, 2.74957275390625, 2.9290771484375, 3.10858154296875, 3.2880859375, 3.46759033203125, 3.6470947265625, 3.82659912109375, 4.006103515625, 4.18560791015625, 4.3651123046875, 4.54461669921875, 4.72412109375, 4.90362548828125, 5.0831298828125, 5.26263427734375, 5.442138671875, 5.62164306640625, 5.8011474609375, 5.98065185546875, 6.16015625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 8.0, 8.0, 6.0, 10.0, 7.0, 12.0, 18.0, 18.0, 19.0, 17.0, 26.0, 29.0, 41.0, 34.0, 31.0, 35.0, 36.0, 42.0, 39.0, 41.0, 36.0, 51.0, 34.0, 36.0, 35.0, 43.0, 33.0, 30.0, 24.0, 38.0, 19.0, 17.0, 25.0, 17.0, 14.0, 15.0, 12.0, 11.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.3323974609375, -4.192138671875, -4.0518798828125, -3.91162109375, -3.7713623046875, -3.631103515625, -3.4908447265625, -3.3505859375, -3.2103271484375, -3.070068359375, -2.9298095703125, -2.78955078125, -2.6492919921875, -2.509033203125, -2.3687744140625, -2.228515625, -2.0882568359375, -1.947998046875, -1.8077392578125, -1.66748046875, -1.5272216796875, -1.386962890625, -1.2467041015625, -1.1064453125, -0.9661865234375, -0.825927734375, -0.6856689453125, -0.54541015625, -0.4051513671875, -0.264892578125, -0.1246337890625, 0.015625, 0.1558837890625, 0.296142578125, 0.4364013671875, 0.57666015625, 0.7169189453125, 0.857177734375, 0.9974365234375, 1.1376953125, 1.2779541015625, 1.418212890625, 1.5584716796875, 1.69873046875, 1.8389892578125, 1.979248046875, 2.1195068359375, 2.259765625, 2.4000244140625, 2.540283203125, 2.6805419921875, 2.82080078125, 2.9610595703125, 3.101318359375, 3.2415771484375, 3.3818359375, 3.5220947265625, 3.662353515625, 3.8026123046875, 3.94287109375, 4.0831298828125, 4.223388671875, 4.3636474609375, 4.50390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 10.0, 12.0, 18.0, 28.0, 28.0, 39.0, 65.0, 79.0, 110.0, 161.0, 235.0, 338.0, 537.0, 653.0, 973.0, 1398.0, 2070.0, 3149.0, 4784.0, 7725.0, 12581.0, 21090.0, 36836.0, 64199.0, 110624.0, 169812.0, 200953.0, 161962.0, 102158.0, 59540.0, 33901.0, 19669.0, 11783.0, 7211.0, 4509.0, 2941.0, 1916.0, 1345.0, 917.0, 644.0, 442.0, 313.0, 217.0, 165.0, 113.0, 74.0, 61.0, 45.0, 42.0, 16.0, 22.0, 19.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0], "bins": [-4.87890625, -4.72845458984375, -4.5780029296875, -4.42755126953125, -4.277099609375, -4.12664794921875, -3.9761962890625, -3.82574462890625, -3.67529296875, -3.52484130859375, -3.3743896484375, -3.22393798828125, -3.073486328125, -2.92303466796875, -2.7725830078125, -2.62213134765625, -2.4716796875, -2.32122802734375, -2.1707763671875, -2.02032470703125, -1.869873046875, -1.71942138671875, -1.5689697265625, -1.41851806640625, -1.26806640625, -1.11761474609375, -0.9671630859375, -0.81671142578125, -0.666259765625, -0.51580810546875, -0.3653564453125, -0.21490478515625, -0.064453125, 0.08599853515625, 0.2364501953125, 0.38690185546875, 0.537353515625, 0.68780517578125, 0.8382568359375, 0.98870849609375, 1.13916015625, 1.28961181640625, 1.4400634765625, 1.59051513671875, 1.740966796875, 1.89141845703125, 2.0418701171875, 2.19232177734375, 2.3427734375, 2.49322509765625, 2.6436767578125, 2.79412841796875, 2.944580078125, 3.09503173828125, 3.2454833984375, 3.39593505859375, 3.54638671875, 3.69683837890625, 3.8472900390625, 3.99774169921875, 4.148193359375, 4.29864501953125, 4.4490966796875, 4.59954833984375, 4.75]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 8.0, 13.0, 15.0, 18.0, 18.0, 22.0, 23.0, 35.0, 25.0, 37.0, 43.0, 47.0, 57.0, 58.0, 68.0, 64.0, 54.0, 53.0, 50.0, 37.0, 36.0, 28.0, 25.0, 21.0, 23.0, 23.0, 9.0, 7.0, 10.0, 8.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003960132598876953, -0.0003835149109363556, -0.00037101656198501587, -0.00035851821303367615, -0.0003460198640823364, -0.0003335215151309967, -0.000321023166179657, -0.00030852481722831726, -0.00029602646827697754, -0.0002835281193256378, -0.0002710297703742981, -0.0002585314214229584, -0.00024603307247161865, -0.00023353472352027893, -0.0002210363745689392, -0.0002085380256175995, -0.00019603967666625977, -0.00018354132771492004, -0.00017104297876358032, -0.0001585446298122406, -0.00014604628086090088, -0.00013354793190956116, -0.00012104958295822144, -0.00010855123400688171, -9.605288505554199e-05, -8.355453610420227e-05, -7.105618715286255e-05, -5.855783820152283e-05, -4.6059489250183105e-05, -3.3561140298843384e-05, -2.1062791347503662e-05, -8.56444239616394e-06, 3.933906555175781e-06, 1.6432255506515503e-05, 2.8930604457855225e-05, 4.1428953409194946e-05, 5.392730236053467e-05, 6.642565131187439e-05, 7.892400026321411e-05, 9.142234921455383e-05, 0.00010392069816589355, 0.00011641904711723328, 0.000128917396068573, 0.00014141574501991272, 0.00015391409397125244, 0.00016641244292259216, 0.00017891079187393188, 0.0001914091408252716, 0.00020390748977661133, 0.00021640583872795105, 0.00022890418767929077, 0.0002414025366306305, 0.0002539008855819702, 0.00026639923453330994, 0.00027889758348464966, 0.0002913959324359894, 0.0003038942813873291, 0.0003163926303386688, 0.00032889097929000854, 0.00034138932824134827, 0.000353887677192688, 0.0003663860261440277, 0.00037888437509536743, 0.00039138272404670715, 0.0004038810729980469]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 9.0, 14.0, 9.0, 16.0, 27.0, 52.0, 49.0, 109.0, 162.0, 247.0, 416.0, 613.0, 959.0, 1587.0, 2757.0, 4683.0, 8157.0, 14526.0, 26184.0, 47364.0, 83781.0, 136577.0, 186301.0, 189288.0, 142305.0, 88481.0, 50250.0, 27656.0, 15152.0, 8515.0, 4955.0, 2844.0, 1674.0, 1064.0, 619.0, 387.0, 245.0, 161.0, 117.0, 69.0, 52.0, 41.0, 28.0, 21.0, 13.0, 12.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.63323974609375, -4.4930419921875, -4.35284423828125, -4.212646484375, -4.07244873046875, -3.9322509765625, -3.79205322265625, -3.65185546875, -3.51165771484375, -3.3714599609375, -3.23126220703125, -3.091064453125, -2.95086669921875, -2.8106689453125, -2.67047119140625, -2.5302734375, -2.39007568359375, -2.2498779296875, -2.10968017578125, -1.969482421875, -1.82928466796875, -1.6890869140625, -1.54888916015625, -1.40869140625, -1.26849365234375, -1.1282958984375, -0.98809814453125, -0.847900390625, -0.70770263671875, -0.5675048828125, -0.42730712890625, -0.287109375, -0.14691162109375, -0.0067138671875, 0.13348388671875, 0.273681640625, 0.41387939453125, 0.5540771484375, 0.69427490234375, 0.83447265625, 0.97467041015625, 1.1148681640625, 1.25506591796875, 1.395263671875, 1.53546142578125, 1.6756591796875, 1.81585693359375, 1.9560546875, 2.09625244140625, 2.2364501953125, 2.37664794921875, 2.516845703125, 2.65704345703125, 2.7972412109375, 2.93743896484375, 3.07763671875, 3.21783447265625, 3.3580322265625, 3.49822998046875, 3.638427734375, 3.77862548828125, 3.9188232421875, 4.05902099609375, 4.19921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 5.0, 9.0, 9.0, 18.0, 23.0, 22.0, 27.0, 18.0, 27.0, 31.0, 34.0, 37.0, 48.0, 49.0, 69.0, 59.0, 63.0, 53.0, 47.0, 49.0, 38.0, 39.0, 37.0, 28.0, 21.0, 24.0, 21.0, 12.0, 14.0, 10.0, 8.0, 8.0, 7.0, 4.0, 3.0, 9.0, 1.0, 0.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.380859375, -1.335662841796875, -1.29046630859375, -1.245269775390625, -1.2000732421875, -1.154876708984375, -1.10968017578125, -1.064483642578125, -1.019287109375, -0.974090576171875, -0.92889404296875, -0.883697509765625, -0.8385009765625, -0.793304443359375, -0.74810791015625, -0.702911376953125, -0.65771484375, -0.612518310546875, -0.56732177734375, -0.522125244140625, -0.4769287109375, -0.431732177734375, -0.38653564453125, -0.341339111328125, -0.296142578125, -0.250946044921875, -0.20574951171875, -0.160552978515625, -0.1153564453125, -0.070159912109375, -0.02496337890625, 0.020233154296875, 0.0654296875, 0.110626220703125, 0.15582275390625, 0.201019287109375, 0.2462158203125, 0.291412353515625, 0.33660888671875, 0.381805419921875, 0.427001953125, 0.472198486328125, 0.51739501953125, 0.562591552734375, 0.6077880859375, 0.652984619140625, 0.69818115234375, 0.743377685546875, 0.78857421875, 0.833770751953125, 0.87896728515625, 0.924163818359375, 0.9693603515625, 1.014556884765625, 1.05975341796875, 1.104949951171875, 1.150146484375, 1.195343017578125, 1.24053955078125, 1.285736083984375, 1.3309326171875, 1.376129150390625, 1.42132568359375, 1.466522216796875, 1.51171875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 8.0, 7.0, 16.0, 12.0, 19.0, 23.0, 22.0, 33.0, 39.0, 37.0, 51.0, 57.0, 64.0, 62.0, 68.0, 74.0, 50.0, 43.0, 46.0, 43.0, 38.0, 34.0, 22.0, 33.0, 18.0, 15.0, 18.0, 8.0, 5.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26020622253418, -5.975907325744629, -5.691608428955078, -5.407309532165527, -5.123010158538818, -4.838711261749268, -4.554412364959717, -4.270113468170166, -3.985814332962036, -3.7015154361724854, -3.4172163009643555, -3.1329174041748047, -2.848618507385254, -2.564319372177124, -2.2800204753875732, -1.995721459388733, -1.7114224433898926, -1.4271234273910522, -1.142824411392212, -0.8585255146026611, -0.5742264986038208, -0.28992748260498047, -0.0056285858154296875, 0.27867043018341064, 0.562969446182251, 0.8472684621810913, 1.1315674781799316, 1.4158663749694824, 1.7001653909683228, 1.984464406967163, 2.268763303756714, 2.5530624389648438, 2.8373613357543945, 3.1216602325439453, 3.405959367752075, 3.690258264541626, 3.974557399749756, 4.258856296539307, 4.543155193328857, 4.827454090118408, 5.111753463745117, 5.396052360534668, 5.680351257324219, 5.9646501541137695, 6.2489495277404785, 6.533248424530029, 6.81754732131958, 7.101846218109131, 7.386145114898682, 7.670444011688232, 7.954742908477783, 8.239042282104492, 8.523341178894043, 8.807640075683594, 9.091938972473145, 9.376237869262695, 9.660536766052246, 9.944835662841797, 10.229134559631348, 10.513433456420898, 10.79773235321045, 11.08203125, 11.366331100463867, 11.650629997253418, 11.934928894042969]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 13.0, 13.0, 14.0, 17.0, 21.0, 15.0, 24.0, 32.0, 33.0, 18.0, 30.0, 32.0, 27.0, 41.0, 45.0, 47.0, 43.0, 40.0, 46.0, 36.0, 51.0, 30.0, 23.0, 37.0, 29.0, 30.0, 25.0, 21.0, 24.0, 25.0, 14.0, 14.0, 10.0, 8.0, 7.0, 10.0, 7.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.785921096801758, -6.569186687469482, -6.352452754974365, -6.13571834564209, -5.918984413146973, -5.702250003814697, -5.485515594482422, -5.268781661987305, -5.052047252655029, -4.835312843322754, -4.618578910827637, -4.401844501495361, -4.185110092163086, -3.9683761596679688, -3.7516417503356934, -3.534907579421997, -3.318173408508301, -3.1014392375946045, -2.884705066680908, -2.667970657348633, -2.4512364864349365, -2.2345023155212402, -2.017767906188965, -1.8010337352752686, -1.5842995643615723, -1.367565393447876, -1.1508311033248901, -0.9340968728065491, -0.717362642288208, -0.5006284713745117, -0.2838941812515259, -0.06715989112854004, 0.14957427978515625, 0.3663085103034973, 0.5830427408218384, 0.7997769713401794, 1.0165112018585205, 1.2332453727722168, 1.4499796628952026, 1.6667139530181885, 1.8834481239318848, 2.100182294845581, 2.3169164657592773, 2.5336508750915527, 2.750385046005249, 2.9671192169189453, 3.1838536262512207, 3.400587797164917, 3.6173219680786133, 3.8340561389923096, 4.050790309906006, 4.267524719238281, 4.484258651733398, 4.700993061065674, 4.917727470397949, 5.134461402893066, 5.351195812225342, 5.567930221557617, 5.784664154052734, 6.00139856338501, 6.218132972717285, 6.434866905212402, 6.651601314544678, 6.868335723876953, 7.08506965637207]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 7.0, 9.0, 9.0, 15.0, 26.0, 53.0, 59.0, 127.0, 175.0, 316.0, 533.0, 1062.0, 1954.0, 3741.0, 7660.0, 16261.0, 37905.0, 96872.0, 290774.0, 920702.0, 1561171.0, 840570.0, 258946.0, 88447.0, 35426.0, 15913.0, 7497.0, 3824.0, 1929.0, 1033.0, 537.0, 318.0, 160.0, 111.0, 60.0, 26.0, 18.0, 11.0, 10.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.46875, -13.1185302734375, -12.768310546875, -12.4180908203125, -12.06787109375, -11.7176513671875, -11.367431640625, -11.0172119140625, -10.6669921875, -10.3167724609375, -9.966552734375, -9.6163330078125, -9.26611328125, -8.9158935546875, -8.565673828125, -8.2154541015625, -7.865234375, -7.5150146484375, -7.164794921875, -6.8145751953125, -6.46435546875, -6.1141357421875, -5.763916015625, -5.4136962890625, -5.0634765625, -4.7132568359375, -4.363037109375, -4.0128173828125, -3.66259765625, -3.3123779296875, -2.962158203125, -2.6119384765625, -2.26171875, -1.9114990234375, -1.561279296875, -1.2110595703125, -0.86083984375, -0.5106201171875, -0.160400390625, 0.1898193359375, 0.5400390625, 0.8902587890625, 1.240478515625, 1.5906982421875, 1.94091796875, 2.2911376953125, 2.641357421875, 2.9915771484375, 3.341796875, 3.6920166015625, 4.042236328125, 4.3924560546875, 4.74267578125, 5.0928955078125, 5.443115234375, 5.7933349609375, 6.1435546875, 6.4937744140625, 6.843994140625, 7.1942138671875, 7.54443359375, 7.8946533203125, 8.244873046875, 8.5950927734375, 8.9453125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 19.0, 22.0, 28.0, 27.0, 25.0, 40.0, 31.0, 33.0, 42.0, 37.0, 45.0, 52.0, 50.0, 47.0, 34.0, 55.0, 38.0, 39.0, 29.0, 29.0, 44.0, 27.0, 27.0, 24.0, 20.0, 14.0, 17.0, 13.0, 10.0, 7.0, 4.0, 6.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.6796875, -5.51416015625, -5.3486328125, -5.18310546875, -5.017578125, -4.85205078125, -4.6865234375, -4.52099609375, -4.35546875, -4.18994140625, -4.0244140625, -3.85888671875, -3.693359375, -3.52783203125, -3.3623046875, -3.19677734375, -3.03125, -2.86572265625, -2.7001953125, -2.53466796875, -2.369140625, -2.20361328125, -2.0380859375, -1.87255859375, -1.70703125, -1.54150390625, -1.3759765625, -1.21044921875, -1.044921875, -0.87939453125, -0.7138671875, -0.54833984375, -0.3828125, -0.21728515625, -0.0517578125, 0.11376953125, 0.279296875, 0.44482421875, 0.6103515625, 0.77587890625, 0.94140625, 1.10693359375, 1.2724609375, 1.43798828125, 1.603515625, 1.76904296875, 1.9345703125, 2.10009765625, 2.265625, 2.43115234375, 2.5966796875, 2.76220703125, 2.927734375, 3.09326171875, 3.2587890625, 3.42431640625, 3.58984375, 3.75537109375, 3.9208984375, 4.08642578125, 4.251953125, 4.41748046875, 4.5830078125, 4.74853515625, 4.9140625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 6.0, 13.0, 19.0, 21.0, 47.0, 44.0, 97.0, 130.0, 199.0, 269.0, 392.0, 556.0, 905.0, 1334.0, 2121.0, 3252.0, 5131.0, 8299.0, 13392.0, 21868.0, 36958.0, 64008.0, 114200.0, 211567.0, 395823.0, 698741.0, 928098.0, 738724.0, 426639.0, 228475.0, 123953.0, 68368.0, 39149.0, 23319.0, 14027.0, 8777.0, 5388.0, 3359.0, 2238.0, 1491.0, 948.0, 656.0, 419.0, 290.0, 200.0, 140.0, 72.0, 47.0, 37.0, 24.0, 24.0, 13.0, 12.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.296875, -6.0838623046875, -5.870849609375, -5.6578369140625, -5.44482421875, -5.2318115234375, -5.018798828125, -4.8057861328125, -4.5927734375, -4.3797607421875, -4.166748046875, -3.9537353515625, -3.74072265625, -3.5277099609375, -3.314697265625, -3.1016845703125, -2.888671875, -2.6756591796875, -2.462646484375, -2.2496337890625, -2.03662109375, -1.8236083984375, -1.610595703125, -1.3975830078125, -1.1845703125, -0.9715576171875, -0.758544921875, -0.5455322265625, -0.33251953125, -0.1195068359375, 0.093505859375, 0.3065185546875, 0.51953125, 0.7325439453125, 0.945556640625, 1.1585693359375, 1.37158203125, 1.5845947265625, 1.797607421875, 2.0106201171875, 2.2236328125, 2.4366455078125, 2.649658203125, 2.8626708984375, 3.07568359375, 3.2886962890625, 3.501708984375, 3.7147216796875, 3.927734375, 4.1407470703125, 4.353759765625, 4.5667724609375, 4.77978515625, 4.9927978515625, 5.205810546875, 5.4188232421875, 5.6318359375, 5.8448486328125, 6.057861328125, 6.2708740234375, 6.48388671875, 6.6968994140625, 6.909912109375, 7.1229248046875, 7.3359375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 8.0, 12.0, 15.0, 18.0, 28.0, 31.0, 25.0, 48.0, 47.0, 61.0, 87.0, 108.0, 131.0, 161.0, 176.0, 233.0, 258.0, 290.0, 296.0, 296.0, 293.0, 201.0, 236.0, 166.0, 148.0, 123.0, 113.0, 101.0, 78.0, 59.0, 33.0, 38.0, 25.0, 30.0, 24.0, 14.0, 9.0, 8.0, 9.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.4840087890625, -2.403564453125, -2.3231201171875, -2.24267578125, -2.1622314453125, -2.081787109375, -2.0013427734375, -1.9208984375, -1.8404541015625, -1.760009765625, -1.6795654296875, -1.59912109375, -1.5186767578125, -1.438232421875, -1.3577880859375, -1.27734375, -1.1968994140625, -1.116455078125, -1.0360107421875, -0.95556640625, -0.8751220703125, -0.794677734375, -0.7142333984375, -0.6337890625, -0.5533447265625, -0.472900390625, -0.3924560546875, -0.31201171875, -0.2315673828125, -0.151123046875, -0.0706787109375, 0.009765625, 0.0902099609375, 0.170654296875, 0.2510986328125, 0.33154296875, 0.4119873046875, 0.492431640625, 0.5728759765625, 0.6533203125, 0.7337646484375, 0.814208984375, 0.8946533203125, 0.97509765625, 1.0555419921875, 1.135986328125, 1.2164306640625, 1.296875, 1.3773193359375, 1.457763671875, 1.5382080078125, 1.61865234375, 1.6990966796875, 1.779541015625, 1.8599853515625, 1.9404296875, 2.0208740234375, 2.101318359375, 2.1817626953125, 2.26220703125, 2.3426513671875, 2.423095703125, 2.5035400390625, 2.583984375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 12.0, 11.0, 20.0, 23.0, 20.0, 32.0, 35.0, 49.0, 65.0, 48.0, 79.0, 72.0, 75.0, 73.0, 58.0, 52.0, 47.0, 44.0, 34.0, 29.0, 24.0, 14.0, 14.0, 7.0, 15.0, 3.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.479434013366699, -7.182035446166992, -6.884636878967285, -6.587238311767578, -6.289839267730713, -5.992440700531006, -5.695042133331299, -5.397643089294434, -5.100244522094727, -4.8028459548950195, -4.5054473876953125, -4.2080488204956055, -3.9106497764587402, -3.613251209259033, -3.315852642059326, -3.01845383644104, -2.721055507659912, -2.423656940460205, -2.126258134841919, -1.828859567642212, -1.5314608812332153, -1.2340621948242188, -0.9366636276245117, -0.6392648220062256, -0.34186625480651855, -0.04446759819984436, 0.25293105840682983, 0.5503296852111816, 0.8477283716201782, 1.1451270580291748, 1.4425256252288818, 1.739924430847168, 2.037322998046875, 2.334721565246582, 2.632120370864868, 2.929518938064575, 3.2269177436828613, 3.5243163108825684, 3.8217148780822754, 4.119113922119141, 4.416512489318848, 4.713911056518555, 5.011309623718262, 5.308708190917969, 5.606107234954834, 5.903505802154541, 6.200904369354248, 6.498303413391113, 6.795701503753662, 7.093100070953369, 7.390498638153076, 7.687897682189941, 7.985296249389648, 8.282694816589355, 8.580093383789062, 8.87749195098877, 9.174890518188477, 9.472289085388184, 9.76968765258789, 10.067086219787598, 10.364484786987305, 10.661884307861328, 10.959281921386719, 11.256681442260742, 11.55408000946045]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 5.0, 8.0, 10.0, 8.0, 11.0, 12.0, 19.0, 19.0, 23.0, 25.0, 30.0, 27.0, 27.0, 39.0, 39.0, 42.0, 35.0, 38.0, 35.0, 39.0, 35.0, 32.0, 40.0, 33.0, 37.0, 31.0, 43.0, 39.0, 24.0, 22.0, 25.0, 13.0, 21.0, 11.0, 14.0, 15.0, 10.0, 9.0, 12.0, 5.0, 4.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-5.8547821044921875, -5.6723103523254395, -5.489838600158691, -5.307366847991943, -5.124895095825195, -4.942423343658447, -4.759951591491699, -4.577480316162109, -4.395008087158203, -4.212536334991455, -4.030064582824707, -3.847592830657959, -3.665121078491211, -3.482649326324463, -3.300177812576294, -3.117706060409546, -2.935234546661377, -2.752762794494629, -2.570291042327881, -2.387819290161133, -2.2053475379943848, -2.0228757858276367, -1.8404042720794678, -1.6579325199127197, -1.4754607677459717, -1.2929890155792236, -1.1105172634124756, -0.9280456304550171, -0.745573878288269, -0.563102126121521, -0.3806304931640625, -0.19815874099731445, -0.01568746566772461, 0.16678425669670105, 0.3492559790611267, 0.53172767162323, 0.714199423789978, 0.8966711759567261, 1.0791428089141846, 1.2616145610809326, 1.4440863132476807, 1.6265580654144287, 1.8090298175811768, 1.9915014505386353, 2.1739730834960938, 2.356444835662842, 2.53891658782959, 2.721388339996338, 2.903860092163086, 3.086331844329834, 3.268803596496582, 3.45127534866333, 3.633747100830078, 3.816218852996826, 3.998690366744995, 4.181161880493164, 4.36363410949707, 4.546105861663818, 4.728577613830566, 4.9110493659973145, 5.0935211181640625, 5.2759928703308105, 5.458464622497559, 5.640935897827148, 5.8234076499938965]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 14.0, 11.0, 20.0, 27.0, 48.0, 59.0, 106.0, 196.0, 304.0, 588.0, 956.0, 1676.0, 3083.0, 5876.0, 11240.0, 22308.0, 45656.0, 89605.0, 161325.0, 225680.0, 207241.0, 131084.0, 70094.0, 35232.0, 17351.0, 8687.0, 4442.0, 2380.0, 1402.0, 709.0, 455.0, 241.0, 170.0, 107.0, 65.0, 46.0, 23.0, 10.0, 9.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.78363037109375, -5.5828857421875, -5.38214111328125, -5.181396484375, -4.98065185546875, -4.7799072265625, -4.57916259765625, -4.37841796875, -4.17767333984375, -3.9769287109375, -3.77618408203125, -3.575439453125, -3.37469482421875, -3.1739501953125, -2.97320556640625, -2.7724609375, -2.57171630859375, -2.3709716796875, -2.17022705078125, -1.969482421875, -1.76873779296875, -1.5679931640625, -1.36724853515625, -1.16650390625, -0.96575927734375, -0.7650146484375, -0.56427001953125, -0.363525390625, -0.16278076171875, 0.0379638671875, 0.23870849609375, 0.439453125, 0.64019775390625, 0.8409423828125, 1.04168701171875, 1.242431640625, 1.44317626953125, 1.6439208984375, 1.84466552734375, 2.04541015625, 2.24615478515625, 2.4468994140625, 2.64764404296875, 2.848388671875, 3.04913330078125, 3.2498779296875, 3.45062255859375, 3.6513671875, 3.85211181640625, 4.0528564453125, 4.25360107421875, 4.454345703125, 4.65509033203125, 4.8558349609375, 5.05657958984375, 5.25732421875, 5.45806884765625, 5.6588134765625, 5.85955810546875, 6.060302734375, 6.26104736328125, 6.4617919921875, 6.66253662109375, 6.86328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 6.0, 7.0, 9.0, 13.0, 11.0, 13.0, 20.0, 23.0, 25.0, 24.0, 35.0, 25.0, 31.0, 37.0, 36.0, 38.0, 40.0, 36.0, 33.0, 39.0, 48.0, 50.0, 38.0, 32.0, 47.0, 36.0, 20.0, 29.0, 26.0, 27.0, 20.0, 16.0, 14.0, 14.0, 12.0, 13.0, 11.0, 10.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.30859375, -6.1151123046875, -5.921630859375, -5.7281494140625, -5.53466796875, -5.3411865234375, -5.147705078125, -4.9542236328125, -4.7607421875, -4.5672607421875, -4.373779296875, -4.1802978515625, -3.98681640625, -3.7933349609375, -3.599853515625, -3.4063720703125, -3.212890625, -3.0194091796875, -2.825927734375, -2.6324462890625, -2.43896484375, -2.2454833984375, -2.052001953125, -1.8585205078125, -1.6650390625, -1.4715576171875, -1.278076171875, -1.0845947265625, -0.89111328125, -0.6976318359375, -0.504150390625, -0.3106689453125, -0.1171875, 0.0762939453125, 0.269775390625, 0.4632568359375, 0.65673828125, 0.8502197265625, 1.043701171875, 1.2371826171875, 1.4306640625, 1.6241455078125, 1.817626953125, 2.0111083984375, 2.20458984375, 2.3980712890625, 2.591552734375, 2.7850341796875, 2.978515625, 3.1719970703125, 3.365478515625, 3.5589599609375, 3.75244140625, 3.9459228515625, 4.139404296875, 4.3328857421875, 4.5263671875, 4.7198486328125, 4.913330078125, 5.1068115234375, 5.30029296875, 5.4937744140625, 5.687255859375, 5.8807373046875, 6.07421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 14.0, 8.0, 19.0, 20.0, 28.0, 62.0, 78.0, 114.0, 158.0, 263.0, 404.0, 638.0, 983.0, 1679.0, 2887.0, 5251.0, 9801.0, 19160.0, 38799.0, 80136.0, 159174.0, 257868.0, 224914.0, 123679.0, 60283.0, 29338.0, 14796.0, 7572.0, 4255.0, 2303.0, 1455.0, 873.0, 513.0, 316.0, 240.0, 141.0, 116.0, 75.0, 31.0, 27.0, 30.0, 17.0, 10.0, 6.0, 7.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2894287109375, -6.063232421875, -5.8370361328125, -5.61083984375, -5.3846435546875, -5.158447265625, -4.9322509765625, -4.7060546875, -4.4798583984375, -4.253662109375, -4.0274658203125, -3.80126953125, -3.5750732421875, -3.348876953125, -3.1226806640625, -2.896484375, -2.6702880859375, -2.444091796875, -2.2178955078125, -1.99169921875, -1.7655029296875, -1.539306640625, -1.3131103515625, -1.0869140625, -0.8607177734375, -0.634521484375, -0.4083251953125, -0.18212890625, 0.0440673828125, 0.270263671875, 0.4964599609375, 0.72265625, 0.9488525390625, 1.175048828125, 1.4012451171875, 1.62744140625, 1.8536376953125, 2.079833984375, 2.3060302734375, 2.5322265625, 2.7584228515625, 2.984619140625, 3.2108154296875, 3.43701171875, 3.6632080078125, 3.889404296875, 4.1156005859375, 4.341796875, 4.5679931640625, 4.794189453125, 5.0203857421875, 5.24658203125, 5.4727783203125, 5.698974609375, 5.9251708984375, 6.1513671875, 6.3775634765625, 6.603759765625, 6.8299560546875, 7.05615234375, 7.2823486328125, 7.508544921875, 7.7347412109375, 7.9609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 16.0, 10.0, 13.0, 16.0, 19.0, 23.0, 27.0, 24.0, 27.0, 28.0, 40.0, 42.0, 24.0, 42.0, 41.0, 53.0, 43.0, 28.0, 45.0, 50.0, 35.0, 37.0, 42.0, 22.0, 28.0, 26.0, 24.0, 23.0, 23.0, 15.0, 17.0, 13.0, 13.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.1640625, -4.0474853515625, -3.930908203125, -3.8143310546875, -3.69775390625, -3.5811767578125, -3.464599609375, -3.3480224609375, -3.2314453125, -3.1148681640625, -2.998291015625, -2.8817138671875, -2.76513671875, -2.6485595703125, -2.531982421875, -2.4154052734375, -2.298828125, -2.1822509765625, -2.065673828125, -1.9490966796875, -1.83251953125, -1.7159423828125, -1.599365234375, -1.4827880859375, -1.3662109375, -1.2496337890625, -1.133056640625, -1.0164794921875, -0.89990234375, -0.7833251953125, -0.666748046875, -0.5501708984375, -0.43359375, -0.3170166015625, -0.200439453125, -0.0838623046875, 0.03271484375, 0.1492919921875, 0.265869140625, 0.3824462890625, 0.4990234375, 0.6156005859375, 0.732177734375, 0.8487548828125, 0.96533203125, 1.0819091796875, 1.198486328125, 1.3150634765625, 1.431640625, 1.5482177734375, 1.664794921875, 1.7813720703125, 1.89794921875, 2.0145263671875, 2.131103515625, 2.2476806640625, 2.3642578125, 2.4808349609375, 2.597412109375, 2.7139892578125, 2.83056640625, 2.9471435546875, 3.063720703125, 3.1802978515625, 3.296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 14.0, 14.0, 13.0, 18.0, 29.0, 43.0, 45.0, 76.0, 104.0, 124.0, 192.0, 256.0, 385.0, 626.0, 972.0, 1701.0, 2796.0, 5186.0, 10172.0, 21018.0, 47832.0, 114257.0, 266461.0, 314793.0, 147540.0, 60591.0, 26449.0, 12318.0, 6088.0, 3251.0, 1866.0, 1077.0, 677.0, 484.0, 295.0, 229.0, 153.0, 106.0, 93.0, 56.0, 35.0, 26.0, 32.0, 10.0, 12.0, 11.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.98046875, -4.8345947265625, -4.688720703125, -4.5428466796875, -4.39697265625, -4.2510986328125, -4.105224609375, -3.9593505859375, -3.8134765625, -3.6676025390625, -3.521728515625, -3.3758544921875, -3.22998046875, -3.0841064453125, -2.938232421875, -2.7923583984375, -2.646484375, -2.5006103515625, -2.354736328125, -2.2088623046875, -2.06298828125, -1.9171142578125, -1.771240234375, -1.6253662109375, -1.4794921875, -1.3336181640625, -1.187744140625, -1.0418701171875, -0.89599609375, -0.7501220703125, -0.604248046875, -0.4583740234375, -0.3125, -0.1666259765625, -0.020751953125, 0.1251220703125, 0.27099609375, 0.4168701171875, 0.562744140625, 0.7086181640625, 0.8544921875, 1.0003662109375, 1.146240234375, 1.2921142578125, 1.43798828125, 1.5838623046875, 1.729736328125, 1.8756103515625, 2.021484375, 2.1673583984375, 2.313232421875, 2.4591064453125, 2.60498046875, 2.7508544921875, 2.896728515625, 3.0426025390625, 3.1884765625, 3.3343505859375, 3.480224609375, 3.6260986328125, 3.77197265625, 3.9178466796875, 4.063720703125, 4.2095947265625, 4.35546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 7.0, 11.0, 13.0, 15.0, 18.0, 22.0, 28.0, 40.0, 43.0, 66.0, 52.0, 70.0, 65.0, 80.0, 76.0, 74.0, 71.0, 51.0, 52.0, 35.0, 20.0, 20.0, 11.0, 10.0, 9.0, 8.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017976760864257812, -0.00017384812235832214, -0.00016792863607406616, -0.00016200914978981018, -0.0001560896635055542, -0.00015017017722129822, -0.00014425069093704224, -0.00013833120465278625, -0.00013241171836853027, -0.0001264922320842743, -0.00012057274580001831, -0.00011465325951576233, -0.00010873377323150635, -0.00010281428694725037, -9.689480066299438e-05, -9.09753143787384e-05, -8.505582809448242e-05, -7.913634181022644e-05, -7.321685552597046e-05, -6.729736924171448e-05, -6.13778829574585e-05, -5.5458396673202515e-05, -4.953891038894653e-05, -4.361942410469055e-05, -3.769993782043457e-05, -3.178045153617859e-05, -2.5860965251922607e-05, -1.9941478967666626e-05, -1.4021992683410645e-05, -8.102506399154663e-06, -2.1830201148986816e-06, 3.7364661693573e-06, 9.655952453613281e-06, 1.5575438737869263e-05, 2.1494925022125244e-05, 2.7414411306381226e-05, 3.333389759063721e-05, 3.925338387489319e-05, 4.517287015914917e-05, 5.109235644340515e-05, 5.701184272766113e-05, 6.293132901191711e-05, 6.88508152961731e-05, 7.477030158042908e-05, 8.068978786468506e-05, 8.660927414894104e-05, 9.252876043319702e-05, 9.8448246717453e-05, 0.00010436773300170898, 0.00011028721928596497, 0.00011620670557022095, 0.00012212619185447693, 0.0001280456781387329, 0.0001339651644229889, 0.00013988465070724487, 0.00014580413699150085, 0.00015172362327575684, 0.00015764310956001282, 0.0001635625958442688, 0.00016948208212852478, 0.00017540156841278076, 0.00018132105469703674, 0.00018724054098129272, 0.0001931600272655487, 0.0001990795135498047]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 14.0, 13.0, 23.0, 35.0, 59.0, 64.0, 119.0, 153.0, 246.0, 321.0, 516.0, 758.0, 1160.0, 1980.0, 3472.0, 6167.0, 11455.0, 22056.0, 44227.0, 89037.0, 165569.0, 235190.0, 209041.0, 125437.0, 63443.0, 31701.0, 16227.0, 8357.0, 4686.0, 2684.0, 1549.0, 939.0, 598.0, 392.0, 257.0, 183.0, 113.0, 87.0, 62.0, 38.0, 36.0, 20.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0], "bins": [-3.3828125, -3.285491943359375, -3.18817138671875, -3.090850830078125, -2.9935302734375, -2.896209716796875, -2.79888916015625, -2.701568603515625, -2.604248046875, -2.506927490234375, -2.40960693359375, -2.312286376953125, -2.2149658203125, -2.117645263671875, -2.02032470703125, -1.923004150390625, -1.82568359375, -1.728363037109375, -1.63104248046875, -1.533721923828125, -1.4364013671875, -1.339080810546875, -1.24176025390625, -1.144439697265625, -1.047119140625, -0.949798583984375, -0.85247802734375, -0.755157470703125, -0.6578369140625, -0.560516357421875, -0.46319580078125, -0.365875244140625, -0.2685546875, -0.171234130859375, -0.07391357421875, 0.023406982421875, 0.1207275390625, 0.218048095703125, 0.31536865234375, 0.412689208984375, 0.510009765625, 0.607330322265625, 0.70465087890625, 0.801971435546875, 0.8992919921875, 0.996612548828125, 1.09393310546875, 1.191253662109375, 1.28857421875, 1.385894775390625, 1.48321533203125, 1.580535888671875, 1.6778564453125, 1.775177001953125, 1.87249755859375, 1.969818115234375, 2.067138671875, 2.164459228515625, 2.26177978515625, 2.359100341796875, 2.4564208984375, 2.553741455078125, 2.65106201171875, 2.748382568359375, 2.845703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 13.0, 8.0, 10.0, 12.0, 29.0, 36.0, 30.0, 45.0, 51.0, 60.0, 72.0, 71.0, 80.0, 70.0, 59.0, 60.0, 63.0, 40.0, 39.0, 29.0, 25.0, 17.0, 11.0, 15.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0888671875, -1.055572509765625, -1.02227783203125, -0.988983154296875, -0.9556884765625, -0.922393798828125, -0.88909912109375, -0.855804443359375, -0.822509765625, -0.789215087890625, -0.75592041015625, -0.722625732421875, -0.6893310546875, -0.656036376953125, -0.62274169921875, -0.589447021484375, -0.55615234375, -0.522857666015625, -0.48956298828125, -0.456268310546875, -0.4229736328125, -0.389678955078125, -0.35638427734375, -0.323089599609375, -0.289794921875, -0.256500244140625, -0.22320556640625, -0.189910888671875, -0.1566162109375, -0.123321533203125, -0.09002685546875, -0.056732177734375, -0.0234375, 0.009857177734375, 0.04315185546875, 0.076446533203125, 0.1097412109375, 0.143035888671875, 0.17633056640625, 0.209625244140625, 0.242919921875, 0.276214599609375, 0.30950927734375, 0.342803955078125, 0.3760986328125, 0.409393310546875, 0.44268798828125, 0.475982666015625, 0.50927734375, 0.542572021484375, 0.57586669921875, 0.609161376953125, 0.6424560546875, 0.675750732421875, 0.70904541015625, 0.742340087890625, 0.775634765625, 0.808929443359375, 0.84222412109375, 0.875518798828125, 0.9088134765625, 0.942108154296875, 0.97540283203125, 1.008697509765625, 1.0419921875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 11.0, 12.0, 27.0, 15.0, 22.0, 28.0, 41.0, 60.0, 58.0, 62.0, 76.0, 60.0, 62.0, 71.0, 79.0, 52.0, 47.0, 32.0, 29.0, 30.0, 21.0, 14.0, 18.0, 3.0, 10.0, 9.0, 7.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.090021133422852, -7.80002498626709, -7.510028839111328, -7.220032215118408, -6.9300360679626465, -6.640039920806885, -6.350043296813965, -6.060047149658203, -5.770051002502441, -5.48005485534668, -5.190058708190918, -4.900062084197998, -4.610065937042236, -4.320069789886475, -4.030073165893555, -3.740077018737793, -3.4500808715820312, -3.1600847244262695, -2.8700883388519287, -2.580091953277588, -2.290095806121826, -2.0000996589660645, -1.7101032733917236, -1.4201068878173828, -1.130110740661621, -0.8401144742965698, -0.5501182079315186, -0.2601219415664673, 0.029874324798583984, 0.31987059116363525, 0.6098668575286865, 0.8998632431030273, 1.189859390258789, 1.4798556566238403, 1.7698519229888916, 2.0598483085632324, 2.349844455718994, 2.639840602874756, 2.9298369884490967, 3.2198333740234375, 3.509829521179199, 3.799825668334961, 4.089821815490723, 4.379818439483643, 4.669814586639404, 4.959810733795166, 5.249807357788086, 5.539803504943848, 5.829799652099609, 6.119795799255371, 6.409791946411133, 6.699788570404053, 6.9897847175598145, 7.279780864715576, 7.569777488708496, 7.859773635864258, 8.14976978302002, 8.439765930175781, 8.729762077331543, 9.019758224487305, 9.309755325317383, 9.599751472473145, 9.889747619628906, 10.179743766784668, 10.46973991394043]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 7.0, 8.0, 9.0, 11.0, 12.0, 16.0, 15.0, 23.0, 31.0, 20.0, 31.0, 26.0, 26.0, 41.0, 39.0, 41.0, 39.0, 43.0, 39.0, 36.0, 28.0, 38.0, 32.0, 37.0, 32.0, 45.0, 34.0, 29.0, 30.0, 21.0, 21.0, 17.0, 14.0, 11.0, 19.0, 11.0, 9.0, 7.0, 8.0, 10.0, 2.0, 3.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-5.845791339874268, -5.666573524475098, -5.487356185913086, -5.308138370513916, -5.128920555114746, -4.949702739715576, -4.770484924316406, -4.5912675857543945, -4.412049770355225, -4.232831954956055, -4.053614616394043, -3.874396800994873, -3.695178985595703, -3.515961170196533, -3.3367435932159424, -3.1575260162353516, -2.9783082008361816, -2.7990903854370117, -2.619872808456421, -2.44065523147583, -2.26143741607666, -2.0822196006774902, -1.9030020236968994, -1.723784327507019, -1.5445666313171387, -1.3653489351272583, -1.186131238937378, -1.0069135427474976, -0.8276958465576172, -0.6484781503677368, -0.46926045417785645, -0.2900427579879761, -0.1108255386352539, 0.06839215755462646, 0.24760985374450684, 0.4268275499343872, 0.6060452461242676, 0.785262942314148, 0.9644806385040283, 1.1436983346939087, 1.322916030883789, 1.5021337270736694, 1.6813514232635498, 1.8605691194534302, 2.0397868156433105, 2.2190046310424805, 2.3982222080230713, 2.577439785003662, 2.756657600402832, 2.935875415802002, 3.1150929927825928, 3.2943105697631836, 3.4735283851623535, 3.6527462005615234, 3.8319637775421143, 4.011181354522705, 4.190399169921875, 4.369616985321045, 4.548834800720215, 4.728052139282227, 4.9072699546813965, 5.086487770080566, 5.265705108642578, 5.444922924041748, 5.624140739440918]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 11.0, 13.0, 21.0, 28.0, 51.0, 86.0, 98.0, 159.0, 273.0, 436.0, 746.0, 1178.0, 2075.0, 3472.0, 6050.0, 10546.0, 17882.0, 31022.0, 52922.0, 87187.0, 130490.0, 167371.0, 169675.0, 136651.0, 92931.0, 56890.0, 33397.0, 19484.0, 11200.0, 6640.0, 3878.0, 2182.0, 1368.0, 806.0, 492.0, 301.0, 214.0, 117.0, 66.0, 40.0, 37.0, 25.0, 19.0, 10.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0234375, -5.84130859375, -5.6591796875, -5.47705078125, -5.294921875, -5.11279296875, -4.9306640625, -4.74853515625, -4.56640625, -4.38427734375, -4.2021484375, -4.02001953125, -3.837890625, -3.65576171875, -3.4736328125, -3.29150390625, -3.109375, -2.92724609375, -2.7451171875, -2.56298828125, -2.380859375, -2.19873046875, -2.0166015625, -1.83447265625, -1.65234375, -1.47021484375, -1.2880859375, -1.10595703125, -0.923828125, -0.74169921875, -0.5595703125, -0.37744140625, -0.1953125, -0.01318359375, 0.1689453125, 0.35107421875, 0.533203125, 0.71533203125, 0.8974609375, 1.07958984375, 1.26171875, 1.44384765625, 1.6259765625, 1.80810546875, 1.990234375, 2.17236328125, 2.3544921875, 2.53662109375, 2.71875, 2.90087890625, 3.0830078125, 3.26513671875, 3.447265625, 3.62939453125, 3.8115234375, 3.99365234375, 4.17578125, 4.35791015625, 4.5400390625, 4.72216796875, 4.904296875, 5.08642578125, 5.2685546875, 5.45068359375, 5.6328125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 9.0, 4.0, 11.0, 11.0, 15.0, 16.0, 26.0, 25.0, 36.0, 29.0, 33.0, 40.0, 46.0, 52.0, 53.0, 50.0, 51.0, 46.0, 40.0, 56.0, 36.0, 37.0, 39.0, 39.0, 31.0, 27.0, 20.0, 26.0, 15.0, 14.0, 16.0, 9.0, 12.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.1015625, -7.87701416015625, -7.6524658203125, -7.42791748046875, -7.203369140625, -6.97882080078125, -6.7542724609375, -6.52972412109375, -6.30517578125, -6.08062744140625, -5.8560791015625, -5.63153076171875, -5.406982421875, -5.18243408203125, -4.9578857421875, -4.73333740234375, -4.5087890625, -4.28424072265625, -4.0596923828125, -3.83514404296875, -3.610595703125, -3.38604736328125, -3.1614990234375, -2.93695068359375, -2.71240234375, -2.48785400390625, -2.2633056640625, -2.03875732421875, -1.814208984375, -1.58966064453125, -1.3651123046875, -1.14056396484375, -0.916015625, -0.69146728515625, -0.4669189453125, -0.24237060546875, -0.017822265625, 0.20672607421875, 0.4312744140625, 0.65582275390625, 0.88037109375, 1.10491943359375, 1.3294677734375, 1.55401611328125, 1.778564453125, 2.00311279296875, 2.2276611328125, 2.45220947265625, 2.6767578125, 2.90130615234375, 3.1258544921875, 3.35040283203125, 3.574951171875, 3.79949951171875, 4.0240478515625, 4.24859619140625, 4.47314453125, 4.69769287109375, 4.9222412109375, 5.14678955078125, 5.371337890625, 5.59588623046875, 5.8204345703125, 6.04498291015625, 6.26953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 17.0, 10.0, 22.0, 33.0, 45.0, 64.0, 85.0, 141.0, 185.0, 243.0, 409.0, 560.0, 867.0, 1373.0, 2004.0, 3197.0, 5038.0, 8207.0, 12791.0, 21069.0, 33839.0, 54867.0, 84779.0, 122928.0, 153863.0, 156992.0, 130744.0, 92869.0, 60677.0, 38071.0, 23524.0, 14474.0, 8930.0, 5399.0, 3549.0, 2214.0, 1448.0, 980.0, 594.0, 461.0, 312.0, 178.0, 146.0, 92.0, 79.0, 51.0, 32.0, 28.0, 22.0, 18.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-5.05859375, -4.90106201171875, -4.7435302734375, -4.58599853515625, -4.428466796875, -4.27093505859375, -4.1134033203125, -3.95587158203125, -3.79833984375, -3.64080810546875, -3.4832763671875, -3.32574462890625, -3.168212890625, -3.01068115234375, -2.8531494140625, -2.69561767578125, -2.5380859375, -2.38055419921875, -2.2230224609375, -2.06549072265625, -1.907958984375, -1.75042724609375, -1.5928955078125, -1.43536376953125, -1.27783203125, -1.12030029296875, -0.9627685546875, -0.80523681640625, -0.647705078125, -0.49017333984375, -0.3326416015625, -0.17510986328125, -0.017578125, 0.13995361328125, 0.2974853515625, 0.45501708984375, 0.612548828125, 0.77008056640625, 0.9276123046875, 1.08514404296875, 1.24267578125, 1.40020751953125, 1.5577392578125, 1.71527099609375, 1.872802734375, 2.03033447265625, 2.1878662109375, 2.34539794921875, 2.5029296875, 2.66046142578125, 2.8179931640625, 2.97552490234375, 3.133056640625, 3.29058837890625, 3.4481201171875, 3.60565185546875, 3.76318359375, 3.92071533203125, 4.0782470703125, 4.23577880859375, 4.393310546875, 4.55084228515625, 4.7083740234375, 4.86590576171875, 5.0234375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 14.0, 11.0, 12.0, 13.0, 12.0, 25.0, 26.0, 22.0, 28.0, 32.0, 32.0, 33.0, 28.0, 30.0, 35.0, 45.0, 43.0, 31.0, 35.0, 39.0, 44.0, 29.0, 29.0, 38.0, 35.0, 29.0, 27.0, 27.0, 27.0, 22.0, 20.0, 20.0, 14.0, 14.0, 7.0, 9.0, 7.0, 5.0, 10.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.240234375, -3.129302978515625, -3.01837158203125, -2.907440185546875, -2.7965087890625, -2.685577392578125, -2.57464599609375, -2.463714599609375, -2.352783203125, -2.241851806640625, -2.13092041015625, -2.019989013671875, -1.9090576171875, -1.798126220703125, -1.68719482421875, -1.576263427734375, -1.46533203125, -1.354400634765625, -1.24346923828125, -1.132537841796875, -1.0216064453125, -0.910675048828125, -0.79974365234375, -0.688812255859375, -0.577880859375, -0.466949462890625, -0.35601806640625, -0.245086669921875, -0.1341552734375, -0.023223876953125, 0.08770751953125, 0.198638916015625, 0.3095703125, 0.420501708984375, 0.53143310546875, 0.642364501953125, 0.7532958984375, 0.864227294921875, 0.97515869140625, 1.086090087890625, 1.197021484375, 1.307952880859375, 1.41888427734375, 1.529815673828125, 1.6407470703125, 1.751678466796875, 1.86260986328125, 1.973541259765625, 2.08447265625, 2.195404052734375, 2.30633544921875, 2.417266845703125, 2.5281982421875, 2.639129638671875, 2.75006103515625, 2.860992431640625, 2.971923828125, 3.082855224609375, 3.19378662109375, 3.304718017578125, 3.4156494140625, 3.526580810546875, 3.63751220703125, 3.748443603515625, 3.859375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 10.0, 12.0, 22.0, 29.0, 63.0, 76.0, 118.0, 192.0, 244.0, 338.0, 608.0, 829.0, 1395.0, 2188.0, 3496.0, 5842.0, 10267.0, 18981.0, 36425.0, 71389.0, 135845.0, 215448.0, 225095.0, 149906.0, 79882.0, 40471.0, 21196.0, 11313.0, 6433.0, 3890.0, 2313.0, 1473.0, 929.0, 576.0, 407.0, 290.0, 191.0, 118.0, 85.0, 55.0, 43.0, 22.0, 17.0, 10.0, 10.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.23046875, -4.08984375, -3.94921875, -3.80859375, -3.66796875, -3.52734375, -3.38671875, -3.24609375, -3.10546875, -2.96484375, -2.82421875, -2.68359375, -2.54296875, -2.40234375, -2.26171875, -2.12109375, -1.98046875, -1.83984375, -1.69921875, -1.55859375, -1.41796875, -1.27734375, -1.13671875, -0.99609375, -0.85546875, -0.71484375, -0.57421875, -0.43359375, -0.29296875, -0.15234375, -0.01171875, 0.12890625, 0.26953125, 0.41015625, 0.55078125, 0.69140625, 0.83203125, 0.97265625, 1.11328125, 1.25390625, 1.39453125, 1.53515625, 1.67578125, 1.81640625, 1.95703125, 2.09765625, 2.23828125, 2.37890625, 2.51953125, 2.66015625, 2.80078125, 2.94140625, 3.08203125, 3.22265625, 3.36328125, 3.50390625, 3.64453125, 3.78515625, 3.92578125, 4.06640625, 4.20703125, 4.34765625, 4.48828125, 4.62890625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 7.0, 12.0, 10.0, 11.0, 16.0, 20.0, 19.0, 28.0, 49.0, 47.0, 45.0, 60.0, 66.0, 75.0, 84.0, 82.0, 69.0, 54.0, 49.0, 47.0, 41.0, 25.0, 15.0, 14.0, 10.0, 12.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003941059112548828, -0.00038155168294906616, -0.0003689974546432495, -0.00035644322633743286, -0.0003438889980316162, -0.00033133476972579956, -0.0003187805414199829, -0.00030622631311416626, -0.0002936720848083496, -0.00028111785650253296, -0.0002685636281967163, -0.00025600939989089966, -0.000243455171585083, -0.00023090094327926636, -0.0002183467149734497, -0.00020579248666763306, -0.0001932382583618164, -0.00018068403005599976, -0.0001681298017501831, -0.00015557557344436646, -0.0001430213451385498, -0.00013046711683273315, -0.0001179128885269165, -0.00010535866022109985, -9.28044319152832e-05, -8.025020360946655e-05, -6.76959753036499e-05, -5.514174699783325e-05, -4.25875186920166e-05, -3.003329038619995e-05, -1.74790620803833e-05, -4.92483377456665e-06, 7.62939453125e-06, 2.018362283706665e-05, 3.27378511428833e-05, 4.529207944869995e-05, 5.78463077545166e-05, 7.040053606033325e-05, 8.29547643661499e-05, 9.550899267196655e-05, 0.0001080632209777832, 0.00012061744928359985, 0.0001331716775894165, 0.00014572590589523315, 0.0001582801342010498, 0.00017083436250686646, 0.0001833885908126831, 0.00019594281911849976, 0.0002084970474243164, 0.00022105127573013306, 0.0002336055040359497, 0.00024615973234176636, 0.000258713960647583, 0.00027126818895339966, 0.0002838224172592163, 0.00029637664556503296, 0.0003089308738708496, 0.00032148510217666626, 0.0003340393304824829, 0.00034659355878829956, 0.0003591477870941162, 0.00037170201539993286, 0.0003842562437057495, 0.00039681047201156616, 0.0004093647003173828]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 19.0, 37.0, 48.0, 77.0, 117.0, 165.0, 180.0, 289.0, 446.0, 612.0, 980.0, 1443.0, 2305.0, 3448.0, 5500.0, 8800.0, 14409.0, 24316.0, 40800.0, 68997.0, 111942.0, 162570.0, 183932.0, 154360.0, 103907.0, 63001.0, 37474.0, 22131.0, 13499.0, 8101.0, 5097.0, 3323.0, 2106.0, 1330.0, 907.0, 556.0, 415.0, 286.0, 186.0, 143.0, 94.0, 58.0, 37.0, 34.0, 21.0, 12.0, 10.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2578125, -3.15411376953125, -3.0504150390625, -2.94671630859375, -2.843017578125, -2.73931884765625, -2.6356201171875, -2.53192138671875, -2.42822265625, -2.32452392578125, -2.2208251953125, -2.11712646484375, -2.013427734375, -1.90972900390625, -1.8060302734375, -1.70233154296875, -1.5986328125, -1.49493408203125, -1.3912353515625, -1.28753662109375, -1.183837890625, -1.08013916015625, -0.9764404296875, -0.87274169921875, -0.76904296875, -0.66534423828125, -0.5616455078125, -0.45794677734375, -0.354248046875, -0.25054931640625, -0.1468505859375, -0.04315185546875, 0.060546875, 0.16424560546875, 0.2679443359375, 0.37164306640625, 0.475341796875, 0.57904052734375, 0.6827392578125, 0.78643798828125, 0.89013671875, 0.99383544921875, 1.0975341796875, 1.20123291015625, 1.304931640625, 1.40863037109375, 1.5123291015625, 1.61602783203125, 1.7197265625, 1.82342529296875, 1.9271240234375, 2.03082275390625, 2.134521484375, 2.23822021484375, 2.3419189453125, 2.44561767578125, 2.54931640625, 2.65301513671875, 2.7567138671875, 2.86041259765625, 2.964111328125, 3.06781005859375, 3.1715087890625, 3.27520751953125, 3.37890625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 18.0, 26.0, 26.0, 35.0, 37.0, 43.0, 46.0, 46.0, 62.0, 53.0, 51.0, 58.0, 59.0, 59.0, 70.0, 47.0, 57.0, 32.0, 26.0, 23.0, 34.0, 18.0, 11.0, 10.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.42578125, -1.3802490234375, -1.334716796875, -1.2891845703125, -1.24365234375, -1.1981201171875, -1.152587890625, -1.1070556640625, -1.0615234375, -1.0159912109375, -0.970458984375, -0.9249267578125, -0.87939453125, -0.8338623046875, -0.788330078125, -0.7427978515625, -0.697265625, -0.6517333984375, -0.606201171875, -0.5606689453125, -0.51513671875, -0.4696044921875, -0.424072265625, -0.3785400390625, -0.3330078125, -0.2874755859375, -0.241943359375, -0.1964111328125, -0.15087890625, -0.1053466796875, -0.059814453125, -0.0142822265625, 0.03125, 0.0767822265625, 0.122314453125, 0.1678466796875, 0.21337890625, 0.2589111328125, 0.304443359375, 0.3499755859375, 0.3955078125, 0.4410400390625, 0.486572265625, 0.5321044921875, 0.57763671875, 0.6231689453125, 0.668701171875, 0.7142333984375, 0.759765625, 0.8052978515625, 0.850830078125, 0.8963623046875, 0.94189453125, 0.9874267578125, 1.032958984375, 1.0784912109375, 1.1240234375, 1.1695556640625, 1.215087890625, 1.2606201171875, 1.30615234375, 1.3516845703125, 1.397216796875, 1.4427490234375, 1.48828125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 11.0, 15.0, 15.0, 19.0, 18.0, 37.0, 31.0, 46.0, 64.0, 71.0, 76.0, 76.0, 72.0, 77.0, 60.0, 66.0, 53.0, 31.0, 36.0, 24.0, 31.0, 13.0, 10.0, 6.0, 12.0, 9.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.653032302856445, -8.334821701049805, -8.016611099243164, -7.698400497436523, -7.380189895629883, -7.061979293823242, -6.74376916885376, -6.425558567047119, -6.1073479652404785, -5.789137363433838, -5.470926761627197, -5.152716159820557, -4.834506034851074, -4.516295433044434, -4.198084831237793, -3.8798742294311523, -3.5616636276245117, -3.243453025817871, -2.9252424240112305, -2.607032060623169, -2.2888214588165283, -1.9706108570098877, -1.6524003744125366, -1.3341898918151855, -1.015979290008545, -0.6977687478065491, -0.3795582056045532, -0.06134766340255737, 0.2568628787994385, 0.5750734806060791, 0.8932839632034302, 1.2114944458007812, 1.5297060012817383, 1.847916603088379, 2.1661272048950195, 2.484337568283081, 2.8025481700897217, 3.1207587718963623, 3.438969135284424, 3.7571797370910645, 4.075390338897705, 4.393600940704346, 4.711811542510986, 5.030022144317627, 5.348232269287109, 5.66644287109375, 5.984653472900391, 6.302864074707031, 6.621074676513672, 6.9392852783203125, 7.257495880126953, 7.575706481933594, 7.893917083740234, 8.212127685546875, 8.530338287353516, 8.848548889160156, 9.166759490966797, 9.484970092773438, 9.803180694580078, 10.121391296386719, 10.43960189819336, 10.7578125, 11.07602310180664, 11.394233703613281, 11.712443351745605]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 8.0, 8.0, 13.0, 17.0, 12.0, 25.0, 18.0, 27.0, 23.0, 23.0, 29.0, 37.0, 40.0, 30.0, 30.0, 44.0, 39.0, 48.0, 41.0, 30.0, 38.0, 35.0, 36.0, 41.0, 50.0, 29.0, 33.0, 28.0, 20.0, 19.0, 24.0, 15.0, 9.0, 12.0, 13.0, 14.0, 6.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.179008960723877, -5.988417148590088, -5.797824859619141, -5.607233047485352, -5.4166412353515625, -5.226048946380615, -5.035457134246826, -4.844864845275879, -4.65427303314209, -4.463681221008301, -4.2730889320373535, -4.0824971199035645, -3.8919050693511963, -3.701313018798828, -3.510721206665039, -3.320129156112671, -3.1295371055603027, -2.9389450550079346, -2.7483530044555664, -2.5577611923217773, -2.367169141769409, -2.176577091217041, -1.9859851598739624, -1.7953932285308838, -1.6048011779785156, -1.4142091274261475, -1.2236171960830688, -1.0330252647399902, -0.8424332141876221, -0.6518412232398987, -0.4612492322921753, -0.2706573009490967, -0.08006477355957031, 0.11052721738815308, 0.30111920833587646, 0.49171119928359985, 0.6823031902313232, 0.8728951811790466, 1.06348717212677, 1.2540791034698486, 1.4446711540222168, 1.635263204574585, 1.8258551359176636, 2.016447067260742, 2.2070391178131104, 2.3976311683654785, 2.5882229804992676, 2.7788150310516357, 2.969407081604004, 3.159999132156372, 3.3505911827087402, 3.5411829948425293, 3.7317750453948975, 3.9223670959472656, 4.112958908081055, 4.303550720214844, 4.494143009185791, 4.68473482131958, 4.875327110290527, 5.065918922424316, 5.2565107345581055, 5.447103023529053, 5.637694835662842, 5.828287124633789, 6.018878936767578]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 5.0, 3.0, 11.0, 10.0, 11.0, 16.0, 23.0, 41.0, 48.0, 50.0, 99.0, 131.0, 191.0, 287.0, 398.0, 552.0, 871.0, 1292.0, 1966.0, 2912.0, 4685.0, 7397.0, 12123.0, 21308.0, 37995.0, 75213.0, 163150.0, 387008.0, 834973.0, 1149320.0, 805344.0, 366738.0, 156895.0, 72823.0, 37631.0, 20732.0, 11879.0, 7295.0, 4402.0, 2884.0, 1797.0, 1214.0, 838.0, 558.0, 360.0, 252.0, 190.0, 126.0, 76.0, 60.0, 41.0, 18.0, 17.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-7.140625, -6.92071533203125, -6.7008056640625, -6.48089599609375, -6.260986328125, -6.04107666015625, -5.8211669921875, -5.60125732421875, -5.38134765625, -5.16143798828125, -4.9415283203125, -4.72161865234375, -4.501708984375, -4.28179931640625, -4.0618896484375, -3.84197998046875, -3.6220703125, -3.40216064453125, -3.1822509765625, -2.96234130859375, -2.742431640625, -2.52252197265625, -2.3026123046875, -2.08270263671875, -1.86279296875, -1.64288330078125, -1.4229736328125, -1.20306396484375, -0.983154296875, -0.76324462890625, -0.5433349609375, -0.32342529296875, -0.103515625, 0.11639404296875, 0.3363037109375, 0.55621337890625, 0.776123046875, 0.99603271484375, 1.2159423828125, 1.43585205078125, 1.65576171875, 1.87567138671875, 2.0955810546875, 2.31549072265625, 2.535400390625, 2.75531005859375, 2.9752197265625, 3.19512939453125, 3.4150390625, 3.63494873046875, 3.8548583984375, 4.07476806640625, 4.294677734375, 4.51458740234375, 4.7344970703125, 4.95440673828125, 5.17431640625, 5.39422607421875, 5.6141357421875, 5.83404541015625, 6.053955078125, 6.27386474609375, 6.4937744140625, 6.71368408203125, 6.93359375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 3.0, 10.0, 14.0, 16.0, 12.0, 14.0, 21.0, 19.0, 27.0, 34.0, 28.0, 41.0, 36.0, 41.0, 35.0, 50.0, 50.0, 54.0, 50.0, 34.0, 36.0, 38.0, 41.0, 40.0, 28.0, 36.0, 25.0, 22.0, 27.0, 21.0, 15.0, 8.0, 15.0, 12.0, 7.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.65625, -4.5142822265625, -4.372314453125, -4.2303466796875, -4.08837890625, -3.9464111328125, -3.804443359375, -3.6624755859375, -3.5205078125, -3.3785400390625, -3.236572265625, -3.0946044921875, -2.95263671875, -2.8106689453125, -2.668701171875, -2.5267333984375, -2.384765625, -2.2427978515625, -2.100830078125, -1.9588623046875, -1.81689453125, -1.6749267578125, -1.532958984375, -1.3909912109375, -1.2490234375, -1.1070556640625, -0.965087890625, -0.8231201171875, -0.68115234375, -0.5391845703125, -0.397216796875, -0.2552490234375, -0.11328125, 0.0286865234375, 0.170654296875, 0.3126220703125, 0.45458984375, 0.5965576171875, 0.738525390625, 0.8804931640625, 1.0224609375, 1.1644287109375, 1.306396484375, 1.4483642578125, 1.59033203125, 1.7322998046875, 1.874267578125, 2.0162353515625, 2.158203125, 2.3001708984375, 2.442138671875, 2.5841064453125, 2.72607421875, 2.8680419921875, 3.010009765625, 3.1519775390625, 3.2939453125, 3.4359130859375, 3.577880859375, 3.7198486328125, 3.86181640625, 4.0037841796875, 4.145751953125, 4.2877197265625, 4.4296875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 9.0, 8.0, 14.0, 12.0, 22.0, 24.0, 36.0, 69.0, 85.0, 153.0, 204.0, 301.0, 404.0, 616.0, 940.0, 1451.0, 2264.0, 3438.0, 5376.0, 8986.0, 15345.0, 26337.0, 48166.0, 89287.0, 177177.0, 368219.0, 752002.0, 1106528.0, 791674.0, 392154.0, 188155.0, 94624.0, 50298.0, 28037.0, 16159.0, 9528.0, 5723.0, 3655.0, 2305.0, 1526.0, 954.0, 657.0, 438.0, 292.0, 195.0, 139.0, 79.0, 54.0, 50.0, 38.0, 28.0, 19.0, 11.0, 9.0, 7.0, 7.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.0078125, -6.78564453125, -6.5634765625, -6.34130859375, -6.119140625, -5.89697265625, -5.6748046875, -5.45263671875, -5.23046875, -5.00830078125, -4.7861328125, -4.56396484375, -4.341796875, -4.11962890625, -3.8974609375, -3.67529296875, -3.453125, -3.23095703125, -3.0087890625, -2.78662109375, -2.564453125, -2.34228515625, -2.1201171875, -1.89794921875, -1.67578125, -1.45361328125, -1.2314453125, -1.00927734375, -0.787109375, -0.56494140625, -0.3427734375, -0.12060546875, 0.1015625, 0.32373046875, 0.5458984375, 0.76806640625, 0.990234375, 1.21240234375, 1.4345703125, 1.65673828125, 1.87890625, 2.10107421875, 2.3232421875, 2.54541015625, 2.767578125, 2.98974609375, 3.2119140625, 3.43408203125, 3.65625, 3.87841796875, 4.1005859375, 4.32275390625, 4.544921875, 4.76708984375, 4.9892578125, 5.21142578125, 5.43359375, 5.65576171875, 5.8779296875, 6.10009765625, 6.322265625, 6.54443359375, 6.7666015625, 6.98876953125, 7.2109375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 9.0, 13.0, 18.0, 24.0, 28.0, 31.0, 38.0, 37.0, 79.0, 104.0, 130.0, 146.0, 206.0, 218.0, 273.0, 322.0, 358.0, 346.0, 308.0, 294.0, 220.0, 189.0, 145.0, 128.0, 90.0, 69.0, 54.0, 50.0, 31.0, 21.0, 21.0, 24.0, 10.0, 9.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.166015625, -3.082489013671875, -2.99896240234375, -2.915435791015625, -2.8319091796875, -2.748382568359375, -2.66485595703125, -2.581329345703125, -2.497802734375, -2.414276123046875, -2.33074951171875, -2.247222900390625, -2.1636962890625, -2.080169677734375, -1.99664306640625, -1.913116455078125, -1.82958984375, -1.746063232421875, -1.66253662109375, -1.579010009765625, -1.4954833984375, -1.411956787109375, -1.32843017578125, -1.244903564453125, -1.161376953125, -1.077850341796875, -0.99432373046875, -0.910797119140625, -0.8272705078125, -0.743743896484375, -0.66021728515625, -0.576690673828125, -0.4931640625, -0.409637451171875, -0.32611083984375, -0.242584228515625, -0.1590576171875, -0.075531005859375, 0.00799560546875, 0.091522216796875, 0.175048828125, 0.258575439453125, 0.34210205078125, 0.425628662109375, 0.5091552734375, 0.592681884765625, 0.67620849609375, 0.759735107421875, 0.84326171875, 0.926788330078125, 1.01031494140625, 1.093841552734375, 1.1773681640625, 1.260894775390625, 1.34442138671875, 1.427947998046875, 1.511474609375, 1.595001220703125, 1.67852783203125, 1.762054443359375, 1.8455810546875, 1.929107666015625, 2.01263427734375, 2.096160888671875, 2.1796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 13.0, 7.0, 24.0, 29.0, 43.0, 63.0, 52.0, 94.0, 83.0, 101.0, 81.0, 97.0, 63.0, 53.0, 48.0, 37.0, 26.0, 12.0, 15.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.35332202911377, -10.997031211853027, -10.640740394592285, -10.28445053100586, -9.928159713745117, -9.571868896484375, -9.215578079223633, -8.85928726196289, -8.502996444702148, -8.146705627441406, -7.790415287017822, -7.43412446975708, -7.077833652496338, -6.721543312072754, -6.365252494812012, -6.0089616775512695, -5.6526713371276855, -5.296380519866943, -4.940090179443359, -4.583799362182617, -4.227508544921875, -3.871217966079712, -3.514927387237549, -3.1586365699768066, -2.8023459911346436, -2.4460554122924805, -2.0897645950317383, -1.7334740161895752, -1.3771833181381226, -1.02089262008667, -0.6646020412445068, -0.30831122398376465, 0.04797935485839844, 0.4042700231075287, 0.7605606913566589, 1.1168513298034668, 1.4731420278549194, 1.829432725906372, 2.185723304748535, 2.5420141220092773, 2.8983047008514404, 3.2545952796936035, 3.6108860969543457, 3.967176675796509, 4.323467254638672, 4.679758071899414, 5.036048889160156, 5.392339706420898, 5.748630046844482, 6.104920864105225, 6.461211204528809, 6.817502021789551, 7.173792839050293, 7.530083656311035, 7.886373996734619, 8.242664337158203, 8.598955154418945, 8.955245971679688, 9.31153678894043, 9.667827606201172, 10.024117469787598, 10.38040828704834, 10.736699104309082, 11.092989921569824, 11.449280738830566]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 7.0, 15.0, 14.0, 14.0, 13.0, 18.0, 25.0, 17.0, 27.0, 28.0, 23.0, 24.0, 33.0, 39.0, 36.0, 38.0, 40.0, 42.0, 40.0, 45.0, 46.0, 31.0, 37.0, 44.0, 36.0, 34.0, 19.0, 22.0, 30.0, 23.0, 13.0, 19.0, 17.0, 16.0, 13.0, 15.0, 6.0, 11.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.965344429016113, -4.798496246337891, -4.631648063659668, -4.464799880981445, -4.297951698303223, -4.131103992462158, -3.9642558097839355, -3.797407627105713, -3.6305594444274902, -3.4637112617492676, -3.296863079071045, -3.1300151348114014, -2.9631669521331787, -2.796318769454956, -2.6294708251953125, -2.46262264251709, -2.295774459838867, -2.1289262771606445, -1.9620782136917114, -1.7952301502227783, -1.6283819675445557, -1.461533784866333, -1.2946857213974, -1.1278376579284668, -0.9609894752502441, -0.7941413521766663, -0.6272932291030884, -0.4604451060295105, -0.2935969829559326, -0.12674885988235474, 0.040099263191223145, 0.20694732666015625, 0.3737959861755371, 0.540644109249115, 0.7074922323226929, 0.8743403553962708, 1.0411884784698486, 1.2080366611480713, 1.3748847246170044, 1.5417327880859375, 1.7085809707641602, 1.8754291534423828, 2.0422773361206055, 2.209125280380249, 2.3759734630584717, 2.5428216457366943, 2.709669589996338, 2.8765177726745605, 3.043365955352783, 3.210214138031006, 3.3770623207092285, 3.543910264968872, 3.7107584476470947, 3.8776066303253174, 4.044454574584961, 4.211302757263184, 4.378150939941406, 4.544999122619629, 4.711847305297852, 4.878695487976074, 5.045543670654297, 5.212391376495361, 5.379239559173584, 5.546087741851807, 5.712935924530029]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 11.0, 7.0, 9.0, 26.0, 34.0, 41.0, 59.0, 98.0, 153.0, 262.0, 414.0, 738.0, 1435.0, 2678.0, 5398.0, 11237.0, 24063.0, 52833.0, 112758.0, 211222.0, 264683.0, 185031.0, 93333.0, 43034.0, 19975.0, 9438.0, 4558.0, 2245.0, 1165.0, 635.0, 347.0, 236.0, 120.0, 93.0, 59.0, 45.0, 21.0, 11.0, 16.0, 10.0, 10.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.55859375, -5.35552978515625, -5.1524658203125, -4.94940185546875, -4.746337890625, -4.54327392578125, -4.3402099609375, -4.13714599609375, -3.93408203125, -3.73101806640625, -3.5279541015625, -3.32489013671875, -3.121826171875, -2.91876220703125, -2.7156982421875, -2.51263427734375, -2.3095703125, -2.10650634765625, -1.9034423828125, -1.70037841796875, -1.497314453125, -1.29425048828125, -1.0911865234375, -0.88812255859375, -0.68505859375, -0.48199462890625, -0.2789306640625, -0.07586669921875, 0.127197265625, 0.33026123046875, 0.5333251953125, 0.73638916015625, 0.939453125, 1.14251708984375, 1.3455810546875, 1.54864501953125, 1.751708984375, 1.95477294921875, 2.1578369140625, 2.36090087890625, 2.56396484375, 2.76702880859375, 2.9700927734375, 3.17315673828125, 3.376220703125, 3.57928466796875, 3.7823486328125, 3.98541259765625, 4.1884765625, 4.39154052734375, 4.5946044921875, 4.79766845703125, 5.000732421875, 5.20379638671875, 5.4068603515625, 5.60992431640625, 5.81298828125, 6.01605224609375, 6.2191162109375, 6.42218017578125, 6.625244140625, 6.82830810546875, 7.0313720703125, 7.23443603515625, 7.4375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 7.0, 11.0, 9.0, 17.0, 18.0, 26.0, 25.0, 31.0, 18.0, 16.0, 35.0, 31.0, 37.0, 30.0, 46.0, 36.0, 34.0, 36.0, 51.0, 44.0, 39.0, 46.0, 36.0, 41.0, 40.0, 18.0, 24.0, 34.0, 16.0, 17.0, 22.0, 14.0, 17.0, 18.0, 4.0, 4.0, 7.0, 9.0, 6.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.16796875, -4.99029541015625, -4.8126220703125, -4.63494873046875, -4.457275390625, -4.27960205078125, -4.1019287109375, -3.92425537109375, -3.74658203125, -3.56890869140625, -3.3912353515625, -3.21356201171875, -3.035888671875, -2.85821533203125, -2.6805419921875, -2.50286865234375, -2.3251953125, -2.14752197265625, -1.9698486328125, -1.79217529296875, -1.614501953125, -1.43682861328125, -1.2591552734375, -1.08148193359375, -0.90380859375, -0.72613525390625, -0.5484619140625, -0.37078857421875, -0.193115234375, -0.01544189453125, 0.1622314453125, 0.33990478515625, 0.517578125, 0.69525146484375, 0.8729248046875, 1.05059814453125, 1.228271484375, 1.40594482421875, 1.5836181640625, 1.76129150390625, 1.93896484375, 2.11663818359375, 2.2943115234375, 2.47198486328125, 2.649658203125, 2.82733154296875, 3.0050048828125, 3.18267822265625, 3.3603515625, 3.53802490234375, 3.7156982421875, 3.89337158203125, 4.071044921875, 4.24871826171875, 4.4263916015625, 4.60406494140625, 4.78173828125, 4.95941162109375, 5.1370849609375, 5.31475830078125, 5.492431640625, 5.67010498046875, 5.8477783203125, 6.02545166015625, 6.203125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 12.0, 13.0, 14.0, 23.0, 36.0, 44.0, 55.0, 69.0, 94.0, 121.0, 162.0, 234.0, 354.0, 458.0, 843.0, 1207.0, 1883.0, 3030.0, 5213.0, 9305.0, 16645.0, 31907.0, 62399.0, 122016.0, 211682.0, 242193.0, 159300.0, 84444.0, 43070.0, 22223.0, 11963.0, 6869.0, 3791.0, 2382.0, 1495.0, 927.0, 624.0, 431.0, 295.0, 207.0, 124.0, 116.0, 70.0, 40.0, 45.0, 33.0, 25.0, 18.0, 20.0, 11.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.28125, -6.0863037109375, -5.891357421875, -5.6964111328125, -5.50146484375, -5.3065185546875, -5.111572265625, -4.9166259765625, -4.7216796875, -4.5267333984375, -4.331787109375, -4.1368408203125, -3.94189453125, -3.7469482421875, -3.552001953125, -3.3570556640625, -3.162109375, -2.9671630859375, -2.772216796875, -2.5772705078125, -2.38232421875, -2.1873779296875, -1.992431640625, -1.7974853515625, -1.6025390625, -1.4075927734375, -1.212646484375, -1.0177001953125, -0.82275390625, -0.6278076171875, -0.432861328125, -0.2379150390625, -0.04296875, 0.1519775390625, 0.346923828125, 0.5418701171875, 0.73681640625, 0.9317626953125, 1.126708984375, 1.3216552734375, 1.5166015625, 1.7115478515625, 1.906494140625, 2.1014404296875, 2.29638671875, 2.4913330078125, 2.686279296875, 2.8812255859375, 3.076171875, 3.2711181640625, 3.466064453125, 3.6610107421875, 3.85595703125, 4.0509033203125, 4.245849609375, 4.4407958984375, 4.6357421875, 4.8306884765625, 5.025634765625, 5.2205810546875, 5.41552734375, 5.6104736328125, 5.805419921875, 6.0003662109375, 6.1953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 15.0, 3.0, 13.0, 19.0, 16.0, 13.0, 25.0, 25.0, 27.0, 36.0, 24.0, 27.0, 42.0, 45.0, 44.0, 47.0, 31.0, 38.0, 45.0, 28.0, 25.0, 38.0, 48.0, 31.0, 29.0, 38.0, 25.0, 18.0, 27.0, 31.0, 25.0, 18.0, 8.0, 13.0, 10.0, 13.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.26348876953125, -3.1558837890625, -3.04827880859375, -2.940673828125, -2.83306884765625, -2.7254638671875, -2.61785888671875, -2.51025390625, -2.40264892578125, -2.2950439453125, -2.18743896484375, -2.079833984375, -1.97222900390625, -1.8646240234375, -1.75701904296875, -1.6494140625, -1.54180908203125, -1.4342041015625, -1.32659912109375, -1.218994140625, -1.11138916015625, -1.0037841796875, -0.89617919921875, -0.78857421875, -0.68096923828125, -0.5733642578125, -0.46575927734375, -0.358154296875, -0.25054931640625, -0.1429443359375, -0.03533935546875, 0.072265625, 0.17987060546875, 0.2874755859375, 0.39508056640625, 0.502685546875, 0.61029052734375, 0.7178955078125, 0.82550048828125, 0.93310546875, 1.04071044921875, 1.1483154296875, 1.25592041015625, 1.363525390625, 1.47113037109375, 1.5787353515625, 1.68634033203125, 1.7939453125, 1.90155029296875, 2.0091552734375, 2.11676025390625, 2.224365234375, 2.33197021484375, 2.4395751953125, 2.54718017578125, 2.65478515625, 2.76239013671875, 2.8699951171875, 2.97760009765625, 3.085205078125, 3.19281005859375, 3.3004150390625, 3.40802001953125, 3.515625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 3.0, 5.0, 6.0, 19.0, 19.0, 22.0, 27.0, 47.0, 75.0, 103.0, 126.0, 193.0, 315.0, 460.0, 798.0, 1357.0, 2511.0, 4915.0, 10111.0, 23398.0, 58628.0, 162834.0, 364598.0, 257811.0, 94789.0, 35857.0, 14686.0, 6847.0, 3307.0, 1760.0, 1038.0, 634.0, 382.0, 268.0, 180.0, 125.0, 86.0, 60.0, 54.0, 26.0, 21.0, 20.0, 6.0, 4.0, 11.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.96875, -4.82147216796875, -4.6741943359375, -4.52691650390625, -4.379638671875, -4.23236083984375, -4.0850830078125, -3.93780517578125, -3.79052734375, -3.64324951171875, -3.4959716796875, -3.34869384765625, -3.201416015625, -3.05413818359375, -2.9068603515625, -2.75958251953125, -2.6123046875, -2.46502685546875, -2.3177490234375, -2.17047119140625, -2.023193359375, -1.87591552734375, -1.7286376953125, -1.58135986328125, -1.43408203125, -1.28680419921875, -1.1395263671875, -0.99224853515625, -0.844970703125, -0.69769287109375, -0.5504150390625, -0.40313720703125, -0.255859375, -0.10858154296875, 0.0386962890625, 0.18597412109375, 0.333251953125, 0.48052978515625, 0.6278076171875, 0.77508544921875, 0.92236328125, 1.06964111328125, 1.2169189453125, 1.36419677734375, 1.511474609375, 1.65875244140625, 1.8060302734375, 1.95330810546875, 2.1005859375, 2.24786376953125, 2.3951416015625, 2.54241943359375, 2.689697265625, 2.83697509765625, 2.9842529296875, 3.13153076171875, 3.27880859375, 3.42608642578125, 3.5733642578125, 3.72064208984375, 3.867919921875, 4.01519775390625, 4.1624755859375, 4.30975341796875, 4.45703125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 11.0, 19.0, 15.0, 15.0, 31.0, 39.0, 55.0, 59.0, 77.0, 77.0, 77.0, 96.0, 73.0, 61.0, 43.0, 59.0, 54.0, 25.0, 22.0, 16.0, 19.0, 11.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020837783813476562, -0.00020242482423782349, -0.00019647181034088135, -0.0001905187964439392, -0.00018456578254699707, -0.00017861276865005493, -0.0001726597547531128, -0.00016670674085617065, -0.00016075372695922852, -0.00015480071306228638, -0.00014884769916534424, -0.0001428946852684021, -0.00013694167137145996, -0.00013098865747451782, -0.00012503564357757568, -0.00011908262968063354, -0.0001131296157836914, -0.00010717660188674927, -0.00010122358798980713, -9.527057409286499e-05, -8.931756019592285e-05, -8.336454629898071e-05, -7.741153240203857e-05, -7.145851850509644e-05, -6.55055046081543e-05, -5.955249071121216e-05, -5.359947681427002e-05, -4.764646291732788e-05, -4.169344902038574e-05, -3.5740435123443604e-05, -2.9787421226501465e-05, -2.3834407329559326e-05, -1.7881393432617188e-05, -1.1928379535675049e-05, -5.97536563873291e-06, -2.2351741790771484e-08, 5.930662155151367e-06, 1.1883676052093506e-05, 1.7836689949035645e-05, 2.3789703845977783e-05, 2.9742717742919922e-05, 3.569573163986206e-05, 4.16487455368042e-05, 4.760175943374634e-05, 5.3554773330688477e-05, 5.9507787227630615e-05, 6.546080112457275e-05, 7.141381502151489e-05, 7.736682891845703e-05, 8.331984281539917e-05, 8.927285671234131e-05, 9.522587060928345e-05, 0.00010117888450622559, 0.00010713189840316772, 0.00011308491230010986, 0.000119037926197052, 0.00012499094009399414, 0.00013094395399093628, 0.00013689696788787842, 0.00014284998178482056, 0.0001488029956817627, 0.00015475600957870483, 0.00016070902347564697, 0.0001666620373725891, 0.00017261505126953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 12.0, 16.0, 34.0, 31.0, 52.0, 93.0, 128.0, 191.0, 314.0, 636.0, 983.0, 1890.0, 3654.0, 7222.0, 15090.0, 32484.0, 71996.0, 153791.0, 257673.0, 245041.0, 138046.0, 63374.0, 28703.0, 13218.0, 6491.0, 3347.0, 1707.0, 959.0, 520.0, 298.0, 202.0, 126.0, 61.0, 54.0, 33.0, 23.0, 22.0, 13.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.061737060546875, -2.95941162109375, -2.857086181640625, -2.7547607421875, -2.652435302734375, -2.55010986328125, -2.447784423828125, -2.345458984375, -2.243133544921875, -2.14080810546875, -2.038482666015625, -1.9361572265625, -1.833831787109375, -1.73150634765625, -1.629180908203125, -1.52685546875, -1.424530029296875, -1.32220458984375, -1.219879150390625, -1.1175537109375, -1.015228271484375, -0.91290283203125, -0.810577392578125, -0.708251953125, -0.605926513671875, -0.50360107421875, -0.401275634765625, -0.2989501953125, -0.196624755859375, -0.09429931640625, 0.008026123046875, 0.1103515625, 0.212677001953125, 0.31500244140625, 0.417327880859375, 0.5196533203125, 0.621978759765625, 0.72430419921875, 0.826629638671875, 0.928955078125, 1.031280517578125, 1.13360595703125, 1.235931396484375, 1.3382568359375, 1.440582275390625, 1.54290771484375, 1.645233154296875, 1.74755859375, 1.849884033203125, 1.95220947265625, 2.054534912109375, 2.1568603515625, 2.259185791015625, 2.36151123046875, 2.463836669921875, 2.566162109375, 2.668487548828125, 2.77081298828125, 2.873138427734375, 2.9754638671875, 3.077789306640625, 3.18011474609375, 3.282440185546875, 3.384765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 6.0, 5.0, 4.0, 16.0, 17.0, 24.0, 25.0, 28.0, 36.0, 43.0, 75.0, 61.0, 64.0, 75.0, 71.0, 73.0, 65.0, 59.0, 43.0, 41.0, 39.0, 20.0, 23.0, 14.0, 17.0, 11.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90283203125, -0.8705215454101562, -0.8382110595703125, -0.8059005737304688, -0.773590087890625, -0.7412796020507812, -0.7089691162109375, -0.6766586303710938, -0.64434814453125, -0.6120376586914062, -0.5797271728515625, -0.5474166870117188, -0.515106201171875, -0.48279571533203125, -0.4504852294921875, -0.41817474365234375, -0.3858642578125, -0.35355377197265625, -0.3212432861328125, -0.28893280029296875, -0.256622314453125, -0.22431182861328125, -0.1920013427734375, -0.15969085693359375, -0.12738037109375, -0.09506988525390625, -0.0627593994140625, -0.03044891357421875, 0.001861572265625, 0.03417205810546875, 0.0664825439453125, 0.09879302978515625, 0.131103515625, 0.16341400146484375, 0.1957244873046875, 0.22803497314453125, 0.260345458984375, 0.29265594482421875, 0.3249664306640625, 0.35727691650390625, 0.38958740234375, 0.42189788818359375, 0.4542083740234375, 0.48651885986328125, 0.518829345703125, 0.5511398315429688, 0.5834503173828125, 0.6157608032226562, 0.6480712890625, 0.6803817749023438, 0.7126922607421875, 0.7450027465820312, 0.777313232421875, 0.8096237182617188, 0.8419342041015625, 0.8742446899414062, 0.90655517578125, 0.9388656616210938, 0.9711761474609375, 1.0034866333007812, 1.035797119140625, 1.0681076049804688, 1.1004180908203125, 1.1327285766601562, 1.1650390625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 8.0, 19.0, 25.0, 27.0, 55.0, 59.0, 74.0, 82.0, 103.0, 101.0, 80.0, 68.0, 69.0, 52.0, 40.0, 28.0, 22.0, 14.0, 12.0, 15.0, 6.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.238876342773438, -9.889521598815918, -9.540165901184082, -9.190811157226562, -8.841455459594727, -8.492100715637207, -8.142745971679688, -7.79339075088501, -7.444035530090332, -7.094680309295654, -6.745325088500977, -6.395970344543457, -6.046615123748779, -5.697259902954102, -5.347905158996582, -4.998549938201904, -4.649194717407227, -4.299839496612549, -3.95048451423645, -3.6011295318603516, -3.251774311065674, -2.902419090270996, -2.5530641078948975, -2.203709125518799, -1.854353904724121, -1.504998803138733, -1.1556437015533447, -0.8062885999679565, -0.45693349838256836, -0.10757839679718018, 0.241776704788208, 0.5911316871643066, 0.940485954284668, 1.2898410558700562, 1.6391961574554443, 1.9885512590408325, 2.3379063606262207, 2.6872615814208984, 3.036616563796997, 3.3859715461730957, 3.7353267669677734, 4.084681987762451, 4.434037208557129, 4.783391952514648, 5.132747173309326, 5.482102394104004, 5.831457138061523, 6.180812358856201, 6.530167579650879, 6.879522800445557, 7.228878021240234, 7.578232765197754, 7.927587985992432, 8.27694320678711, 8.626297950744629, 8.975652694702148, 9.325008392333984, 9.674363136291504, 10.02371883392334, 10.37307357788086, 10.722429275512695, 11.071784019470215, 11.421138763427734, 11.77049446105957, 12.11984920501709]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 9.0, 1.0, 14.0, 10.0, 10.0, 16.0, 6.0, 18.0, 22.0, 21.0, 21.0, 30.0, 27.0, 33.0, 30.0, 32.0, 29.0, 41.0, 41.0, 46.0, 36.0, 39.0, 52.0, 32.0, 40.0, 39.0, 37.0, 41.0, 19.0, 27.0, 21.0, 26.0, 14.0, 28.0, 13.0, 16.0, 17.0, 13.0, 14.0, 3.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.970677852630615, -4.806047439575195, -4.641416549682617, -4.476786136627197, -4.312155723571777, -4.147525310516357, -3.9828946590423584, -3.8182640075683594, -3.6536335945129395, -3.4890031814575195, -3.3243725299835205, -3.1597418785095215, -2.9951114654541016, -2.8304810523986816, -2.6658504009246826, -2.5012197494506836, -2.3365893363952637, -2.1719589233398438, -2.0073282718658447, -1.8426977396011353, -1.6780672073364258, -1.5134366750717163, -1.3488061428070068, -1.1841756105422974, -1.019545078277588, -0.8549145460128784, -0.690284013748169, -0.5256534814834595, -0.36102294921875, -0.19639241695404053, -0.031761884689331055, 0.13286864757537842, 0.2974987030029297, 0.46212923526763916, 0.6267597675323486, 0.7913902997970581, 0.9560208320617676, 1.120651364326477, 1.2852818965911865, 1.449912428855896, 1.6145429611206055, 1.779173493385315, 1.9438040256500244, 2.1084346771240234, 2.2730650901794434, 2.4376955032348633, 2.6023261547088623, 2.7669568061828613, 2.9315872192382812, 3.096217632293701, 3.2608482837677, 3.425478935241699, 3.590109348297119, 3.754739761352539, 3.919370412826538, 4.084001064300537, 4.248631477355957, 4.413261890411377, 4.577892303466797, 4.742523193359375, 4.907153606414795, 5.071784019470215, 5.236414909362793, 5.401045322418213, 5.565675735473633]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 8.0, 9.0, 7.0, 12.0, 18.0, 34.0, 48.0, 68.0, 109.0, 188.0, 295.0, 437.0, 647.0, 1048.0, 1814.0, 2768.0, 4438.0, 7205.0, 11768.0, 18826.0, 30167.0, 48267.0, 73299.0, 104791.0, 135463.0, 149044.0, 137799.0, 108862.0, 76713.0, 50375.0, 32094.0, 19609.0, 12357.0, 7420.0, 4696.0, 2900.0, 1757.0, 1125.0, 730.0, 481.0, 317.0, 190.0, 114.0, 80.0, 65.0, 30.0, 20.0, 15.0, 15.0, 11.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-4.68359375, -4.54400634765625, -4.4044189453125, -4.26483154296875, -4.125244140625, -3.98565673828125, -3.8460693359375, -3.70648193359375, -3.56689453125, -3.42730712890625, -3.2877197265625, -3.14813232421875, -3.008544921875, -2.86895751953125, -2.7293701171875, -2.58978271484375, -2.4501953125, -2.31060791015625, -2.1710205078125, -2.03143310546875, -1.891845703125, -1.75225830078125, -1.6126708984375, -1.47308349609375, -1.33349609375, -1.19390869140625, -1.0543212890625, -0.91473388671875, -0.775146484375, -0.63555908203125, -0.4959716796875, -0.35638427734375, -0.216796875, -0.07720947265625, 0.0623779296875, 0.20196533203125, 0.341552734375, 0.48114013671875, 0.6207275390625, 0.76031494140625, 0.89990234375, 1.03948974609375, 1.1790771484375, 1.31866455078125, 1.458251953125, 1.59783935546875, 1.7374267578125, 1.87701416015625, 2.0166015625, 2.15618896484375, 2.2957763671875, 2.43536376953125, 2.574951171875, 2.71453857421875, 2.8541259765625, 2.99371337890625, 3.13330078125, 3.27288818359375, 3.4124755859375, 3.55206298828125, 3.691650390625, 3.83123779296875, 3.9708251953125, 4.11041259765625, 4.25]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 8.0, 14.0, 12.0, 8.0, 15.0, 18.0, 18.0, 15.0, 16.0, 24.0, 27.0, 30.0, 31.0, 42.0, 29.0, 35.0, 34.0, 39.0, 34.0, 39.0, 40.0, 44.0, 41.0, 37.0, 28.0, 35.0, 44.0, 26.0, 29.0, 25.0, 18.0, 14.0, 18.0, 22.0, 11.0, 11.0, 6.0, 12.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.5465087890625, -4.382080078125, -4.2176513671875, -4.05322265625, -3.8887939453125, -3.724365234375, -3.5599365234375, -3.3955078125, -3.2310791015625, -3.066650390625, -2.9022216796875, -2.73779296875, -2.5733642578125, -2.408935546875, -2.2445068359375, -2.080078125, -1.9156494140625, -1.751220703125, -1.5867919921875, -1.42236328125, -1.2579345703125, -1.093505859375, -0.9290771484375, -0.7646484375, -0.6002197265625, -0.435791015625, -0.2713623046875, -0.10693359375, 0.0574951171875, 0.221923828125, 0.3863525390625, 0.55078125, 0.7152099609375, 0.879638671875, 1.0440673828125, 1.20849609375, 1.3729248046875, 1.537353515625, 1.7017822265625, 1.8662109375, 2.0306396484375, 2.195068359375, 2.3594970703125, 2.52392578125, 2.6883544921875, 2.852783203125, 3.0172119140625, 3.181640625, 3.3460693359375, 3.510498046875, 3.6749267578125, 3.83935546875, 4.0037841796875, 4.168212890625, 4.3326416015625, 4.4970703125, 4.6614990234375, 4.825927734375, 4.9903564453125, 5.15478515625, 5.3192138671875, 5.483642578125, 5.6480712890625, 5.8125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 12.0, 16.0, 20.0, 25.0, 33.0, 61.0, 90.0, 118.0, 194.0, 311.0, 428.0, 717.0, 1018.0, 1530.0, 2403.0, 3618.0, 5698.0, 9040.0, 13638.0, 21098.0, 32312.0, 48700.0, 69294.0, 96327.0, 121142.0, 135058.0, 129288.0, 107641.0, 81225.0, 56809.0, 38351.0, 25101.0, 16599.0, 10889.0, 6875.0, 4434.0, 2856.0, 1977.0, 1238.0, 844.0, 484.0, 332.0, 220.0, 177.0, 90.0, 64.0, 52.0, 33.0, 28.0, 12.0, 12.0, 8.0, 7.0, 2.0, 3.0], "bins": [-4.2578125, -4.135162353515625, -4.01251220703125, -3.889862060546875, -3.7672119140625, -3.644561767578125, -3.52191162109375, -3.399261474609375, -3.276611328125, -3.153961181640625, -3.03131103515625, -2.908660888671875, -2.7860107421875, -2.663360595703125, -2.54071044921875, -2.418060302734375, -2.29541015625, -2.172760009765625, -2.05010986328125, -1.927459716796875, -1.8048095703125, -1.682159423828125, -1.55950927734375, -1.436859130859375, -1.314208984375, -1.191558837890625, -1.06890869140625, -0.946258544921875, -0.8236083984375, -0.700958251953125, -0.57830810546875, -0.455657958984375, -0.3330078125, -0.210357666015625, -0.08770751953125, 0.034942626953125, 0.1575927734375, 0.280242919921875, 0.40289306640625, 0.525543212890625, 0.648193359375, 0.770843505859375, 0.89349365234375, 1.016143798828125, 1.1387939453125, 1.261444091796875, 1.38409423828125, 1.506744384765625, 1.62939453125, 1.752044677734375, 1.87469482421875, 1.997344970703125, 2.1199951171875, 2.242645263671875, 2.36529541015625, 2.487945556640625, 2.610595703125, 2.733245849609375, 2.85589599609375, 2.978546142578125, 3.1011962890625, 3.223846435546875, 3.34649658203125, 3.469146728515625, 3.591796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 8.0, 7.0, 6.0, 13.0, 7.0, 15.0, 19.0, 18.0, 14.0, 15.0, 27.0, 21.0, 27.0, 31.0, 29.0, 41.0, 50.0, 43.0, 47.0, 32.0, 41.0, 44.0, 37.0, 37.0, 38.0, 33.0, 26.0, 32.0, 27.0, 36.0, 23.0, 28.0, 21.0, 21.0, 15.0, 20.0, 8.0, 20.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.025390625, -2.91668701171875, -2.8079833984375, -2.69927978515625, -2.590576171875, -2.48187255859375, -2.3731689453125, -2.26446533203125, -2.15576171875, -2.04705810546875, -1.9383544921875, -1.82965087890625, -1.720947265625, -1.61224365234375, -1.5035400390625, -1.39483642578125, -1.2861328125, -1.17742919921875, -1.0687255859375, -0.96002197265625, -0.851318359375, -0.74261474609375, -0.6339111328125, -0.52520751953125, -0.41650390625, -0.30780029296875, -0.1990966796875, -0.09039306640625, 0.018310546875, 0.12701416015625, 0.2357177734375, 0.34442138671875, 0.453125, 0.56182861328125, 0.6705322265625, 0.77923583984375, 0.887939453125, 0.99664306640625, 1.1053466796875, 1.21405029296875, 1.32275390625, 1.43145751953125, 1.5401611328125, 1.64886474609375, 1.757568359375, 1.86627197265625, 1.9749755859375, 2.08367919921875, 2.1923828125, 2.30108642578125, 2.4097900390625, 2.51849365234375, 2.627197265625, 2.73590087890625, 2.8446044921875, 2.95330810546875, 3.06201171875, 3.17071533203125, 3.2794189453125, 3.38812255859375, 3.496826171875, 3.60552978515625, 3.7142333984375, 3.82293701171875, 3.931640625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 12.0, 18.0, 20.0, 31.0, 63.0, 87.0, 130.0, 225.0, 348.0, 645.0, 1042.0, 1767.0, 3056.0, 5428.0, 9644.0, 18146.0, 33171.0, 62210.0, 109828.0, 172745.0, 207121.0, 173834.0, 111156.0, 62676.0, 34025.0, 18245.0, 9861.0, 5452.0, 3168.0, 1765.0, 1027.0, 630.0, 350.0, 230.0, 123.0, 92.0, 64.0, 35.0, 28.0, 14.0, 10.0, 11.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.7738037109375, -2.676513671875, -2.5792236328125, -2.48193359375, -2.3846435546875, -2.287353515625, -2.1900634765625, -2.0927734375, -1.9954833984375, -1.898193359375, -1.8009033203125, -1.70361328125, -1.6063232421875, -1.509033203125, -1.4117431640625, -1.314453125, -1.2171630859375, -1.119873046875, -1.0225830078125, -0.92529296875, -0.8280029296875, -0.730712890625, -0.6334228515625, -0.5361328125, -0.4388427734375, -0.341552734375, -0.2442626953125, -0.14697265625, -0.0496826171875, 0.047607421875, 0.1448974609375, 0.2421875, 0.3394775390625, 0.436767578125, 0.5340576171875, 0.63134765625, 0.7286376953125, 0.825927734375, 0.9232177734375, 1.0205078125, 1.1177978515625, 1.215087890625, 1.3123779296875, 1.40966796875, 1.5069580078125, 1.604248046875, 1.7015380859375, 1.798828125, 1.8961181640625, 1.993408203125, 2.0906982421875, 2.18798828125, 2.2852783203125, 2.382568359375, 2.4798583984375, 2.5771484375, 2.6744384765625, 2.771728515625, 2.8690185546875, 2.96630859375, 3.0635986328125, 3.160888671875, 3.2581787109375, 3.35546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 5.0, 10.0, 9.0, 5.0, 8.0, 16.0, 16.0, 20.0, 32.0, 32.0, 28.0, 44.0, 56.0, 53.0, 54.0, 57.0, 65.0, 64.0, 59.0, 62.0, 39.0, 43.0, 36.0, 31.0, 39.0, 26.0, 15.0, 13.0, 8.0, 17.0, 7.0, 7.0, 7.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024306774139404297, -0.000235067680478096, -0.00022706761956214905, -0.0002190675586462021, -0.00021106749773025513, -0.00020306743681430817, -0.0001950673758983612, -0.00018706731498241425, -0.00017906725406646729, -0.00017106719315052032, -0.00016306713223457336, -0.0001550670713186264, -0.00014706701040267944, -0.00013906694948673248, -0.00013106688857078552, -0.00012306682765483856, -0.0001150667667388916, -0.00010706670582294464, -9.906664490699768e-05, -9.106658399105072e-05, -8.306652307510376e-05, -7.50664621591568e-05, -6.706640124320984e-05, -5.906634032726288e-05, -5.106627941131592e-05, -4.306621849536896e-05, -3.5066157579422e-05, -2.7066096663475037e-05, -1.9066035747528076e-05, -1.1065974831581116e-05, -3.0659139156341553e-06, 4.934147000312805e-06, 1.2934207916259766e-05, 2.0934268832206726e-05, 2.8934329748153687e-05, 3.693439066410065e-05, 4.493445158004761e-05, 5.293451249599457e-05, 6.093457341194153e-05, 6.893463432788849e-05, 7.693469524383545e-05, 8.493475615978241e-05, 9.293481707572937e-05, 0.00010093487799167633, 0.00010893493890762329, 0.00011693499982357025, 0.0001249350607395172, 0.00013293512165546417, 0.00014093518257141113, 0.0001489352434873581, 0.00015693530440330505, 0.00016493536531925201, 0.00017293542623519897, 0.00018093548715114594, 0.0001889355480670929, 0.00019693560898303986, 0.00020493566989898682, 0.00021293573081493378, 0.00022093579173088074, 0.0002289358526468277, 0.00023693591356277466, 0.0002449359744787216, 0.0002529360353946686, 0.00026093609631061554, 0.0002689361572265625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 13.0, 18.0, 39.0, 42.0, 45.0, 78.0, 107.0, 180.0, 279.0, 429.0, 653.0, 1026.0, 1625.0, 2516.0, 3996.0, 6781.0, 10837.0, 17945.0, 30323.0, 50293.0, 80770.0, 122299.0, 160389.0, 168370.0, 139118.0, 95818.0, 61077.0, 37114.0, 22011.0, 12996.0, 7903.0, 4918.0, 2993.0, 1980.0, 1230.0, 767.0, 517.0, 368.0, 227.0, 163.0, 116.0, 64.0, 41.0, 30.0, 22.0, 22.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.603515625, -2.52508544921875, -2.4466552734375, -2.36822509765625, -2.289794921875, -2.21136474609375, -2.1329345703125, -2.05450439453125, -1.97607421875, -1.89764404296875, -1.8192138671875, -1.74078369140625, -1.662353515625, -1.58392333984375, -1.5054931640625, -1.42706298828125, -1.3486328125, -1.27020263671875, -1.1917724609375, -1.11334228515625, -1.034912109375, -0.95648193359375, -0.8780517578125, -0.79962158203125, -0.72119140625, -0.64276123046875, -0.5643310546875, -0.48590087890625, -0.407470703125, -0.32904052734375, -0.2506103515625, -0.17218017578125, -0.09375, -0.01531982421875, 0.0631103515625, 0.14154052734375, 0.219970703125, 0.29840087890625, 0.3768310546875, 0.45526123046875, 0.53369140625, 0.61212158203125, 0.6905517578125, 0.76898193359375, 0.847412109375, 0.92584228515625, 1.0042724609375, 1.08270263671875, 1.1611328125, 1.23956298828125, 1.3179931640625, 1.39642333984375, 1.474853515625, 1.55328369140625, 1.6317138671875, 1.71014404296875, 1.78857421875, 1.86700439453125, 1.9454345703125, 2.02386474609375, 2.102294921875, 2.18072509765625, 2.2591552734375, 2.33758544921875, 2.416015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 18.0, 11.0, 12.0, 18.0, 22.0, 36.0, 29.0, 28.0, 30.0, 43.0, 40.0, 44.0, 51.0, 48.0, 60.0, 54.0, 53.0, 50.0, 55.0, 39.0, 35.0, 42.0, 31.0, 22.0, 24.0, 21.0, 22.0, 6.0, 12.0, 12.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.04296875, -1.0161056518554688, -0.9892425537109375, -0.9623794555664062, -0.935516357421875, -0.9086532592773438, -0.8817901611328125, -0.8549270629882812, -0.82806396484375, -0.8012008666992188, -0.7743377685546875, -0.7474746704101562, -0.720611572265625, -0.6937484741210938, -0.6668853759765625, -0.6400222778320312, -0.6131591796875, -0.5862960815429688, -0.5594329833984375, -0.5325698852539062, -0.505706787109375, -0.47884368896484375, -0.4519805908203125, -0.42511749267578125, -0.39825439453125, -0.37139129638671875, -0.3445281982421875, -0.31766510009765625, -0.290802001953125, -0.26393890380859375, -0.2370758056640625, -0.21021270751953125, -0.183349609375, -0.15648651123046875, -0.1296234130859375, -0.10276031494140625, -0.075897216796875, -0.04903411865234375, -0.0221710205078125, 0.00469207763671875, 0.03155517578125, 0.05841827392578125, 0.0852813720703125, 0.11214447021484375, 0.139007568359375, 0.16587066650390625, 0.1927337646484375, 0.21959686279296875, 0.2464599609375, 0.27332305908203125, 0.3001861572265625, 0.32704925537109375, 0.353912353515625, 0.38077545166015625, 0.4076385498046875, 0.43450164794921875, 0.46136474609375, 0.48822784423828125, 0.5150909423828125, 0.5419540405273438, 0.568817138671875, 0.5956802368164062, 0.6225433349609375, 0.6494064331054688, 0.67626953125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 12.0, 15.0, 23.0, 38.0, 47.0, 53.0, 61.0, 87.0, 92.0, 86.0, 84.0, 89.0, 64.0, 51.0, 44.0, 28.0, 27.0, 20.0, 8.0, 17.0, 8.0, 6.0, 7.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.054876327514648, -8.726757049560547, -8.398637771606445, -8.070518493652344, -7.742399215698242, -7.414279937744141, -7.086161136627197, -6.758041858673096, -6.429922580718994, -6.101803302764893, -5.773684024810791, -5.4455647468566895, -5.117445945739746, -4.7893266677856445, -4.461207389831543, -4.133088111877441, -3.80496883392334, -3.4768495559692383, -3.1487302780151367, -2.8206112384796143, -2.4924919605255127, -2.164372682571411, -1.8362535238265991, -1.508134365081787, -1.1800150871276855, -0.8518958687782288, -0.523776650428772, -0.19565743207931519, 0.1324617862701416, 0.46058106422424316, 0.7887002229690552, 1.1168193817138672, 1.4449377059936523, 1.773056983947754, 2.1011762619018555, 2.429295301437378, 2.7574145793914795, 3.085533857345581, 3.4136528968811035, 3.741772174835205, 4.069891452789307, 4.398010730743408, 4.72613000869751, 5.054249286651611, 5.382368087768555, 5.710487365722656, 6.038606643676758, 6.366725921630859, 6.694845199584961, 7.0229644775390625, 7.351083755493164, 7.679203033447266, 8.007322311401367, 8.335441589355469, 8.66356086730957, 8.991680145263672, 9.319799423217773, 9.647918701171875, 9.976037979125977, 10.304157257080078, 10.63227653503418, 10.960395812988281, 11.288515090942383, 11.616634368896484, 11.94475269317627]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 4.0, 8.0, 4.0, 8.0, 8.0, 15.0, 15.0, 14.0, 21.0, 18.0, 17.0, 28.0, 28.0, 21.0, 27.0, 39.0, 42.0, 38.0, 30.0, 46.0, 37.0, 31.0, 43.0, 37.0, 37.0, 39.0, 25.0, 39.0, 30.0, 24.0, 37.0, 26.0, 16.0, 25.0, 14.0, 25.0, 8.0, 8.0, 9.0, 9.0, 8.0, 13.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.073388576507568, -4.918100357055664, -4.762812614440918, -4.607524871826172, -4.452236652374268, -4.296948432922363, -4.141660690307617, -3.986372709274292, -3.831084728240967, -3.6757967472076416, -3.5205087661743164, -3.365220785140991, -3.209932804107666, -3.054644823074341, -2.8993568420410156, -2.7440688610076904, -2.5887808799743652, -2.43349289894104, -2.278204917907715, -2.1229169368743896, -1.9676289558410645, -1.8123409748077393, -1.657052993774414, -1.5017650127410889, -1.3464770317077637, -1.1911890506744385, -1.0359010696411133, -0.8806130886077881, -0.7253251075744629, -0.5700371265411377, -0.4147491455078125, -0.2594611644744873, -0.10417366027832031, 0.05111432075500488, 0.20640230178833008, 0.3616902828216553, 0.5169782638549805, 0.6722662448883057, 0.8275542259216309, 0.982842206954956, 1.1381301879882812, 1.2934181690216064, 1.4487061500549316, 1.6039941310882568, 1.759282112121582, 1.9145700931549072, 2.0698580741882324, 2.2251460552215576, 2.380434036254883, 2.535722017288208, 2.691009998321533, 2.8462979793548584, 3.0015859603881836, 3.156873941421509, 3.312161922454834, 3.467449903488159, 3.6227378845214844, 3.7780258655548096, 3.9333138465881348, 4.088602066040039, 4.243889808654785, 4.399177551269531, 4.5544657707214355, 4.70975399017334, 4.865041732788086]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 18.0, 17.0, 15.0, 35.0, 47.0, 76.0, 133.0, 183.0, 274.0, 426.0, 763.0, 1244.0, 1984.0, 3281.0, 5769.0, 10413.0, 20228.0, 40328.0, 88191.0, 224046.0, 611448.0, 1261866.0, 1115483.0, 483081.0, 179061.0, 73297.0, 33661.0, 17078.0, 9191.0, 5100.0, 2895.0, 1732.0, 1074.0, 632.0, 425.0, 229.0, 173.0, 137.0, 70.0, 38.0, 41.0, 32.0, 15.0, 17.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.34375, -8.10455322265625, -7.8653564453125, -7.62615966796875, -7.386962890625, -7.14776611328125, -6.9085693359375, -6.66937255859375, -6.43017578125, -6.19097900390625, -5.9517822265625, -5.71258544921875, -5.473388671875, -5.23419189453125, -4.9949951171875, -4.75579833984375, -4.5166015625, -4.27740478515625, -4.0382080078125, -3.79901123046875, -3.559814453125, -3.32061767578125, -3.0814208984375, -2.84222412109375, -2.60302734375, -2.36383056640625, -2.1246337890625, -1.88543701171875, -1.646240234375, -1.40704345703125, -1.1678466796875, -0.92864990234375, -0.689453125, -0.45025634765625, -0.2110595703125, 0.02813720703125, 0.267333984375, 0.50653076171875, 0.7457275390625, 0.98492431640625, 1.22412109375, 1.46331787109375, 1.7025146484375, 1.94171142578125, 2.180908203125, 2.42010498046875, 2.6593017578125, 2.89849853515625, 3.1376953125, 3.37689208984375, 3.6160888671875, 3.85528564453125, 4.094482421875, 4.33367919921875, 4.5728759765625, 4.81207275390625, 5.05126953125, 5.29046630859375, 5.5296630859375, 5.76885986328125, 6.008056640625, 6.24725341796875, 6.4864501953125, 6.72564697265625, 6.96484375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 10.0, 8.0, 12.0, 12.0, 9.0, 19.0, 30.0, 19.0, 35.0, 23.0, 27.0, 24.0, 26.0, 32.0, 33.0, 42.0, 49.0, 52.0, 41.0, 36.0, 45.0, 35.0, 44.0, 36.0, 36.0, 33.0, 27.0, 35.0, 22.0, 15.0, 19.0, 10.0, 13.0, 16.0, 7.0, 10.0, 6.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6796875, -3.56591796875, -3.4521484375, -3.33837890625, -3.224609375, -3.11083984375, -2.9970703125, -2.88330078125, -2.76953125, -2.65576171875, -2.5419921875, -2.42822265625, -2.314453125, -2.20068359375, -2.0869140625, -1.97314453125, -1.859375, -1.74560546875, -1.6318359375, -1.51806640625, -1.404296875, -1.29052734375, -1.1767578125, -1.06298828125, -0.94921875, -0.83544921875, -0.7216796875, -0.60791015625, -0.494140625, -0.38037109375, -0.2666015625, -0.15283203125, -0.0390625, 0.07470703125, 0.1884765625, 0.30224609375, 0.416015625, 0.52978515625, 0.6435546875, 0.75732421875, 0.87109375, 0.98486328125, 1.0986328125, 1.21240234375, 1.326171875, 1.43994140625, 1.5537109375, 1.66748046875, 1.78125, 1.89501953125, 2.0087890625, 2.12255859375, 2.236328125, 2.35009765625, 2.4638671875, 2.57763671875, 2.69140625, 2.80517578125, 2.9189453125, 3.03271484375, 3.146484375, 3.26025390625, 3.3740234375, 3.48779296875, 3.6015625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 7.0, 12.0, 17.0, 27.0, 45.0, 74.0, 85.0, 130.0, 215.0, 302.0, 454.0, 682.0, 1054.0, 1643.0, 2574.0, 4124.0, 6613.0, 11132.0, 19174.0, 34521.0, 64041.0, 126148.0, 262576.0, 570948.0, 1070342.0, 1011462.0, 516261.0, 237239.0, 115471.0, 59349.0, 32247.0, 17779.0, 10432.0, 6315.0, 3863.0, 2429.0, 1519.0, 940.0, 723.0, 413.0, 286.0, 188.0, 135.0, 93.0, 71.0, 42.0, 31.0, 17.0, 12.0, 10.0, 8.0, 6.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.21875, -6.99957275390625, -6.7803955078125, -6.56121826171875, -6.342041015625, -6.12286376953125, -5.9036865234375, -5.68450927734375, -5.46533203125, -5.24615478515625, -5.0269775390625, -4.80780029296875, -4.588623046875, -4.36944580078125, -4.1502685546875, -3.93109130859375, -3.7119140625, -3.49273681640625, -3.2735595703125, -3.05438232421875, -2.835205078125, -2.61602783203125, -2.3968505859375, -2.17767333984375, -1.95849609375, -1.73931884765625, -1.5201416015625, -1.30096435546875, -1.081787109375, -0.86260986328125, -0.6434326171875, -0.42425537109375, -0.205078125, 0.01409912109375, 0.2332763671875, 0.45245361328125, 0.671630859375, 0.89080810546875, 1.1099853515625, 1.32916259765625, 1.54833984375, 1.76751708984375, 1.9866943359375, 2.20587158203125, 2.425048828125, 2.64422607421875, 2.8634033203125, 3.08258056640625, 3.3017578125, 3.52093505859375, 3.7401123046875, 3.95928955078125, 4.178466796875, 4.39764404296875, 4.6168212890625, 4.83599853515625, 5.05517578125, 5.27435302734375, 5.4935302734375, 5.71270751953125, 5.931884765625, 6.15106201171875, 6.3702392578125, 6.58941650390625, 6.80859375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 3.0, 9.0, 10.0, 10.0, 6.0, 23.0, 25.0, 25.0, 34.0, 47.0, 58.0, 84.0, 102.0, 121.0, 158.0, 203.0, 215.0, 251.0, 276.0, 301.0, 320.0, 308.0, 280.0, 241.0, 194.0, 148.0, 129.0, 109.0, 84.0, 79.0, 42.0, 36.0, 30.0, 28.0, 13.0, 12.0, 9.0, 6.0, 12.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.517578125, -2.4479217529296875, -2.378265380859375, -2.3086090087890625, -2.23895263671875, -2.1692962646484375, -2.099639892578125, -2.0299835205078125, -1.9603271484375, -1.8906707763671875, -1.821014404296875, -1.7513580322265625, -1.68170166015625, -1.6120452880859375, -1.542388916015625, -1.4727325439453125, -1.403076171875, -1.3334197998046875, -1.263763427734375, -1.1941070556640625, -1.12445068359375, -1.0547943115234375, -0.985137939453125, -0.9154815673828125, -0.8458251953125, -0.7761688232421875, -0.706512451171875, -0.6368560791015625, -0.56719970703125, -0.4975433349609375, -0.427886962890625, -0.3582305908203125, -0.28857421875, -0.2189178466796875, -0.149261474609375, -0.0796051025390625, -0.00994873046875, 0.0597076416015625, 0.129364013671875, 0.1990203857421875, 0.2686767578125, 0.3383331298828125, 0.407989501953125, 0.4776458740234375, 0.54730224609375, 0.6169586181640625, 0.686614990234375, 0.7562713623046875, 0.825927734375, 0.8955841064453125, 0.965240478515625, 1.0348968505859375, 1.10455322265625, 1.1742095947265625, 1.243865966796875, 1.3135223388671875, 1.3831787109375, 1.4528350830078125, 1.522491455078125, 1.5921478271484375, 1.66180419921875, 1.7314605712890625, 1.801116943359375, 1.8707733154296875, 1.9404296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 8.0, 14.0, 13.0, 17.0, 29.0, 34.0, 39.0, 54.0, 56.0, 98.0, 117.0, 86.0, 98.0, 79.0, 74.0, 55.0, 25.0, 22.0, 17.0, 15.0, 6.0, 14.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.846148490905762, -8.509147644042969, -8.172146797180176, -7.835146427154541, -7.498146057128906, -7.161145210266113, -6.82414436340332, -6.487143516540527, -6.150143146514893, -5.8131422996521, -5.476141929626465, -5.139141082763672, -4.802140235900879, -4.465139865875244, -4.128139019012451, -3.7911384105682373, -3.4541378021240234, -3.1171371936798096, -2.7801365852355957, -2.4431357383728027, -2.106135129928589, -1.769134521484375, -1.432133674621582, -1.0951330661773682, -0.7581324577331543, -0.42113178968429565, -0.08413112163543701, 0.2528696060180664, 0.5898702144622803, 0.9268708229064941, 1.263871669769287, 1.600872278213501, 1.9378719329833984, 2.2748725414276123, 2.611873149871826, 2.948873996734619, 3.285874605178833, 3.622875213623047, 3.95987606048584, 4.296876907348633, 4.633877277374268, 4.9708781242370605, 5.307878494262695, 5.644879341125488, 5.981880187988281, 6.318880558013916, 6.655881404876709, 6.992881774902344, 7.329882621765137, 7.66688346862793, 8.003884315490723, 8.340885162353516, 8.677885055541992, 9.014885902404785, 9.351886749267578, 9.688887596130371, 10.025888442993164, 10.362889289855957, 10.69989013671875, 11.036890029907227, 11.37389087677002, 11.710891723632812, 12.047892570495605, 12.384893417358398, 12.721893310546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 10.0, 12.0, 11.0, 15.0, 11.0, 12.0, 28.0, 23.0, 21.0, 28.0, 47.0, 38.0, 37.0, 33.0, 51.0, 40.0, 41.0, 54.0, 48.0, 40.0, 43.0, 33.0, 42.0, 41.0, 30.0, 37.0, 19.0, 25.0, 20.0, 16.0, 16.0, 13.0, 13.0, 9.0, 11.0, 8.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0195159912109375, -4.8498053550720215, -4.6800947189331055, -4.510384559631348, -4.340673923492432, -4.170963287353516, -4.0012526512146, -3.8315422534942627, -3.661831855773926, -3.4921212196350098, -3.322410821914673, -3.152700185775757, -2.98298978805542, -2.813279151916504, -2.643568515777588, -2.473858118057251, -2.304147481918335, -2.134436845779419, -1.964726448059082, -1.795015811920166, -1.625305414199829, -1.455594778060913, -1.2858842611312866, -1.1161737442016602, -0.9464632272720337, -0.7767527103424072, -0.6070421934127808, -0.4373316168785095, -0.26762109994888306, -0.09791058301925659, 0.07179999351501465, 0.2415105104446411, 0.4112210273742676, 0.580931544303894, 0.7506420612335205, 0.9203526377677917, 1.0900630950927734, 1.2597737312316895, 1.429484248161316, 1.5991947650909424, 1.7689052820205688, 1.9386157989501953, 2.1083264350891113, 2.2780368328094482, 2.4477474689483643, 2.617457866668701, 2.787168502807617, 2.956879138946533, 3.12658953666687, 3.296300172805786, 3.466010570526123, 3.635721206665039, 3.805431604385376, 3.975142240524292, 4.144852638244629, 4.314563274383545, 4.484273910522461, 4.653984546661377, 4.823695182800293, 4.993405342102051, 5.163115978240967, 5.332826614379883, 5.502537250518799, 5.672247886657715, 5.841958045959473]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 14.0, 16.0, 22.0, 27.0, 64.0, 73.0, 97.0, 158.0, 239.0, 462.0, 680.0, 1105.0, 1933.0, 3325.0, 5924.0, 10689.0, 19111.0, 35316.0, 63349.0, 108570.0, 169819.0, 205485.0, 169383.0, 109258.0, 63428.0, 35616.0, 19432.0, 10651.0, 5989.0, 3302.0, 1986.0, 1143.0, 685.0, 448.0, 280.0, 186.0, 95.0, 57.0, 45.0, 30.0, 19.0, 18.0, 8.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.75286865234375, -4.6151123046875, -4.47735595703125, -4.339599609375, -4.20184326171875, -4.0640869140625, -3.92633056640625, -3.78857421875, -3.65081787109375, -3.5130615234375, -3.37530517578125, -3.237548828125, -3.09979248046875, -2.9620361328125, -2.82427978515625, -2.6865234375, -2.54876708984375, -2.4110107421875, -2.27325439453125, -2.135498046875, -1.99774169921875, -1.8599853515625, -1.72222900390625, -1.58447265625, -1.44671630859375, -1.3089599609375, -1.17120361328125, -1.033447265625, -0.89569091796875, -0.7579345703125, -0.62017822265625, -0.482421875, -0.34466552734375, -0.2069091796875, -0.06915283203125, 0.068603515625, 0.20635986328125, 0.3441162109375, 0.48187255859375, 0.61962890625, 0.75738525390625, 0.8951416015625, 1.03289794921875, 1.170654296875, 1.30841064453125, 1.4461669921875, 1.58392333984375, 1.7216796875, 1.85943603515625, 1.9971923828125, 2.13494873046875, 2.272705078125, 2.41046142578125, 2.5482177734375, 2.68597412109375, 2.82373046875, 2.96148681640625, 3.0992431640625, 3.23699951171875, 3.374755859375, 3.51251220703125, 3.6502685546875, 3.78802490234375, 3.92578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 1.0, 6.0, 11.0, 12.0, 12.0, 11.0, 18.0, 15.0, 25.0, 26.0, 25.0, 32.0, 41.0, 34.0, 38.0, 45.0, 31.0, 44.0, 52.0, 51.0, 57.0, 45.0, 28.0, 38.0, 36.0, 34.0, 41.0, 23.0, 28.0, 30.0, 18.0, 14.0, 13.0, 14.0, 11.0, 10.0, 10.0, 9.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.2816162109375, -5.102294921875, -4.9229736328125, -4.74365234375, -4.5643310546875, -4.385009765625, -4.2056884765625, -4.0263671875, -3.8470458984375, -3.667724609375, -3.4884033203125, -3.30908203125, -3.1297607421875, -2.950439453125, -2.7711181640625, -2.591796875, -2.4124755859375, -2.233154296875, -2.0538330078125, -1.87451171875, -1.6951904296875, -1.515869140625, -1.3365478515625, -1.1572265625, -0.9779052734375, -0.798583984375, -0.6192626953125, -0.43994140625, -0.2606201171875, -0.081298828125, 0.0980224609375, 0.27734375, 0.4566650390625, 0.635986328125, 0.8153076171875, 0.99462890625, 1.1739501953125, 1.353271484375, 1.5325927734375, 1.7119140625, 1.8912353515625, 2.070556640625, 2.2498779296875, 2.42919921875, 2.6085205078125, 2.787841796875, 2.9671630859375, 3.146484375, 3.3258056640625, 3.505126953125, 3.6844482421875, 3.86376953125, 4.0430908203125, 4.222412109375, 4.4017333984375, 4.5810546875, 4.7603759765625, 4.939697265625, 5.1190185546875, 5.29833984375, 5.4776611328125, 5.656982421875, 5.8363037109375, 6.015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 9.0, 24.0, 27.0, 35.0, 56.0, 93.0, 154.0, 281.0, 421.0, 712.0, 1146.0, 1880.0, 3376.0, 6020.0, 11109.0, 21647.0, 42601.0, 84881.0, 161221.0, 248038.0, 214957.0, 121408.0, 61841.0, 31003.0, 16119.0, 8345.0, 4638.0, 2629.0, 1501.0, 859.0, 512.0, 368.0, 225.0, 118.0, 93.0, 67.0, 45.0, 28.0, 19.0, 19.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.5, -5.326904296875, -5.15380859375, -4.980712890625, -4.8076171875, -4.634521484375, -4.46142578125, -4.288330078125, -4.115234375, -3.942138671875, -3.76904296875, -3.595947265625, -3.4228515625, -3.249755859375, -3.07666015625, -2.903564453125, -2.73046875, -2.557373046875, -2.38427734375, -2.211181640625, -2.0380859375, -1.864990234375, -1.69189453125, -1.518798828125, -1.345703125, -1.172607421875, -0.99951171875, -0.826416015625, -0.6533203125, -0.480224609375, -0.30712890625, -0.134033203125, 0.0390625, 0.212158203125, 0.38525390625, 0.558349609375, 0.7314453125, 0.904541015625, 1.07763671875, 1.250732421875, 1.423828125, 1.596923828125, 1.77001953125, 1.943115234375, 2.1162109375, 2.289306640625, 2.46240234375, 2.635498046875, 2.80859375, 2.981689453125, 3.15478515625, 3.327880859375, 3.5009765625, 3.674072265625, 3.84716796875, 4.020263671875, 4.193359375, 4.366455078125, 4.53955078125, 4.712646484375, 4.8857421875, 5.058837890625, 5.23193359375, 5.405029296875, 5.578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 0.0, 8.0, 7.0, 6.0, 11.0, 14.0, 12.0, 11.0, 16.0, 28.0, 23.0, 24.0, 37.0, 34.0, 33.0, 33.0, 27.0, 39.0, 42.0, 42.0, 44.0, 29.0, 31.0, 41.0, 47.0, 37.0, 32.0, 34.0, 40.0, 21.0, 25.0, 25.0, 20.0, 18.0, 12.0, 13.0, 13.0, 10.0, 11.0, 7.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.966796875, -2.8758544921875, -2.784912109375, -2.6939697265625, -2.60302734375, -2.5120849609375, -2.421142578125, -2.3302001953125, -2.2392578125, -2.1483154296875, -2.057373046875, -1.9664306640625, -1.87548828125, -1.7845458984375, -1.693603515625, -1.6026611328125, -1.51171875, -1.4207763671875, -1.329833984375, -1.2388916015625, -1.14794921875, -1.0570068359375, -0.966064453125, -0.8751220703125, -0.7841796875, -0.6932373046875, -0.602294921875, -0.5113525390625, -0.42041015625, -0.3294677734375, -0.238525390625, -0.1475830078125, -0.056640625, 0.0343017578125, 0.125244140625, 0.2161865234375, 0.30712890625, 0.3980712890625, 0.489013671875, 0.5799560546875, 0.6708984375, 0.7618408203125, 0.852783203125, 0.9437255859375, 1.03466796875, 1.1256103515625, 1.216552734375, 1.3074951171875, 1.3984375, 1.4893798828125, 1.580322265625, 1.6712646484375, 1.76220703125, 1.8531494140625, 1.944091796875, 2.0350341796875, 2.1259765625, 2.2169189453125, 2.307861328125, 2.3988037109375, 2.48974609375, 2.5806884765625, 2.671630859375, 2.7625732421875, 2.853515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 11.0, 20.0, 21.0, 44.0, 63.0, 100.0, 167.0, 272.0, 416.0, 635.0, 1092.0, 1824.0, 3151.0, 5566.0, 9747.0, 18545.0, 35798.0, 73760.0, 155091.0, 271516.0, 233064.0, 118409.0, 56859.0, 28297.0, 14770.0, 8114.0, 4528.0, 2622.0, 1528.0, 957.0, 587.0, 341.0, 228.0, 139.0, 91.0, 60.0, 45.0, 33.0, 14.0, 10.0, 11.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.669921875, -2.590972900390625, -2.51202392578125, -2.433074951171875, -2.3541259765625, -2.275177001953125, -2.19622802734375, -2.117279052734375, -2.038330078125, -1.959381103515625, -1.88043212890625, -1.801483154296875, -1.7225341796875, -1.643585205078125, -1.56463623046875, -1.485687255859375, -1.40673828125, -1.327789306640625, -1.24884033203125, -1.169891357421875, -1.0909423828125, -1.011993408203125, -0.93304443359375, -0.854095458984375, -0.775146484375, -0.696197509765625, -0.61724853515625, -0.538299560546875, -0.4593505859375, -0.380401611328125, -0.30145263671875, -0.222503662109375, -0.1435546875, -0.064605712890625, 0.01434326171875, 0.093292236328125, 0.1722412109375, 0.251190185546875, 0.33013916015625, 0.409088134765625, 0.488037109375, 0.566986083984375, 0.64593505859375, 0.724884033203125, 0.8038330078125, 0.882781982421875, 0.96173095703125, 1.040679931640625, 1.11962890625, 1.198577880859375, 1.27752685546875, 1.356475830078125, 1.4354248046875, 1.514373779296875, 1.59332275390625, 1.672271728515625, 1.751220703125, 1.830169677734375, 1.90911865234375, 1.988067626953125, 2.0670166015625, 2.145965576171875, 2.22491455078125, 2.303863525390625, 2.3828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 6.0, 14.0, 11.0, 18.0, 28.0, 25.0, 43.0, 52.0, 53.0, 74.0, 85.0, 98.0, 73.0, 72.0, 77.0, 57.0, 36.0, 37.0, 34.0, 21.0, 26.0, 6.0, 7.0, 10.0, 6.0, 4.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011140108108520508, -0.00010639335960149765, -0.00010138563811779022, -9.63779166340828e-05, -9.137019515037537e-05, -8.636247366666794e-05, -8.135475218296051e-05, -7.634703069925308e-05, -7.133930921554565e-05, -6.633158773183823e-05, -6.13238662481308e-05, -5.631614476442337e-05, -5.130842328071594e-05, -4.6300701797008514e-05, -4.1292980313301086e-05, -3.628525882959366e-05, -3.127753734588623e-05, -2.6269815862178802e-05, -2.1262094378471375e-05, -1.6254372894763947e-05, -1.1246651411056519e-05, -6.2389299273490906e-06, -1.2312084436416626e-06, 3.7765130400657654e-06, 8.784234523773193e-06, 1.3791956007480621e-05, 1.879967749118805e-05, 2.3807398974895477e-05, 2.8815120458602905e-05, 3.382284194231033e-05, 3.883056342601776e-05, 4.383828490972519e-05, 4.884600639343262e-05, 5.3853727877140045e-05, 5.886144936084747e-05, 6.38691708445549e-05, 6.887689232826233e-05, 7.388461381196976e-05, 7.889233529567719e-05, 8.390005677938461e-05, 8.890777826309204e-05, 9.391549974679947e-05, 9.89232212305069e-05, 0.00010393094271421432, 0.00010893866419792175, 0.00011394638568162918, 0.00011895410716533661, 0.00012396182864904404, 0.00012896955013275146, 0.0001339772716164589, 0.00013898499310016632, 0.00014399271458387375, 0.00014900043606758118, 0.0001540081575512886, 0.00015901587903499603, 0.00016402360051870346, 0.0001690313220024109, 0.00017403904348611832, 0.00017904676496982574, 0.00018405448645353317, 0.0001890622079372406, 0.00019406992942094803, 0.00019907765090465546, 0.00020408537238836288, 0.0002090930938720703]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 14.0, 19.0, 26.0, 39.0, 34.0, 60.0, 94.0, 131.0, 192.0, 252.0, 401.0, 531.0, 875.0, 1323.0, 2152.0, 3498.0, 6014.0, 10853.0, 20057.0, 38468.0, 76284.0, 141733.0, 213074.0, 216667.0, 146625.0, 79865.0, 40999.0, 20899.0, 11206.0, 6221.0, 3640.0, 2138.0, 1419.0, 864.0, 562.0, 390.0, 233.0, 206.0, 154.0, 95.0, 71.0, 47.0, 33.0, 27.0, 23.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.22265625, -2.1573486328125, -2.092041015625, -2.0267333984375, -1.96142578125, -1.8961181640625, -1.830810546875, -1.7655029296875, -1.7001953125, -1.6348876953125, -1.569580078125, -1.5042724609375, -1.43896484375, -1.3736572265625, -1.308349609375, -1.2430419921875, -1.177734375, -1.1124267578125, -1.047119140625, -0.9818115234375, -0.91650390625, -0.8511962890625, -0.785888671875, -0.7205810546875, -0.6552734375, -0.5899658203125, -0.524658203125, -0.4593505859375, -0.39404296875, -0.3287353515625, -0.263427734375, -0.1981201171875, -0.1328125, -0.0675048828125, -0.002197265625, 0.0631103515625, 0.12841796875, 0.1937255859375, 0.259033203125, 0.3243408203125, 0.3896484375, 0.4549560546875, 0.520263671875, 0.5855712890625, 0.65087890625, 0.7161865234375, 0.781494140625, 0.8468017578125, 0.912109375, 0.9774169921875, 1.042724609375, 1.1080322265625, 1.17333984375, 1.2386474609375, 1.303955078125, 1.3692626953125, 1.4345703125, 1.4998779296875, 1.565185546875, 1.6304931640625, 1.69580078125, 1.7611083984375, 1.826416015625, 1.8917236328125, 1.95703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 5.0, 10.0, 8.0, 18.0, 19.0, 20.0, 36.0, 51.0, 62.0, 49.0, 70.0, 62.0, 71.0, 69.0, 64.0, 57.0, 47.0, 43.0, 53.0, 37.0, 33.0, 23.0, 21.0, 14.0, 16.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76513671875, -0.739593505859375, -0.71405029296875, -0.688507080078125, -0.6629638671875, -0.637420654296875, -0.61187744140625, -0.586334228515625, -0.560791015625, -0.535247802734375, -0.50970458984375, -0.484161376953125, -0.4586181640625, -0.433074951171875, -0.40753173828125, -0.381988525390625, -0.3564453125, -0.330902099609375, -0.30535888671875, -0.279815673828125, -0.2542724609375, -0.228729248046875, -0.20318603515625, -0.177642822265625, -0.152099609375, -0.126556396484375, -0.10101318359375, -0.075469970703125, -0.0499267578125, -0.024383544921875, 0.00115966796875, 0.026702880859375, 0.05224609375, 0.077789306640625, 0.10333251953125, 0.128875732421875, 0.1544189453125, 0.179962158203125, 0.20550537109375, 0.231048583984375, 0.256591796875, 0.282135009765625, 0.30767822265625, 0.333221435546875, 0.3587646484375, 0.384307861328125, 0.40985107421875, 0.435394287109375, 0.4609375, 0.486480712890625, 0.51202392578125, 0.537567138671875, 0.5631103515625, 0.588653564453125, 0.61419677734375, 0.639739990234375, 0.665283203125, 0.690826416015625, 0.71636962890625, 0.741912841796875, 0.7674560546875, 0.792999267578125, 0.81854248046875, 0.844085693359375, 0.86962890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 8.0, 7.0, 12.0, 20.0, 28.0, 29.0, 43.0, 49.0, 68.0, 99.0, 112.0, 97.0, 104.0, 65.0, 82.0, 41.0, 33.0, 24.0, 11.0, 16.0, 11.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.14549732208252, -8.808816909790039, -8.472137451171875, -8.135457038879395, -7.7987775802612305, -7.462097644805908, -7.125417709350586, -6.7887372970581055, -6.452057838439941, -6.115377902984619, -5.778697967529297, -5.442018032073975, -5.105338096618652, -4.76865816116333, -4.431978225708008, -4.095297813415527, -3.758617877960205, -3.421937942504883, -3.0852580070495605, -2.7485780715942383, -2.411898136138916, -2.0752182006835938, -1.7385380268096924, -1.4018580913543701, -1.0651781558990479, -0.7284982204437256, -0.39181822538375854, -0.055138230323791504, 0.28154170513153076, 0.618221640586853, 0.9549016952514648, 1.291581630706787, 1.6282615661621094, 1.9649415016174316, 2.301621437072754, 2.638301372528076, 2.9749813079833984, 3.3116612434387207, 3.648341417312622, 3.9850213527679443, 4.3217010498046875, 4.65838098526001, 4.995060920715332, 5.331740856170654, 5.668420791625977, 6.005100727081299, 6.341780662536621, 6.678461074829102, 7.015141010284424, 7.351820945739746, 7.688500881195068, 8.02518081665039, 8.361861228942871, 8.698540687561035, 9.035221099853516, 9.37190055847168, 9.70858097076416, 10.04526138305664, 10.381940841674805, 10.718621253967285, 11.05530071258545, 11.39198112487793, 11.728660583496094, 12.065340995788574, 12.402020454406738]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 1.0, 6.0, 4.0, 10.0, 13.0, 14.0, 9.0, 16.0, 15.0, 22.0, 23.0, 16.0, 42.0, 41.0, 41.0, 34.0, 39.0, 46.0, 45.0, 42.0, 56.0, 40.0, 44.0, 39.0, 38.0, 40.0, 38.0, 38.0, 24.0, 29.0, 21.0, 21.0, 13.0, 16.0, 14.0, 12.0, 12.0, 7.0, 2.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.905910015106201, -4.7390899658203125, -4.572269916534424, -4.405449867248535, -4.2386298179626465, -4.071809768676758, -3.90498948097229, -3.7381694316864014, -3.5713493824005127, -3.404529333114624, -3.2377092838287354, -3.0708889961242676, -2.904068946838379, -2.7372488975524902, -2.5704288482666016, -2.403608798980713, -2.236788749694824, -2.0699687004089355, -1.9031486511230469, -1.7363284826278687, -1.56950843334198, -1.4026883840560913, -1.235868215560913, -1.0690481662750244, -0.9022281169891357, -0.7354080677032471, -0.5685879588127136, -0.4017678499221802, -0.2349478006362915, -0.06812775135040283, 0.09869241714477539, 0.26551246643066406, 0.43233299255371094, 0.5991530418395996, 0.7659731507301331, 0.9327932596206665, 1.0996133089065552, 1.2664333581924438, 1.433253526687622, 1.6000735759735107, 1.7668936252593994, 1.933713674545288, 2.1005337238311768, 2.2673540115356445, 2.434174060821533, 2.600994110107422, 2.7678141593933105, 2.934634208679199, 3.101454257965088, 3.2682743072509766, 3.4350943565368652, 3.601914405822754, 3.7687344551086426, 3.9355545043945312, 4.102375030517578, 4.269194602966309, 4.4360151290893555, 4.602835178375244, 4.769655227661133, 4.9364752769470215, 5.10329532623291, 5.270115375518799, 5.4369354248046875, 5.603755950927734, 5.770575523376465]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 13.0, 9.0, 16.0, 22.0, 45.0, 70.0, 97.0, 154.0, 218.0, 317.0, 517.0, 803.0, 1264.0, 1921.0, 3104.0, 5068.0, 8230.0, 13678.0, 22937.0, 37799.0, 62602.0, 100420.0, 143767.0, 173493.0, 159503.0, 117742.0, 76950.0, 46680.0, 27826.0, 16852.0, 9905.0, 6213.0, 3725.0, 2383.0, 1504.0, 935.0, 621.0, 416.0, 242.0, 175.0, 114.0, 57.0, 55.0, 32.0, 24.0, 16.0, 7.0, 6.0, 6.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.7562255859375, -4.606201171875, -4.4561767578125, -4.30615234375, -4.1561279296875, -4.006103515625, -3.8560791015625, -3.7060546875, -3.5560302734375, -3.406005859375, -3.2559814453125, -3.10595703125, -2.9559326171875, -2.805908203125, -2.6558837890625, -2.505859375, -2.3558349609375, -2.205810546875, -2.0557861328125, -1.90576171875, -1.7557373046875, -1.605712890625, -1.4556884765625, -1.3056640625, -1.1556396484375, -1.005615234375, -0.8555908203125, -0.70556640625, -0.5555419921875, -0.405517578125, -0.2554931640625, -0.10546875, 0.0445556640625, 0.194580078125, 0.3446044921875, 0.49462890625, 0.6446533203125, 0.794677734375, 0.9447021484375, 1.0947265625, 1.2447509765625, 1.394775390625, 1.5447998046875, 1.69482421875, 1.8448486328125, 1.994873046875, 2.1448974609375, 2.294921875, 2.4449462890625, 2.594970703125, 2.7449951171875, 2.89501953125, 3.0450439453125, 3.195068359375, 3.3450927734375, 3.4951171875, 3.6451416015625, 3.795166015625, 3.9451904296875, 4.09521484375, 4.2452392578125, 4.395263671875, 4.5452880859375, 4.6953125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 5.0, 13.0, 14.0, 16.0, 19.0, 13.0, 29.0, 29.0, 32.0, 30.0, 38.0, 36.0, 42.0, 52.0, 53.0, 47.0, 30.0, 48.0, 49.0, 37.0, 48.0, 37.0, 35.0, 33.0, 27.0, 27.0, 21.0, 21.0, 21.0, 11.0, 11.0, 11.0, 5.0, 6.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34375, -5.16766357421875, -4.9915771484375, -4.81549072265625, -4.639404296875, -4.46331787109375, -4.2872314453125, -4.11114501953125, -3.93505859375, -3.75897216796875, -3.5828857421875, -3.40679931640625, -3.230712890625, -3.05462646484375, -2.8785400390625, -2.70245361328125, -2.5263671875, -2.35028076171875, -2.1741943359375, -1.99810791015625, -1.822021484375, -1.64593505859375, -1.4698486328125, -1.29376220703125, -1.11767578125, -0.94158935546875, -0.7655029296875, -0.58941650390625, -0.413330078125, -0.23724365234375, -0.0611572265625, 0.11492919921875, 0.291015625, 0.46710205078125, 0.6431884765625, 0.81927490234375, 0.995361328125, 1.17144775390625, 1.3475341796875, 1.52362060546875, 1.69970703125, 1.87579345703125, 2.0518798828125, 2.22796630859375, 2.404052734375, 2.58013916015625, 2.7562255859375, 2.93231201171875, 3.1083984375, 3.28448486328125, 3.4605712890625, 3.63665771484375, 3.812744140625, 3.98883056640625, 4.1649169921875, 4.34100341796875, 4.51708984375, 4.69317626953125, 4.8692626953125, 5.04534912109375, 5.221435546875, 5.39752197265625, 5.5736083984375, 5.74969482421875, 5.92578125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 2.0, 4.0, 4.0, 10.0, 10.0, 8.0, 14.0, 23.0, 29.0, 43.0, 52.0, 64.0, 92.0, 135.0, 159.0, 243.0, 344.0, 504.0, 799.0, 1355.0, 2272.0, 3991.0, 7518.0, 14920.0, 31423.0, 66426.0, 134683.0, 221750.0, 238393.0, 161022.0, 83082.0, 39592.0, 18598.0, 9314.0, 4912.0, 2523.0, 1392.0, 896.0, 584.0, 370.0, 277.0, 189.0, 117.0, 106.0, 89.0, 52.0, 44.0, 31.0, 29.0, 19.0, 17.0, 13.0, 8.0, 7.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.64453125, -6.43121337890625, -6.2178955078125, -6.00457763671875, -5.791259765625, -5.57794189453125, -5.3646240234375, -5.15130615234375, -4.93798828125, -4.72467041015625, -4.5113525390625, -4.29803466796875, -4.084716796875, -3.87139892578125, -3.6580810546875, -3.44476318359375, -3.2314453125, -3.01812744140625, -2.8048095703125, -2.59149169921875, -2.378173828125, -2.16485595703125, -1.9515380859375, -1.73822021484375, -1.52490234375, -1.31158447265625, -1.0982666015625, -0.88494873046875, -0.671630859375, -0.45831298828125, -0.2449951171875, -0.03167724609375, 0.181640625, 0.39495849609375, 0.6082763671875, 0.82159423828125, 1.034912109375, 1.24822998046875, 1.4615478515625, 1.67486572265625, 1.88818359375, 2.10150146484375, 2.3148193359375, 2.52813720703125, 2.741455078125, 2.95477294921875, 3.1680908203125, 3.38140869140625, 3.5947265625, 3.80804443359375, 4.0213623046875, 4.23468017578125, 4.447998046875, 4.66131591796875, 4.8746337890625, 5.08795166015625, 5.30126953125, 5.51458740234375, 5.7279052734375, 5.94122314453125, 6.154541015625, 6.36785888671875, 6.5811767578125, 6.79449462890625, 7.0078125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 4.0, 11.0, 8.0, 4.0, 9.0, 11.0, 10.0, 12.0, 15.0, 28.0, 19.0, 46.0, 25.0, 30.0, 43.0, 29.0, 33.0, 38.0, 37.0, 32.0, 37.0, 45.0, 52.0, 46.0, 45.0, 36.0, 35.0, 28.0, 26.0, 34.0, 32.0, 27.0, 16.0, 19.0, 9.0, 16.0, 7.0, 5.0, 3.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.981231689453125, -2.88238525390625, -2.783538818359375, -2.6846923828125, -2.585845947265625, -2.48699951171875, -2.388153076171875, -2.289306640625, -2.190460205078125, -2.09161376953125, -1.992767333984375, -1.8939208984375, -1.795074462890625, -1.69622802734375, -1.597381591796875, -1.49853515625, -1.399688720703125, -1.30084228515625, -1.201995849609375, -1.1031494140625, -1.004302978515625, -0.90545654296875, -0.806610107421875, -0.707763671875, -0.608917236328125, -0.51007080078125, -0.411224365234375, -0.3123779296875, -0.213531494140625, -0.11468505859375, -0.015838623046875, 0.0830078125, 0.181854248046875, 0.28070068359375, 0.379547119140625, 0.4783935546875, 0.577239990234375, 0.67608642578125, 0.774932861328125, 0.873779296875, 0.972625732421875, 1.07147216796875, 1.170318603515625, 1.2691650390625, 1.368011474609375, 1.46685791015625, 1.565704345703125, 1.66455078125, 1.763397216796875, 1.86224365234375, 1.961090087890625, 2.0599365234375, 2.158782958984375, 2.25762939453125, 2.356475830078125, 2.455322265625, 2.554168701171875, 2.65301513671875, 2.751861572265625, 2.8507080078125, 2.949554443359375, 3.04840087890625, 3.147247314453125, 3.24609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 6.0, 8.0, 11.0, 17.0, 24.0, 32.0, 49.0, 80.0, 99.0, 127.0, 186.0, 292.0, 428.0, 618.0, 978.0, 1464.0, 2632.0, 4459.0, 8337.0, 15813.0, 32806.0, 68461.0, 137617.0, 223869.0, 236050.0, 155632.0, 79248.0, 38233.0, 18596.0, 9495.0, 5047.0, 2887.0, 1718.0, 1134.0, 660.0, 437.0, 322.0, 201.0, 134.0, 92.0, 71.0, 53.0, 38.0, 18.0, 23.0, 12.0, 7.0, 6.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.05078125, -2.95574951171875, -2.8607177734375, -2.76568603515625, -2.670654296875, -2.57562255859375, -2.4805908203125, -2.38555908203125, -2.29052734375, -2.19549560546875, -2.1004638671875, -2.00543212890625, -1.910400390625, -1.81536865234375, -1.7203369140625, -1.62530517578125, -1.5302734375, -1.43524169921875, -1.3402099609375, -1.24517822265625, -1.150146484375, -1.05511474609375, -0.9600830078125, -0.86505126953125, -0.77001953125, -0.67498779296875, -0.5799560546875, -0.48492431640625, -0.389892578125, -0.29486083984375, -0.1998291015625, -0.10479736328125, -0.009765625, 0.08526611328125, 0.1802978515625, 0.27532958984375, 0.370361328125, 0.46539306640625, 0.5604248046875, 0.65545654296875, 0.75048828125, 0.84552001953125, 0.9405517578125, 1.03558349609375, 1.130615234375, 1.22564697265625, 1.3206787109375, 1.41571044921875, 1.5107421875, 1.60577392578125, 1.7008056640625, 1.79583740234375, 1.890869140625, 1.98590087890625, 2.0809326171875, 2.17596435546875, 2.27099609375, 2.36602783203125, 2.4610595703125, 2.55609130859375, 2.651123046875, 2.74615478515625, 2.8411865234375, 2.93621826171875, 3.03125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 2.0, 7.0, 7.0, 15.0, 8.0, 15.0, 13.0, 21.0, 27.0, 22.0, 37.0, 48.0, 65.0, 49.0, 66.0, 57.0, 63.0, 73.0, 66.0, 51.0, 43.0, 52.0, 36.0, 31.0, 33.0, 19.0, 18.0, 7.0, 8.0, 9.0, 7.0, 3.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.0002105608582496643, -0.0002032071352005005, -0.00019585341215133667, -0.00018849968910217285, -0.00018114596605300903, -0.00017379224300384521, -0.0001664385199546814, -0.00015908479690551758, -0.00015173107385635376, -0.00014437735080718994, -0.00013702362775802612, -0.0001296699047088623, -0.00012231618165969849, -0.00011496245861053467, -0.00010760873556137085, -0.00010025501251220703, -9.290128946304321e-05, -8.55475664138794e-05, -7.819384336471558e-05, -7.084012031555176e-05, -6.348639726638794e-05, -5.613267421722412e-05, -4.87789511680603e-05, -4.1425228118896484e-05, -3.4071505069732666e-05, -2.6717782020568848e-05, -1.936405897140503e-05, -1.2010335922241211e-05, -4.656612873077393e-06, 2.6971101760864258e-06, 1.0050833225250244e-05, 1.7404556274414062e-05, 2.475827932357788e-05, 3.21120023727417e-05, 3.946572542190552e-05, 4.6819448471069336e-05, 5.4173171520233154e-05, 6.152689456939697e-05, 6.888061761856079e-05, 7.623434066772461e-05, 8.358806371688843e-05, 9.094178676605225e-05, 9.829550981521606e-05, 0.00010564923286437988, 0.0001130029559135437, 0.00012035667896270752, 0.00012771040201187134, 0.00013506412506103516, 0.00014241784811019897, 0.0001497715711593628, 0.0001571252942085266, 0.00016447901725769043, 0.00017183274030685425, 0.00017918646335601807, 0.00018654018640518188, 0.0001938939094543457, 0.00020124763250350952, 0.00020860135555267334, 0.00021595507860183716, 0.00022330880165100098, 0.0002306625247001648, 0.0002380162477493286, 0.00024536997079849243, 0.00025272369384765625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 8.0, 4.0, 13.0, 12.0, 19.0, 29.0, 58.0, 48.0, 80.0, 140.0, 187.0, 266.0, 402.0, 644.0, 982.0, 1752.0, 3108.0, 6077.0, 12981.0, 29850.0, 73451.0, 176039.0, 299294.0, 244461.0, 114464.0, 46038.0, 19367.0, 8609.0, 4313.0, 2199.0, 1280.0, 805.0, 509.0, 324.0, 240.0, 161.0, 94.0, 78.0, 39.0, 45.0, 26.0, 21.0, 15.0, 8.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.560546875, -3.444732666015625, -3.32891845703125, -3.213104248046875, -3.0972900390625, -2.981475830078125, -2.86566162109375, -2.749847412109375, -2.634033203125, -2.518218994140625, -2.40240478515625, -2.286590576171875, -2.1707763671875, -2.054962158203125, -1.93914794921875, -1.823333740234375, -1.70751953125, -1.591705322265625, -1.47589111328125, -1.360076904296875, -1.2442626953125, -1.128448486328125, -1.01263427734375, -0.896820068359375, -0.781005859375, -0.665191650390625, -0.54937744140625, -0.433563232421875, -0.3177490234375, -0.201934814453125, -0.08612060546875, 0.029693603515625, 0.1455078125, 0.261322021484375, 0.37713623046875, 0.492950439453125, 0.6087646484375, 0.724578857421875, 0.84039306640625, 0.956207275390625, 1.072021484375, 1.187835693359375, 1.30364990234375, 1.419464111328125, 1.5352783203125, 1.651092529296875, 1.76690673828125, 1.882720947265625, 1.99853515625, 2.114349365234375, 2.23016357421875, 2.345977783203125, 2.4617919921875, 2.577606201171875, 2.69342041015625, 2.809234619140625, 2.925048828125, 3.040863037109375, 3.15667724609375, 3.272491455078125, 3.3883056640625, 3.504119873046875, 3.61993408203125, 3.735748291015625, 3.8515625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 18.0, 11.0, 13.0, 25.0, 23.0, 49.0, 41.0, 63.0, 72.0, 71.0, 90.0, 88.0, 80.0, 73.0, 60.0, 49.0, 43.0, 35.0, 19.0, 15.0, 15.0, 8.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.9903106689453125, -0.957183837890625, -0.9240570068359375, -0.89093017578125, -0.8578033447265625, -0.824676513671875, -0.7915496826171875, -0.7584228515625, -0.7252960205078125, -0.692169189453125, -0.6590423583984375, -0.62591552734375, -0.5927886962890625, -0.559661865234375, -0.5265350341796875, -0.493408203125, -0.4602813720703125, -0.427154541015625, -0.3940277099609375, -0.36090087890625, -0.3277740478515625, -0.294647216796875, -0.2615203857421875, -0.2283935546875, -0.1952667236328125, -0.162139892578125, -0.1290130615234375, -0.09588623046875, -0.0627593994140625, -0.029632568359375, 0.0034942626953125, 0.03662109375, 0.0697479248046875, 0.102874755859375, 0.1360015869140625, 0.16912841796875, 0.2022552490234375, 0.235382080078125, 0.2685089111328125, 0.3016357421875, 0.3347625732421875, 0.367889404296875, 0.4010162353515625, 0.43414306640625, 0.4672698974609375, 0.500396728515625, 0.5335235595703125, 0.566650390625, 0.5997772216796875, 0.632904052734375, 0.6660308837890625, 0.69915771484375, 0.7322845458984375, 0.765411376953125, 0.7985382080078125, 0.8316650390625, 0.8647918701171875, 0.897918701171875, 0.9310455322265625, 0.96417236328125, 0.9972991943359375, 1.030426025390625, 1.0635528564453125, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 9.0, 16.0, 8.0, 18.0, 24.0, 29.0, 37.0, 51.0, 57.0, 84.0, 98.0, 98.0, 93.0, 75.0, 72.0, 57.0, 35.0, 37.0, 21.0, 14.0, 12.0, 10.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.431387901306152, -8.125255584716797, -7.819123268127441, -7.512991428375244, -7.206859111785889, -6.900726795196533, -6.594594955444336, -6.2884626388549805, -5.982330322265625, -5.6761980056762695, -5.370065689086914, -5.063933849334717, -4.757801532745361, -4.451669216156006, -4.145537376403809, -3.839405059814453, -3.5332727432250977, -3.227140426635742, -2.921008348464966, -2.6148762702941895, -2.308743953704834, -2.0026116371154785, -1.6964795589447021, -1.3903474807739258, -1.0842151641845703, -0.7780829668045044, -0.4719507694244385, -0.16581857204437256, 0.14031362533569336, 0.4464458227157593, 0.7525780200958252, 1.0587100982666016, 1.3648433685302734, 1.6709755659103394, 1.9771077632904053, 2.2832398414611816, 2.589372158050537, 2.8955044746398926, 3.201636552810669, 3.5077686309814453, 3.813900947570801, 4.120033264160156, 4.426165580749512, 4.732297420501709, 5.0384297370910645, 5.34456205368042, 5.650693893432617, 5.956826210021973, 6.262958526611328, 6.569090843200684, 6.875223159790039, 7.181354999542236, 7.487487316131592, 7.793619632720947, 8.099751472473145, 8.4058837890625, 8.712016105651855, 9.018148422241211, 9.324280738830566, 9.630413055419922, 9.936544418334961, 10.242676734924316, 10.548809051513672, 10.854941368103027, 11.161073684692383]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 12.0, 10.0, 7.0, 13.0, 22.0, 21.0, 22.0, 20.0, 25.0, 31.0, 32.0, 38.0, 38.0, 37.0, 55.0, 33.0, 46.0, 48.0, 52.0, 47.0, 42.0, 37.0, 46.0, 44.0, 30.0, 27.0, 18.0, 16.0, 20.0, 20.0, 21.0, 11.0, 14.0, 6.0, 7.0, 5.0, 6.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.728944778442383, -4.568073749542236, -4.407203197479248, -4.246332168579102, -4.085461616516113, -3.924590826034546, -3.7637200355529785, -3.602849006652832, -3.4419784545898438, -3.2811076641082764, -3.120236873626709, -2.9593660831451416, -2.798495292663574, -2.637624502182007, -2.4767537117004395, -2.315882682800293, -2.1550118923187256, -1.9941411018371582, -1.8332703113555908, -1.6723995208740234, -1.511528730392456, -1.3506579399108887, -1.1897870302200317, -1.0289162397384644, -0.868045449256897, -0.7071746587753296, -0.5463038682937622, -0.38543301820755005, -0.22456222772598267, -0.06369143724441528, 0.09717941284179688, 0.25805020332336426, 0.41892099380493164, 0.579791784286499, 0.7406625747680664, 0.9015334248542786, 1.0624041557312012, 1.2232749462127686, 1.3841458559036255, 1.5450166463851929, 1.7058874368667603, 1.8667582273483276, 2.0276291370391846, 2.188499927520752, 2.3493707180023193, 2.5102415084838867, 2.671112298965454, 2.8319830894470215, 2.992853879928589, 3.1537246704101562, 3.3145954608917236, 3.475466251373291, 3.6363370418548584, 3.797207832336426, 3.9580788612365723, 4.1189494132995605, 4.279820442199707, 4.4406914710998535, 4.601562023162842, 4.762433052062988, 4.923303604125977, 5.084174633026123, 5.245045185089111, 5.405916213989258, 5.566786766052246]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 9.0, 13.0, 6.0, 22.0, 29.0, 24.0, 51.0, 83.0, 163.0, 230.0, 332.0, 632.0, 1098.0, 1913.0, 3490.0, 6683.0, 13854.0, 31073.0, 80035.0, 254327.0, 909314.0, 1694677.0, 829262.0, 232124.0, 76069.0, 29755.0, 13491.0, 6776.0, 3694.0, 2003.0, 1195.0, 692.0, 441.0, 269.0, 159.0, 113.0, 67.0, 31.0, 24.0, 21.0, 16.0, 9.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5625, -9.2679443359375, -8.973388671875, -8.6788330078125, -8.38427734375, -8.0897216796875, -7.795166015625, -7.5006103515625, -7.2060546875, -6.9114990234375, -6.616943359375, -6.3223876953125, -6.02783203125, -5.7332763671875, -5.438720703125, -5.1441650390625, -4.849609375, -4.5550537109375, -4.260498046875, -3.9659423828125, -3.67138671875, -3.3768310546875, -3.082275390625, -2.7877197265625, -2.4931640625, -2.1986083984375, -1.904052734375, -1.6094970703125, -1.31494140625, -1.0203857421875, -0.725830078125, -0.4312744140625, -0.13671875, 0.1578369140625, 0.452392578125, 0.7469482421875, 1.04150390625, 1.3360595703125, 1.630615234375, 1.9251708984375, 2.2197265625, 2.5142822265625, 2.808837890625, 3.1033935546875, 3.39794921875, 3.6925048828125, 3.987060546875, 4.2816162109375, 4.576171875, 4.8707275390625, 5.165283203125, 5.4598388671875, 5.75439453125, 6.0489501953125, 6.343505859375, 6.6380615234375, 6.9326171875, 7.2271728515625, 7.521728515625, 7.8162841796875, 8.11083984375, 8.4053955078125, 8.699951171875, 8.9945068359375, 9.2890625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 11.0, 15.0, 9.0, 18.0, 28.0, 29.0, 34.0, 21.0, 40.0, 37.0, 46.0, 39.0, 54.0, 41.0, 60.0, 52.0, 51.0, 61.0, 37.0, 55.0, 51.0, 31.0, 30.0, 19.0, 16.0, 21.0, 17.0, 17.0, 17.0, 13.0, 4.0, 3.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.750213623046875, -3.61566162109375, -3.481109619140625, -3.3465576171875, -3.212005615234375, -3.07745361328125, -2.942901611328125, -2.808349609375, -2.673797607421875, -2.53924560546875, -2.404693603515625, -2.2701416015625, -2.135589599609375, -2.00103759765625, -1.866485595703125, -1.73193359375, -1.597381591796875, -1.46282958984375, -1.328277587890625, -1.1937255859375, -1.059173583984375, -0.92462158203125, -0.790069580078125, -0.655517578125, -0.520965576171875, -0.38641357421875, -0.251861572265625, -0.1173095703125, 0.017242431640625, 0.15179443359375, 0.286346435546875, 0.4208984375, 0.555450439453125, 0.69000244140625, 0.824554443359375, 0.9591064453125, 1.093658447265625, 1.22821044921875, 1.362762451171875, 1.497314453125, 1.631866455078125, 1.76641845703125, 1.900970458984375, 2.0355224609375, 2.170074462890625, 2.30462646484375, 2.439178466796875, 2.57373046875, 2.708282470703125, 2.84283447265625, 2.977386474609375, 3.1119384765625, 3.246490478515625, 3.38104248046875, 3.515594482421875, 3.650146484375, 3.784698486328125, 3.91925048828125, 4.053802490234375, 4.1883544921875, 4.322906494140625, 4.45745849609375, 4.592010498046875, 4.7265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 5.0, 1.0, 6.0, 5.0, 11.0, 11.0, 16.0, 22.0, 46.0, 60.0, 58.0, 103.0, 158.0, 206.0, 332.0, 550.0, 802.0, 1285.0, 2076.0, 3260.0, 5605.0, 9486.0, 17163.0, 31322.0, 59331.0, 121401.0, 261273.0, 581822.0, 1104003.0, 1027741.0, 512074.0, 229198.0, 106581.0, 52945.0, 27771.0, 15269.0, 8681.0, 5085.0, 3103.0, 1917.0, 1251.0, 765.0, 485.0, 330.0, 215.0, 149.0, 95.0, 76.0, 40.0, 24.0, 25.0, 17.0, 18.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-7.3671875, -7.14337158203125, -6.9195556640625, -6.69573974609375, -6.471923828125, -6.24810791015625, -6.0242919921875, -5.80047607421875, -5.57666015625, -5.35284423828125, -5.1290283203125, -4.90521240234375, -4.681396484375, -4.45758056640625, -4.2337646484375, -4.00994873046875, -3.7861328125, -3.56231689453125, -3.3385009765625, -3.11468505859375, -2.890869140625, -2.66705322265625, -2.4432373046875, -2.21942138671875, -1.99560546875, -1.77178955078125, -1.5479736328125, -1.32415771484375, -1.100341796875, -0.87652587890625, -0.6527099609375, -0.42889404296875, -0.205078125, 0.01873779296875, 0.2425537109375, 0.46636962890625, 0.690185546875, 0.91400146484375, 1.1378173828125, 1.36163330078125, 1.58544921875, 1.80926513671875, 2.0330810546875, 2.25689697265625, 2.480712890625, 2.70452880859375, 2.9283447265625, 3.15216064453125, 3.3759765625, 3.59979248046875, 3.8236083984375, 4.04742431640625, 4.271240234375, 4.49505615234375, 4.7188720703125, 4.94268798828125, 5.16650390625, 5.39031982421875, 5.6141357421875, 5.83795166015625, 6.061767578125, 6.28558349609375, 6.5093994140625, 6.73321533203125, 6.95703125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 6.0, 4.0, 6.0, 4.0, 10.0, 13.0, 20.0, 9.0, 26.0, 35.0, 48.0, 71.0, 99.0, 106.0, 124.0, 145.0, 183.0, 237.0, 303.0, 313.0, 330.0, 314.0, 339.0, 284.0, 240.0, 180.0, 152.0, 110.0, 79.0, 63.0, 48.0, 36.0, 38.0, 17.0, 23.0, 12.0, 7.0, 11.0, 6.0, 11.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.544921875, -2.4739227294921875, -2.402923583984375, -2.3319244384765625, -2.26092529296875, -2.1899261474609375, -2.118927001953125, -2.0479278564453125, -1.9769287109375, -1.9059295654296875, -1.834930419921875, -1.7639312744140625, -1.69293212890625, -1.6219329833984375, -1.550933837890625, -1.4799346923828125, -1.408935546875, -1.3379364013671875, -1.266937255859375, -1.1959381103515625, -1.12493896484375, -1.0539398193359375, -0.982940673828125, -0.9119415283203125, -0.8409423828125, -0.7699432373046875, -0.698944091796875, -0.6279449462890625, -0.55694580078125, -0.4859466552734375, -0.414947509765625, -0.3439483642578125, -0.27294921875, -0.2019500732421875, -0.130950927734375, -0.0599517822265625, 0.01104736328125, 0.0820465087890625, 0.153045654296875, 0.2240447998046875, 0.2950439453125, 0.3660430908203125, 0.437042236328125, 0.5080413818359375, 0.57904052734375, 0.6500396728515625, 0.721038818359375, 0.7920379638671875, 0.863037109375, 0.9340362548828125, 1.005035400390625, 1.0760345458984375, 1.14703369140625, 1.2180328369140625, 1.289031982421875, 1.3600311279296875, 1.4310302734375, 1.5020294189453125, 1.573028564453125, 1.6440277099609375, 1.71502685546875, 1.7860260009765625, 1.857025146484375, 1.9280242919921875, 1.9990234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 9.0, 4.0, 4.0, 9.0, 14.0, 19.0, 18.0, 30.0, 33.0, 35.0, 58.0, 64.0, 82.0, 86.0, 110.0, 94.0, 79.0, 63.0, 52.0, 30.0, 31.0, 24.0, 12.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.282023429870605, -7.975139617919922, -7.66825532913208, -7.3613715171813965, -7.054487228393555, -6.747603416442871, -6.4407196044921875, -6.133835792541504, -5.826951503753662, -5.5200676918029785, -5.213183403015137, -4.906299591064453, -4.5994157791137695, -4.292531490325928, -3.985647678375244, -3.6787636280059814, -3.3718795776367188, -3.064995527267456, -2.7581114768981934, -2.4512276649475098, -2.144343614578247, -1.8374595642089844, -1.5305756330490112, -1.223691701889038, -0.9168076515197754, -0.6099236607551575, -0.30303966999053955, 0.003844320774078369, 0.3107283115386963, 0.617612361907959, 0.9244962930679321, 1.2313802242279053, 1.538264274597168, 1.8451483249664307, 2.1520323753356934, 2.458916187286377, 2.7658002376556396, 3.0726842880249023, 3.379568099975586, 3.6864521503448486, 3.9933362007141113, 4.300220012664795, 4.607104301452637, 4.91398811340332, 5.220871925354004, 5.527756214141846, 5.834640026092529, 6.141524314880371, 6.448408126831055, 6.755291938781738, 7.06217622756958, 7.369060039520264, 7.6759443283081055, 7.982828140258789, 8.289711952209473, 8.596595764160156, 8.903480529785156, 9.21036434173584, 9.517248153686523, 9.824132919311523, 10.131016731262207, 10.43790054321289, 10.744784355163574, 11.051668167114258, 11.358551979064941]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 8.0, 11.0, 15.0, 15.0, 21.0, 17.0, 23.0, 39.0, 28.0, 27.0, 42.0, 37.0, 51.0, 38.0, 38.0, 44.0, 52.0, 38.0, 58.0, 65.0, 33.0, 39.0, 31.0, 29.0, 34.0, 25.0, 22.0, 12.0, 26.0, 17.0, 14.0, 8.0, 10.0, 9.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.997282028198242, -4.833381175994873, -4.669480800628662, -4.505579948425293, -4.341679096221924, -4.177778244018555, -4.013877868652344, -3.8499770164489746, -3.6860764026641846, -3.5221757888793945, -3.3582749366760254, -3.1943743228912354, -3.0304737091064453, -2.866572856903076, -2.702672243118286, -2.538771629333496, -2.374870777130127, -2.210970163345337, -2.0470693111419678, -1.8831686973571777, -1.7192679643630981, -1.5553672313690186, -1.3914666175842285, -1.227565884590149, -1.0636651515960693, -0.8997644186019897, -0.7358637452125549, -0.5719630718231201, -0.4080623388290405, -0.24416160583496094, -0.08026093244552612, 0.08363974094390869, 0.24754095077514648, 0.4114416539669037, 0.5753423571586609, 0.7392430305480957, 0.9031437635421753, 1.0670444965362549, 1.230945110321045, 1.3948458433151245, 1.558746576309204, 1.7226473093032837, 1.8865480422973633, 2.0504486560821533, 2.2143492698669434, 2.3782501220703125, 2.5421507358551025, 2.7060513496398926, 2.8699522018432617, 3.0338528156280518, 3.197753667831421, 3.361654281616211, 3.52555513381958, 3.68945574760437, 3.85335636138916, 4.017257213592529, 4.181158065795898, 4.345058917999268, 4.5089592933654785, 4.672860145568848, 4.836760997772217, 5.000661849975586, 5.164562225341797, 5.328463077545166, 5.492363452911377]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 14.0, 15.0, 24.0, 28.0, 66.0, 92.0, 143.0, 225.0, 361.0, 488.0, 933.0, 1514.0, 2849.0, 5372.0, 11398.0, 25401.0, 59095.0, 134977.0, 255785.0, 272573.0, 153238.0, 68114.0, 29305.0, 13112.0, 6046.0, 3061.0, 1736.0, 1002.0, 562.0, 341.0, 234.0, 121.0, 112.0, 61.0, 43.0, 31.0, 30.0, 12.0, 6.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.32421875, -6.138671875, -5.953125, -5.767578125, -5.58203125, -5.396484375, -5.2109375, -5.025390625, -4.83984375, -4.654296875, -4.46875, -4.283203125, -4.09765625, -3.912109375, -3.7265625, -3.541015625, -3.35546875, -3.169921875, -2.984375, -2.798828125, -2.61328125, -2.427734375, -2.2421875, -2.056640625, -1.87109375, -1.685546875, -1.5, -1.314453125, -1.12890625, -0.943359375, -0.7578125, -0.572265625, -0.38671875, -0.201171875, -0.015625, 0.169921875, 0.35546875, 0.541015625, 0.7265625, 0.912109375, 1.09765625, 1.283203125, 1.46875, 1.654296875, 1.83984375, 2.025390625, 2.2109375, 2.396484375, 2.58203125, 2.767578125, 2.953125, 3.138671875, 3.32421875, 3.509765625, 3.6953125, 3.880859375, 4.06640625, 4.251953125, 4.4375, 4.623046875, 4.80859375, 4.994140625, 5.1796875, 5.365234375, 5.55078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 7.0, 13.0, 6.0, 15.0, 17.0, 19.0, 24.0, 27.0, 32.0, 34.0, 29.0, 37.0, 36.0, 42.0, 57.0, 32.0, 54.0, 43.0, 38.0, 55.0, 42.0, 54.0, 49.0, 31.0, 20.0, 35.0, 25.0, 28.0, 15.0, 16.0, 18.0, 9.0, 10.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.52935791015625, -4.3555908203125, -4.18182373046875, -4.008056640625, -3.83428955078125, -3.6605224609375, -3.48675537109375, -3.31298828125, -3.13922119140625, -2.9654541015625, -2.79168701171875, -2.617919921875, -2.44415283203125, -2.2703857421875, -2.09661865234375, -1.9228515625, -1.74908447265625, -1.5753173828125, -1.40155029296875, -1.227783203125, -1.05401611328125, -0.8802490234375, -0.70648193359375, -0.53271484375, -0.35894775390625, -0.1851806640625, -0.01141357421875, 0.162353515625, 0.33612060546875, 0.5098876953125, 0.68365478515625, 0.857421875, 1.03118896484375, 1.2049560546875, 1.37872314453125, 1.552490234375, 1.72625732421875, 1.9000244140625, 2.07379150390625, 2.24755859375, 2.42132568359375, 2.5950927734375, 2.76885986328125, 2.942626953125, 3.11639404296875, 3.2901611328125, 3.46392822265625, 3.6376953125, 3.81146240234375, 3.9852294921875, 4.15899658203125, 4.332763671875, 4.50653076171875, 4.6802978515625, 4.85406494140625, 5.02783203125, 5.20159912109375, 5.3753662109375, 5.54913330078125, 5.722900390625, 5.89666748046875, 6.0704345703125, 6.24420166015625, 6.41796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 5.0, 12.0, 12.0, 13.0, 25.0, 50.0, 70.0, 100.0, 118.0, 167.0, 260.0, 431.0, 644.0, 1126.0, 1887.0, 3628.0, 7202.0, 16276.0, 38847.0, 98307.0, 239479.0, 337173.0, 178185.0, 71461.0, 28311.0, 12231.0, 5620.0, 2802.0, 1594.0, 891.0, 550.0, 327.0, 213.0, 141.0, 106.0, 66.0, 42.0, 44.0, 37.0, 21.0, 16.0, 13.0, 14.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0], "bins": [-7.32421875, -7.10443115234375, -6.8846435546875, -6.66485595703125, -6.445068359375, -6.22528076171875, -6.0054931640625, -5.78570556640625, -5.56591796875, -5.34613037109375, -5.1263427734375, -4.90655517578125, -4.686767578125, -4.46697998046875, -4.2471923828125, -4.02740478515625, -3.8076171875, -3.58782958984375, -3.3680419921875, -3.14825439453125, -2.928466796875, -2.70867919921875, -2.4888916015625, -2.26910400390625, -2.04931640625, -1.82952880859375, -1.6097412109375, -1.38995361328125, -1.170166015625, -0.95037841796875, -0.7305908203125, -0.51080322265625, -0.291015625, -0.07122802734375, 0.1485595703125, 0.36834716796875, 0.588134765625, 0.80792236328125, 1.0277099609375, 1.24749755859375, 1.46728515625, 1.68707275390625, 1.9068603515625, 2.12664794921875, 2.346435546875, 2.56622314453125, 2.7860107421875, 3.00579833984375, 3.2255859375, 3.44537353515625, 3.6651611328125, 3.88494873046875, 4.104736328125, 4.32452392578125, 4.5443115234375, 4.76409912109375, 4.98388671875, 5.20367431640625, 5.4234619140625, 5.64324951171875, 5.863037109375, 6.08282470703125, 6.3026123046875, 6.52239990234375, 6.7421875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 18.0, 14.0, 22.0, 25.0, 28.0, 29.0, 25.0, 30.0, 31.0, 39.0, 38.0, 35.0, 41.0, 45.0, 49.0, 51.0, 48.0, 50.0, 47.0, 40.0, 34.0, 20.0, 34.0, 20.0, 28.0, 23.0, 17.0, 15.0, 14.0, 15.0, 8.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83984375, -2.743743896484375, -2.64764404296875, -2.551544189453125, -2.4554443359375, -2.359344482421875, -2.26324462890625, -2.167144775390625, -2.071044921875, -1.974945068359375, -1.87884521484375, -1.782745361328125, -1.6866455078125, -1.590545654296875, -1.49444580078125, -1.398345947265625, -1.30224609375, -1.206146240234375, -1.11004638671875, -1.013946533203125, -0.9178466796875, -0.821746826171875, -0.72564697265625, -0.629547119140625, -0.533447265625, -0.437347412109375, -0.34124755859375, -0.245147705078125, -0.1490478515625, -0.052947998046875, 0.04315185546875, 0.139251708984375, 0.2353515625, 0.331451416015625, 0.42755126953125, 0.523651123046875, 0.6197509765625, 0.715850830078125, 0.81195068359375, 0.908050537109375, 1.004150390625, 1.100250244140625, 1.19635009765625, 1.292449951171875, 1.3885498046875, 1.484649658203125, 1.58074951171875, 1.676849365234375, 1.77294921875, 1.869049072265625, 1.96514892578125, 2.061248779296875, 2.1573486328125, 2.253448486328125, 2.34954833984375, 2.445648193359375, 2.541748046875, 2.637847900390625, 2.73394775390625, 2.830047607421875, 2.9261474609375, 3.022247314453125, 3.11834716796875, 3.214447021484375, 3.310546875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 5.0, 11.0, 11.0, 19.0, 16.0, 31.0, 38.0, 45.0, 58.0, 87.0, 131.0, 152.0, 216.0, 276.0, 392.0, 618.0, 844.0, 1211.0, 1909.0, 3309.0, 6407.0, 15072.0, 45105.0, 176874.0, 487075.0, 219297.0, 54889.0, 17234.0, 7086.0, 3650.0, 2029.0, 1378.0, 844.0, 586.0, 442.0, 300.0, 249.0, 160.0, 140.0, 84.0, 56.0, 56.0, 36.0, 33.0, 33.0, 18.0, 13.0, 9.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5703125, -4.42083740234375, -4.2713623046875, -4.12188720703125, -3.972412109375, -3.82293701171875, -3.6734619140625, -3.52398681640625, -3.37451171875, -3.22503662109375, -3.0755615234375, -2.92608642578125, -2.776611328125, -2.62713623046875, -2.4776611328125, -2.32818603515625, -2.1787109375, -2.02923583984375, -1.8797607421875, -1.73028564453125, -1.580810546875, -1.43133544921875, -1.2818603515625, -1.13238525390625, -0.98291015625, -0.83343505859375, -0.6839599609375, -0.53448486328125, -0.385009765625, -0.23553466796875, -0.0860595703125, 0.06341552734375, 0.212890625, 0.36236572265625, 0.5118408203125, 0.66131591796875, 0.810791015625, 0.96026611328125, 1.1097412109375, 1.25921630859375, 1.40869140625, 1.55816650390625, 1.7076416015625, 1.85711669921875, 2.006591796875, 2.15606689453125, 2.3055419921875, 2.45501708984375, 2.6044921875, 2.75396728515625, 2.9034423828125, 3.05291748046875, 3.202392578125, 3.35186767578125, 3.5013427734375, 3.65081787109375, 3.80029296875, 3.94976806640625, 4.0992431640625, 4.24871826171875, 4.398193359375, 4.54766845703125, 4.6971435546875, 4.84661865234375, 4.99609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 13.0, 15.0, 32.0, 39.0, 53.0, 72.0, 85.0, 107.0, 102.0, 113.0, 80.0, 72.0, 56.0, 45.0, 30.0, 23.0, 10.0, 11.0, 8.0, 5.0, 4.0, 0.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023245811462402344, -0.00022612139582633972, -0.000219784677028656, -0.0002134479582309723, -0.00020711123943328857, -0.00020077452063560486, -0.00019443780183792114, -0.00018810108304023743, -0.0001817643642425537, -0.00017542764544487, -0.00016909092664718628, -0.00016275420784950256, -0.00015641748905181885, -0.00015008077025413513, -0.00014374405145645142, -0.0001374073326587677, -0.00013107061386108398, -0.00012473389506340027, -0.00011839717626571655, -0.00011206045746803284, -0.00010572373867034912, -9.93870198726654e-05, -9.305030107498169e-05, -8.671358227729797e-05, -8.037686347961426e-05, -7.404014468193054e-05, -6.770342588424683e-05, -6.136670708656311e-05, -5.5029988288879395e-05, -4.869326949119568e-05, -4.235655069351196e-05, -3.601983189582825e-05, -2.968311309814453e-05, -2.3346394300460815e-05, -1.70096755027771e-05, -1.0672956705093384e-05, -4.336237907409668e-06, 2.000480890274048e-06, 8.337199687957764e-06, 1.467391848564148e-05, 2.1010637283325195e-05, 2.734735608100891e-05, 3.368407487869263e-05, 4.002079367637634e-05, 4.635751247406006e-05, 5.2694231271743774e-05, 5.903095006942749e-05, 6.53676688671112e-05, 7.170438766479492e-05, 7.804110646247864e-05, 8.437782526016235e-05, 9.071454405784607e-05, 9.705126285552979e-05, 0.0001033879816532135, 0.00010972470045089722, 0.00011606141924858093, 0.00012239813804626465, 0.00012873485684394836, 0.00013507157564163208, 0.0001414082944393158, 0.0001477450132369995, 0.00015408173203468323, 0.00016041845083236694, 0.00016675516963005066, 0.00017309188842773438]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 2.0, 4.0, 7.0, 19.0, 28.0, 39.0, 40.0, 45.0, 62.0, 87.0, 91.0, 148.0, 154.0, 218.0, 287.0, 370.0, 462.0, 705.0, 1116.0, 1623.0, 2771.0, 5723.0, 16118.0, 64709.0, 297005.0, 463328.0, 142954.0, 30955.0, 8942.0, 3854.0, 2078.0, 1330.0, 864.0, 576.0, 443.0, 287.0, 243.0, 200.0, 165.0, 120.0, 102.0, 79.0, 52.0, 41.0, 24.0, 25.0, 16.0, 13.0, 16.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.09765625, -4.9443359375, -4.791015625, -4.6376953125, -4.484375, -4.3310546875, -4.177734375, -4.0244140625, -3.87109375, -3.7177734375, -3.564453125, -3.4111328125, -3.2578125, -3.1044921875, -2.951171875, -2.7978515625, -2.64453125, -2.4912109375, -2.337890625, -2.1845703125, -2.03125, -1.8779296875, -1.724609375, -1.5712890625, -1.41796875, -1.2646484375, -1.111328125, -0.9580078125, -0.8046875, -0.6513671875, -0.498046875, -0.3447265625, -0.19140625, -0.0380859375, 0.115234375, 0.2685546875, 0.421875, 0.5751953125, 0.728515625, 0.8818359375, 1.03515625, 1.1884765625, 1.341796875, 1.4951171875, 1.6484375, 1.8017578125, 1.955078125, 2.1083984375, 2.26171875, 2.4150390625, 2.568359375, 2.7216796875, 2.875, 3.0283203125, 3.181640625, 3.3349609375, 3.48828125, 3.6416015625, 3.794921875, 3.9482421875, 4.1015625, 4.2548828125, 4.408203125, 4.5615234375, 4.71484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 24.0, 33.0, 79.0, 121.0, 172.0, 156.0, 149.0, 112.0, 67.0, 28.0, 18.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.74609375, -1.6920318603515625, -1.637969970703125, -1.5839080810546875, -1.52984619140625, -1.4757843017578125, -1.421722412109375, -1.3676605224609375, -1.3135986328125, -1.2595367431640625, -1.205474853515625, -1.1514129638671875, -1.09735107421875, -1.0432891845703125, -0.989227294921875, -0.9351654052734375, -0.881103515625, -0.8270416259765625, -0.772979736328125, -0.7189178466796875, -0.66485595703125, -0.6107940673828125, -0.556732177734375, -0.5026702880859375, -0.4486083984375, -0.3945465087890625, -0.340484619140625, -0.2864227294921875, -0.23236083984375, -0.1782989501953125, -0.124237060546875, -0.0701751708984375, -0.01611328125, 0.0379486083984375, 0.092010498046875, 0.1460723876953125, 0.20013427734375, 0.2541961669921875, 0.308258056640625, 0.3623199462890625, 0.4163818359375, 0.4704437255859375, 0.524505615234375, 0.5785675048828125, 0.63262939453125, 0.6866912841796875, 0.740753173828125, 0.7948150634765625, 0.848876953125, 0.9029388427734375, 0.957000732421875, 1.0110626220703125, 1.06512451171875, 1.1191864013671875, 1.173248291015625, 1.2273101806640625, 1.2813720703125, 1.3354339599609375, 1.389495849609375, 1.4435577392578125, 1.49761962890625, 1.5516815185546875, 1.605743408203125, 1.6598052978515625, 1.7138671875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 8.0, 13.0, 11.0, 16.0, 19.0, 20.0, 38.0, 41.0, 53.0, 68.0, 86.0, 102.0, 118.0, 85.0, 80.0, 56.0, 49.0, 27.0, 34.0, 19.0, 8.0, 11.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.044318199157715, -7.732737064361572, -7.42115592956543, -7.109575271606445, -6.797994136810303, -6.48641300201416, -6.174832344055176, -5.863251209259033, -5.551670074462891, -5.240088939666748, -4.9285078048706055, -4.616927146911621, -4.3053460121154785, -3.993764877319336, -3.6821839809417725, -3.370603084564209, -3.0590219497680664, -2.747440814971924, -2.4358599185943604, -2.124279022216797, -1.8126978874206543, -1.5011168718338013, -1.1895358562469482, -0.8779549598693848, -0.5663738250732422, -0.25479280948638916, 0.05678820610046387, 0.3683692216873169, 0.6799502372741699, 0.991531252861023, 1.303112268447876, 1.6146931648254395, 1.9262752532958984, 2.237856388092041, 2.5494372844696045, 2.861018180847168, 3.1725993156433105, 3.484180450439453, 3.7957613468170166, 4.10734224319458, 4.418923377990723, 4.730504512786865, 5.042085647583008, 5.353666305541992, 5.665247440338135, 5.976828575134277, 6.288409233093262, 6.599990367889404, 6.911571502685547, 7.2231526374816895, 7.534733772277832, 7.846314430236816, 8.157896041870117, 8.469476699829102, 8.781057357788086, 9.09263801574707, 9.404219627380371, 9.715800285339355, 10.027381896972656, 10.33896255493164, 10.650543212890625, 10.962124824523926, 11.27370548248291, 11.585287094116211, 11.896867752075195]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 7.0, 9.0, 10.0, 11.0, 15.0, 19.0, 23.0, 32.0, 30.0, 30.0, 29.0, 43.0, 42.0, 45.0, 45.0, 40.0, 45.0, 44.0, 49.0, 56.0, 48.0, 39.0, 39.0, 27.0, 37.0, 30.0, 23.0, 17.0, 25.0, 18.0, 14.0, 18.0, 7.0, 12.0, 7.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.159510135650635, -4.9949188232421875, -4.83032751083374, -4.665735721588135, -4.5011444091796875, -4.33655309677124, -4.171961784362793, -4.0073699951171875, -3.8427786827087402, -3.678187370300293, -3.5135958194732666, -3.3490045070648193, -3.184412956237793, -3.0198216438293457, -2.8552303314208984, -2.690638780593872, -2.526047468185425, -2.3614561557769775, -2.196864604949951, -2.032273292541504, -1.8676817417144775, -1.7030904293060303, -1.5384989976882935, -1.3739075660705566, -1.2093161344528198, -1.044724702835083, -0.8801332712173462, -0.7155418992042542, -0.5509504675865173, -0.3863590359687805, -0.22176766395568848, -0.05717623233795166, 0.10741519927978516, 0.272006630897522, 0.4365980327129364, 0.6011894345283508, 0.7657808661460876, 0.9303722977638245, 1.0949636697769165, 1.2595551013946533, 1.4241465330123901, 1.588737964630127, 1.7533293962478638, 1.9179208278656006, 2.082512140274048, 2.247103691101074, 2.4116950035095215, 2.5762863159179688, 2.740877866744995, 2.9054691791534424, 3.0700607299804688, 3.234652042388916, 3.3992435932159424, 3.5638349056243896, 3.728426456451416, 3.8930177688598633, 4.0576090812683105, 4.222200393676758, 4.386791706085205, 4.5513834953308105, 4.715974807739258, 4.880566120147705, 5.045157432556152, 5.209749221801758, 5.374340534210205]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 12.0, 26.0, 14.0, 21.0, 44.0, 64.0, 98.0, 145.0, 228.0, 349.0, 524.0, 821.0, 1301.0, 2027.0, 3429.0, 5581.0, 9594.0, 16933.0, 28415.0, 48847.0, 83707.0, 133169.0, 177804.0, 181615.0, 138578.0, 88846.0, 52418.0, 30061.0, 17737.0, 10405.0, 6155.0, 3574.0, 2190.0, 1331.0, 834.0, 533.0, 348.0, 228.0, 154.0, 107.0, 79.0, 62.0, 38.0, 40.0, 17.0, 14.0, 10.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.89453125, -4.7369384765625, -4.579345703125, -4.4217529296875, -4.26416015625, -4.1065673828125, -3.948974609375, -3.7913818359375, -3.6337890625, -3.4761962890625, -3.318603515625, -3.1610107421875, -3.00341796875, -2.8458251953125, -2.688232421875, -2.5306396484375, -2.373046875, -2.2154541015625, -2.057861328125, -1.9002685546875, -1.74267578125, -1.5850830078125, -1.427490234375, -1.2698974609375, -1.1123046875, -0.9547119140625, -0.797119140625, -0.6395263671875, -0.48193359375, -0.3243408203125, -0.166748046875, -0.0091552734375, 0.1484375, 0.3060302734375, 0.463623046875, 0.6212158203125, 0.77880859375, 0.9364013671875, 1.093994140625, 1.2515869140625, 1.4091796875, 1.5667724609375, 1.724365234375, 1.8819580078125, 2.03955078125, 2.1971435546875, 2.354736328125, 2.5123291015625, 2.669921875, 2.8275146484375, 2.985107421875, 3.1427001953125, 3.30029296875, 3.4578857421875, 3.615478515625, 3.7730712890625, 3.9306640625, 4.0882568359375, 4.245849609375, 4.4034423828125, 4.56103515625, 4.7186279296875, 4.876220703125, 5.0338134765625, 5.19140625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 12.0, 8.0, 6.0, 5.0, 18.0, 25.0, 20.0, 26.0, 25.0, 28.0, 32.0, 43.0, 37.0, 38.0, 38.0, 45.0, 49.0, 47.0, 53.0, 49.0, 42.0, 46.0, 47.0, 38.0, 30.0, 35.0, 28.0, 20.0, 18.0, 13.0, 10.0, 18.0, 9.0, 9.0, 10.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.71575927734375, -5.5408935546875, -5.36602783203125, -5.191162109375, -5.01629638671875, -4.8414306640625, -4.66656494140625, -4.49169921875, -4.31683349609375, -4.1419677734375, -3.96710205078125, -3.792236328125, -3.61737060546875, -3.4425048828125, -3.26763916015625, -3.0927734375, -2.91790771484375, -2.7430419921875, -2.56817626953125, -2.393310546875, -2.21844482421875, -2.0435791015625, -1.86871337890625, -1.69384765625, -1.51898193359375, -1.3441162109375, -1.16925048828125, -0.994384765625, -0.81951904296875, -0.6446533203125, -0.46978759765625, -0.294921875, -0.12005615234375, 0.0548095703125, 0.22967529296875, 0.404541015625, 0.57940673828125, 0.7542724609375, 0.92913818359375, 1.10400390625, 1.27886962890625, 1.4537353515625, 1.62860107421875, 1.803466796875, 1.97833251953125, 2.1531982421875, 2.32806396484375, 2.5029296875, 2.67779541015625, 2.8526611328125, 3.02752685546875, 3.202392578125, 3.37725830078125, 3.5521240234375, 3.72698974609375, 3.90185546875, 4.07672119140625, 4.2515869140625, 4.42645263671875, 4.601318359375, 4.77618408203125, 4.9510498046875, 5.12591552734375, 5.30078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 5.0, 14.0, 19.0, 17.0, 38.0, 47.0, 71.0, 124.0, 174.0, 243.0, 376.0, 561.0, 838.0, 1379.0, 2106.0, 3291.0, 5355.0, 8968.0, 14782.0, 24706.0, 41422.0, 68798.0, 106277.0, 149366.0, 171206.0, 153061.0, 111880.0, 72370.0, 43935.0, 26086.0, 15777.0, 9479.0, 5852.0, 3572.0, 2157.0, 1451.0, 954.0, 603.0, 382.0, 262.0, 192.0, 103.0, 85.0, 35.0, 39.0, 23.0, 20.0, 11.0, 8.0, 7.0, 11.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.47088623046875, -4.3245849609375, -4.17828369140625, -4.031982421875, -3.88568115234375, -3.7393798828125, -3.59307861328125, -3.44677734375, -3.30047607421875, -3.1541748046875, -3.00787353515625, -2.861572265625, -2.71527099609375, -2.5689697265625, -2.42266845703125, -2.2763671875, -2.13006591796875, -1.9837646484375, -1.83746337890625, -1.691162109375, -1.54486083984375, -1.3985595703125, -1.25225830078125, -1.10595703125, -0.95965576171875, -0.8133544921875, -0.66705322265625, -0.520751953125, -0.37445068359375, -0.2281494140625, -0.08184814453125, 0.064453125, 0.21075439453125, 0.3570556640625, 0.50335693359375, 0.649658203125, 0.79595947265625, 0.9422607421875, 1.08856201171875, 1.23486328125, 1.38116455078125, 1.5274658203125, 1.67376708984375, 1.820068359375, 1.96636962890625, 2.1126708984375, 2.25897216796875, 2.4052734375, 2.55157470703125, 2.6978759765625, 2.84417724609375, 2.990478515625, 3.13677978515625, 3.2830810546875, 3.42938232421875, 3.57568359375, 3.72198486328125, 3.8682861328125, 4.01458740234375, 4.160888671875, 4.30718994140625, 4.4534912109375, 4.59979248046875, 4.74609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 3.0, 11.0, 14.0, 23.0, 27.0, 23.0, 24.0, 24.0, 24.0, 42.0, 34.0, 39.0, 34.0, 39.0, 38.0, 23.0, 44.0, 53.0, 37.0, 37.0, 44.0, 41.0, 29.0, 28.0, 27.0, 26.0, 28.0, 26.0, 29.0, 18.0, 15.0, 11.0, 10.0, 11.0, 12.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.96875, -2.8792724609375, -2.789794921875, -2.7003173828125, -2.61083984375, -2.5213623046875, -2.431884765625, -2.3424072265625, -2.2529296875, -2.1634521484375, -2.073974609375, -1.9844970703125, -1.89501953125, -1.8055419921875, -1.716064453125, -1.6265869140625, -1.537109375, -1.4476318359375, -1.358154296875, -1.2686767578125, -1.17919921875, -1.0897216796875, -1.000244140625, -0.9107666015625, -0.8212890625, -0.7318115234375, -0.642333984375, -0.5528564453125, -0.46337890625, -0.3739013671875, -0.284423828125, -0.1949462890625, -0.10546875, -0.0159912109375, 0.073486328125, 0.1629638671875, 0.25244140625, 0.3419189453125, 0.431396484375, 0.5208740234375, 0.6103515625, 0.6998291015625, 0.789306640625, 0.8787841796875, 0.96826171875, 1.0577392578125, 1.147216796875, 1.2366943359375, 1.326171875, 1.4156494140625, 1.505126953125, 1.5946044921875, 1.68408203125, 1.7735595703125, 1.863037109375, 1.9525146484375, 2.0419921875, 2.1314697265625, 2.220947265625, 2.3104248046875, 2.39990234375, 2.4893798828125, 2.578857421875, 2.6683349609375, 2.7578125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 8.0, 28.0, 20.0, 37.0, 45.0, 51.0, 57.0, 70.0, 90.0, 129.0, 160.0, 242.0, 344.0, 424.0, 573.0, 915.0, 1395.0, 2519.0, 4562.0, 8763.0, 18039.0, 38493.0, 81953.0, 161565.0, 245188.0, 224747.0, 132442.0, 64285.0, 30134.0, 14349.0, 7125.0, 3685.0, 2035.0, 1225.0, 800.0, 529.0, 361.0, 278.0, 200.0, 163.0, 110.0, 104.0, 54.0, 56.0, 56.0, 37.0, 36.0, 17.0, 18.0, 9.0, 11.0, 7.0, 2.0, 4.0, 0.0, 1.0], "bins": [-3.017578125, -2.925689697265625, -2.83380126953125, -2.741912841796875, -2.6500244140625, -2.558135986328125, -2.46624755859375, -2.374359130859375, -2.282470703125, -2.190582275390625, -2.09869384765625, -2.006805419921875, -1.9149169921875, -1.823028564453125, -1.73114013671875, -1.639251708984375, -1.54736328125, -1.455474853515625, -1.36358642578125, -1.271697998046875, -1.1798095703125, -1.087921142578125, -0.99603271484375, -0.904144287109375, -0.812255859375, -0.720367431640625, -0.62847900390625, -0.536590576171875, -0.4447021484375, -0.352813720703125, -0.26092529296875, -0.169036865234375, -0.0771484375, 0.014739990234375, 0.10662841796875, 0.198516845703125, 0.2904052734375, 0.382293701171875, 0.47418212890625, 0.566070556640625, 0.657958984375, 0.749847412109375, 0.84173583984375, 0.933624267578125, 1.0255126953125, 1.117401123046875, 1.20928955078125, 1.301177978515625, 1.39306640625, 1.484954833984375, 1.57684326171875, 1.668731689453125, 1.7606201171875, 1.852508544921875, 1.94439697265625, 2.036285400390625, 2.128173828125, 2.220062255859375, 2.31195068359375, 2.403839111328125, 2.4957275390625, 2.587615966796875, 2.67950439453125, 2.771392822265625, 2.86328125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 13.0, 11.0, 18.0, 20.0, 28.0, 46.0, 51.0, 63.0, 69.0, 82.0, 76.0, 83.0, 75.0, 67.0, 56.0, 58.0, 46.0, 30.0, 20.0, 12.0, 18.0, 5.0, 9.0, 4.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00034880638122558594, -0.00034005753695964813, -0.00033130869269371033, -0.0003225598484277725, -0.0003138110041618347, -0.0003050621598958969, -0.0002963133156299591, -0.0002875644713640213, -0.0002788156270980835, -0.0002700667828321457, -0.0002613179385662079, -0.0002525690943002701, -0.00024382025003433228, -0.00023507140576839447, -0.00022632256150245667, -0.00021757371723651886, -0.00020882487297058105, -0.00020007602870464325, -0.00019132718443870544, -0.00018257834017276764, -0.00017382949590682983, -0.00016508065164089203, -0.00015633180737495422, -0.00014758296310901642, -0.0001388341188430786, -0.0001300852745771408, -0.000121336430311203, -0.0001125875860452652, -0.00010383874177932739, -9.508989751338959e-05, -8.634105324745178e-05, -7.759220898151398e-05, -6.884336471557617e-05, -6.009452044963837e-05, -5.134567618370056e-05, -4.2596831917762756e-05, -3.384798765182495e-05, -2.5099143385887146e-05, -1.635029911994934e-05, -7.601454854011536e-06, 1.1473894119262695e-06, 9.896233677864075e-06, 1.864507794380188e-05, 2.7393922209739685e-05, 3.614276647567749e-05, 4.4891610741615295e-05, 5.36404550075531e-05, 6.23892992734909e-05, 7.113814353942871e-05, 7.988698780536652e-05, 8.863583207130432e-05, 9.738467633724213e-05, 0.00010613352060317993, 0.00011488236486911774, 0.00012363120913505554, 0.00013238005340099335, 0.00014112889766693115, 0.00014987774193286896, 0.00015862658619880676, 0.00016737543046474457, 0.00017612427473068237, 0.00018487311899662018, 0.00019362196326255798, 0.0002023708075284958, 0.0002111196517944336]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 11.0, 16.0, 10.0, 18.0, 20.0, 28.0, 48.0, 73.0, 110.0, 168.0, 322.0, 623.0, 1271.0, 2799.0, 7273.0, 20867.0, 66427.0, 205613.0, 379688.0, 241629.0, 81092.0, 25380.0, 8725.0, 3253.0, 1402.0, 712.0, 381.0, 198.0, 119.0, 91.0, 43.0, 39.0, 16.0, 18.0, 19.0, 15.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.96484375, -4.8170166015625, -4.669189453125, -4.5213623046875, -4.37353515625, -4.2257080078125, -4.077880859375, -3.9300537109375, -3.7822265625, -3.6343994140625, -3.486572265625, -3.3387451171875, -3.19091796875, -3.0430908203125, -2.895263671875, -2.7474365234375, -2.599609375, -2.4517822265625, -2.303955078125, -2.1561279296875, -2.00830078125, -1.8604736328125, -1.712646484375, -1.5648193359375, -1.4169921875, -1.2691650390625, -1.121337890625, -0.9735107421875, -0.82568359375, -0.6778564453125, -0.530029296875, -0.3822021484375, -0.234375, -0.0865478515625, 0.061279296875, 0.2091064453125, 0.35693359375, 0.5047607421875, 0.652587890625, 0.8004150390625, 0.9482421875, 1.0960693359375, 1.243896484375, 1.3917236328125, 1.53955078125, 1.6873779296875, 1.835205078125, 1.9830322265625, 2.130859375, 2.2786865234375, 2.426513671875, 2.5743408203125, 2.72216796875, 2.8699951171875, 3.017822265625, 3.1656494140625, 3.3134765625, 3.4613037109375, 3.609130859375, 3.7569580078125, 3.90478515625, 4.0526123046875, 4.200439453125, 4.3482666015625, 4.49609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 15.0, 7.0, 17.0, 11.0, 27.0, 33.0, 33.0, 58.0, 52.0, 64.0, 68.0, 81.0, 77.0, 77.0, 80.0, 53.0, 59.0, 53.0, 41.0, 22.0, 22.0, 14.0, 11.0, 15.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2505264282226562, -1.2188262939453125, -1.1871261596679688, -1.155426025390625, -1.1237258911132812, -1.0920257568359375, -1.0603256225585938, -1.02862548828125, -0.9969253540039062, -0.9652252197265625, -0.9335250854492188, -0.901824951171875, -0.8701248168945312, -0.8384246826171875, -0.8067245483398438, -0.7750244140625, -0.7433242797851562, -0.7116241455078125, -0.6799240112304688, -0.648223876953125, -0.6165237426757812, -0.5848236083984375, -0.5531234741210938, -0.52142333984375, -0.48972320556640625, -0.4580230712890625, -0.42632293701171875, -0.394622802734375, -0.36292266845703125, -0.3312225341796875, -0.29952239990234375, -0.267822265625, -0.23612213134765625, -0.2044219970703125, -0.17272186279296875, -0.141021728515625, -0.10932159423828125, -0.0776214599609375, -0.04592132568359375, -0.01422119140625, 0.01747894287109375, 0.0491790771484375, 0.08087921142578125, 0.112579345703125, 0.14427947998046875, 0.1759796142578125, 0.20767974853515625, 0.2393798828125, 0.27108001708984375, 0.3027801513671875, 0.33448028564453125, 0.366180419921875, 0.39788055419921875, 0.4295806884765625, 0.46128082275390625, 0.49298095703125, 0.5246810913085938, 0.5563812255859375, 0.5880813598632812, 0.619781494140625, 0.6514816284179688, 0.6831817626953125, 0.7148818969726562, 0.74658203125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 13.0, 18.0, 18.0, 21.0, 22.0, 28.0, 49.0, 60.0, 68.0, 102.0, 92.0, 97.0, 113.0, 75.0, 52.0, 40.0, 31.0, 29.0, 15.0, 13.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.124826431274414, -8.80727767944336, -8.489727973937988, -8.172179222106934, -7.8546295166015625, -7.53708028793335, -7.219531059265137, -6.901982307434082, -6.584432601928711, -6.266883373260498, -5.949334144592285, -5.631784915924072, -5.314235687255859, -4.9966864585876465, -4.679137229919434, -4.361588478088379, -4.044039249420166, -3.726490020751953, -3.4089407920837402, -3.0913915634155273, -2.7738423347473145, -2.4562931060791016, -2.1387441158294678, -1.8211948871612549, -1.503645658493042, -1.186096429824829, -0.868547260761261, -0.5509980916976929, -0.23344886302947998, 0.08410036563873291, 0.40164947509765625, 0.7191987037658691, 1.036747932434082, 1.354297161102295, 1.6718463897705078, 1.9893954992294312, 2.3069448471069336, 2.6244940757751465, 2.9420430660247803, 3.259592294692993, 3.577141523361206, 3.894690752029419, 4.212239742279053, 4.529788970947266, 4.8473381996154785, 5.164887428283691, 5.482436656951904, 5.799985885620117, 6.11753511428833, 6.435084342956543, 6.752633571624756, 7.070182800292969, 7.387732028961182, 7.7052812576293945, 8.02283000946045, 8.34037971496582, 8.657928466796875, 8.97547721862793, 9.2930269241333, 9.610575675964355, 9.928125381469727, 10.245674133300781, 10.563223838806152, 10.880772590637207, 11.198322296142578]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 5.0, 16.0, 14.0, 19.0, 18.0, 15.0, 21.0, 24.0, 34.0, 41.0, 43.0, 42.0, 38.0, 44.0, 43.0, 54.0, 50.0, 44.0, 46.0, 39.0, 52.0, 36.0, 29.0, 40.0, 22.0, 23.0, 23.0, 19.0, 24.0, 13.0, 8.0, 15.0, 15.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.089992046356201, -4.92699670791626, -4.764001846313477, -4.601006507873535, -4.438011169433594, -4.2750163078308105, -4.112020969390869, -3.949025869369507, -3.7860307693481445, -3.6230356693267822, -3.46004056930542, -3.2970452308654785, -3.134050130844116, -2.971055030822754, -2.8080596923828125, -2.64506459236145, -2.482069492340088, -2.3190743923187256, -2.1560792922973633, -1.9930839538574219, -1.8300888538360596, -1.6670937538146973, -1.5040985345840454, -1.3411033153533936, -1.1781082153320312, -1.015113115310669, -0.8521178960800171, -0.68912273645401, -0.5261275768280029, -0.36313241720199585, -0.20013725757598877, -0.037142038345336914, 0.1258525848388672, 0.28884774446487427, 0.45184290409088135, 0.6148380637168884, 0.7778332233428955, 0.9408283829689026, 1.1038235425949097, 1.2668187618255615, 1.4298138618469238, 1.5928089618682861, 1.755804181098938, 1.9187994003295898, 2.081794500350952, 2.2447896003723145, 2.407784938812256, 2.570780038833618, 2.7337751388549805, 2.8967702388763428, 3.059765338897705, 3.2227606773376465, 3.385755777359009, 3.548750877380371, 3.7117462158203125, 3.874741315841675, 4.037736415863037, 4.2007317543029785, 4.363726615905762, 4.526721954345703, 4.6897172927856445, 4.852712154388428, 5.015707492828369, 5.178702354431152, 5.341697692871094]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 2.0, 2.0, 11.0, 11.0, 24.0, 18.0, 33.0, 52.0, 81.0, 98.0, 139.0, 206.0, 295.0, 427.0, 655.0, 1028.0, 1634.0, 2527.0, 4306.0, 7350.0, 13389.0, 26268.0, 55055.0, 129156.0, 346722.0, 919553.0, 1379129.0, 796317.0, 292754.0, 111888.0, 49362.0, 24314.0, 12913.0, 7203.0, 4208.0, 2528.0, 1552.0, 1000.0, 706.0, 452.0, 293.0, 191.0, 124.0, 80.0, 69.0, 45.0, 33.0, 20.0, 19.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0], "bins": [-7.62890625, -7.400634765625, -7.17236328125, -6.944091796875, -6.7158203125, -6.487548828125, -6.25927734375, -6.031005859375, -5.802734375, -5.574462890625, -5.34619140625, -5.117919921875, -4.8896484375, -4.661376953125, -4.43310546875, -4.204833984375, -3.9765625, -3.748291015625, -3.52001953125, -3.291748046875, -3.0634765625, -2.835205078125, -2.60693359375, -2.378662109375, -2.150390625, -1.922119140625, -1.69384765625, -1.465576171875, -1.2373046875, -1.009033203125, -0.78076171875, -0.552490234375, -0.32421875, -0.095947265625, 0.13232421875, 0.360595703125, 0.5888671875, 0.817138671875, 1.04541015625, 1.273681640625, 1.501953125, 1.730224609375, 1.95849609375, 2.186767578125, 2.4150390625, 2.643310546875, 2.87158203125, 3.099853515625, 3.328125, 3.556396484375, 3.78466796875, 4.012939453125, 4.2412109375, 4.469482421875, 4.69775390625, 4.926025390625, 5.154296875, 5.382568359375, 5.61083984375, 5.839111328125, 6.0673828125, 6.295654296875, 6.52392578125, 6.752197265625, 6.98046875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 13.0, 11.0, 13.0, 19.0, 16.0, 18.0, 19.0, 21.0, 29.0, 39.0, 42.0, 45.0, 45.0, 44.0, 62.0, 57.0, 55.0, 52.0, 58.0, 29.0, 37.0, 32.0, 27.0, 32.0, 24.0, 24.0, 31.0, 20.0, 16.0, 16.0, 13.0, 10.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9375, -3.8143310546875, -3.691162109375, -3.5679931640625, -3.44482421875, -3.3216552734375, -3.198486328125, -3.0753173828125, -2.9521484375, -2.8289794921875, -2.705810546875, -2.5826416015625, -2.45947265625, -2.3363037109375, -2.213134765625, -2.0899658203125, -1.966796875, -1.8436279296875, -1.720458984375, -1.5972900390625, -1.47412109375, -1.3509521484375, -1.227783203125, -1.1046142578125, -0.9814453125, -0.8582763671875, -0.735107421875, -0.6119384765625, -0.48876953125, -0.3656005859375, -0.242431640625, -0.1192626953125, 0.00390625, 0.1270751953125, 0.250244140625, 0.3734130859375, 0.49658203125, 0.6197509765625, 0.742919921875, 0.8660888671875, 0.9892578125, 1.1124267578125, 1.235595703125, 1.3587646484375, 1.48193359375, 1.6051025390625, 1.728271484375, 1.8514404296875, 1.974609375, 2.0977783203125, 2.220947265625, 2.3441162109375, 2.46728515625, 2.5904541015625, 2.713623046875, 2.8367919921875, 2.9599609375, 3.0831298828125, 3.206298828125, 3.3294677734375, 3.45263671875, 3.5758056640625, 3.698974609375, 3.8221435546875, 3.9453125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 8.0, 10.0, 24.0, 13.0, 34.0, 42.0, 68.0, 87.0, 149.0, 186.0, 276.0, 441.0, 644.0, 1060.0, 1728.0, 2733.0, 4567.0, 8082.0, 14428.0, 27094.0, 54775.0, 116687.0, 267303.0, 642831.0, 1253124.0, 1004653.0, 437803.0, 184706.0, 83017.0, 40224.0, 20479.0, 10942.0, 6201.0, 3696.0, 2274.0, 1373.0, 847.0, 550.0, 364.0, 243.0, 174.0, 121.0, 61.0, 54.0, 30.0, 24.0, 19.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.44921875, -7.20721435546875, -6.9652099609375, -6.72320556640625, -6.481201171875, -6.23919677734375, -5.9971923828125, -5.75518798828125, -5.51318359375, -5.27117919921875, -5.0291748046875, -4.78717041015625, -4.545166015625, -4.30316162109375, -4.0611572265625, -3.81915283203125, -3.5771484375, -3.33514404296875, -3.0931396484375, -2.85113525390625, -2.609130859375, -2.36712646484375, -2.1251220703125, -1.88311767578125, -1.64111328125, -1.39910888671875, -1.1571044921875, -0.91510009765625, -0.673095703125, -0.43109130859375, -0.1890869140625, 0.05291748046875, 0.294921875, 0.53692626953125, 0.7789306640625, 1.02093505859375, 1.262939453125, 1.50494384765625, 1.7469482421875, 1.98895263671875, 2.23095703125, 2.47296142578125, 2.7149658203125, 2.95697021484375, 3.198974609375, 3.44097900390625, 3.6829833984375, 3.92498779296875, 4.1669921875, 4.40899658203125, 4.6510009765625, 4.89300537109375, 5.135009765625, 5.37701416015625, 5.6190185546875, 5.86102294921875, 6.10302734375, 6.34503173828125, 6.5870361328125, 6.82904052734375, 7.071044921875, 7.31304931640625, 7.5550537109375, 7.79705810546875, 8.0390625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 5.0, 4.0, 10.0, 9.0, 15.0, 17.0, 23.0, 33.0, 36.0, 52.0, 47.0, 88.0, 118.0, 148.0, 192.0, 225.0, 283.0, 308.0, 334.0, 351.0, 307.0, 289.0, 275.0, 199.0, 180.0, 111.0, 113.0, 73.0, 62.0, 53.0, 31.0, 19.0, 14.0, 10.0, 5.0, 8.0, 4.0, 6.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.156524658203125, -2.08258056640625, -2.008636474609375, -1.9346923828125, -1.860748291015625, -1.78680419921875, -1.712860107421875, -1.638916015625, -1.564971923828125, -1.49102783203125, -1.417083740234375, -1.3431396484375, -1.269195556640625, -1.19525146484375, -1.121307373046875, -1.04736328125, -0.973419189453125, -0.89947509765625, -0.825531005859375, -0.7515869140625, -0.677642822265625, -0.60369873046875, -0.529754638671875, -0.455810546875, -0.381866455078125, -0.30792236328125, -0.233978271484375, -0.1600341796875, -0.086090087890625, -0.01214599609375, 0.061798095703125, 0.1357421875, 0.209686279296875, 0.28363037109375, 0.357574462890625, 0.4315185546875, 0.505462646484375, 0.57940673828125, 0.653350830078125, 0.727294921875, 0.801239013671875, 0.87518310546875, 0.949127197265625, 1.0230712890625, 1.097015380859375, 1.17095947265625, 1.244903564453125, 1.31884765625, 1.392791748046875, 1.46673583984375, 1.540679931640625, 1.6146240234375, 1.688568115234375, 1.76251220703125, 1.836456298828125, 1.910400390625, 1.984344482421875, 2.05828857421875, 2.132232666015625, 2.2061767578125, 2.280120849609375, 2.35406494140625, 2.428009033203125, 2.501953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 1.0, 3.0, 11.0, 10.0, 16.0, 12.0, 32.0, 24.0, 29.0, 48.0, 51.0, 56.0, 69.0, 90.0, 93.0, 77.0, 86.0, 66.0, 49.0, 49.0, 33.0, 21.0, 21.0, 15.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.17936897277832, -8.893779754638672, -8.60819149017334, -8.322602272033691, -8.03701400756836, -7.751424789428711, -7.465836048126221, -7.1802473068237305, -6.89465856552124, -6.60906982421875, -6.32348108291626, -6.0378923416137695, -5.752303123474121, -5.466714859008789, -5.181125640869141, -4.89553689956665, -4.60994815826416, -4.32435941696167, -4.03877067565918, -3.7531816959381104, -3.46759295463562, -3.18200421333313, -2.8964152336120605, -2.6108264923095703, -2.32523775100708, -2.03964900970459, -1.75406014919281, -1.4684712886810303, -1.18288254737854, -0.8972938060760498, -0.61170494556427, -0.32611608505249023, -0.040526390075683594, 0.24506241083145142, 0.5306512117385864, 0.8162400126457214, 1.1018288135528564, 1.3874175548553467, 1.6730064153671265, 1.9585952758789062, 2.2441840171813965, 2.5297727584838867, 2.815361499786377, 3.1009504795074463, 3.3865392208099365, 3.6721279621124268, 3.957716941833496, 4.243305683135986, 4.528894424438477, 4.814483165740967, 5.100071907043457, 5.385660648345947, 5.6712493896484375, 5.956838607788086, 6.242427349090576, 6.528016090393066, 6.813604831695557, 7.099193572998047, 7.384782314300537, 7.670371055603027, 7.955960273742676, 8.241548538208008, 8.527137756347656, 8.812726974487305, 9.098315238952637]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 9.0, 6.0, 7.0, 8.0, 11.0, 10.0, 22.0, 18.0, 30.0, 22.0, 28.0, 28.0, 43.0, 41.0, 53.0, 46.0, 46.0, 38.0, 49.0, 49.0, 46.0, 49.0, 32.0, 40.0, 41.0, 34.0, 23.0, 36.0, 20.0, 24.0, 23.0, 14.0, 13.0, 15.0, 8.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3765716552734375, -4.217191219329834, -4.057810306549072, -3.8984296321868896, -3.739048957824707, -3.5796685218811035, -3.420287847518921, -3.2609071731567383, -3.1015264987945557, -2.942145824432373, -2.7827651500701904, -2.623384475708008, -2.4640040397644043, -2.3046231269836426, -2.145242691040039, -1.9858620166778564, -1.8264813423156738, -1.6671006679534912, -1.5077199935913086, -1.3483394384384155, -1.188958764076233, -1.0295780897140503, -0.8701974749565125, -0.7108168601989746, -0.551436185836792, -0.39205554127693176, -0.23267489671707153, -0.0732942521572113, 0.08608639240264893, 0.24546706676483154, 0.4048476815223694, 0.5642282962799072, 0.7236084938049316, 0.8829891681671143, 1.0423698425292969, 1.20175039768219, 1.3611310720443726, 1.5205117464065552, 1.6798923015594482, 1.8392729759216309, 1.9986536502838135, 2.158034324645996, 2.3174149990081787, 2.4767956733703613, 2.636176109313965, 2.7955570220947266, 2.95493745803833, 3.1143181324005127, 3.2736988067626953, 3.433079481124878, 3.5924601554870605, 3.751840829849243, 3.911221504211426, 4.070601940155029, 4.229982852935791, 4.3893632888793945, 4.548744201660156, 4.70812463760376, 4.8675055503845215, 5.026885986328125, 5.186266899108887, 5.34564733505249, 5.505028247833252, 5.6644086837768555, 5.823789119720459]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 4.0, 11.0, 26.0, 36.0, 52.0, 73.0, 107.0, 195.0, 308.0, 527.0, 840.0, 1388.0, 2590.0, 4672.0, 8653.0, 17353.0, 37485.0, 81235.0, 174517.0, 283598.0, 225020.0, 111016.0, 50153.0, 23693.0, 11506.0, 5920.0, 3113.0, 1788.0, 1037.0, 600.0, 340.0, 229.0, 157.0, 111.0, 58.0, 38.0, 30.0, 23.0, 7.0, 13.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5703125, -5.38885498046875, -5.2073974609375, -5.02593994140625, -4.844482421875, -4.66302490234375, -4.4815673828125, -4.30010986328125, -4.11865234375, -3.93719482421875, -3.7557373046875, -3.57427978515625, -3.392822265625, -3.21136474609375, -3.0299072265625, -2.84844970703125, -2.6669921875, -2.48553466796875, -2.3040771484375, -2.12261962890625, -1.941162109375, -1.75970458984375, -1.5782470703125, -1.39678955078125, -1.21533203125, -1.03387451171875, -0.8524169921875, -0.67095947265625, -0.489501953125, -0.30804443359375, -0.1265869140625, 0.05487060546875, 0.236328125, 0.41778564453125, 0.5992431640625, 0.78070068359375, 0.962158203125, 1.14361572265625, 1.3250732421875, 1.50653076171875, 1.68798828125, 1.86944580078125, 2.0509033203125, 2.23236083984375, 2.413818359375, 2.59527587890625, 2.7767333984375, 2.95819091796875, 3.1396484375, 3.32110595703125, 3.5025634765625, 3.68402099609375, 3.865478515625, 4.04693603515625, 4.2283935546875, 4.40985107421875, 4.59130859375, 4.77276611328125, 4.9542236328125, 5.13568115234375, 5.317138671875, 5.49859619140625, 5.6800537109375, 5.86151123046875, 6.04296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 8.0, 8.0, 6.0, 7.0, 14.0, 18.0, 14.0, 18.0, 26.0, 32.0, 34.0, 30.0, 36.0, 38.0, 48.0, 45.0, 40.0, 46.0, 52.0, 48.0, 44.0, 51.0, 43.0, 40.0, 34.0, 25.0, 35.0, 28.0, 16.0, 17.0, 16.0, 14.0, 12.0, 9.0, 16.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91015625, -4.74749755859375, -4.5848388671875, -4.42218017578125, -4.259521484375, -4.09686279296875, -3.9342041015625, -3.77154541015625, -3.60888671875, -3.44622802734375, -3.2835693359375, -3.12091064453125, -2.958251953125, -2.79559326171875, -2.6329345703125, -2.47027587890625, -2.3076171875, -2.14495849609375, -1.9822998046875, -1.81964111328125, -1.656982421875, -1.49432373046875, -1.3316650390625, -1.16900634765625, -1.00634765625, -0.84368896484375, -0.6810302734375, -0.51837158203125, -0.355712890625, -0.19305419921875, -0.0303955078125, 0.13226318359375, 0.294921875, 0.45758056640625, 0.6202392578125, 0.78289794921875, 0.945556640625, 1.10821533203125, 1.2708740234375, 1.43353271484375, 1.59619140625, 1.75885009765625, 1.9215087890625, 2.08416748046875, 2.246826171875, 2.40948486328125, 2.5721435546875, 2.73480224609375, 2.8974609375, 3.06011962890625, 3.2227783203125, 3.38543701171875, 3.548095703125, 3.71075439453125, 3.8734130859375, 4.03607177734375, 4.19873046875, 4.36138916015625, 4.5240478515625, 4.68670654296875, 4.849365234375, 5.01202392578125, 5.1746826171875, 5.33734130859375, 5.5]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 8.0, 4.0, 19.0, 17.0, 26.0, 37.0, 64.0, 74.0, 125.0, 178.0, 273.0, 476.0, 711.0, 1052.0, 1814.0, 3031.0, 5308.0, 9890.0, 19538.0, 42190.0, 95148.0, 213504.0, 311963.0, 186617.0, 81804.0, 36646.0, 17078.0, 8867.0, 4867.0, 2753.0, 1575.0, 1037.0, 597.0, 444.0, 253.0, 174.0, 118.0, 79.0, 60.0, 48.0, 35.0, 15.0, 7.0, 10.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.62890625, -6.42437744140625, -6.2198486328125, -6.01531982421875, -5.810791015625, -5.60626220703125, -5.4017333984375, -5.19720458984375, -4.99267578125, -4.78814697265625, -4.5836181640625, -4.37908935546875, -4.174560546875, -3.97003173828125, -3.7655029296875, -3.56097412109375, -3.3564453125, -3.15191650390625, -2.9473876953125, -2.74285888671875, -2.538330078125, -2.33380126953125, -2.1292724609375, -1.92474365234375, -1.72021484375, -1.51568603515625, -1.3111572265625, -1.10662841796875, -0.902099609375, -0.69757080078125, -0.4930419921875, -0.28851318359375, -0.083984375, 0.12054443359375, 0.3250732421875, 0.52960205078125, 0.734130859375, 0.93865966796875, 1.1431884765625, 1.34771728515625, 1.55224609375, 1.75677490234375, 1.9613037109375, 2.16583251953125, 2.370361328125, 2.57489013671875, 2.7794189453125, 2.98394775390625, 3.1884765625, 3.39300537109375, 3.5975341796875, 3.80206298828125, 4.006591796875, 4.21112060546875, 4.4156494140625, 4.62017822265625, 4.82470703125, 5.02923583984375, 5.2337646484375, 5.43829345703125, 5.642822265625, 5.84735107421875, 6.0518798828125, 6.25640869140625, 6.4609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 4.0, 7.0, 8.0, 13.0, 17.0, 10.0, 15.0, 27.0, 26.0, 20.0, 29.0, 20.0, 26.0, 43.0, 36.0, 43.0, 47.0, 37.0, 43.0, 34.0, 34.0, 53.0, 36.0, 27.0, 29.0, 39.0, 33.0, 28.0, 29.0, 24.0, 19.0, 21.0, 22.0, 19.0, 16.0, 20.0, 10.0, 8.0, 5.0, 10.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.818359375, -2.733062744140625, -2.64776611328125, -2.562469482421875, -2.4771728515625, -2.391876220703125, -2.30657958984375, -2.221282958984375, -2.135986328125, -2.050689697265625, -1.96539306640625, -1.880096435546875, -1.7947998046875, -1.709503173828125, -1.62420654296875, -1.538909912109375, -1.45361328125, -1.368316650390625, -1.28302001953125, -1.197723388671875, -1.1124267578125, -1.027130126953125, -0.94183349609375, -0.856536865234375, -0.771240234375, -0.685943603515625, -0.60064697265625, -0.515350341796875, -0.4300537109375, -0.344757080078125, -0.25946044921875, -0.174163818359375, -0.0888671875, -0.003570556640625, 0.08172607421875, 0.167022705078125, 0.2523193359375, 0.337615966796875, 0.42291259765625, 0.508209228515625, 0.593505859375, 0.678802490234375, 0.76409912109375, 0.849395751953125, 0.9346923828125, 1.019989013671875, 1.10528564453125, 1.190582275390625, 1.27587890625, 1.361175537109375, 1.44647216796875, 1.531768798828125, 1.6170654296875, 1.702362060546875, 1.78765869140625, 1.872955322265625, 1.958251953125, 2.043548583984375, 2.12884521484375, 2.214141845703125, 2.2994384765625, 2.384735107421875, 2.47003173828125, 2.555328369140625, 2.640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 16.0, 11.0, 15.0, 24.0, 28.0, 34.0, 48.0, 74.0, 99.0, 113.0, 161.0, 232.0, 346.0, 449.0, 724.0, 988.0, 1464.0, 2270.0, 3751.0, 6367.0, 12169.0, 25872.0, 65131.0, 189061.0, 400142.0, 208083.0, 71418.0, 28157.0, 13115.0, 6851.0, 3884.0, 2420.0, 1599.0, 1061.0, 731.0, 446.0, 300.0, 233.0, 198.0, 142.0, 87.0, 82.0, 49.0, 25.0, 30.0, 17.0, 10.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.6171875, -3.498779296875, -3.38037109375, -3.261962890625, -3.1435546875, -3.025146484375, -2.90673828125, -2.788330078125, -2.669921875, -2.551513671875, -2.43310546875, -2.314697265625, -2.1962890625, -2.077880859375, -1.95947265625, -1.841064453125, -1.72265625, -1.604248046875, -1.48583984375, -1.367431640625, -1.2490234375, -1.130615234375, -1.01220703125, -0.893798828125, -0.775390625, -0.656982421875, -0.53857421875, -0.420166015625, -0.3017578125, -0.183349609375, -0.06494140625, 0.053466796875, 0.171875, 0.290283203125, 0.40869140625, 0.527099609375, 0.6455078125, 0.763916015625, 0.88232421875, 1.000732421875, 1.119140625, 1.237548828125, 1.35595703125, 1.474365234375, 1.5927734375, 1.711181640625, 1.82958984375, 1.947998046875, 2.06640625, 2.184814453125, 2.30322265625, 2.421630859375, 2.5400390625, 2.658447265625, 2.77685546875, 2.895263671875, 3.013671875, 3.132080078125, 3.25048828125, 3.368896484375, 3.4873046875, 3.605712890625, 3.72412109375, 3.842529296875, 3.9609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 8.0, 10.0, 24.0, 24.0, 30.0, 38.0, 41.0, 74.0, 79.0, 87.0, 101.0, 90.0, 75.0, 56.0, 61.0, 25.0, 34.0, 31.0, 19.0, 14.0, 14.0, 10.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014448165893554688, -0.00013866834342479706, -0.00013285502791404724, -0.00012704171240329742, -0.00012122839689254761, -0.00011541508138179779, -0.00010960176587104797, -0.00010378845036029816, -9.797513484954834e-05, -9.216181933879852e-05, -8.63485038280487e-05, -8.053518831729889e-05, -7.472187280654907e-05, -6.890855729579926e-05, -6.309524178504944e-05, -5.728192627429962e-05, -5.1468610763549805e-05, -4.565529525279999e-05, -3.984197974205017e-05, -3.4028664231300354e-05, -2.8215348720550537e-05, -2.240203320980072e-05, -1.6588717699050903e-05, -1.0775402188301086e-05, -4.9620866775512695e-06, 8.512288331985474e-07, 6.664544343948364e-06, 1.2477859854698181e-05, 1.8291175365447998e-05, 2.4104490876197815e-05, 2.9917806386947632e-05, 3.573112189769745e-05, 4.1544437408447266e-05, 4.735775291919708e-05, 5.31710684299469e-05, 5.8984383940696716e-05, 6.479769945144653e-05, 7.061101496219635e-05, 7.642433047294617e-05, 8.223764598369598e-05, 8.80509614944458e-05, 9.386427700519562e-05, 9.967759251594543e-05, 0.00010549090802669525, 0.00011130422353744507, 0.00011711753904819489, 0.0001229308545589447, 0.00012874417006969452, 0.00013455748558044434, 0.00014037080109119415, 0.00014618411660194397, 0.0001519974321126938, 0.0001578107476234436, 0.00016362406313419342, 0.00016943737864494324, 0.00017525069415569305, 0.00018106400966644287, 0.0001868773251771927, 0.0001926906406879425, 0.00019850395619869232, 0.00020431727170944214, 0.00021013058722019196, 0.00021594390273094177, 0.0002217572182416916, 0.0002275705337524414]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 4.0, 9.0, 16.0, 27.0, 33.0, 56.0, 66.0, 121.0, 160.0, 244.0, 339.0, 577.0, 839.0, 1352.0, 2100.0, 3521.0, 6047.0, 11851.0, 26875.0, 72533.0, 212363.0, 372850.0, 210786.0, 72010.0, 26498.0, 11859.0, 6092.0, 3500.0, 2014.0, 1300.0, 824.0, 550.0, 375.0, 253.0, 147.0, 118.0, 73.0, 40.0, 37.0, 31.0, 17.0, 13.0, 9.0, 8.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.188873291015625, -3.07696533203125, -2.965057373046875, -2.8531494140625, -2.741241455078125, -2.62933349609375, -2.517425537109375, -2.405517578125, -2.293609619140625, -2.18170166015625, -2.069793701171875, -1.9578857421875, -1.845977783203125, -1.73406982421875, -1.622161865234375, -1.51025390625, -1.398345947265625, -1.28643798828125, -1.174530029296875, -1.0626220703125, -0.950714111328125, -0.83880615234375, -0.726898193359375, -0.614990234375, -0.503082275390625, -0.39117431640625, -0.279266357421875, -0.1673583984375, -0.055450439453125, 0.05645751953125, 0.168365478515625, 0.2802734375, 0.392181396484375, 0.50408935546875, 0.615997314453125, 0.7279052734375, 0.839813232421875, 0.95172119140625, 1.063629150390625, 1.175537109375, 1.287445068359375, 1.39935302734375, 1.511260986328125, 1.6231689453125, 1.735076904296875, 1.84698486328125, 1.958892822265625, 2.07080078125, 2.182708740234375, 2.29461669921875, 2.406524658203125, 2.5184326171875, 2.630340576171875, 2.74224853515625, 2.854156494140625, 2.966064453125, 3.077972412109375, 3.18988037109375, 3.301788330078125, 3.4136962890625, 3.525604248046875, 3.63751220703125, 3.749420166015625, 3.861328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 10.0, 10.0, 20.0, 10.0, 21.0, 33.0, 45.0, 59.0, 72.0, 85.0, 96.0, 77.0, 73.0, 72.0, 87.0, 52.0, 52.0, 27.0, 31.0, 12.0, 5.0, 10.0, 6.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90625, -0.878387451171875, -0.85052490234375, -0.822662353515625, -0.7947998046875, -0.766937255859375, -0.73907470703125, -0.711212158203125, -0.683349609375, -0.655487060546875, -0.62762451171875, -0.599761962890625, -0.5718994140625, -0.544036865234375, -0.51617431640625, -0.488311767578125, -0.46044921875, -0.432586669921875, -0.40472412109375, -0.376861572265625, -0.3489990234375, -0.321136474609375, -0.29327392578125, -0.265411376953125, -0.237548828125, -0.209686279296875, -0.18182373046875, -0.153961181640625, -0.1260986328125, -0.098236083984375, -0.07037353515625, -0.042510986328125, -0.0146484375, 0.013214111328125, 0.04107666015625, 0.068939208984375, 0.0968017578125, 0.124664306640625, 0.15252685546875, 0.180389404296875, 0.208251953125, 0.236114501953125, 0.26397705078125, 0.291839599609375, 0.3197021484375, 0.347564697265625, 0.37542724609375, 0.403289794921875, 0.43115234375, 0.459014892578125, 0.48687744140625, 0.514739990234375, 0.5426025390625, 0.570465087890625, 0.59832763671875, 0.626190185546875, 0.654052734375, 0.681915283203125, 0.70977783203125, 0.737640380859375, 0.7655029296875, 0.793365478515625, 0.82122802734375, 0.849090576171875, 0.876953125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 3.0, 8.0, 13.0, 12.0, 16.0, 18.0, 20.0, 25.0, 44.0, 30.0, 43.0, 54.0, 73.0, 81.0, 95.0, 77.0, 77.0, 63.0, 45.0, 55.0, 38.0, 26.0, 17.0, 16.0, 14.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.284247398376465, -8.018978118896484, -7.75370979309082, -7.48844051361084, -7.223171710968018, -6.957902908325195, -6.692633628845215, -6.427364826202393, -6.16209602355957, -5.896827220916748, -5.631558418273926, -5.366289138793945, -5.101020336151123, -4.835751533508301, -4.57048225402832, -4.305213451385498, -4.039944648742676, -3.7746758460998535, -3.509406805038452, -3.244137763977051, -2.9788689613342285, -2.7136001586914062, -2.448331117630005, -2.1830620765686035, -1.9177932739257812, -1.6525243520736694, -1.3872554302215576, -1.1219865083694458, -0.856717586517334, -0.5914486646652222, -0.32617974281311035, -0.060910820960998535, 0.20435714721679688, 0.4696260690689087, 0.7348949909210205, 1.0001639127731323, 1.2654328346252441, 1.530701756477356, 1.7959706783294678, 2.061239719390869, 2.3265085220336914, 2.5917773246765137, 2.857046365737915, 3.1223154067993164, 3.3875842094421387, 3.652853012084961, 3.9181220531463623, 4.183391094207764, 4.448659896850586, 4.713928699493408, 4.9791975021362305, 5.244466781616211, 5.509735584259033, 5.7750043869018555, 6.040273666381836, 6.305542469024658, 6.5708112716674805, 6.836080074310303, 7.101348876953125, 7.3666181564331055, 7.631886959075928, 7.89715576171875, 8.16242504119873, 8.427693367004395, 8.692962646484375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 9.0, 7.0, 10.0, 9.0, 18.0, 29.0, 21.0, 26.0, 23.0, 32.0, 38.0, 45.0, 63.0, 34.0, 44.0, 49.0, 43.0, 49.0, 54.0, 47.0, 42.0, 41.0, 34.0, 38.0, 21.0, 27.0, 29.0, 27.0, 20.0, 15.0, 10.0, 13.0, 11.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.414175987243652, -4.2537431716918945, -4.093310832977295, -3.932878017425537, -3.7724454402923584, -3.6120128631591797, -3.451580047607422, -3.291147470474243, -3.1307148933410645, -2.9702823162078857, -2.809849739074707, -2.649416923522949, -2.4889843463897705, -2.328551769256592, -2.168118953704834, -2.0076863765716553, -1.8472537994384766, -1.6868212223052979, -1.5263885259628296, -1.3659558296203613, -1.2055232524871826, -1.045090675354004, -0.8846579790115356, -0.7242252826690674, -0.5637927055358887, -0.4033600687980652, -0.2429274320602417, -0.08249479532241821, 0.07793784141540527, 0.23837047815322876, 0.39880311489105225, 0.5592358112335205, 0.719667911529541, 0.8801005482673645, 1.040533185005188, 1.2009658813476562, 1.361398458480835, 1.5218310356140137, 1.682263731956482, 1.8426964282989502, 2.003129005432129, 2.1635615825653076, 2.3239941596984863, 2.484426975250244, 2.644859552383423, 2.8052921295166016, 2.9657249450683594, 3.126157522201538, 3.286590099334717, 3.4470226764678955, 3.607455253601074, 3.767888069152832, 3.9283206462860107, 4.0887532234191895, 4.249186038970947, 4.409618377685547, 4.570051193237305, 4.7304840087890625, 4.890916347503662, 5.05134916305542, 5.2117815017700195, 5.372214317321777, 5.532647132873535, 5.693079948425293, 5.853512287139893]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 14.0, 26.0, 26.0, 44.0, 77.0, 87.0, 153.0, 208.0, 272.0, 513.0, 782.0, 1144.0, 1924.0, 3306.0, 5386.0, 9531.0, 16652.0, 29752.0, 53741.0, 93621.0, 148544.0, 192682.0, 182480.0, 128805.0, 77604.0, 43578.0, 24288.0, 13684.0, 7779.0, 4552.0, 2650.0, 1593.0, 1085.0, 664.0, 438.0, 283.0, 181.0, 137.0, 78.0, 57.0, 37.0, 23.0, 19.0, 17.0, 6.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.49151611328125, -5.3189697265625, -5.14642333984375, -4.973876953125, -4.80133056640625, -4.6287841796875, -4.45623779296875, -4.28369140625, -4.11114501953125, -3.9385986328125, -3.76605224609375, -3.593505859375, -3.42095947265625, -3.2484130859375, -3.07586669921875, -2.9033203125, -2.73077392578125, -2.5582275390625, -2.38568115234375, -2.213134765625, -2.04058837890625, -1.8680419921875, -1.69549560546875, -1.52294921875, -1.35040283203125, -1.1778564453125, -1.00531005859375, -0.832763671875, -0.66021728515625, -0.4876708984375, -0.31512451171875, -0.142578125, 0.02996826171875, 0.2025146484375, 0.37506103515625, 0.547607421875, 0.72015380859375, 0.8927001953125, 1.06524658203125, 1.23779296875, 1.41033935546875, 1.5828857421875, 1.75543212890625, 1.927978515625, 2.10052490234375, 2.2730712890625, 2.44561767578125, 2.6181640625, 2.79071044921875, 2.9632568359375, 3.13580322265625, 3.308349609375, 3.48089599609375, 3.6534423828125, 3.82598876953125, 3.99853515625, 4.17108154296875, 4.3436279296875, 4.51617431640625, 4.688720703125, 4.86126708984375, 5.0338134765625, 5.20635986328125, 5.37890625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 10.0, 9.0, 8.0, 17.0, 9.0, 14.0, 15.0, 18.0, 21.0, 23.0, 28.0, 22.0, 25.0, 31.0, 38.0, 42.0, 40.0, 37.0, 42.0, 33.0, 49.0, 42.0, 35.0, 47.0, 34.0, 36.0, 31.0, 37.0, 22.0, 32.0, 27.0, 18.0, 16.0, 15.0, 10.0, 15.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.83203125, -4.68865966796875, -4.5452880859375, -4.40191650390625, -4.258544921875, -4.11517333984375, -3.9718017578125, -3.82843017578125, -3.68505859375, -3.54168701171875, -3.3983154296875, -3.25494384765625, -3.111572265625, -2.96820068359375, -2.8248291015625, -2.68145751953125, -2.5380859375, -2.39471435546875, -2.2513427734375, -2.10797119140625, -1.964599609375, -1.82122802734375, -1.6778564453125, -1.53448486328125, -1.39111328125, -1.24774169921875, -1.1043701171875, -0.96099853515625, -0.817626953125, -0.67425537109375, -0.5308837890625, -0.38751220703125, -0.244140625, -0.10076904296875, 0.0426025390625, 0.18597412109375, 0.329345703125, 0.47271728515625, 0.6160888671875, 0.75946044921875, 0.90283203125, 1.04620361328125, 1.1895751953125, 1.33294677734375, 1.476318359375, 1.61968994140625, 1.7630615234375, 1.90643310546875, 2.0498046875, 2.19317626953125, 2.3365478515625, 2.47991943359375, 2.623291015625, 2.76666259765625, 2.9100341796875, 3.05340576171875, 3.19677734375, 3.34014892578125, 3.4835205078125, 3.62689208984375, 3.770263671875, 3.91363525390625, 4.0570068359375, 4.20037841796875, 4.34375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 15.0, 11.0, 26.0, 37.0, 32.0, 54.0, 89.0, 116.0, 212.0, 325.0, 546.0, 862.0, 1430.0, 2600.0, 4728.0, 8984.0, 17782.0, 35313.0, 70796.0, 134385.0, 211192.0, 225317.0, 158418.0, 85904.0, 43914.0, 21396.0, 11008.0, 5534.0, 3001.0, 1752.0, 1030.0, 615.0, 373.0, 281.0, 178.0, 114.0, 55.0, 43.0, 23.0, 23.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.14453125, -5.9337158203125, -5.722900390625, -5.5120849609375, -5.30126953125, -5.0904541015625, -4.879638671875, -4.6688232421875, -4.4580078125, -4.2471923828125, -4.036376953125, -3.8255615234375, -3.61474609375, -3.4039306640625, -3.193115234375, -2.9822998046875, -2.771484375, -2.5606689453125, -2.349853515625, -2.1390380859375, -1.92822265625, -1.7174072265625, -1.506591796875, -1.2957763671875, -1.0849609375, -0.8741455078125, -0.663330078125, -0.4525146484375, -0.24169921875, -0.0308837890625, 0.179931640625, 0.3907470703125, 0.6015625, 0.8123779296875, 1.023193359375, 1.2340087890625, 1.44482421875, 1.6556396484375, 1.866455078125, 2.0772705078125, 2.2880859375, 2.4989013671875, 2.709716796875, 2.9205322265625, 3.13134765625, 3.3421630859375, 3.552978515625, 3.7637939453125, 3.974609375, 4.1854248046875, 4.396240234375, 4.6070556640625, 4.81787109375, 5.0286865234375, 5.239501953125, 5.4503173828125, 5.6611328125, 5.8719482421875, 6.082763671875, 6.2935791015625, 6.50439453125, 6.7152099609375, 6.926025390625, 7.1368408203125, 7.34765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 15.0, 16.0, 21.0, 14.0, 19.0, 28.0, 31.0, 24.0, 31.0, 34.0, 40.0, 37.0, 50.0, 34.0, 53.0, 43.0, 42.0, 30.0, 60.0, 34.0, 46.0, 42.0, 35.0, 34.0, 18.0, 26.0, 24.0, 22.0, 10.0, 15.0, 7.0, 11.0, 6.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.659088134765625, -2.56231689453125, -2.465545654296875, -2.3687744140625, -2.272003173828125, -2.17523193359375, -2.078460693359375, -1.981689453125, -1.884918212890625, -1.78814697265625, -1.691375732421875, -1.5946044921875, -1.497833251953125, -1.40106201171875, -1.304290771484375, -1.20751953125, -1.110748291015625, -1.01397705078125, -0.917205810546875, -0.8204345703125, -0.723663330078125, -0.62689208984375, -0.530120849609375, -0.433349609375, -0.336578369140625, -0.23980712890625, -0.143035888671875, -0.0462646484375, 0.050506591796875, 0.14727783203125, 0.244049072265625, 0.3408203125, 0.437591552734375, 0.53436279296875, 0.631134033203125, 0.7279052734375, 0.824676513671875, 0.92144775390625, 1.018218994140625, 1.114990234375, 1.211761474609375, 1.30853271484375, 1.405303955078125, 1.5020751953125, 1.598846435546875, 1.69561767578125, 1.792388916015625, 1.88916015625, 1.985931396484375, 2.08270263671875, 2.179473876953125, 2.2762451171875, 2.373016357421875, 2.46978759765625, 2.566558837890625, 2.663330078125, 2.760101318359375, 2.85687255859375, 2.953643798828125, 3.0504150390625, 3.147186279296875, 3.24395751953125, 3.340728759765625, 3.4375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 5.0, 6.0, 10.0, 24.0, 25.0, 34.0, 52.0, 89.0, 107.0, 157.0, 239.0, 402.0, 572.0, 843.0, 1314.0, 2019.0, 3111.0, 4797.0, 7717.0, 12498.0, 20550.0, 34477.0, 56616.0, 90757.0, 135053.0, 170768.0, 165373.0, 125921.0, 82728.0, 51313.0, 31127.0, 18627.0, 11410.0, 7208.0, 4418.0, 2849.0, 1798.0, 1168.0, 780.0, 523.0, 332.0, 250.0, 152.0, 102.0, 82.0, 54.0, 45.0, 23.0, 15.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.033203125, -1.971405029296875, -1.90960693359375, -1.847808837890625, -1.7860107421875, -1.724212646484375, -1.66241455078125, -1.600616455078125, -1.538818359375, -1.477020263671875, -1.41522216796875, -1.353424072265625, -1.2916259765625, -1.229827880859375, -1.16802978515625, -1.106231689453125, -1.04443359375, -0.982635498046875, -0.92083740234375, -0.859039306640625, -0.7972412109375, -0.735443115234375, -0.67364501953125, -0.611846923828125, -0.550048828125, -0.488250732421875, -0.42645263671875, -0.364654541015625, -0.3028564453125, -0.241058349609375, -0.17926025390625, -0.117462158203125, -0.0556640625, 0.006134033203125, 0.06793212890625, 0.129730224609375, 0.1915283203125, 0.253326416015625, 0.31512451171875, 0.376922607421875, 0.438720703125, 0.500518798828125, 0.56231689453125, 0.624114990234375, 0.6859130859375, 0.747711181640625, 0.80950927734375, 0.871307373046875, 0.93310546875, 0.994903564453125, 1.05670166015625, 1.118499755859375, 1.1802978515625, 1.242095947265625, 1.30389404296875, 1.365692138671875, 1.427490234375, 1.489288330078125, 1.55108642578125, 1.612884521484375, 1.6746826171875, 1.736480712890625, 1.79827880859375, 1.860076904296875, 1.921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 7.0, 11.0, 14.0, 18.0, 21.0, 34.0, 50.0, 61.0, 73.0, 71.0, 85.0, 87.0, 76.0, 72.0, 55.0, 49.0, 49.0, 30.0, 27.0, 14.0, 15.0, 12.0, 14.0, 10.0, 9.0, 5.0, 8.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003025531768798828, -0.0002929605543613434, -0.00028336793184280396, -0.0002737753093242645, -0.0002641826868057251, -0.00025459006428718567, -0.00024499744176864624, -0.0002354048192501068, -0.00022581219673156738, -0.00021621957421302795, -0.00020662695169448853, -0.0001970343291759491, -0.00018744170665740967, -0.00017784908413887024, -0.0001682564616203308, -0.00015866383910179138, -0.00014907121658325195, -0.00013947859406471252, -0.0001298859715461731, -0.00012029334902763367, -0.00011070072650909424, -0.00010110810399055481, -9.151548147201538e-05, -8.192285895347595e-05, -7.233023643493652e-05, -6.27376139163971e-05, -5.3144991397857666e-05, -4.355236887931824e-05, -3.395974636077881e-05, -2.436712384223938e-05, -1.4774501323699951e-05, -5.1818788051605225e-06, 4.410743713378906e-06, 1.4003366231918335e-05, 2.3595988750457764e-05, 3.318861126899719e-05, 4.278123378753662e-05, 5.237385630607605e-05, 6.196647882461548e-05, 7.155910134315491e-05, 8.115172386169434e-05, 9.074434638023376e-05, 0.0001003369688987732, 0.00010992959141731262, 0.00011952221393585205, 0.00012911483645439148, 0.0001387074589729309, 0.00014830008149147034, 0.00015789270401000977, 0.0001674853265285492, 0.00017707794904708862, 0.00018667057156562805, 0.00019626319408416748, 0.0002058558166027069, 0.00021544843912124634, 0.00022504106163978577, 0.0002346336841583252, 0.0002442263066768646, 0.00025381892919540405, 0.0002634115517139435, 0.0002730041742324829, 0.00028259679675102234, 0.00029218941926956177, 0.0003017820417881012, 0.0003113746643066406]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 10.0, 21.0, 41.0, 39.0, 103.0, 135.0, 237.0, 427.0, 650.0, 1106.0, 2013.0, 3602.0, 6371.0, 11890.0, 22469.0, 42185.0, 79367.0, 139372.0, 202237.0, 205286.0, 147988.0, 84946.0, 45777.0, 23875.0, 12779.0, 6803.0, 3843.0, 2041.0, 1176.0, 691.0, 410.0, 236.0, 147.0, 95.0, 57.0, 39.0, 30.0, 21.0, 11.0, 5.0, 4.0, 2.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.514068603515625, -2.44024658203125, -2.366424560546875, -2.2926025390625, -2.218780517578125, -2.14495849609375, -2.071136474609375, -1.997314453125, -1.923492431640625, -1.84967041015625, -1.775848388671875, -1.7020263671875, -1.628204345703125, -1.55438232421875, -1.480560302734375, -1.40673828125, -1.332916259765625, -1.25909423828125, -1.185272216796875, -1.1114501953125, -1.037628173828125, -0.96380615234375, -0.889984130859375, -0.816162109375, -0.742340087890625, -0.66851806640625, -0.594696044921875, -0.5208740234375, -0.447052001953125, -0.37322998046875, -0.299407958984375, -0.2255859375, -0.151763916015625, -0.07794189453125, -0.004119873046875, 0.0697021484375, 0.143524169921875, 0.21734619140625, 0.291168212890625, 0.364990234375, 0.438812255859375, 0.51263427734375, 0.586456298828125, 0.6602783203125, 0.734100341796875, 0.80792236328125, 0.881744384765625, 0.95556640625, 1.029388427734375, 1.10321044921875, 1.177032470703125, 1.2508544921875, 1.324676513671875, 1.39849853515625, 1.472320556640625, 1.546142578125, 1.619964599609375, 1.69378662109375, 1.767608642578125, 1.8414306640625, 1.915252685546875, 1.98907470703125, 2.062896728515625, 2.13671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 10.0, 4.0, 11.0, 18.0, 25.0, 22.0, 12.0, 27.0, 35.0, 32.0, 33.0, 27.0, 36.0, 31.0, 41.0, 49.0, 42.0, 50.0, 51.0, 25.0, 48.0, 38.0, 37.0, 38.0, 29.0, 23.0, 25.0, 27.0, 16.0, 18.0, 16.0, 13.0, 16.0, 19.0, 6.0, 8.0, 4.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412353515625, -0.3975410461425781, -0.38272857666015625, -0.3679161071777344, -0.3531036376953125, -0.3382911682128906, -0.32347869873046875, -0.3086662292480469, -0.293853759765625, -0.2790412902832031, -0.26422882080078125, -0.24941635131835938, -0.2346038818359375, -0.21979141235351562, -0.20497894287109375, -0.19016647338867188, -0.17535400390625, -0.16054153442382812, -0.14572906494140625, -0.13091659545898438, -0.1161041259765625, -0.10129165649414062, -0.08647918701171875, -0.07166671752929688, -0.056854248046875, -0.042041778564453125, -0.02722930908203125, -0.012416839599609375, 0.0023956298828125, 0.017208099365234375, 0.03202056884765625, 0.046833038330078125, 0.0616455078125, 0.07645797729492188, 0.09127044677734375, 0.10608291625976562, 0.1208953857421875, 0.13570785522460938, 0.15052032470703125, 0.16533279418945312, 0.180145263671875, 0.19495773315429688, 0.20977020263671875, 0.22458267211914062, 0.2393951416015625, 0.2542076110839844, 0.26902008056640625, 0.2838325500488281, 0.29864501953125, 0.3134574890136719, 0.32826995849609375, 0.3430824279785156, 0.3578948974609375, 0.3727073669433594, 0.38751983642578125, 0.4023323059082031, 0.417144775390625, 0.4319572448730469, 0.44676971435546875, 0.4615821838378906, 0.4763946533203125, 0.4912071228027344, 0.5060195922851562, 0.5208320617675781, 0.53564453125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 4.0, 6.0, 4.0, 5.0, 14.0, 12.0, 19.0, 16.0, 33.0, 17.0, 25.0, 49.0, 53.0, 59.0, 68.0, 78.0, 95.0, 74.0, 75.0, 72.0, 55.0, 48.0, 37.0, 23.0, 17.0, 12.0, 11.0, 6.0, 0.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.282942771911621, -7.014131546020508, -6.745320796966553, -6.4765095710754395, -6.207698345184326, -5.938887596130371, -5.670076370239258, -5.4012651443481445, -5.132453918457031, -4.863642692565918, -4.594831943511963, -4.32602071762085, -4.057209491729736, -3.788398504257202, -3.519587516784668, -3.2507762908935547, -2.9819655418395996, -2.7131545543670654, -2.444343328475952, -2.175532341003418, -1.9067212343215942, -1.6379101276397705, -1.3690991401672363, -1.1002880334854126, -0.8314769268035889, -0.5626658201217651, -0.2938547730445862, -0.025043725967407227, 0.2437673807144165, 0.5125784873962402, 0.7813894748687744, 1.0502005815505981, 1.3190116882324219, 1.5878227949142456, 1.8566339015960693, 2.1254448890686035, 2.394256114959717, 2.663067102432251, 2.931878089904785, 3.2006893157958984, 3.4695003032684326, 3.738311290740967, 4.00712251663208, 4.275933265686035, 4.544744491577148, 4.813555717468262, 5.082366943359375, 5.35117769241333, 5.619988918304443, 5.888800144195557, 6.157610893249512, 6.426422119140625, 6.695233345031738, 6.964044570922852, 7.232855319976807, 7.50166654586792, 7.770477294921875, 8.039288520812988, 8.308099746704102, 8.576910018920898, 8.845721244812012, 9.114532470703125, 9.383343696594238, 9.652154922485352, 9.920966148376465]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 14.0, 20.0, 12.0, 17.0, 24.0, 25.0, 28.0, 26.0, 52.0, 40.0, 39.0, 55.0, 31.0, 57.0, 49.0, 53.0, 46.0, 46.0, 47.0, 39.0, 37.0, 25.0, 26.0, 25.0, 26.0, 20.0, 25.0, 17.0, 11.0, 13.0, 8.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.709172248840332, -4.549365997314453, -4.389560222625732, -4.2297539710998535, -4.069948196411133, -3.910141944885254, -3.750335931777954, -3.5905299186706543, -3.4307236671447754, -3.2709176540374756, -3.111111640930176, -2.951305389404297, -2.791499376296997, -2.6316933631896973, -2.4718873500823975, -2.3120813369750977, -2.152275323867798, -1.992469310760498, -1.8326631784439087, -1.6728571653366089, -1.5130510330200195, -1.3532450199127197, -1.19343900680542, -1.0336328744888306, -0.8738268613815308, -0.7140207886695862, -0.5542147159576416, -0.3944087028503418, -0.23460263013839722, -0.07479655742645264, 0.08500945568084717, 0.24481558799743652, 0.40462160110473633, 0.5644276738166809, 0.7242337465286255, 0.8840397596359253, 1.0438458919525146, 1.2036519050598145, 1.3634579181671143, 1.5232640504837036, 1.6830700635910034, 1.8428760766983032, 2.0026822090148926, 2.1624882221221924, 2.322294235229492, 2.482100486755371, 2.641906261444092, 2.8017125129699707, 2.9615185260772705, 3.1213245391845703, 3.28113055229187, 3.44093656539917, 3.600742816925049, 3.7605488300323486, 3.9203548431396484, 4.080161094665527, 4.239966869354248, 4.399773120880127, 4.559578895568848, 4.719385147094727, 4.879190921783447, 5.038997173309326, 5.198802947998047, 5.358609199523926, 5.518415451049805]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 7.0, 28.0, 27.0, 34.0, 58.0, 78.0, 113.0, 217.0, 278.0, 487.0, 808.0, 1325.0, 2236.0, 4183.0, 7942.0, 15336.0, 32063.0, 74477.0, 195248.0, 584754.0, 1401308.0, 1190817.0, 428741.0, 143166.0, 56825.0, 25567.0, 12574.0, 6591.0, 3632.0, 2078.0, 1215.0, 738.0, 467.0, 299.0, 197.0, 110.0, 84.0, 40.0, 42.0, 23.0, 17.0, 13.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.5078125, -8.2489013671875, -7.989990234375, -7.7310791015625, -7.47216796875, -7.2132568359375, -6.954345703125, -6.6954345703125, -6.4365234375, -6.1776123046875, -5.918701171875, -5.6597900390625, -5.40087890625, -5.1419677734375, -4.883056640625, -4.6241455078125, -4.365234375, -4.1063232421875, -3.847412109375, -3.5885009765625, -3.32958984375, -3.0706787109375, -2.811767578125, -2.5528564453125, -2.2939453125, -2.0350341796875, -1.776123046875, -1.5172119140625, -1.25830078125, -0.9993896484375, -0.740478515625, -0.4815673828125, -0.22265625, 0.0362548828125, 0.295166015625, 0.5540771484375, 0.81298828125, 1.0718994140625, 1.330810546875, 1.5897216796875, 1.8486328125, 2.1075439453125, 2.366455078125, 2.6253662109375, 2.88427734375, 3.1431884765625, 3.402099609375, 3.6610107421875, 3.919921875, 4.1788330078125, 4.437744140625, 4.6966552734375, 4.95556640625, 5.2144775390625, 5.473388671875, 5.7322998046875, 5.9912109375, 6.2501220703125, 6.509033203125, 6.7679443359375, 7.02685546875, 7.2857666015625, 7.544677734375, 7.8035888671875, 8.0625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 8.0, 11.0, 18.0, 14.0, 18.0, 32.0, 31.0, 32.0, 47.0, 46.0, 34.0, 44.0, 53.0, 48.0, 45.0, 51.0, 47.0, 51.0, 47.0, 46.0, 44.0, 24.0, 29.0, 31.0, 15.0, 27.0, 24.0, 16.0, 9.0, 7.0, 7.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.3780517578125, -3.256103515625, -3.1341552734375, -3.01220703125, -2.8902587890625, -2.768310546875, -2.6463623046875, -2.5244140625, -2.4024658203125, -2.280517578125, -2.1585693359375, -2.03662109375, -1.9146728515625, -1.792724609375, -1.6707763671875, -1.548828125, -1.4268798828125, -1.304931640625, -1.1829833984375, -1.06103515625, -0.9390869140625, -0.817138671875, -0.6951904296875, -0.5732421875, -0.4512939453125, -0.329345703125, -0.2073974609375, -0.08544921875, 0.0364990234375, 0.158447265625, 0.2803955078125, 0.40234375, 0.5242919921875, 0.646240234375, 0.7681884765625, 0.89013671875, 1.0120849609375, 1.134033203125, 1.2559814453125, 1.3779296875, 1.4998779296875, 1.621826171875, 1.7437744140625, 1.86572265625, 1.9876708984375, 2.109619140625, 2.2315673828125, 2.353515625, 2.4754638671875, 2.597412109375, 2.7193603515625, 2.84130859375, 2.9632568359375, 3.085205078125, 3.2071533203125, 3.3291015625, 3.4510498046875, 3.572998046875, 3.6949462890625, 3.81689453125, 3.9388427734375, 4.060791015625, 4.1827392578125, 4.3046875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 6.0, 10.0, 22.0, 26.0, 34.0, 63.0, 105.0, 148.0, 223.0, 357.0, 513.0, 839.0, 1327.0, 2195.0, 3781.0, 6404.0, 11704.0, 21178.0, 41416.0, 84851.0, 186143.0, 424970.0, 928754.0, 1211830.0, 694739.0, 304408.0, 134819.0, 63148.0, 31530.0, 16458.0, 9050.0, 5124.0, 3085.0, 1820.0, 1162.0, 711.0, 422.0, 297.0, 180.0, 117.0, 92.0, 70.0, 55.0, 30.0, 11.0, 22.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.0859375, -7.85687255859375, -7.6278076171875, -7.39874267578125, -7.169677734375, -6.94061279296875, -6.7115478515625, -6.48248291015625, -6.25341796875, -6.02435302734375, -5.7952880859375, -5.56622314453125, -5.337158203125, -5.10809326171875, -4.8790283203125, -4.64996337890625, -4.4208984375, -4.19183349609375, -3.9627685546875, -3.73370361328125, -3.504638671875, -3.27557373046875, -3.0465087890625, -2.81744384765625, -2.58837890625, -2.35931396484375, -2.1302490234375, -1.90118408203125, -1.672119140625, -1.44305419921875, -1.2139892578125, -0.98492431640625, -0.755859375, -0.52679443359375, -0.2977294921875, -0.06866455078125, 0.160400390625, 0.38946533203125, 0.6185302734375, 0.84759521484375, 1.07666015625, 1.30572509765625, 1.5347900390625, 1.76385498046875, 1.992919921875, 2.22198486328125, 2.4510498046875, 2.68011474609375, 2.9091796875, 3.13824462890625, 3.3673095703125, 3.59637451171875, 3.825439453125, 4.05450439453125, 4.2835693359375, 4.51263427734375, 4.74169921875, 4.97076416015625, 5.1998291015625, 5.42889404296875, 5.657958984375, 5.88702392578125, 6.1160888671875, 6.34515380859375, 6.57421875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 13.0, 14.0, 25.0, 26.0, 37.0, 45.0, 54.0, 65.0, 88.0, 127.0, 139.0, 194.0, 228.0, 245.0, 277.0, 299.0, 338.0, 274.0, 264.0, 294.0, 203.0, 162.0, 144.0, 115.0, 73.0, 54.0, 59.0, 41.0, 29.0, 26.0, 28.0, 14.0, 7.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0], "bins": [-2.478515625, -2.413665771484375, -2.34881591796875, -2.283966064453125, -2.2191162109375, -2.154266357421875, -2.08941650390625, -2.024566650390625, -1.959716796875, -1.894866943359375, -1.83001708984375, -1.765167236328125, -1.7003173828125, -1.635467529296875, -1.57061767578125, -1.505767822265625, -1.44091796875, -1.376068115234375, -1.31121826171875, -1.246368408203125, -1.1815185546875, -1.116668701171875, -1.05181884765625, -0.986968994140625, -0.922119140625, -0.857269287109375, -0.79241943359375, -0.727569580078125, -0.6627197265625, -0.597869873046875, -0.53302001953125, -0.468170166015625, -0.4033203125, -0.338470458984375, -0.27362060546875, -0.208770751953125, -0.1439208984375, -0.079071044921875, -0.01422119140625, 0.050628662109375, 0.115478515625, 0.180328369140625, 0.24517822265625, 0.310028076171875, 0.3748779296875, 0.439727783203125, 0.50457763671875, 0.569427490234375, 0.63427734375, 0.699127197265625, 0.76397705078125, 0.828826904296875, 0.8936767578125, 0.958526611328125, 1.02337646484375, 1.088226318359375, 1.153076171875, 1.217926025390625, 1.28277587890625, 1.347625732421875, 1.4124755859375, 1.477325439453125, 1.54217529296875, 1.607025146484375, 1.671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 6.0, 8.0, 8.0, 18.0, 14.0, 12.0, 21.0, 21.0, 17.0, 31.0, 41.0, 46.0, 57.0, 69.0, 65.0, 64.0, 80.0, 61.0, 52.0, 59.0, 53.0, 32.0, 39.0, 28.0, 22.0, 13.0, 16.0, 10.0, 13.0, 5.0, 3.0, 1.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.507089614868164, -7.277308464050293, -7.047527313232422, -6.817746162414551, -6.58796501159668, -6.358183860778809, -6.1284027099609375, -5.898621082305908, -5.668839931488037, -5.439058780670166, -5.209277629852295, -4.979496479034424, -4.749715328216553, -4.519933700561523, -4.290152549743652, -4.060371398925781, -3.8305904865264893, -3.600809335708618, -3.371028184890747, -3.141246795654297, -2.911465644836426, -2.6816844940185547, -2.4519033432006836, -2.2221221923828125, -1.9923409223556519, -1.7625597715377808, -1.5327785015106201, -1.302997350692749, -1.073216199874878, -0.8434349298477173, -0.6136537790298462, -0.38387250900268555, -0.15409135818481445, 0.07568983733654022, 0.3054710328578949, 0.5352522134780884, 0.7650334239006042, 0.9948146343231201, 1.2245957851409912, 1.4543770551681519, 1.684158205986023, 1.913939356803894, 2.1437206268310547, 2.373501777648926, 2.603282928466797, 2.833064079284668, 3.062845230102539, 3.2926266193389893, 3.5224077701568604, 3.7521889209747314, 3.9819700717926025, 4.211751461029053, 4.441532611846924, 4.671313762664795, 4.901094913482666, 5.130876064300537, 5.360657215118408, 5.590438365936279, 5.82021951675415, 6.0500006675720215, 6.279781818389893, 6.509563446044922, 6.739344596862793, 6.969125747680664, 7.198906898498535]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 7.0, 3.0, 10.0, 14.0, 16.0, 14.0, 18.0, 21.0, 31.0, 35.0, 21.0, 32.0, 44.0, 37.0, 53.0, 46.0, 59.0, 58.0, 54.0, 46.0, 44.0, 47.0, 42.0, 41.0, 29.0, 26.0, 34.0, 26.0, 19.0, 22.0, 17.0, 11.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.126667022705078, -4.96545934677124, -4.804251194000244, -4.643043518066406, -4.48183536529541, -4.320627689361572, -4.159419536590576, -3.9982118606567383, -3.837003707885742, -3.675795793533325, -3.514587879180908, -3.353379964828491, -3.192172050476074, -3.0309641361236572, -2.8697562217712402, -2.7085485458374023, -2.5473406314849854, -2.3861327171325684, -2.2249248027801514, -2.0637168884277344, -1.9025089740753174, -1.7413010597229004, -1.580093264579773, -1.418885350227356, -1.257677435874939, -1.096469521522522, -0.935261607170105, -0.7740537524223328, -0.6128458380699158, -0.4516379237174988, -0.29043006896972656, -0.12922215461730957, 0.03198575973510742, 0.19319365918636322, 0.354401558637619, 0.5156094431877136, 0.6768173575401306, 0.8380252718925476, 0.9992331266403198, 1.1604410409927368, 1.3216489553451538, 1.4828568696975708, 1.6440647840499878, 1.8052725791931152, 1.9664804935455322, 2.127688407897949, 2.288896322250366, 2.450104236602783, 2.6113121509552, 2.772520065307617, 2.933727979660034, 3.094935894012451, 3.256143808364868, 3.417351722717285, 3.578559398651123, 3.739767551422119, 3.900975227355957, 4.062182903289795, 4.223391056060791, 4.384598731994629, 4.545806884765625, 4.707014560699463, 4.868222713470459, 5.029430389404297, 5.190638542175293]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 13.0, 12.0, 25.0, 27.0, 32.0, 52.0, 77.0, 136.0, 186.0, 254.0, 395.0, 614.0, 898.0, 1363.0, 2144.0, 3294.0, 5103.0, 7855.0, 12713.0, 19966.0, 31888.0, 50468.0, 78631.0, 116158.0, 149502.0, 158849.0, 135279.0, 97655.0, 64180.0, 40806.0, 25512.0, 16109.0, 10134.0, 6402.0, 4094.0, 2660.0, 1686.0, 1079.0, 754.0, 513.0, 341.0, 211.0, 127.0, 116.0, 75.0, 50.0, 37.0, 21.0, 18.0, 15.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0], "bins": [-2.775390625, -2.69195556640625, -2.6085205078125, -2.52508544921875, -2.441650390625, -2.35821533203125, -2.2747802734375, -2.19134521484375, -2.10791015625, -2.02447509765625, -1.9410400390625, -1.85760498046875, -1.774169921875, -1.69073486328125, -1.6072998046875, -1.52386474609375, -1.4404296875, -1.35699462890625, -1.2735595703125, -1.19012451171875, -1.106689453125, -1.02325439453125, -0.9398193359375, -0.85638427734375, -0.77294921875, -0.68951416015625, -0.6060791015625, -0.52264404296875, -0.439208984375, -0.35577392578125, -0.2723388671875, -0.18890380859375, -0.10546875, -0.02203369140625, 0.0614013671875, 0.14483642578125, 0.228271484375, 0.31170654296875, 0.3951416015625, 0.47857666015625, 0.56201171875, 0.64544677734375, 0.7288818359375, 0.81231689453125, 0.895751953125, 0.97918701171875, 1.0626220703125, 1.14605712890625, 1.2294921875, 1.31292724609375, 1.3963623046875, 1.47979736328125, 1.563232421875, 1.64666748046875, 1.7301025390625, 1.81353759765625, 1.89697265625, 1.98040771484375, 2.0638427734375, 2.14727783203125, 2.230712890625, 2.31414794921875, 2.3975830078125, 2.48101806640625, 2.564453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 16.0, 11.0, 15.0, 23.0, 25.0, 35.0, 29.0, 36.0, 32.0, 43.0, 47.0, 50.0, 44.0, 56.0, 58.0, 60.0, 42.0, 53.0, 51.0, 34.0, 31.0, 40.0, 20.0, 28.0, 22.0, 17.0, 10.0, 15.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.495361328125, -5.31884765625, -5.142333984375, -4.9658203125, -4.789306640625, -4.61279296875, -4.436279296875, -4.259765625, -4.083251953125, -3.90673828125, -3.730224609375, -3.5537109375, -3.377197265625, -3.20068359375, -3.024169921875, -2.84765625, -2.671142578125, -2.49462890625, -2.318115234375, -2.1416015625, -1.965087890625, -1.78857421875, -1.612060546875, -1.435546875, -1.259033203125, -1.08251953125, -0.906005859375, -0.7294921875, -0.552978515625, -0.37646484375, -0.199951171875, -0.0234375, 0.153076171875, 0.32958984375, 0.506103515625, 0.6826171875, 0.859130859375, 1.03564453125, 1.212158203125, 1.388671875, 1.565185546875, 1.74169921875, 1.918212890625, 2.0947265625, 2.271240234375, 2.44775390625, 2.624267578125, 2.80078125, 2.977294921875, 3.15380859375, 3.330322265625, 3.5068359375, 3.683349609375, 3.85986328125, 4.036376953125, 4.212890625, 4.389404296875, 4.56591796875, 4.742431640625, 4.9189453125, 5.095458984375, 5.27197265625, 5.448486328125, 5.625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 15.0, 22.0, 20.0, 39.0, 43.0, 62.0, 67.0, 110.0, 163.0, 242.0, 381.0, 583.0, 905.0, 1481.0, 2225.0, 3795.0, 6512.0, 11163.0, 19950.0, 36031.0, 64842.0, 115528.0, 190734.0, 223372.0, 159773.0, 92420.0, 51042.0, 28218.0, 16088.0, 9086.0, 5239.0, 3169.0, 1901.0, 1138.0, 727.0, 507.0, 330.0, 188.0, 111.0, 97.0, 74.0, 40.0, 42.0, 20.0, 16.0, 14.0, 5.0, 6.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.99609375, -3.8760986328125, -3.756103515625, -3.6361083984375, -3.51611328125, -3.3961181640625, -3.276123046875, -3.1561279296875, -3.0361328125, -2.9161376953125, -2.796142578125, -2.6761474609375, -2.55615234375, -2.4361572265625, -2.316162109375, -2.1961669921875, -2.076171875, -1.9561767578125, -1.836181640625, -1.7161865234375, -1.59619140625, -1.4761962890625, -1.356201171875, -1.2362060546875, -1.1162109375, -0.9962158203125, -0.876220703125, -0.7562255859375, -0.63623046875, -0.5162353515625, -0.396240234375, -0.2762451171875, -0.15625, -0.0362548828125, 0.083740234375, 0.2037353515625, 0.32373046875, 0.4437255859375, 0.563720703125, 0.6837158203125, 0.8037109375, 0.9237060546875, 1.043701171875, 1.1636962890625, 1.28369140625, 1.4036865234375, 1.523681640625, 1.6436767578125, 1.763671875, 1.8836669921875, 2.003662109375, 2.1236572265625, 2.24365234375, 2.3636474609375, 2.483642578125, 2.6036376953125, 2.7236328125, 2.8436279296875, 2.963623046875, 3.0836181640625, 3.20361328125, 3.3236083984375, 3.443603515625, 3.5635986328125, 3.68359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 11.0, 10.0, 22.0, 16.0, 11.0, 14.0, 21.0, 24.0, 20.0, 37.0, 29.0, 28.0, 40.0, 43.0, 38.0, 39.0, 29.0, 51.0, 47.0, 49.0, 33.0, 43.0, 31.0, 29.0, 29.0, 26.0, 32.0, 26.0, 29.0, 28.0, 21.0, 14.0, 14.0, 9.0, 10.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.736328125, -2.6539306640625, -2.571533203125, -2.4891357421875, -2.40673828125, -2.3243408203125, -2.241943359375, -2.1595458984375, -2.0771484375, -1.9947509765625, -1.912353515625, -1.8299560546875, -1.74755859375, -1.6651611328125, -1.582763671875, -1.5003662109375, -1.41796875, -1.3355712890625, -1.253173828125, -1.1707763671875, -1.08837890625, -1.0059814453125, -0.923583984375, -0.8411865234375, -0.7587890625, -0.6763916015625, -0.593994140625, -0.5115966796875, -0.42919921875, -0.3468017578125, -0.264404296875, -0.1820068359375, -0.099609375, -0.0172119140625, 0.065185546875, 0.1475830078125, 0.22998046875, 0.3123779296875, 0.394775390625, 0.4771728515625, 0.5595703125, 0.6419677734375, 0.724365234375, 0.8067626953125, 0.88916015625, 0.9715576171875, 1.053955078125, 1.1363525390625, 1.21875, 1.3011474609375, 1.383544921875, 1.4659423828125, 1.54833984375, 1.6307373046875, 1.713134765625, 1.7955322265625, 1.8779296875, 1.9603271484375, 2.042724609375, 2.1251220703125, 2.20751953125, 2.2899169921875, 2.372314453125, 2.4547119140625, 2.537109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 9.0, 13.0, 16.0, 16.0, 36.0, 55.0, 78.0, 132.0, 197.0, 351.0, 561.0, 1025.0, 1766.0, 3226.0, 5481.0, 10718.0, 19835.0, 38534.0, 75970.0, 146521.0, 244633.0, 228375.0, 130393.0, 67404.0, 34073.0, 17938.0, 9293.0, 5061.0, 2849.0, 1605.0, 953.0, 544.0, 319.0, 218.0, 140.0, 70.0, 51.0, 25.0, 20.0, 14.0, 12.0, 7.0, 4.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.060546875, -1.9959716796875, -1.931396484375, -1.8668212890625, -1.80224609375, -1.7376708984375, -1.673095703125, -1.6085205078125, -1.5439453125, -1.4793701171875, -1.414794921875, -1.3502197265625, -1.28564453125, -1.2210693359375, -1.156494140625, -1.0919189453125, -1.02734375, -0.9627685546875, -0.898193359375, -0.8336181640625, -0.76904296875, -0.7044677734375, -0.639892578125, -0.5753173828125, -0.5107421875, -0.4461669921875, -0.381591796875, -0.3170166015625, -0.25244140625, -0.1878662109375, -0.123291015625, -0.0587158203125, 0.005859375, 0.0704345703125, 0.135009765625, 0.1995849609375, 0.26416015625, 0.3287353515625, 0.393310546875, 0.4578857421875, 0.5224609375, 0.5870361328125, 0.651611328125, 0.7161865234375, 0.78076171875, 0.8453369140625, 0.909912109375, 0.9744873046875, 1.0390625, 1.1036376953125, 1.168212890625, 1.2327880859375, 1.29736328125, 1.3619384765625, 1.426513671875, 1.4910888671875, 1.5556640625, 1.6202392578125, 1.684814453125, 1.7493896484375, 1.81396484375, 1.8785400390625, 1.943115234375, 2.0076904296875, 2.072265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 6.0, 10.0, 14.0, 14.0, 26.0, 20.0, 38.0, 23.0, 29.0, 46.0, 43.0, 49.0, 64.0, 63.0, 74.0, 58.0, 57.0, 46.0, 33.0, 49.0, 43.0, 32.0, 19.0, 21.0, 20.0, 12.0, 16.0, 7.0, 9.0, 4.0, 7.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.988380432128906e-05, -8.70702788233757e-05, -8.425675332546234e-05, -8.144322782754898e-05, -7.862970232963562e-05, -7.581617683172226e-05, -7.30026513338089e-05, -7.018912583589554e-05, -6.737560033798218e-05, -6.456207484006882e-05, -6.174854934215546e-05, -5.8935023844242096e-05, -5.6121498346328735e-05, -5.3307972848415375e-05, -5.0494447350502014e-05, -4.7680921852588654e-05, -4.486739635467529e-05, -4.205387085676193e-05, -3.924034535884857e-05, -3.642681986093521e-05, -3.361329436302185e-05, -3.079976886510849e-05, -2.798624336719513e-05, -2.517271786928177e-05, -2.2359192371368408e-05, -1.9545666873455048e-05, -1.6732141375541687e-05, -1.3918615877628326e-05, -1.1105090379714966e-05, -8.291564881801605e-06, -5.478039383888245e-06, -2.664513885974884e-06, 1.4901161193847656e-07, 2.962537109851837e-06, 5.776062607765198e-06, 8.589588105678558e-06, 1.1403113603591919e-05, 1.421663910150528e-05, 1.703016459941864e-05, 1.9843690097332e-05, 2.265721559524536e-05, 2.5470741093158722e-05, 2.8284266591072083e-05, 3.109779208898544e-05, 3.3911317586898804e-05, 3.6724843084812164e-05, 3.9538368582725525e-05, 4.2351894080638885e-05, 4.5165419578552246e-05, 4.797894507646561e-05, 5.079247057437897e-05, 5.360599607229233e-05, 5.641952157020569e-05, 5.923304706811905e-05, 6.204657256603241e-05, 6.486009806394577e-05, 6.767362356185913e-05, 7.048714905977249e-05, 7.330067455768585e-05, 7.611420005559921e-05, 7.892772555351257e-05, 8.174125105142593e-05, 8.45547765493393e-05, 8.736830204725266e-05, 9.018182754516602e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 7.0, 14.0, 15.0, 34.0, 36.0, 53.0, 69.0, 104.0, 144.0, 236.0, 333.0, 480.0, 826.0, 1165.0, 1858.0, 2983.0, 4781.0, 7621.0, 12202.0, 19621.0, 30967.0, 49042.0, 74254.0, 107321.0, 138018.0, 151043.0, 137209.0, 105671.0, 72962.0, 47975.0, 30075.0, 19009.0, 11921.0, 7410.0, 4665.0, 2908.0, 1939.0, 1204.0, 778.0, 515.0, 340.0, 237.0, 157.0, 105.0, 73.0, 51.0, 37.0, 23.0, 19.0, 11.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.2685546875, -1.2294921875, -1.1904296875, -1.1513671875, -1.1123046875, -1.0732421875, -1.0341796875, -0.9951171875, -0.9560546875, -0.9169921875, -0.8779296875, -0.8388671875, -0.7998046875, -0.7607421875, -0.7216796875, -0.6826171875, -0.6435546875, -0.6044921875, -0.5654296875, -0.5263671875, -0.4873046875, -0.4482421875, -0.4091796875, -0.3701171875, -0.3310546875, -0.2919921875, -0.2529296875, -0.2138671875, -0.1748046875, -0.1357421875, -0.0966796875, -0.0576171875, -0.0185546875, 0.0205078125, 0.0595703125, 0.0986328125, 0.1376953125, 0.1767578125, 0.2158203125, 0.2548828125, 0.2939453125, 0.3330078125, 0.3720703125, 0.4111328125, 0.4501953125, 0.4892578125, 0.5283203125, 0.5673828125, 0.6064453125, 0.6455078125, 0.6845703125, 0.7236328125, 0.7626953125, 0.8017578125, 0.8408203125, 0.8798828125, 0.9189453125, 0.9580078125, 0.9970703125, 1.0361328125, 1.0751953125, 1.1142578125, 1.1533203125, 1.1923828125, 1.2314453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 11.0, 14.0, 13.0, 15.0, 12.0, 14.0, 20.0, 25.0, 36.0, 34.0, 44.0, 42.0, 42.0, 52.0, 44.0, 44.0, 41.0, 46.0, 52.0, 42.0, 47.0, 43.0, 34.0, 29.0, 30.0, 26.0, 30.0, 26.0, 13.0, 16.0, 13.0, 10.0, 6.0, 11.0, 5.0, 7.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.462890625, -0.44986724853515625, -0.4368438720703125, -0.42382049560546875, -0.410797119140625, -0.39777374267578125, -0.3847503662109375, -0.37172698974609375, -0.35870361328125, -0.34568023681640625, -0.3326568603515625, -0.31963348388671875, -0.306610107421875, -0.29358673095703125, -0.2805633544921875, -0.26753997802734375, -0.2545166015625, -0.24149322509765625, -0.2284698486328125, -0.21544647216796875, -0.202423095703125, -0.18939971923828125, -0.1763763427734375, -0.16335296630859375, -0.15032958984375, -0.13730621337890625, -0.1242828369140625, -0.11125946044921875, -0.098236083984375, -0.08521270751953125, -0.0721893310546875, -0.05916595458984375, -0.046142578125, -0.03311920166015625, -0.0200958251953125, -0.00707244873046875, 0.005950927734375, 0.01897430419921875, 0.0319976806640625, 0.04502105712890625, 0.05804443359375, 0.07106781005859375, 0.0840911865234375, 0.09711456298828125, 0.110137939453125, 0.12316131591796875, 0.1361846923828125, 0.14920806884765625, 0.1622314453125, 0.17525482177734375, 0.1882781982421875, 0.20130157470703125, 0.214324951171875, 0.22734832763671875, 0.2403717041015625, 0.25339508056640625, 0.26641845703125, 0.27944183349609375, 0.2924652099609375, 0.30548858642578125, 0.318511962890625, 0.33153533935546875, 0.3445587158203125, 0.35758209228515625, 0.37060546875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 13.0, 17.0, 12.0, 17.0, 20.0, 18.0, 28.0, 40.0, 27.0, 52.0, 59.0, 76.0, 72.0, 51.0, 66.0, 59.0, 56.0, 67.0, 43.0, 38.0, 27.0, 21.0, 28.0, 13.0, 19.0, 4.0, 13.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.75745964050293, -6.534886360168457, -6.312313556671143, -6.08974027633667, -5.867166996002197, -5.644594192504883, -5.42202091217041, -5.1994476318359375, -4.976874351501465, -4.754301071166992, -4.531728267669678, -4.309154987335205, -4.086581707000732, -3.864008665084839, -3.6414356231689453, -3.4188623428344727, -3.196289539337158, -2.9737164974212646, -2.751143217086792, -2.5285701751708984, -2.305996894836426, -2.0834238529205322, -1.8608508110046387, -1.6382776498794556, -1.4157044887542725, -1.1931313276290894, -0.970558226108551, -0.7479851245880127, -0.5254119634628296, -0.3028388023376465, -0.08026576042175293, 0.14230740070343018, 0.3648800849914551, 0.5874532461166382, 0.8100263476371765, 1.0325994491577148, 1.255172610282898, 1.477745771408081, 1.7003188133239746, 1.9228919744491577, 2.145465135574341, 2.3680381774902344, 2.590611457824707, 2.8131844997406006, 3.035757541656494, 3.258330821990967, 3.4809038639068604, 3.703476905822754, 3.9260501861572266, 4.148623466491699, 4.371196269989014, 4.593769550323486, 4.816342830657959, 5.038915634155273, 5.261488914489746, 5.484062194824219, 5.706635475158691, 5.929208755493164, 6.1517815589904785, 6.374354839324951, 6.596928119659424, 6.819500923156738, 7.042074203491211, 7.264647483825684, 7.487220287322998]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 11.0, 14.0, 18.0, 12.0, 16.0, 26.0, 26.0, 34.0, 31.0, 34.0, 34.0, 45.0, 51.0, 44.0, 60.0, 57.0, 50.0, 40.0, 48.0, 54.0, 37.0, 32.0, 29.0, 28.0, 37.0, 18.0, 22.0, 24.0, 18.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.892008304595947, -4.736620903015137, -4.581233024597168, -4.425845623016357, -4.270457744598389, -4.115070343017578, -3.9596827030181885, -3.804295063018799, -3.648907423019409, -3.4935197830200195, -3.33813214302063, -3.1827445030212402, -3.0273571014404297, -2.871969223022461, -2.7165818214416504, -2.5611941814422607, -2.405806541442871, -2.2504189014434814, -2.095031261444092, -1.9396437406539917, -1.784256100654602, -1.6288684606552124, -1.4734809398651123, -1.3180932998657227, -1.162705659866333, -1.0073180198669434, -0.8519304394721985, -0.6965428590774536, -0.541155219078064, -0.3857675790786743, -0.23037999868392944, -0.07499241828918457, 0.08039522171020508, 0.23578283190727234, 0.3911704421043396, 0.5465580224990845, 0.7019456624984741, 0.8573333024978638, 1.0127208232879639, 1.1681084632873535, 1.3234961032867432, 1.4788837432861328, 1.6342713832855225, 1.7896589040756226, 1.9450465440750122, 2.1004343032836914, 2.255821704864502, 2.4112093448638916, 2.5665969848632812, 2.721984624862671, 2.8773722648620605, 3.03275990486145, 3.18814754486084, 3.3435349464416504, 3.49892258644104, 3.6543102264404297, 3.8096978664398193, 3.965085506439209, 4.1204729080200195, 4.275860786437988, 4.431248188018799, 4.586636066436768, 4.742023468017578, 4.897411346435547, 5.052798748016357]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 6.0, 18.0, 20.0, 33.0, 44.0, 78.0, 130.0, 225.0, 365.0, 562.0, 1117.0, 2158.0, 4691.0, 9717.0, 21331.0, 46683.0, 101242.0, 192673.0, 257286.0, 204917.0, 109961.0, 51048.0, 23299.0, 10674.0, 5051.0, 2374.0, 1253.0, 675.0, 358.0, 199.0, 125.0, 83.0, 55.0, 23.0, 24.0, 17.0, 10.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.44140625, -7.22607421875, -7.0107421875, -6.79541015625, -6.580078125, -6.36474609375, -6.1494140625, -5.93408203125, -5.71875, -5.50341796875, -5.2880859375, -5.07275390625, -4.857421875, -4.64208984375, -4.4267578125, -4.21142578125, -3.99609375, -3.78076171875, -3.5654296875, -3.35009765625, -3.134765625, -2.91943359375, -2.7041015625, -2.48876953125, -2.2734375, -2.05810546875, -1.8427734375, -1.62744140625, -1.412109375, -1.19677734375, -0.9814453125, -0.76611328125, -0.55078125, -0.33544921875, -0.1201171875, 0.09521484375, 0.310546875, 0.52587890625, 0.7412109375, 0.95654296875, 1.171875, 1.38720703125, 1.6025390625, 1.81787109375, 2.033203125, 2.24853515625, 2.4638671875, 2.67919921875, 2.89453125, 3.10986328125, 3.3251953125, 3.54052734375, 3.755859375, 3.97119140625, 4.1865234375, 4.40185546875, 4.6171875, 4.83251953125, 5.0478515625, 5.26318359375, 5.478515625, 5.69384765625, 5.9091796875, 6.12451171875, 6.33984375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 6.0, 12.0, 12.0, 10.0, 14.0, 22.0, 17.0, 22.0, 37.0, 21.0, 37.0, 38.0, 48.0, 41.0, 40.0, 59.0, 43.0, 55.0, 51.0, 50.0, 37.0, 36.0, 36.0, 28.0, 26.0, 38.0, 17.0, 25.0, 19.0, 17.0, 16.0, 12.0, 10.0, 11.0, 5.0, 3.0, 7.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76336669921875, -4.6087646484375, -4.45416259765625, -4.299560546875, -4.14495849609375, -3.9903564453125, -3.83575439453125, -3.68115234375, -3.52655029296875, -3.3719482421875, -3.21734619140625, -3.062744140625, -2.90814208984375, -2.7535400390625, -2.59893798828125, -2.4443359375, -2.28973388671875, -2.1351318359375, -1.98052978515625, -1.825927734375, -1.67132568359375, -1.5167236328125, -1.36212158203125, -1.20751953125, -1.05291748046875, -0.8983154296875, -0.74371337890625, -0.589111328125, -0.43450927734375, -0.2799072265625, -0.12530517578125, 0.029296875, 0.18389892578125, 0.3385009765625, 0.49310302734375, 0.647705078125, 0.80230712890625, 0.9569091796875, 1.11151123046875, 1.26611328125, 1.42071533203125, 1.5753173828125, 1.72991943359375, 1.884521484375, 2.03912353515625, 2.1937255859375, 2.34832763671875, 2.5029296875, 2.65753173828125, 2.8121337890625, 2.96673583984375, 3.121337890625, 3.27593994140625, 3.4305419921875, 3.58514404296875, 3.73974609375, 3.89434814453125, 4.0489501953125, 4.20355224609375, 4.358154296875, 4.51275634765625, 4.6673583984375, 4.82196044921875, 4.9765625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 8.0, 10.0, 14.0, 25.0, 45.0, 54.0, 105.0, 144.0, 210.0, 354.0, 531.0, 951.0, 1506.0, 2525.0, 4346.0, 7668.0, 13243.0, 23696.0, 42463.0, 74906.0, 123453.0, 172996.0, 188627.0, 153567.0, 101225.0, 59542.0, 33059.0, 18445.0, 10148.0, 5869.0, 3538.0, 2026.0, 1247.0, 740.0, 465.0, 266.0, 198.0, 111.0, 81.0, 58.0, 15.0, 21.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.77069091796875, -4.6077880859375, -4.44488525390625, -4.281982421875, -4.11907958984375, -3.9561767578125, -3.79327392578125, -3.63037109375, -3.46746826171875, -3.3045654296875, -3.14166259765625, -2.978759765625, -2.81585693359375, -2.6529541015625, -2.49005126953125, -2.3271484375, -2.16424560546875, -2.0013427734375, -1.83843994140625, -1.675537109375, -1.51263427734375, -1.3497314453125, -1.18682861328125, -1.02392578125, -0.86102294921875, -0.6981201171875, -0.53521728515625, -0.372314453125, -0.20941162109375, -0.0465087890625, 0.11639404296875, 0.279296875, 0.44219970703125, 0.6051025390625, 0.76800537109375, 0.930908203125, 1.09381103515625, 1.2567138671875, 1.41961669921875, 1.58251953125, 1.74542236328125, 1.9083251953125, 2.07122802734375, 2.234130859375, 2.39703369140625, 2.5599365234375, 2.72283935546875, 2.8857421875, 3.04864501953125, 3.2115478515625, 3.37445068359375, 3.537353515625, 3.70025634765625, 3.8631591796875, 4.02606201171875, 4.18896484375, 4.35186767578125, 4.5147705078125, 4.67767333984375, 4.840576171875, 5.00347900390625, 5.1663818359375, 5.32928466796875, 5.4921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 5.0, 5.0, 2.0, 7.0, 9.0, 14.0, 9.0, 18.0, 5.0, 17.0, 21.0, 22.0, 32.0, 31.0, 25.0, 27.0, 32.0, 39.0, 38.0, 38.0, 49.0, 42.0, 28.0, 35.0, 40.0, 39.0, 37.0, 38.0, 33.0, 27.0, 25.0, 29.0, 38.0, 23.0, 15.0, 19.0, 15.0, 15.0, 12.0, 13.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.70452880859375, -2.6239013671875, -2.54327392578125, -2.462646484375, -2.38201904296875, -2.3013916015625, -2.22076416015625, -2.14013671875, -2.05950927734375, -1.9788818359375, -1.89825439453125, -1.817626953125, -1.73699951171875, -1.6563720703125, -1.57574462890625, -1.4951171875, -1.41448974609375, -1.3338623046875, -1.25323486328125, -1.172607421875, -1.09197998046875, -1.0113525390625, -0.93072509765625, -0.85009765625, -0.76947021484375, -0.6888427734375, -0.60821533203125, -0.527587890625, -0.44696044921875, -0.3663330078125, -0.28570556640625, -0.205078125, -0.12445068359375, -0.0438232421875, 0.03680419921875, 0.117431640625, 0.19805908203125, 0.2786865234375, 0.35931396484375, 0.43994140625, 0.52056884765625, 0.6011962890625, 0.68182373046875, 0.762451171875, 0.84307861328125, 0.9237060546875, 1.00433349609375, 1.0849609375, 1.16558837890625, 1.2462158203125, 1.32684326171875, 1.407470703125, 1.48809814453125, 1.5687255859375, 1.64935302734375, 1.72998046875, 1.81060791015625, 1.8912353515625, 1.97186279296875, 2.052490234375, 2.13311767578125, 2.2137451171875, 2.29437255859375, 2.375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 14.0, 14.0, 30.0, 35.0, 68.0, 81.0, 134.0, 164.0, 318.0, 502.0, 824.0, 1228.0, 1955.0, 3097.0, 5270.0, 8604.0, 14891.0, 25652.0, 44293.0, 76838.0, 123670.0, 175307.0, 187766.0, 147548.0, 94756.0, 56230.0, 32365.0, 18918.0, 10934.0, 6543.0, 4019.0, 2441.0, 1500.0, 922.0, 585.0, 360.0, 227.0, 158.0, 107.0, 47.0, 43.0, 27.0, 20.0, 12.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.056640625, -1.9927978515625, -1.928955078125, -1.8651123046875, -1.80126953125, -1.7374267578125, -1.673583984375, -1.6097412109375, -1.5458984375, -1.4820556640625, -1.418212890625, -1.3543701171875, -1.29052734375, -1.2266845703125, -1.162841796875, -1.0989990234375, -1.03515625, -0.9713134765625, -0.907470703125, -0.8436279296875, -0.77978515625, -0.7159423828125, -0.652099609375, -0.5882568359375, -0.5244140625, -0.4605712890625, -0.396728515625, -0.3328857421875, -0.26904296875, -0.2052001953125, -0.141357421875, -0.0775146484375, -0.013671875, 0.0501708984375, 0.114013671875, 0.1778564453125, 0.24169921875, 0.3055419921875, 0.369384765625, 0.4332275390625, 0.4970703125, 0.5609130859375, 0.624755859375, 0.6885986328125, 0.75244140625, 0.8162841796875, 0.880126953125, 0.9439697265625, 1.0078125, 1.0716552734375, 1.135498046875, 1.1993408203125, 1.26318359375, 1.3270263671875, 1.390869140625, 1.4547119140625, 1.5185546875, 1.5823974609375, 1.646240234375, 1.7100830078125, 1.77392578125, 1.8377685546875, 1.901611328125, 1.9654541015625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 4.0, 8.0, 8.0, 11.0, 20.0, 19.0, 36.0, 29.0, 37.0, 43.0, 69.0, 56.0, 53.0, 67.0, 63.0, 45.0, 62.0, 47.0, 53.0, 58.0, 43.0, 31.0, 27.0, 21.0, 14.0, 9.0, 18.0, 5.0, 2.0, 9.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000209808349609375, -0.00020316801965236664, -0.00019652768969535828, -0.00018988735973834991, -0.00018324702978134155, -0.0001766066998243332, -0.00016996636986732483, -0.00016332603991031647, -0.0001566857099533081, -0.00015004537999629974, -0.00014340505003929138, -0.00013676472008228302, -0.00013012439012527466, -0.0001234840601682663, -0.00011684373021125793, -0.00011020340025424957, -0.00010356307029724121, -9.692274034023285e-05, -9.028241038322449e-05, -8.364208042621613e-05, -7.700175046920776e-05, -7.03614205121994e-05, -6.372109055519104e-05, -5.708076059818268e-05, -5.0440430641174316e-05, -4.3800100684165955e-05, -3.715977072715759e-05, -3.051944077014923e-05, -2.387911081314087e-05, -1.7238780856132507e-05, -1.0598450899124146e-05, -3.958120942115784e-06, 2.682209014892578e-06, 9.32253897190094e-06, 1.5962868928909302e-05, 2.2603198885917664e-05, 2.9243528842926025e-05, 3.588385879993439e-05, 4.252418875694275e-05, 4.916451871395111e-05, 5.580484867095947e-05, 6.244517862796783e-05, 6.90855085849762e-05, 7.572583854198456e-05, 8.236616849899292e-05, 8.900649845600128e-05, 9.564682841300964e-05, 0.000102287158370018, 0.00010892748832702637, 0.00011556781828403473, 0.0001222081482410431, 0.00012884847819805145, 0.00013548880815505981, 0.00014212913811206818, 0.00014876946806907654, 0.0001554097980260849, 0.00016205012798309326, 0.00016869045794010162, 0.00017533078789710999, 0.00018197111785411835, 0.0001886114478111267, 0.00019525177776813507, 0.00020189210772514343, 0.0002085324376821518, 0.00021517276763916016]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 7.0, 15.0, 18.0, 22.0, 32.0, 54.0, 89.0, 152.0, 216.0, 315.0, 513.0, 913.0, 1566.0, 2483.0, 4612.0, 8381.0, 15286.0, 29767.0, 57955.0, 108770.0, 180719.0, 222041.0, 181300.0, 109791.0, 58357.0, 30130.0, 15771.0, 8448.0, 4509.0, 2481.0, 1434.0, 865.0, 574.0, 334.0, 216.0, 125.0, 105.0, 58.0, 47.0, 31.0, 14.0, 10.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.193359375, -2.1214599609375, -2.049560546875, -1.9776611328125, -1.90576171875, -1.8338623046875, -1.761962890625, -1.6900634765625, -1.6181640625, -1.5462646484375, -1.474365234375, -1.4024658203125, -1.33056640625, -1.2586669921875, -1.186767578125, -1.1148681640625, -1.04296875, -0.9710693359375, -0.899169921875, -0.8272705078125, -0.75537109375, -0.6834716796875, -0.611572265625, -0.5396728515625, -0.4677734375, -0.3958740234375, -0.323974609375, -0.2520751953125, -0.18017578125, -0.1082763671875, -0.036376953125, 0.0355224609375, 0.107421875, 0.1793212890625, 0.251220703125, 0.3231201171875, 0.39501953125, 0.4669189453125, 0.538818359375, 0.6107177734375, 0.6826171875, 0.7545166015625, 0.826416015625, 0.8983154296875, 0.97021484375, 1.0421142578125, 1.114013671875, 1.1859130859375, 1.2578125, 1.3297119140625, 1.401611328125, 1.4735107421875, 1.54541015625, 1.6173095703125, 1.689208984375, 1.7611083984375, 1.8330078125, 1.9049072265625, 1.976806640625, 2.0487060546875, 2.12060546875, 2.1925048828125, 2.264404296875, 2.3363037109375, 2.408203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 10.0, 8.0, 6.0, 18.0, 13.0, 25.0, 22.0, 28.0, 28.0, 30.0, 30.0, 28.0, 48.0, 45.0, 50.0, 40.0, 57.0, 57.0, 49.0, 43.0, 43.0, 52.0, 33.0, 31.0, 34.0, 22.0, 28.0, 25.0, 15.0, 9.0, 7.0, 13.0, 8.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58984375, -0.5725784301757812, -0.5553131103515625, -0.5380477905273438, -0.520782470703125, -0.5035171508789062, -0.4862518310546875, -0.46898651123046875, -0.45172119140625, -0.43445587158203125, -0.4171905517578125, -0.39992523193359375, -0.382659912109375, -0.36539459228515625, -0.3481292724609375, -0.33086395263671875, -0.3135986328125, -0.29633331298828125, -0.2790679931640625, -0.26180267333984375, -0.244537353515625, -0.22727203369140625, -0.2100067138671875, -0.19274139404296875, -0.17547607421875, -0.15821075439453125, -0.1409454345703125, -0.12368011474609375, -0.106414794921875, -0.08914947509765625, -0.0718841552734375, -0.05461883544921875, -0.037353515625, -0.02008819580078125, -0.0028228759765625, 0.01444244384765625, 0.031707763671875, 0.04897308349609375, 0.0662384033203125, 0.08350372314453125, 0.10076904296875, 0.11803436279296875, 0.1352996826171875, 0.15256500244140625, 0.169830322265625, 0.18709564208984375, 0.2043609619140625, 0.22162628173828125, 0.2388916015625, 0.25615692138671875, 0.2734222412109375, 0.29068756103515625, 0.307952880859375, 0.32521820068359375, 0.3424835205078125, 0.35974884033203125, 0.37701416015625, 0.39427947998046875, 0.4115447998046875, 0.42881011962890625, 0.446075439453125, 0.46334075927734375, 0.4806060791015625, 0.49787139892578125, 0.51513671875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 18.0, 17.0, 23.0, 13.0, 22.0, 23.0, 33.0, 49.0, 43.0, 63.0, 56.0, 58.0, 70.0, 59.0, 63.0, 62.0, 53.0, 37.0, 47.0, 27.0, 33.0, 19.0, 14.0, 17.0, 11.0, 8.0, 10.0, 9.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.388792514801025, -6.171700954437256, -5.954609394073486, -5.737517833709717, -5.520426273345947, -5.303334712982178, -5.086243152618408, -4.869151592254639, -4.652060031890869, -4.4349684715271, -4.21787691116333, -4.0007853507995605, -3.783693790435791, -3.5666022300720215, -3.349510669708252, -3.1324191093444824, -2.915327548980713, -2.6982359886169434, -2.481144428253174, -2.2640528678894043, -2.0469613075256348, -1.8298697471618652, -1.6127781867980957, -1.3956866264343262, -1.1785950660705566, -0.9615035057067871, -0.7444119453430176, -0.527320384979248, -0.3102288246154785, -0.09313726425170898, 0.12395429611206055, 0.3410458564758301, 0.5581374168395996, 0.7752289772033691, 0.9923205375671387, 1.2094120979309082, 1.4265036582946777, 1.6435952186584473, 1.8606867790222168, 2.0777783393859863, 2.294869899749756, 2.5119614601135254, 2.729053020477295, 2.9461445808410645, 3.163236141204834, 3.3803277015686035, 3.597419261932373, 3.8145108222961426, 4.031602382659912, 4.248693943023682, 4.465785503387451, 4.682877063751221, 4.89996862411499, 5.11706018447876, 5.334151744842529, 5.551243305206299, 5.768334865570068, 5.985426425933838, 6.202517986297607, 6.419609546661377, 6.6367011070251465, 6.853792667388916, 7.0708842277526855, 7.287975788116455, 7.505067348480225]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 7.0, 14.0, 7.0, 9.0, 21.0, 18.0, 26.0, 38.0, 24.0, 36.0, 33.0, 36.0, 54.0, 47.0, 44.0, 48.0, 56.0, 56.0, 60.0, 51.0, 45.0, 28.0, 41.0, 29.0, 31.0, 31.0, 24.0, 12.0, 12.0, 21.0, 11.0, 9.0, 3.0, 9.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.146744728088379, -4.987565040588379, -4.828384876251221, -4.6692047119140625, -4.5100250244140625, -4.3508453369140625, -4.191665172576904, -4.032485008239746, -3.873305320739746, -3.714125394821167, -3.554945468902588, -3.395765542984009, -3.2365856170654297, -3.0774056911468506, -2.9182257652282715, -2.7590458393096924, -2.5998659133911133, -2.440685987472534, -2.281506061553955, -2.122326135635376, -1.9631462097167969, -1.8039662837982178, -1.6447863578796387, -1.4856064319610596, -1.3264265060424805, -1.1672465801239014, -1.0080666542053223, -0.8488867282867432, -0.6897068023681641, -0.530526876449585, -0.37134695053100586, -0.21216702461242676, -0.05298662185668945, 0.10619330406188965, 0.26537322998046875, 0.42455315589904785, 0.583733081817627, 0.742913007736206, 0.9020929336547852, 1.0612728595733643, 1.2204527854919434, 1.3796327114105225, 1.5388126373291016, 1.6979925632476807, 1.8571724891662598, 2.016352415084839, 2.175532341003418, 2.334712266921997, 2.493892192840576, 2.6530721187591553, 2.8122520446777344, 2.9714319705963135, 3.1306118965148926, 3.2897918224334717, 3.448971748352051, 3.60815167427063, 3.767331600189209, 3.926511526107788, 4.085691452026367, 4.244871139526367, 4.404051303863525, 4.563231468200684, 4.722411155700684, 4.881590843200684, 5.040771007537842]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 17.0, 21.0, 25.0, 36.0, 69.0, 82.0, 131.0, 231.0, 350.0, 568.0, 973.0, 1680.0, 2767.0, 5096.0, 9745.0, 20074.0, 45225.0, 116064.0, 341232.0, 1036173.0, 1541147.0, 707640.0, 222456.0, 78640.0, 32156.0, 14821.0, 7383.0, 3964.0, 2218.0, 1252.0, 726.0, 458.0, 296.0, 194.0, 99.0, 93.0, 45.0, 42.0, 26.0, 15.0, 11.0, 15.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.6796875, -8.41912841796875, -8.1585693359375, -7.89801025390625, -7.637451171875, -7.37689208984375, -7.1163330078125, -6.85577392578125, -6.59521484375, -6.33465576171875, -6.0740966796875, -5.81353759765625, -5.552978515625, -5.29241943359375, -5.0318603515625, -4.77130126953125, -4.5107421875, -4.25018310546875, -3.9896240234375, -3.72906494140625, -3.468505859375, -3.20794677734375, -2.9473876953125, -2.68682861328125, -2.42626953125, -2.16571044921875, -1.9051513671875, -1.64459228515625, -1.384033203125, -1.12347412109375, -0.8629150390625, -0.60235595703125, -0.341796875, -0.08123779296875, 0.1793212890625, 0.43988037109375, 0.700439453125, 0.96099853515625, 1.2215576171875, 1.48211669921875, 1.74267578125, 2.00323486328125, 2.2637939453125, 2.52435302734375, 2.784912109375, 3.04547119140625, 3.3060302734375, 3.56658935546875, 3.8271484375, 4.08770751953125, 4.3482666015625, 4.60882568359375, 4.869384765625, 5.12994384765625, 5.3905029296875, 5.65106201171875, 5.91162109375, 6.17218017578125, 6.4327392578125, 6.69329833984375, 6.953857421875, 7.21441650390625, 7.4749755859375, 7.73553466796875, 7.99609375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 11.0, 12.0, 18.0, 19.0, 17.0, 35.0, 32.0, 38.0, 36.0, 43.0, 39.0, 29.0, 43.0, 47.0, 47.0, 51.0, 62.0, 55.0, 46.0, 49.0, 41.0, 32.0, 28.0, 32.0, 20.0, 20.0, 15.0, 11.0, 12.0, 11.0, 12.0, 4.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.91796875, -3.799163818359375, -3.68035888671875, -3.561553955078125, -3.4427490234375, -3.323944091796875, -3.20513916015625, -3.086334228515625, -2.967529296875, -2.848724365234375, -2.72991943359375, -2.611114501953125, -2.4923095703125, -2.373504638671875, -2.25469970703125, -2.135894775390625, -2.01708984375, -1.898284912109375, -1.77947998046875, -1.660675048828125, -1.5418701171875, -1.423065185546875, -1.30426025390625, -1.185455322265625, -1.066650390625, -0.947845458984375, -0.82904052734375, -0.710235595703125, -0.5914306640625, -0.472625732421875, -0.35382080078125, -0.235015869140625, -0.1162109375, 0.002593994140625, 0.12139892578125, 0.240203857421875, 0.3590087890625, 0.477813720703125, 0.59661865234375, 0.715423583984375, 0.834228515625, 0.953033447265625, 1.07183837890625, 1.190643310546875, 1.3094482421875, 1.428253173828125, 1.54705810546875, 1.665863037109375, 1.78466796875, 1.903472900390625, 2.02227783203125, 2.141082763671875, 2.2598876953125, 2.378692626953125, 2.49749755859375, 2.616302490234375, 2.735107421875, 2.853912353515625, 2.97271728515625, 3.091522216796875, 3.2103271484375, 3.329132080078125, 3.44793701171875, 3.566741943359375, 3.685546875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 16.0, 14.0, 22.0, 24.0, 39.0, 55.0, 73.0, 124.0, 173.0, 282.0, 412.0, 674.0, 1025.0, 1711.0, 2626.0, 4494.0, 7675.0, 13561.0, 25259.0, 48642.0, 97089.0, 209106.0, 466660.0, 964655.0, 1150781.0, 640240.0, 288736.0, 132224.0, 63898.0, 32342.0, 17466.0, 9695.0, 5580.0, 3283.0, 2031.0, 1218.0, 820.0, 487.0, 347.0, 237.0, 159.0, 94.0, 69.0, 49.0, 34.0, 23.0, 22.0, 10.0, 4.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-7.13671875, -6.91510009765625, -6.6934814453125, -6.47186279296875, -6.250244140625, -6.02862548828125, -5.8070068359375, -5.58538818359375, -5.36376953125, -5.14215087890625, -4.9205322265625, -4.69891357421875, -4.477294921875, -4.25567626953125, -4.0340576171875, -3.81243896484375, -3.5908203125, -3.36920166015625, -3.1475830078125, -2.92596435546875, -2.704345703125, -2.48272705078125, -2.2611083984375, -2.03948974609375, -1.81787109375, -1.59625244140625, -1.3746337890625, -1.15301513671875, -0.931396484375, -0.70977783203125, -0.4881591796875, -0.26654052734375, -0.044921875, 0.17669677734375, 0.3983154296875, 0.61993408203125, 0.841552734375, 1.06317138671875, 1.2847900390625, 1.50640869140625, 1.72802734375, 1.94964599609375, 2.1712646484375, 2.39288330078125, 2.614501953125, 2.83612060546875, 3.0577392578125, 3.27935791015625, 3.5009765625, 3.72259521484375, 3.9442138671875, 4.16583251953125, 4.387451171875, 4.60906982421875, 4.8306884765625, 5.05230712890625, 5.27392578125, 5.49554443359375, 5.7171630859375, 5.93878173828125, 6.160400390625, 6.38201904296875, 6.6036376953125, 6.82525634765625, 7.046875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 5.0, 5.0, 7.0, 18.0, 12.0, 25.0, 44.0, 46.0, 49.0, 76.0, 102.0, 121.0, 143.0, 193.0, 257.0, 315.0, 331.0, 370.0, 346.0, 328.0, 260.0, 231.0, 176.0, 154.0, 109.0, 96.0, 64.0, 54.0, 27.0, 17.0, 20.0, 12.0, 12.0, 16.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.490875244140625, -2.41925048828125, -2.347625732421875, -2.2760009765625, -2.204376220703125, -2.13275146484375, -2.061126708984375, -1.989501953125, -1.917877197265625, -1.84625244140625, -1.774627685546875, -1.7030029296875, -1.631378173828125, -1.55975341796875, -1.488128662109375, -1.41650390625, -1.344879150390625, -1.27325439453125, -1.201629638671875, -1.1300048828125, -1.058380126953125, -0.98675537109375, -0.915130615234375, -0.843505859375, -0.771881103515625, -0.70025634765625, -0.628631591796875, -0.5570068359375, -0.485382080078125, -0.41375732421875, -0.342132568359375, -0.2705078125, -0.198883056640625, -0.12725830078125, -0.055633544921875, 0.0159912109375, 0.087615966796875, 0.15924072265625, 0.230865478515625, 0.302490234375, 0.374114990234375, 0.44573974609375, 0.517364501953125, 0.5889892578125, 0.660614013671875, 0.73223876953125, 0.803863525390625, 0.87548828125, 0.947113037109375, 1.01873779296875, 1.090362548828125, 1.1619873046875, 1.233612060546875, 1.30523681640625, 1.376861572265625, 1.448486328125, 1.520111083984375, 1.59173583984375, 1.663360595703125, 1.7349853515625, 1.806610107421875, 1.87823486328125, 1.949859619140625, 2.021484375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 14.0, 10.0, 14.0, 24.0, 20.0, 41.0, 28.0, 41.0, 49.0, 72.0, 78.0, 65.0, 85.0, 67.0, 63.0, 55.0, 63.0, 39.0, 38.0, 26.0, 24.0, 13.0, 11.0, 14.0, 7.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.568060874938965, -8.318124771118164, -8.068188667297363, -7.8182525634765625, -7.568316459655762, -7.318380355834961, -7.06844425201416, -6.818508148193359, -6.568572044372559, -6.318635940551758, -6.068699836730957, -5.818763732910156, -5.5688276290893555, -5.318891525268555, -5.068955421447754, -4.819019317626953, -4.569083213806152, -4.319147109985352, -4.069211006164551, -3.81927490234375, -3.569338798522949, -3.3194026947021484, -3.0694665908813477, -2.819530487060547, -2.569594383239746, -2.3196582794189453, -2.0697221755981445, -1.8197860717773438, -1.569849967956543, -1.3199138641357422, -1.0699777603149414, -0.8200416564941406, -0.570106029510498, -0.32016992568969727, -0.07023382186889648, 0.1797022819519043, 0.4296383857727051, 0.6795744895935059, 0.9295105934143066, 1.1794466972351074, 1.4293828010559082, 1.679318904876709, 1.9292550086975098, 2.1791911125183105, 2.4291272163391113, 2.679063320159912, 2.928999423980713, 3.1789355278015137, 3.4288716316223145, 3.6788077354431152, 3.928743839263916, 4.178679943084717, 4.428616046905518, 4.678552150726318, 4.928488254547119, 5.17842435836792, 5.428360462188721, 5.6782965660095215, 5.928232669830322, 6.178168773651123, 6.428104877471924, 6.678040981292725, 6.927977085113525, 7.177913188934326, 7.427849292755127]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 6.0, 10.0, 17.0, 20.0, 26.0, 14.0, 20.0, 18.0, 27.0, 35.0, 30.0, 29.0, 41.0, 31.0, 31.0, 40.0, 45.0, 46.0, 43.0, 38.0, 41.0, 30.0, 53.0, 24.0, 29.0, 29.0, 32.0, 21.0, 20.0, 21.0, 21.0, 22.0, 17.0, 8.0, 8.0, 5.0, 7.0, 6.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.169615268707275, -4.043285369873047, -3.91695499420166, -3.7906248569488525, -3.664294719696045, -3.5379648208618164, -3.411634683609009, -3.285304546356201, -3.1589744091033936, -3.032644271850586, -2.9063141345977783, -2.7799839973449707, -2.653654098510742, -2.5273237228393555, -2.400993824005127, -2.2746636867523193, -2.1483335494995117, -2.022003412246704, -1.8956732749938965, -1.7693432569503784, -1.6430131196975708, -1.5166829824447632, -1.3903529644012451, -1.2640228271484375, -1.1376926898956299, -1.0113625526428223, -0.8850324749946594, -0.7587023973464966, -0.632372260093689, -0.5060421228408813, -0.3797120451927185, -0.25338196754455566, -0.12705206871032715, -0.0007219612598419189, 0.1256081461906433, 0.25193825364112854, 0.37826836109161377, 0.5045984983444214, 0.6309285759925842, 0.7572586536407471, 0.8835887908935547, 1.0099189281463623, 1.13624906539917, 1.262579083442688, 1.3889092206954956, 1.5152393579483032, 1.6415693759918213, 1.767899513244629, 1.8942296504974365, 2.020559787750244, 2.1468899250030518, 2.2732200622558594, 2.399549961090088, 2.5258803367614746, 2.652210235595703, 2.7785403728485107, 2.9048705101013184, 3.031200647354126, 3.1575307846069336, 3.283860921859741, 3.410191059112549, 3.5365209579467773, 3.662851095199585, 3.7891812324523926, 3.9155113697052]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 6.0, 10.0, 9.0, 15.0, 23.0, 36.0, 46.0, 89.0, 111.0, 206.0, 330.0, 526.0, 857.0, 1401.0, 2417.0, 3984.0, 6840.0, 11726.0, 20661.0, 36311.0, 64651.0, 109280.0, 165406.0, 196061.0, 166764.0, 109992.0, 64538.0, 36784.0, 20802.0, 11691.0, 6968.0, 3946.0, 2398.0, 1454.0, 843.0, 499.0, 309.0, 203.0, 127.0, 89.0, 55.0, 31.0, 23.0, 14.0, 12.0, 4.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.4296875, -3.330291748046875, -3.23089599609375, -3.131500244140625, -3.0321044921875, -2.932708740234375, -2.83331298828125, -2.733917236328125, -2.634521484375, -2.535125732421875, -2.43572998046875, -2.336334228515625, -2.2369384765625, -2.137542724609375, -2.03814697265625, -1.938751220703125, -1.83935546875, -1.739959716796875, -1.64056396484375, -1.541168212890625, -1.4417724609375, -1.342376708984375, -1.24298095703125, -1.143585205078125, -1.044189453125, -0.944793701171875, -0.84539794921875, -0.746002197265625, -0.6466064453125, -0.547210693359375, -0.44781494140625, -0.348419189453125, -0.2490234375, -0.149627685546875, -0.05023193359375, 0.049163818359375, 0.1485595703125, 0.247955322265625, 0.34735107421875, 0.446746826171875, 0.546142578125, 0.645538330078125, 0.74493408203125, 0.844329833984375, 0.9437255859375, 1.043121337890625, 1.14251708984375, 1.241912841796875, 1.34130859375, 1.440704345703125, 1.54010009765625, 1.639495849609375, 1.7388916015625, 1.838287353515625, 1.93768310546875, 2.037078857421875, 2.136474609375, 2.235870361328125, 2.33526611328125, 2.434661865234375, 2.5340576171875, 2.633453369140625, 2.73284912109375, 2.832244873046875, 2.931640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 8.0, 10.0, 10.0, 12.0, 20.0, 18.0, 18.0, 23.0, 16.0, 28.0, 29.0, 35.0, 28.0, 36.0, 41.0, 42.0, 41.0, 49.0, 58.0, 37.0, 39.0, 47.0, 27.0, 26.0, 33.0, 36.0, 23.0, 32.0, 24.0, 24.0, 18.0, 20.0, 17.0, 12.0, 9.0, 13.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15234375, -4.01324462890625, -3.8741455078125, -3.73504638671875, -3.595947265625, -3.45684814453125, -3.3177490234375, -3.17864990234375, -3.03955078125, -2.90045166015625, -2.7613525390625, -2.62225341796875, -2.483154296875, -2.34405517578125, -2.2049560546875, -2.06585693359375, -1.9267578125, -1.78765869140625, -1.6485595703125, -1.50946044921875, -1.370361328125, -1.23126220703125, -1.0921630859375, -0.95306396484375, -0.81396484375, -0.67486572265625, -0.5357666015625, -0.39666748046875, -0.257568359375, -0.11846923828125, 0.0206298828125, 0.15972900390625, 0.298828125, 0.43792724609375, 0.5770263671875, 0.71612548828125, 0.855224609375, 0.99432373046875, 1.1334228515625, 1.27252197265625, 1.41162109375, 1.55072021484375, 1.6898193359375, 1.82891845703125, 1.968017578125, 2.10711669921875, 2.2462158203125, 2.38531494140625, 2.5244140625, 2.66351318359375, 2.8026123046875, 2.94171142578125, 3.080810546875, 3.21990966796875, 3.3590087890625, 3.49810791015625, 3.63720703125, 3.77630615234375, 3.9154052734375, 4.05450439453125, 4.193603515625, 4.33270263671875, 4.4718017578125, 4.61090087890625, 4.75]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 22.0, 18.0, 34.0, 40.0, 64.0, 81.0, 139.0, 180.0, 268.0, 385.0, 554.0, 792.0, 1191.0, 1771.0, 2712.0, 4077.0, 6220.0, 9655.0, 15069.0, 24007.0, 38049.0, 60442.0, 93929.0, 138190.0, 171804.0, 157934.0, 114283.0, 74934.0, 47821.0, 30127.0, 18878.0, 12010.0, 7750.0, 5038.0, 3240.0, 2185.0, 1457.0, 980.0, 684.0, 434.0, 327.0, 223.0, 182.0, 123.0, 87.0, 47.0, 31.0, 30.0, 12.0, 11.0, 5.0, 11.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.890625, -2.799560546875, -2.70849609375, -2.617431640625, -2.5263671875, -2.435302734375, -2.34423828125, -2.253173828125, -2.162109375, -2.071044921875, -1.97998046875, -1.888916015625, -1.7978515625, -1.706787109375, -1.61572265625, -1.524658203125, -1.43359375, -1.342529296875, -1.25146484375, -1.160400390625, -1.0693359375, -0.978271484375, -0.88720703125, -0.796142578125, -0.705078125, -0.614013671875, -0.52294921875, -0.431884765625, -0.3408203125, -0.249755859375, -0.15869140625, -0.067626953125, 0.0234375, 0.114501953125, 0.20556640625, 0.296630859375, 0.3876953125, 0.478759765625, 0.56982421875, 0.660888671875, 0.751953125, 0.843017578125, 0.93408203125, 1.025146484375, 1.1162109375, 1.207275390625, 1.29833984375, 1.389404296875, 1.48046875, 1.571533203125, 1.66259765625, 1.753662109375, 1.8447265625, 1.935791015625, 2.02685546875, 2.117919921875, 2.208984375, 2.300048828125, 2.39111328125, 2.482177734375, 2.5732421875, 2.664306640625, 2.75537109375, 2.846435546875, 2.9375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 5.0, 13.0, 13.0, 17.0, 19.0, 25.0, 23.0, 25.0, 19.0, 27.0, 23.0, 40.0, 25.0, 38.0, 31.0, 34.0, 28.0, 38.0, 38.0, 53.0, 49.0, 39.0, 35.0, 32.0, 30.0, 34.0, 23.0, 21.0, 31.0, 25.0, 15.0, 17.0, 20.0, 15.0, 14.0, 9.0, 6.0, 10.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.423828125, -2.34619140625, -2.2685546875, -2.19091796875, -2.11328125, -2.03564453125, -1.9580078125, -1.88037109375, -1.802734375, -1.72509765625, -1.6474609375, -1.56982421875, -1.4921875, -1.41455078125, -1.3369140625, -1.25927734375, -1.181640625, -1.10400390625, -1.0263671875, -0.94873046875, -0.87109375, -0.79345703125, -0.7158203125, -0.63818359375, -0.560546875, -0.48291015625, -0.4052734375, -0.32763671875, -0.25, -0.17236328125, -0.0947265625, -0.01708984375, 0.060546875, 0.13818359375, 0.2158203125, 0.29345703125, 0.37109375, 0.44873046875, 0.5263671875, 0.60400390625, 0.681640625, 0.75927734375, 0.8369140625, 0.91455078125, 0.9921875, 1.06982421875, 1.1474609375, 1.22509765625, 1.302734375, 1.38037109375, 1.4580078125, 1.53564453125, 1.61328125, 1.69091796875, 1.7685546875, 1.84619140625, 1.923828125, 2.00146484375, 2.0791015625, 2.15673828125, 2.234375, 2.31201171875, 2.3896484375, 2.46728515625, 2.544921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 7.0, 17.0, 20.0, 26.0, 29.0, 42.0, 68.0, 114.0, 164.0, 251.0, 377.0, 589.0, 868.0, 1438.0, 2415.0, 4198.0, 7487.0, 13915.0, 27382.0, 55300.0, 115547.0, 226909.0, 274043.0, 160821.0, 76977.0, 37435.0, 18689.0, 9961.0, 5480.0, 3052.0, 1744.0, 1118.0, 680.0, 440.0, 312.0, 177.0, 134.0, 96.0, 57.0, 52.0, 29.0, 21.0, 18.0, 11.0, 8.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8344268798828125, -1.769439697265625, -1.7044525146484375, -1.63946533203125, -1.5744781494140625, -1.509490966796875, -1.4445037841796875, -1.3795166015625, -1.3145294189453125, -1.249542236328125, -1.1845550537109375, -1.11956787109375, -1.0545806884765625, -0.989593505859375, -0.9246063232421875, -0.859619140625, -0.7946319580078125, -0.729644775390625, -0.6646575927734375, -0.59967041015625, -0.5346832275390625, -0.469696044921875, -0.4047088623046875, -0.3397216796875, -0.2747344970703125, -0.209747314453125, -0.1447601318359375, -0.07977294921875, -0.0147857666015625, 0.050201416015625, 0.1151885986328125, 0.18017578125, 0.2451629638671875, 0.310150146484375, 0.3751373291015625, 0.44012451171875, 0.5051116943359375, 0.570098876953125, 0.6350860595703125, 0.7000732421875, 0.7650604248046875, 0.830047607421875, 0.8950347900390625, 0.96002197265625, 1.0250091552734375, 1.089996337890625, 1.1549835205078125, 1.219970703125, 1.2849578857421875, 1.349945068359375, 1.4149322509765625, 1.47991943359375, 1.5449066162109375, 1.609893798828125, 1.6748809814453125, 1.7398681640625, 1.8048553466796875, 1.869842529296875, 1.9348297119140625, 1.99981689453125, 2.0648040771484375, 2.129791259765625, 2.1947784423828125, 2.259765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 12.0, 12.0, 15.0, 16.0, 31.0, 30.0, 44.0, 58.0, 56.0, 64.0, 75.0, 76.0, 88.0, 71.0, 53.0, 52.0, 50.0, 39.0, 28.0, 19.0, 22.0, 23.0, 11.0, 13.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00015425682067871094, -0.00014993548393249512, -0.0001456141471862793, -0.00014129281044006348, -0.00013697147369384766, -0.00013265013694763184, -0.00012832880020141602, -0.0001240074634552002, -0.00011968612670898438, -0.00011536478996276855, -0.00011104345321655273, -0.00010672211647033691, -0.0001024007797241211, -9.807944297790527e-05, -9.375810623168945e-05, -8.943676948547363e-05, -8.511543273925781e-05, -8.079409599304199e-05, -7.647275924682617e-05, -7.215142250061035e-05, -6.783008575439453e-05, -6.350874900817871e-05, -5.918741226196289e-05, -5.486607551574707e-05, -5.054473876953125e-05, -4.622340202331543e-05, -4.190206527709961e-05, -3.758072853088379e-05, -3.325939178466797e-05, -2.893805503845215e-05, -2.4616718292236328e-05, -2.0295381546020508e-05, -1.5974044799804688e-05, -1.1652708053588867e-05, -7.331371307373047e-06, -3.0100345611572266e-06, 1.3113021850585938e-06, 5.632638931274414e-06, 9.953975677490234e-06, 1.4275312423706055e-05, 1.8596649169921875e-05, 2.2917985916137695e-05, 2.7239322662353516e-05, 3.1560659408569336e-05, 3.5881996154785156e-05, 4.0203332901000977e-05, 4.45246696472168e-05, 4.884600639343262e-05, 5.316734313964844e-05, 5.748867988586426e-05, 6.181001663208008e-05, 6.61313533782959e-05, 7.045269012451172e-05, 7.477402687072754e-05, 7.909536361694336e-05, 8.341670036315918e-05, 8.7738037109375e-05, 9.205937385559082e-05, 9.638071060180664e-05, 0.00010070204734802246, 0.00010502338409423828, 0.0001093447208404541, 0.00011366605758666992, 0.00011798739433288574, 0.00012230873107910156]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 19.0, 38.0, 55.0, 63.0, 109.0, 199.0, 301.0, 513.0, 822.0, 1470.0, 2615.0, 4874.0, 9375.0, 19144.0, 41029.0, 88232.0, 176137.0, 257422.0, 217186.0, 119724.0, 56605.0, 26062.0, 12400.0, 6315.0, 3330.0, 1826.0, 1063.0, 606.0, 369.0, 231.0, 138.0, 104.0, 63.0, 38.0, 24.0, 8.0, 11.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1328125, -2.0695343017578125, -2.006256103515625, -1.9429779052734375, -1.87969970703125, -1.8164215087890625, -1.753143310546875, -1.6898651123046875, -1.6265869140625, -1.5633087158203125, -1.500030517578125, -1.4367523193359375, -1.37347412109375, -1.3101959228515625, -1.246917724609375, -1.1836395263671875, -1.120361328125, -1.0570831298828125, -0.993804931640625, -0.9305267333984375, -0.86724853515625, -0.8039703369140625, -0.740692138671875, -0.6774139404296875, -0.6141357421875, -0.5508575439453125, -0.487579345703125, -0.4243011474609375, -0.36102294921875, -0.2977447509765625, -0.234466552734375, -0.1711883544921875, -0.10791015625, -0.0446319580078125, 0.018646240234375, 0.0819244384765625, 0.14520263671875, 0.2084808349609375, 0.271759033203125, 0.3350372314453125, 0.3983154296875, 0.4615936279296875, 0.524871826171875, 0.5881500244140625, 0.65142822265625, 0.7147064208984375, 0.777984619140625, 0.8412628173828125, 0.904541015625, 0.9678192138671875, 1.031097412109375, 1.0943756103515625, 1.15765380859375, 1.2209320068359375, 1.284210205078125, 1.3474884033203125, 1.4107666015625, 1.4740447998046875, 1.537322998046875, 1.6006011962890625, 1.66387939453125, 1.7271575927734375, 1.790435791015625, 1.8537139892578125, 1.9169921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 14.0, 8.0, 9.0, 10.0, 13.0, 20.0, 23.0, 21.0, 36.0, 26.0, 40.0, 38.0, 55.0, 45.0, 56.0, 65.0, 73.0, 51.0, 57.0, 50.0, 44.0, 43.0, 37.0, 36.0, 22.0, 17.0, 15.0, 16.0, 16.0, 13.0, 6.0, 4.0, 7.0, 5.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3710136413574219, -0.35701751708984375, -0.3430213928222656, -0.3290252685546875, -0.3150291442871094, -0.30103302001953125, -0.2870368957519531, -0.273040771484375, -0.2590446472167969, -0.24504852294921875, -0.23105239868164062, -0.2170562744140625, -0.20306015014648438, -0.18906402587890625, -0.17506790161132812, -0.16107177734375, -0.14707565307617188, -0.13307952880859375, -0.11908340454101562, -0.1050872802734375, -0.09109115600585938, -0.07709503173828125, -0.06309890747070312, -0.049102783203125, -0.035106658935546875, -0.02111053466796875, -0.007114410400390625, 0.0068817138671875, 0.020877838134765625, 0.03487396240234375, 0.048870086669921875, 0.0628662109375, 0.07686233520507812, 0.09085845947265625, 0.10485458374023438, 0.1188507080078125, 0.13284683227539062, 0.14684295654296875, 0.16083908081054688, 0.174835205078125, 0.18883132934570312, 0.20282745361328125, 0.21682357788085938, 0.2308197021484375, 0.24481582641601562, 0.25881195068359375, 0.2728080749511719, 0.28680419921875, 0.3008003234863281, 0.31479644775390625, 0.3287925720214844, 0.3427886962890625, 0.3567848205566406, 0.37078094482421875, 0.3847770690917969, 0.398773193359375, 0.4127693176269531, 0.42676544189453125, 0.4407615661621094, 0.4547576904296875, 0.4687538146972656, 0.48274993896484375, 0.4967460632324219, 0.5107421875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 3.0, 16.0, 13.0, 14.0, 24.0, 21.0, 39.0, 35.0, 40.0, 51.0, 73.0, 76.0, 63.0, 85.0, 78.0, 60.0, 54.0, 54.0, 41.0, 35.0, 31.0, 15.0, 15.0, 14.0, 10.0, 5.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.66557502746582, -8.418362617492676, -8.171150207519531, -7.9239373207092285, -7.676724433898926, -7.429512023925781, -7.182299613952637, -6.935086727142334, -6.687873840332031, -6.440661430358887, -6.193448543548584, -5.9462361335754395, -5.699023246765137, -5.451810836791992, -5.204598426818848, -4.957385540008545, -4.7101731300354, -4.462960720062256, -4.215747833251953, -3.9685354232788086, -3.721322536468506, -3.4741101264953613, -3.2268974781036377, -2.979684829711914, -2.7324721813201904, -2.485259532928467, -2.238046884536743, -1.990834355354309, -1.7436217069625854, -1.4964090585708618, -1.2491965293884277, -1.001983880996704, -0.7547707557678223, -0.5075581073760986, -0.2603455185890198, -0.013132929801940918, 0.23407971858978271, 0.48129236698150635, 0.7285048961639404, 0.9757175445556641, 1.2229301929473877, 1.4701428413391113, 1.717355489730835, 1.964568018913269, 2.211780548095703, 2.458993434906006, 2.7062058448791504, 2.953418493270874, 3.2006311416625977, 3.4478437900543213, 3.695056438446045, 3.9422688484191895, 4.189481735229492, 4.436694145202637, 4.683906555175781, 4.931119441986084, 5.178332328796387, 5.425544738769531, 5.672757625579834, 5.9199700355529785, 6.167182922363281, 6.414395332336426, 6.66160774230957, 6.908820629119873, 7.156033039093018]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 2.0, 4.0, 11.0, 12.0, 20.0, 28.0, 17.0, 14.0, 22.0, 30.0, 29.0, 32.0, 35.0, 32.0, 36.0, 38.0, 35.0, 50.0, 49.0, 38.0, 44.0, 42.0, 31.0, 46.0, 32.0, 20.0, 42.0, 29.0, 15.0, 26.0, 22.0, 19.0, 19.0, 9.0, 14.0, 7.0, 2.0, 10.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.1894402503967285, -4.062045574188232, -3.9346511363983154, -3.8072564601898193, -3.6798620223999023, -3.5524673461914062, -3.42507266998291, -3.297678232192993, -3.170283794403076, -3.04288911819458, -2.915494680404663, -2.788100004196167, -2.66070556640625, -2.533310890197754, -2.405916213989258, -2.278521776199341, -2.1511270999908447, -2.0237324237823486, -1.8963379859924316, -1.7689433097839355, -1.6415488719940186, -1.5141541957855225, -1.386759638786316, -1.2593650817871094, -1.1319705247879028, -1.0045759677886963, -0.8771814107894897, -0.7497867941856384, -0.6223922371864319, -0.49499768018722534, -0.367603063583374, -0.24020850658416748, -0.11281371116638184, 0.014580860733985901, 0.14197543263435364, 0.26937001943588257, 0.3967645764350891, 0.5241591334342957, 0.651553750038147, 0.7789483070373535, 0.9063428640365601, 1.0337374210357666, 1.1611319780349731, 1.2885265350341797, 1.4159212112426758, 1.5433156490325928, 1.6707103252410889, 1.7981048822402954, 1.925499439239502, 2.052894115447998, 2.180288553237915, 2.307683229446411, 2.435077667236328, 2.562472343444824, 2.6898670196533203, 2.8172614574432373, 2.9446558952331543, 3.0720505714416504, 3.1994450092315674, 3.3268396854400635, 3.4542341232299805, 3.5816287994384766, 3.7090234756469727, 3.8364179134368896, 3.9638125896453857]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 20.0, 20.0, 32.0, 46.0, 79.0, 104.0, 167.0, 297.0, 446.0, 687.0, 1067.0, 1818.0, 3035.0, 5196.0, 9205.0, 16322.0, 28885.0, 51791.0, 90325.0, 144065.0, 190691.0, 183706.0, 133115.0, 81232.0, 45868.0, 25950.0, 14528.0, 8080.0, 4615.0, 2732.0, 1636.0, 1027.0, 611.0, 418.0, 269.0, 145.0, 112.0, 72.0, 48.0, 25.0, 17.0, 7.0, 9.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.484375, -5.306884765625, -5.12939453125, -4.951904296875, -4.7744140625, -4.596923828125, -4.41943359375, -4.241943359375, -4.064453125, -3.886962890625, -3.70947265625, -3.531982421875, -3.3544921875, -3.177001953125, -2.99951171875, -2.822021484375, -2.64453125, -2.467041015625, -2.28955078125, -2.112060546875, -1.9345703125, -1.757080078125, -1.57958984375, -1.402099609375, -1.224609375, -1.047119140625, -0.86962890625, -0.692138671875, -0.5146484375, -0.337158203125, -0.15966796875, 0.017822265625, 0.1953125, 0.372802734375, 0.55029296875, 0.727783203125, 0.9052734375, 1.082763671875, 1.26025390625, 1.437744140625, 1.615234375, 1.792724609375, 1.97021484375, 2.147705078125, 2.3251953125, 2.502685546875, 2.68017578125, 2.857666015625, 3.03515625, 3.212646484375, 3.39013671875, 3.567626953125, 3.7451171875, 3.922607421875, 4.10009765625, 4.277587890625, 4.455078125, 4.632568359375, 4.81005859375, 4.987548828125, 5.1650390625, 5.342529296875, 5.52001953125, 5.697509765625, 5.875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 12.0, 19.0, 11.0, 15.0, 15.0, 27.0, 31.0, 25.0, 33.0, 34.0, 27.0, 32.0, 36.0, 45.0, 48.0, 38.0, 50.0, 45.0, 45.0, 55.0, 43.0, 37.0, 38.0, 29.0, 26.0, 25.0, 17.0, 28.0, 17.0, 18.0, 11.0, 17.0, 6.0, 8.0, 8.0, 1.0, 4.0, 2.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01953125, -4.8702392578125, -4.720947265625, -4.5716552734375, -4.42236328125, -4.2730712890625, -4.123779296875, -3.9744873046875, -3.8251953125, -3.6759033203125, -3.526611328125, -3.3773193359375, -3.22802734375, -3.0787353515625, -2.929443359375, -2.7801513671875, -2.630859375, -2.4815673828125, -2.332275390625, -2.1829833984375, -2.03369140625, -1.8843994140625, -1.735107421875, -1.5858154296875, -1.4365234375, -1.2872314453125, -1.137939453125, -0.9886474609375, -0.83935546875, -0.6900634765625, -0.540771484375, -0.3914794921875, -0.2421875, -0.0928955078125, 0.056396484375, 0.2056884765625, 0.35498046875, 0.5042724609375, 0.653564453125, 0.8028564453125, 0.9521484375, 1.1014404296875, 1.250732421875, 1.4000244140625, 1.54931640625, 1.6986083984375, 1.847900390625, 1.9971923828125, 2.146484375, 2.2957763671875, 2.445068359375, 2.5943603515625, 2.74365234375, 2.8929443359375, 3.042236328125, 3.1915283203125, 3.3408203125, 3.4901123046875, 3.639404296875, 3.7886962890625, 3.93798828125, 4.0872802734375, 4.236572265625, 4.3858642578125, 4.53515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 14.0, 19.0, 36.0, 54.0, 78.0, 83.0, 119.0, 203.0, 268.0, 406.0, 630.0, 903.0, 1364.0, 2071.0, 3225.0, 4776.0, 7571.0, 12188.0, 19247.0, 30649.0, 47907.0, 73980.0, 106532.0, 138380.0, 150542.0, 137991.0, 105519.0, 72940.0, 47833.0, 30269.0, 19102.0, 12109.0, 7521.0, 4860.0, 3004.0, 1980.0, 1368.0, 915.0, 588.0, 428.0, 298.0, 154.0, 147.0, 86.0, 45.0, 40.0, 36.0, 26.0, 18.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0], "bins": [-4.6171875, -4.47930908203125, -4.3414306640625, -4.20355224609375, -4.065673828125, -3.92779541015625, -3.7899169921875, -3.65203857421875, -3.51416015625, -3.37628173828125, -3.2384033203125, -3.10052490234375, -2.962646484375, -2.82476806640625, -2.6868896484375, -2.54901123046875, -2.4111328125, -2.27325439453125, -2.1353759765625, -1.99749755859375, -1.859619140625, -1.72174072265625, -1.5838623046875, -1.44598388671875, -1.30810546875, -1.17022705078125, -1.0323486328125, -0.89447021484375, -0.756591796875, -0.61871337890625, -0.4808349609375, -0.34295654296875, -0.205078125, -0.06719970703125, 0.0706787109375, 0.20855712890625, 0.346435546875, 0.48431396484375, 0.6221923828125, 0.76007080078125, 0.89794921875, 1.03582763671875, 1.1737060546875, 1.31158447265625, 1.449462890625, 1.58734130859375, 1.7252197265625, 1.86309814453125, 2.0009765625, 2.13885498046875, 2.2767333984375, 2.41461181640625, 2.552490234375, 2.69036865234375, 2.8282470703125, 2.96612548828125, 3.10400390625, 3.24188232421875, 3.3797607421875, 3.51763916015625, 3.655517578125, 3.79339599609375, 3.9312744140625, 4.06915283203125, 4.20703125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 10.0, 13.0, 12.0, 13.0, 17.0, 27.0, 28.0, 27.0, 30.0, 35.0, 31.0, 29.0, 44.0, 42.0, 45.0, 43.0, 39.0, 29.0, 38.0, 47.0, 36.0, 35.0, 42.0, 35.0, 41.0, 31.0, 21.0, 23.0, 22.0, 19.0, 19.0, 19.0, 9.0, 12.0, 5.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.917327880859375, -2.83074951171875, -2.744171142578125, -2.6575927734375, -2.571014404296875, -2.48443603515625, -2.397857666015625, -2.311279296875, -2.224700927734375, -2.13812255859375, -2.051544189453125, -1.9649658203125, -1.878387451171875, -1.79180908203125, -1.705230712890625, -1.61865234375, -1.532073974609375, -1.44549560546875, -1.358917236328125, -1.2723388671875, -1.185760498046875, -1.09918212890625, -1.012603759765625, -0.926025390625, -0.839447021484375, -0.75286865234375, -0.666290283203125, -0.5797119140625, -0.493133544921875, -0.40655517578125, -0.319976806640625, -0.2333984375, -0.146820068359375, -0.06024169921875, 0.026336669921875, 0.1129150390625, 0.199493408203125, 0.28607177734375, 0.372650146484375, 0.459228515625, 0.545806884765625, 0.63238525390625, 0.718963623046875, 0.8055419921875, 0.892120361328125, 0.97869873046875, 1.065277099609375, 1.15185546875, 1.238433837890625, 1.32501220703125, 1.411590576171875, 1.4981689453125, 1.584747314453125, 1.67132568359375, 1.757904052734375, 1.844482421875, 1.931060791015625, 2.01763916015625, 2.104217529296875, 2.1907958984375, 2.277374267578125, 2.36395263671875, 2.450531005859375, 2.537109375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 19.0, 20.0, 37.0, 50.0, 65.0, 112.0, 132.0, 173.0, 248.0, 378.0, 545.0, 777.0, 1268.0, 1879.0, 3177.0, 5505.0, 9817.0, 18416.0, 36199.0, 72541.0, 139870.0, 218760.0, 226060.0, 149274.0, 78977.0, 38957.0, 19696.0, 10447.0, 5826.0, 3285.0, 2040.0, 1298.0, 818.0, 559.0, 376.0, 271.0, 197.0, 125.0, 99.0, 69.0, 53.0, 35.0, 38.0, 10.0, 14.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.701171875, -2.621856689453125, -2.54254150390625, -2.463226318359375, -2.3839111328125, -2.304595947265625, -2.22528076171875, -2.145965576171875, -2.066650390625, -1.987335205078125, -1.90802001953125, -1.828704833984375, -1.7493896484375, -1.670074462890625, -1.59075927734375, -1.511444091796875, -1.43212890625, -1.352813720703125, -1.27349853515625, -1.194183349609375, -1.1148681640625, -1.035552978515625, -0.95623779296875, -0.876922607421875, -0.797607421875, -0.718292236328125, -0.63897705078125, -0.559661865234375, -0.4803466796875, -0.401031494140625, -0.32171630859375, -0.242401123046875, -0.1630859375, -0.083770751953125, -0.00445556640625, 0.074859619140625, 0.1541748046875, 0.233489990234375, 0.31280517578125, 0.392120361328125, 0.471435546875, 0.550750732421875, 0.63006591796875, 0.709381103515625, 0.7886962890625, 0.868011474609375, 0.94732666015625, 1.026641845703125, 1.10595703125, 1.185272216796875, 1.26458740234375, 1.343902587890625, 1.4232177734375, 1.502532958984375, 1.58184814453125, 1.661163330078125, 1.740478515625, 1.819793701171875, 1.89910888671875, 1.978424072265625, 2.0577392578125, 2.137054443359375, 2.21636962890625, 2.295684814453125, 2.375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 4.0, 22.0, 19.0, 27.0, 27.0, 46.0, 43.0, 57.0, 92.0, 86.0, 98.0, 93.0, 79.0, 53.0, 57.0, 50.0, 34.0, 21.0, 21.0, 15.0, 9.0, 10.0, 13.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00041484832763671875, -0.0004055984318256378, -0.0003963485360145569, -0.00038709864020347595, -0.000377848744392395, -0.0003685988485813141, -0.00035934895277023315, -0.0003500990569591522, -0.0003408491611480713, -0.00033159926533699036, -0.0003223493695259094, -0.0003130994737148285, -0.00030384957790374756, -0.0002945996820926666, -0.0002853497862815857, -0.00027609989047050476, -0.00026684999465942383, -0.0002576000988483429, -0.00024835020303726196, -0.00023910030722618103, -0.0002298504114151001, -0.00022060051560401917, -0.00021135061979293823, -0.0002021007239818573, -0.00019285082817077637, -0.00018360093235969543, -0.0001743510365486145, -0.00016510114073753357, -0.00015585124492645264, -0.0001466013491153717, -0.00013735145330429077, -0.00012810155749320984, -0.0001188516616821289, -0.00010960176587104797, -0.00010035187005996704, -9.110197424888611e-05, -8.185207843780518e-05, -7.260218262672424e-05, -6.335228681564331e-05, -5.410239100456238e-05, -4.4852495193481445e-05, -3.560259938240051e-05, -2.635270357131958e-05, -1.7102807760238647e-05, -7.852911949157715e-06, 1.3969838619232178e-06, 1.064687967300415e-05, 1.9896775484085083e-05, 2.9146671295166016e-05, 3.839656710624695e-05, 4.764646291732788e-05, 5.6896358728408813e-05, 6.614625453948975e-05, 7.539615035057068e-05, 8.464604616165161e-05, 9.389594197273254e-05, 0.00010314583778381348, 0.00011239573359489441, 0.00012164562940597534, 0.00013089552521705627, 0.0001401454210281372, 0.00014939531683921814, 0.00015864521265029907, 0.00016789510846138, 0.00017714500427246094]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 17.0, 12.0, 24.0, 34.0, 58.0, 67.0, 118.0, 175.0, 257.0, 414.0, 682.0, 1100.0, 1814.0, 3103.0, 5359.0, 9845.0, 19189.0, 39908.0, 83058.0, 160295.0, 239258.0, 220849.0, 131592.0, 65142.0, 31210.0, 15762.0, 8195.0, 4443.0, 2524.0, 1544.0, 898.0, 538.0, 356.0, 239.0, 146.0, 95.0, 76.0, 48.0, 30.0, 19.0, 11.0, 14.0, 4.0, 3.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5, -2.421478271484375, -2.34295654296875, -2.264434814453125, -2.1859130859375, -2.107391357421875, -2.02886962890625, -1.950347900390625, -1.871826171875, -1.793304443359375, -1.71478271484375, -1.636260986328125, -1.5577392578125, -1.479217529296875, -1.40069580078125, -1.322174072265625, -1.24365234375, -1.165130615234375, -1.08660888671875, -1.008087158203125, -0.9295654296875, -0.851043701171875, -0.77252197265625, -0.694000244140625, -0.615478515625, -0.536956787109375, -0.45843505859375, -0.379913330078125, -0.3013916015625, -0.222869873046875, -0.14434814453125, -0.065826416015625, 0.0126953125, 0.091217041015625, 0.16973876953125, 0.248260498046875, 0.3267822265625, 0.405303955078125, 0.48382568359375, 0.562347412109375, 0.640869140625, 0.719390869140625, 0.79791259765625, 0.876434326171875, 0.9549560546875, 1.033477783203125, 1.11199951171875, 1.190521240234375, 1.26904296875, 1.347564697265625, 1.42608642578125, 1.504608154296875, 1.5831298828125, 1.661651611328125, 1.74017333984375, 1.818695068359375, 1.897216796875, 1.975738525390625, 2.05426025390625, 2.132781982421875, 2.2113037109375, 2.289825439453125, 2.36834716796875, 2.446868896484375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 14.0, 8.0, 8.0, 12.0, 12.0, 14.0, 22.0, 23.0, 25.0, 33.0, 32.0, 44.0, 46.0, 42.0, 66.0, 49.0, 57.0, 54.0, 51.0, 43.0, 49.0, 41.0, 27.0, 34.0, 41.0, 30.0, 21.0, 19.0, 16.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46240234375, -0.444915771484375, -0.42742919921875, -0.409942626953125, -0.3924560546875, -0.374969482421875, -0.35748291015625, -0.339996337890625, -0.322509765625, -0.305023193359375, -0.28753662109375, -0.270050048828125, -0.2525634765625, -0.235076904296875, -0.21759033203125, -0.200103759765625, -0.1826171875, -0.165130615234375, -0.14764404296875, -0.130157470703125, -0.1126708984375, -0.095184326171875, -0.07769775390625, -0.060211181640625, -0.042724609375, -0.025238037109375, -0.00775146484375, 0.009735107421875, 0.0272216796875, 0.044708251953125, 0.06219482421875, 0.079681396484375, 0.09716796875, 0.114654541015625, 0.13214111328125, 0.149627685546875, 0.1671142578125, 0.184600830078125, 0.20208740234375, 0.219573974609375, 0.237060546875, 0.254547119140625, 0.27203369140625, 0.289520263671875, 0.3070068359375, 0.324493408203125, 0.34197998046875, 0.359466552734375, 0.376953125, 0.394439697265625, 0.41192626953125, 0.429412841796875, 0.4468994140625, 0.464385986328125, 0.48187255859375, 0.499359130859375, 0.516845703125, 0.534332275390625, 0.55181884765625, 0.569305419921875, 0.5867919921875, 0.604278564453125, 0.62176513671875, 0.639251708984375, 0.65673828125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 9.0, 7.0, 10.0, 12.0, 19.0, 19.0, 35.0, 41.0, 42.0, 49.0, 69.0, 64.0, 74.0, 93.0, 81.0, 67.0, 68.0, 48.0, 46.0, 32.0, 25.0, 30.0, 12.0, 9.0, 5.0, 14.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.590655326843262, -10.321578979492188, -10.052502632141113, -9.783426284790039, -9.514350891113281, -9.245274543762207, -8.976198196411133, -8.707121849060059, -8.438045501708984, -8.16896915435791, -7.899892807006836, -7.63081693649292, -7.361740589141846, -7.0926642417907715, -6.8235883712768555, -6.554512023925781, -6.285435676574707, -6.016359329223633, -5.747282981872559, -5.478207111358643, -5.209130764007568, -4.940054416656494, -4.670978546142578, -4.401902198791504, -4.13282585144043, -3.8637495040893555, -3.5946733951568604, -3.3255972862243652, -3.056520938873291, -2.787444591522217, -2.5183684825897217, -2.2492923736572266, -1.9802160263061523, -1.7111397981643677, -1.442063570022583, -1.1729873418807983, -0.9039111137390137, -0.634834885597229, -0.36575865745544434, -0.09668242931365967, 0.172393798828125, 0.44147002696990967, 0.7105462551116943, 0.979622483253479, 1.2486987113952637, 1.5177749395370483, 1.786851167678833, 2.055927276611328, 2.3250036239624023, 2.5940799713134766, 2.8631560802459717, 3.132232189178467, 3.401308536529541, 3.6703848838806152, 3.9394609928131104, 4.2085371017456055, 4.47761344909668, 4.746689796447754, 5.015766143798828, 5.284842014312744, 5.553918361663818, 5.822994709014893, 6.092070579528809, 6.361146926879883, 6.630223274230957]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 7.0, 6.0, 13.0, 13.0, 12.0, 18.0, 7.0, 18.0, 26.0, 23.0, 41.0, 34.0, 46.0, 35.0, 34.0, 26.0, 28.0, 40.0, 42.0, 42.0, 48.0, 39.0, 33.0, 42.0, 33.0, 43.0, 25.0, 25.0, 30.0, 25.0, 18.0, 23.0, 17.0, 11.0, 9.0, 9.0, 6.0, 8.0, 13.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.17221736907959, -4.0430169105529785, -3.9138166904449463, -3.784616470336914, -3.6554160118103027, -3.5262157917022705, -3.3970155715942383, -3.267815113067627, -3.1386148929595947, -3.0094146728515625, -2.880214214324951, -2.751013994216919, -2.6218137741088867, -2.4926133155822754, -2.363413095474243, -2.234212875366211, -2.1050124168395996, -1.9758120775222778, -1.846611738204956, -1.7174115180969238, -1.588211178779602, -1.4590108394622803, -1.329810619354248, -1.2006102800369263, -1.0714099407196045, -0.9422096014022827, -0.8130093216896057, -0.6838090419769287, -0.5546087026596069, -0.42540836334228516, -0.29620808362960815, -0.16700780391693115, -0.03780698776245117, 0.09139332175254822, 0.2205936312675476, 0.349793940782547, 0.4789942502975464, 0.6081945896148682, 0.7373948693275452, 0.8665951490402222, 0.995795488357544, 1.1249958276748657, 1.2541961669921875, 1.3833963871002197, 1.5125967264175415, 1.6417970657348633, 1.7709972858428955, 1.9001976251602173, 2.029397964477539, 2.1585981845855713, 2.2877986431121826, 2.416998863220215, 2.546199321746826, 2.6753995418548584, 2.8045997619628906, 2.933800220489502, 3.063000440597534, 3.1922006607055664, 3.3214011192321777, 3.45060133934021, 3.579801559448242, 3.7090020179748535, 3.8382022380828857, 3.967402458190918, 4.096602916717529]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 6.0, 8.0, 15.0, 15.0, 19.0, 43.0, 60.0, 77.0, 138.0, 221.0, 388.0, 665.0, 1221.0, 2207.0, 4004.0, 7323.0, 14534.0, 30164.0, 71018.0, 195507.0, 623944.0, 1506508.0, 1140742.0, 380077.0, 124164.0, 47775.0, 21203.0, 10337.0, 5215.0, 2831.0, 1536.0, 928.0, 551.0, 314.0, 210.0, 105.0, 77.0, 50.0, 34.0, 18.0, 12.0, 11.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.3006591796875, -8.031005859375, -7.7613525390625, -7.49169921875, -7.2220458984375, -6.952392578125, -6.6827392578125, -6.4130859375, -6.1434326171875, -5.873779296875, -5.6041259765625, -5.33447265625, -5.0648193359375, -4.795166015625, -4.5255126953125, -4.255859375, -3.9862060546875, -3.716552734375, -3.4468994140625, -3.17724609375, -2.9075927734375, -2.637939453125, -2.3682861328125, -2.0986328125, -1.8289794921875, -1.559326171875, -1.2896728515625, -1.02001953125, -0.7503662109375, -0.480712890625, -0.2110595703125, 0.05859375, 0.3282470703125, 0.597900390625, 0.8675537109375, 1.13720703125, 1.4068603515625, 1.676513671875, 1.9461669921875, 2.2158203125, 2.4854736328125, 2.755126953125, 3.0247802734375, 3.29443359375, 3.5640869140625, 3.833740234375, 4.1033935546875, 4.373046875, 4.6427001953125, 4.912353515625, 5.1820068359375, 5.45166015625, 5.7213134765625, 5.990966796875, 6.2606201171875, 6.5302734375, 6.7999267578125, 7.069580078125, 7.3392333984375, 7.60888671875, 7.8785400390625, 8.148193359375, 8.4178466796875, 8.6875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 12.0, 5.0, 10.0, 19.0, 9.0, 18.0, 23.0, 21.0, 34.0, 38.0, 34.0, 31.0, 26.0, 43.0, 37.0, 50.0, 55.0, 44.0, 45.0, 36.0, 42.0, 46.0, 37.0, 32.0, 38.0, 35.0, 32.0, 18.0, 23.0, 17.0, 14.0, 10.0, 9.0, 8.0, 8.0, 6.0, 11.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.599609375, -3.4892578125, -3.37890625, -3.2685546875, -3.158203125, -3.0478515625, -2.9375, -2.8271484375, -2.716796875, -2.6064453125, -2.49609375, -2.3857421875, -2.275390625, -2.1650390625, -2.0546875, -1.9443359375, -1.833984375, -1.7236328125, -1.61328125, -1.5029296875, -1.392578125, -1.2822265625, -1.171875, -1.0615234375, -0.951171875, -0.8408203125, -0.73046875, -0.6201171875, -0.509765625, -0.3994140625, -0.2890625, -0.1787109375, -0.068359375, 0.0419921875, 0.15234375, 0.2626953125, 0.373046875, 0.4833984375, 0.59375, 0.7041015625, 0.814453125, 0.9248046875, 1.03515625, 1.1455078125, 1.255859375, 1.3662109375, 1.4765625, 1.5869140625, 1.697265625, 1.8076171875, 1.91796875, 2.0283203125, 2.138671875, 2.2490234375, 2.359375, 2.4697265625, 2.580078125, 2.6904296875, 2.80078125, 2.9111328125, 3.021484375, 3.1318359375, 3.2421875, 3.3525390625, 3.462890625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 12.0, 23.0, 26.0, 28.0, 54.0, 95.0, 126.0, 223.0, 392.0, 702.0, 1212.0, 2310.0, 4645.0, 9439.0, 20666.0, 47499.0, 118977.0, 331640.0, 959137.0, 1546169.0, 734860.0, 252007.0, 93027.0, 38010.0, 16767.0, 7855.0, 3824.0, 1984.0, 1063.0, 586.0, 359.0, 229.0, 115.0, 76.0, 45.0, 30.0, 20.0, 10.0, 10.0, 9.0, 2.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.59375, -10.2855224609375, -9.977294921875, -9.6690673828125, -9.36083984375, -9.0526123046875, -8.744384765625, -8.4361572265625, -8.1279296875, -7.8197021484375, -7.511474609375, -7.2032470703125, -6.89501953125, -6.5867919921875, -6.278564453125, -5.9703369140625, -5.662109375, -5.3538818359375, -5.045654296875, -4.7374267578125, -4.42919921875, -4.1209716796875, -3.812744140625, -3.5045166015625, -3.1962890625, -2.8880615234375, -2.579833984375, -2.2716064453125, -1.96337890625, -1.6551513671875, -1.346923828125, -1.0386962890625, -0.73046875, -0.4222412109375, -0.114013671875, 0.1942138671875, 0.50244140625, 0.8106689453125, 1.118896484375, 1.4271240234375, 1.7353515625, 2.0435791015625, 2.351806640625, 2.6600341796875, 2.96826171875, 3.2764892578125, 3.584716796875, 3.8929443359375, 4.201171875, 4.5093994140625, 4.817626953125, 5.1258544921875, 5.43408203125, 5.7423095703125, 6.050537109375, 6.3587646484375, 6.6669921875, 6.9752197265625, 7.283447265625, 7.5916748046875, 7.89990234375, 8.2081298828125, 8.516357421875, 8.8245849609375, 9.1328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 6.0, 9.0, 10.0, 10.0, 10.0, 19.0, 28.0, 26.0, 45.0, 57.0, 65.0, 83.0, 97.0, 118.0, 155.0, 194.0, 253.0, 295.0, 327.0, 337.0, 333.0, 296.0, 269.0, 226.0, 164.0, 137.0, 118.0, 79.0, 72.0, 63.0, 43.0, 29.0, 25.0, 21.0, 16.0, 10.0, 10.0, 6.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.03125, -1.962677001953125, -1.89410400390625, -1.825531005859375, -1.7569580078125, -1.688385009765625, -1.61981201171875, -1.551239013671875, -1.482666015625, -1.414093017578125, -1.34552001953125, -1.276947021484375, -1.2083740234375, -1.139801025390625, -1.07122802734375, -1.002655029296875, -0.93408203125, -0.865509033203125, -0.79693603515625, -0.728363037109375, -0.6597900390625, -0.591217041015625, -0.52264404296875, -0.454071044921875, -0.385498046875, -0.316925048828125, -0.24835205078125, -0.179779052734375, -0.1112060546875, -0.042633056640625, 0.02593994140625, 0.094512939453125, 0.1630859375, 0.231658935546875, 0.30023193359375, 0.368804931640625, 0.4373779296875, 0.505950927734375, 0.57452392578125, 0.643096923828125, 0.711669921875, 0.780242919921875, 0.84881591796875, 0.917388916015625, 0.9859619140625, 1.054534912109375, 1.12310791015625, 1.191680908203125, 1.26025390625, 1.328826904296875, 1.39739990234375, 1.465972900390625, 1.5345458984375, 1.603118896484375, 1.67169189453125, 1.740264892578125, 1.808837890625, 1.877410888671875, 1.94598388671875, 2.014556884765625, 2.0831298828125, 2.151702880859375, 2.22027587890625, 2.288848876953125, 2.357421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 10.0, 12.0, 8.0, 20.0, 17.0, 18.0, 37.0, 29.0, 54.0, 42.0, 49.0, 55.0, 59.0, 64.0, 71.0, 74.0, 56.0, 53.0, 50.0, 43.0, 35.0, 24.0, 15.0, 19.0, 13.0, 13.0, 10.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.342803001403809, -8.111039161682129, -7.879275321960449, -7.6475114822387695, -7.415748119354248, -7.183984279632568, -6.952220439910889, -6.720456600189209, -6.488692760467529, -6.25692892074585, -6.02516508102417, -5.793401718139648, -5.561637878417969, -5.329874038696289, -5.098110198974609, -4.86634635925293, -4.63458251953125, -4.40281867980957, -4.171054840087891, -3.93929123878479, -3.7075273990631104, -3.4757637977600098, -3.24399995803833, -3.0122361183166504, -2.780472755432129, -2.548708915710449, -2.3169453144073486, -2.085181474685669, -1.8534176349639893, -1.6216539144515991, -1.389890193939209, -1.1581263542175293, -0.9263625144958496, -0.6945987343788147, -0.4628349840641022, -0.23107123374938965, 0.0006925463676452637, 0.23245632648468018, 0.4642200469970703, 0.69598388671875, 0.9277476072311401, 1.1595113277435303, 1.39127516746521, 1.6230388879776, 1.8548026084899902, 2.08656644821167, 2.3183302879333496, 2.5500941276550293, 2.78185772895813, 3.0136215686798096, 3.24538516998291, 3.47714900970459, 3.7089128494262695, 3.940676689147949, 4.172440528869629, 4.404204368591309, 4.63596773147583, 4.86773157119751, 5.0994954109191895, 5.331258773803711, 5.563022613525391, 5.79478645324707, 6.02655029296875, 6.25831413269043, 6.490077972412109]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 5.0, 11.0, 11.0, 17.0, 19.0, 15.0, 17.0, 23.0, 18.0, 17.0, 28.0, 38.0, 26.0, 35.0, 36.0, 29.0, 29.0, 42.0, 32.0, 45.0, 39.0, 40.0, 35.0, 40.0, 28.0, 39.0, 37.0, 24.0, 23.0, 17.0, 20.0, 26.0, 16.0, 14.0, 12.0, 8.0, 7.0, 14.0, 8.0, 8.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.578434467315674, -3.460970163345337, -3.343505859375, -3.226041555404663, -3.108577251434326, -2.9911129474639893, -2.8736486434936523, -2.7561841011047363, -2.6387200355529785, -2.5212557315826416, -2.4037914276123047, -2.2863271236419678, -2.168862819671631, -2.051398515701294, -1.9339340925216675, -1.8164697885513306, -1.699005365371704, -1.5815410614013672, -1.4640767574310303, -1.3466124534606934, -1.2291481494903564, -1.1116838455200195, -0.9942194223403931, -0.8767551183700562, -0.7592908143997192, -0.6418265104293823, -0.5243622064590454, -0.4068978428840637, -0.2894335389137268, -0.1719692349433899, -0.0545048713684082, 0.06295943260192871, 0.18042397499084473, 0.29788827896118164, 0.41535261273384094, 0.5328169465065002, 0.6502812504768372, 0.7677455544471741, 0.8852099180221558, 1.0026742219924927, 1.1201385259628296, 1.2376028299331665, 1.3550671339035034, 1.4725315570831299, 1.5899958610534668, 1.7074601650238037, 1.8249244689941406, 1.9423887729644775, 2.0598530769348145, 2.1773173809051514, 2.2947816848754883, 2.412245988845825, 2.529710292816162, 2.647174596786499, 2.764638900756836, 2.882103443145752, 2.9995675086975098, 3.1170318126678467, 3.2344961166381836, 3.3519604206085205, 3.4694247245788574, 3.5868890285491943, 3.7043533325195312, 3.8218178749084473, 3.939282178878784]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 10.0, 9.0, 10.0, 21.0, 36.0, 55.0, 63.0, 113.0, 166.0, 250.0, 388.0, 550.0, 779.0, 1291.0, 2181.0, 3958.0, 7851.0, 17993.0, 46803.0, 132439.0, 316747.0, 309460.0, 127531.0, 45139.0, 17178.0, 7766.0, 3780.0, 2220.0, 1293.0, 780.0, 566.0, 360.0, 280.0, 175.0, 110.0, 66.0, 47.0, 39.0, 16.0, 11.0, 9.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.83984375, -7.609130859375, -7.37841796875, -7.147705078125, -6.9169921875, -6.686279296875, -6.45556640625, -6.224853515625, -5.994140625, -5.763427734375, -5.53271484375, -5.302001953125, -5.0712890625, -4.840576171875, -4.60986328125, -4.379150390625, -4.1484375, -3.917724609375, -3.68701171875, -3.456298828125, -3.2255859375, -2.994873046875, -2.76416015625, -2.533447265625, -2.302734375, -2.072021484375, -1.84130859375, -1.610595703125, -1.3798828125, -1.149169921875, -0.91845703125, -0.687744140625, -0.45703125, -0.226318359375, 0.00439453125, 0.235107421875, 0.4658203125, 0.696533203125, 0.92724609375, 1.157958984375, 1.388671875, 1.619384765625, 1.85009765625, 2.080810546875, 2.3115234375, 2.542236328125, 2.77294921875, 3.003662109375, 3.234375, 3.465087890625, 3.69580078125, 3.926513671875, 4.1572265625, 4.387939453125, 4.61865234375, 4.849365234375, 5.080078125, 5.310791015625, 5.54150390625, 5.772216796875, 6.0029296875, 6.233642578125, 6.46435546875, 6.695068359375, 6.92578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 9.0, 7.0, 15.0, 9.0, 10.0, 15.0, 18.0, 25.0, 16.0, 25.0, 20.0, 26.0, 31.0, 33.0, 41.0, 45.0, 45.0, 49.0, 46.0, 39.0, 43.0, 49.0, 39.0, 27.0, 39.0, 31.0, 35.0, 30.0, 35.0, 25.0, 17.0, 13.0, 14.0, 13.0, 6.0, 12.0, 11.0, 5.0, 7.0, 7.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.48828125, -4.345703125, -4.203125, -4.060546875, -3.91796875, -3.775390625, -3.6328125, -3.490234375, -3.34765625, -3.205078125, -3.0625, -2.919921875, -2.77734375, -2.634765625, -2.4921875, -2.349609375, -2.20703125, -2.064453125, -1.921875, -1.779296875, -1.63671875, -1.494140625, -1.3515625, -1.208984375, -1.06640625, -0.923828125, -0.78125, -0.638671875, -0.49609375, -0.353515625, -0.2109375, -0.068359375, 0.07421875, 0.216796875, 0.359375, 0.501953125, 0.64453125, 0.787109375, 0.9296875, 1.072265625, 1.21484375, 1.357421875, 1.5, 1.642578125, 1.78515625, 1.927734375, 2.0703125, 2.212890625, 2.35546875, 2.498046875, 2.640625, 2.783203125, 2.92578125, 3.068359375, 3.2109375, 3.353515625, 3.49609375, 3.638671875, 3.78125, 3.923828125, 4.06640625, 4.208984375, 4.3515625, 4.494140625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 15.0, 15.0, 21.0, 22.0, 41.0, 41.0, 65.0, 92.0, 129.0, 210.0, 282.0, 495.0, 825.0, 1398.0, 2826.0, 6695.0, 20826.0, 91770.0, 436171.0, 380208.0, 76389.0, 17874.0, 5985.0, 2638.0, 1378.0, 781.0, 444.0, 279.0, 177.0, 117.0, 97.0, 63.0, 58.0, 22.0, 32.0, 15.0, 9.0, 11.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6328125, -13.24267578125, -12.8525390625, -12.46240234375, -12.072265625, -11.68212890625, -11.2919921875, -10.90185546875, -10.51171875, -10.12158203125, -9.7314453125, -9.34130859375, -8.951171875, -8.56103515625, -8.1708984375, -7.78076171875, -7.390625, -7.00048828125, -6.6103515625, -6.22021484375, -5.830078125, -5.43994140625, -5.0498046875, -4.65966796875, -4.26953125, -3.87939453125, -3.4892578125, -3.09912109375, -2.708984375, -2.31884765625, -1.9287109375, -1.53857421875, -1.1484375, -0.75830078125, -0.3681640625, 0.02197265625, 0.412109375, 0.80224609375, 1.1923828125, 1.58251953125, 1.97265625, 2.36279296875, 2.7529296875, 3.14306640625, 3.533203125, 3.92333984375, 4.3134765625, 4.70361328125, 5.09375, 5.48388671875, 5.8740234375, 6.26416015625, 6.654296875, 7.04443359375, 7.4345703125, 7.82470703125, 8.21484375, 8.60498046875, 8.9951171875, 9.38525390625, 9.775390625, 10.16552734375, 10.5556640625, 10.94580078125, 11.3359375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 11.0, 10.0, 14.0, 10.0, 23.0, 33.0, 22.0, 34.0, 36.0, 32.0, 45.0, 50.0, 40.0, 63.0, 43.0, 47.0, 46.0, 40.0, 49.0, 41.0, 37.0, 44.0, 39.0, 40.0, 22.0, 24.0, 16.0, 13.0, 21.0, 11.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.623046875, -3.518707275390625, -3.41436767578125, -3.310028076171875, -3.2056884765625, -3.101348876953125, -2.99700927734375, -2.892669677734375, -2.788330078125, -2.683990478515625, -2.57965087890625, -2.475311279296875, -2.3709716796875, -2.266632080078125, -2.16229248046875, -2.057952880859375, -1.95361328125, -1.849273681640625, -1.74493408203125, -1.640594482421875, -1.5362548828125, -1.431915283203125, -1.32757568359375, -1.223236083984375, -1.118896484375, -1.014556884765625, -0.91021728515625, -0.805877685546875, -0.7015380859375, -0.597198486328125, -0.49285888671875, -0.388519287109375, -0.2841796875, -0.179840087890625, -0.07550048828125, 0.028839111328125, 0.1331787109375, 0.237518310546875, 0.34185791015625, 0.446197509765625, 0.550537109375, 0.654876708984375, 0.75921630859375, 0.863555908203125, 0.9678955078125, 1.072235107421875, 1.17657470703125, 1.280914306640625, 1.38525390625, 1.489593505859375, 1.59393310546875, 1.698272705078125, 1.8026123046875, 1.906951904296875, 2.01129150390625, 2.115631103515625, 2.219970703125, 2.324310302734375, 2.42864990234375, 2.532989501953125, 2.6373291015625, 2.741668701171875, 2.84600830078125, 2.950347900390625, 3.0546875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 12.0, 26.0, 34.0, 34.0, 53.0, 66.0, 96.0, 126.0, 187.0, 312.0, 444.0, 680.0, 1168.0, 2129.0, 4057.0, 9225.0, 24669.0, 79881.0, 297960.0, 431619.0, 132823.0, 37923.0, 13080.0, 5456.0, 2644.0, 1413.0, 821.0, 493.0, 311.0, 226.0, 140.0, 111.0, 85.0, 70.0, 42.0, 38.0, 26.0, 17.0, 14.0, 4.0, 3.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.91015625, -4.75762939453125, -4.6051025390625, -4.45257568359375, -4.300048828125, -4.14752197265625, -3.9949951171875, -3.84246826171875, -3.68994140625, -3.53741455078125, -3.3848876953125, -3.23236083984375, -3.079833984375, -2.92730712890625, -2.7747802734375, -2.62225341796875, -2.4697265625, -2.31719970703125, -2.1646728515625, -2.01214599609375, -1.859619140625, -1.70709228515625, -1.5545654296875, -1.40203857421875, -1.24951171875, -1.09698486328125, -0.9444580078125, -0.79193115234375, -0.639404296875, -0.48687744140625, -0.3343505859375, -0.18182373046875, -0.029296875, 0.12322998046875, 0.2757568359375, 0.42828369140625, 0.580810546875, 0.73333740234375, 0.8858642578125, 1.03839111328125, 1.19091796875, 1.34344482421875, 1.4959716796875, 1.64849853515625, 1.801025390625, 1.95355224609375, 2.1060791015625, 2.25860595703125, 2.4111328125, 2.56365966796875, 2.7161865234375, 2.86871337890625, 3.021240234375, 3.17376708984375, 3.3262939453125, 3.47882080078125, 3.63134765625, 3.78387451171875, 3.9364013671875, 4.08892822265625, 4.241455078125, 4.39398193359375, 4.5465087890625, 4.69903564453125, 4.8515625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 22.0, 23.0, 38.0, 76.0, 91.0, 128.0, 143.0, 129.0, 110.0, 69.0, 45.0, 35.0, 24.0, 13.0, 12.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002982616424560547, -0.0002888627350330353, -0.00027946382761001587, -0.00027006492018699646, -0.00026066601276397705, -0.00025126710534095764, -0.00024186819791793823, -0.00023246929049491882, -0.00022307038307189941, -0.00021367147564888, -0.0002042725682258606, -0.0001948736608028412, -0.00018547475337982178, -0.00017607584595680237, -0.00016667693853378296, -0.00015727803111076355, -0.00014787912368774414, -0.00013848021626472473, -0.00012908130884170532, -0.00011968240141868591, -0.0001102834939956665, -0.0001008845865726471, -9.148567914962769e-05, -8.208677172660828e-05, -7.268786430358887e-05, -6.328895688056946e-05, -5.389004945755005e-05, -4.449114203453064e-05, -3.509223461151123e-05, -2.569332718849182e-05, -1.6294419765472412e-05, -6.895512342453003e-06, 2.5033950805664062e-06, 1.1902302503585815e-05, 2.1301209926605225e-05, 3.0700117349624634e-05, 4.009902477264404e-05, 4.949793219566345e-05, 5.889683961868286e-05, 6.829574704170227e-05, 7.769465446472168e-05, 8.709356188774109e-05, 9.64924693107605e-05, 0.00010589137673377991, 0.00011529028415679932, 0.00012468919157981873, 0.00013408809900283813, 0.00014348700642585754, 0.00015288591384887695, 0.00016228482127189636, 0.00017168372869491577, 0.00018108263611793518, 0.0001904815435409546, 0.000199880450963974, 0.0002092793583869934, 0.00021867826581001282, 0.00022807717323303223, 0.00023747608065605164, 0.00024687498807907104, 0.00025627389550209045, 0.00026567280292510986, 0.00027507171034812927, 0.0002844706177711487, 0.0002938695251941681, 0.0003032684326171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 18.0, 17.0, 26.0, 39.0, 59.0, 74.0, 120.0, 159.0, 253.0, 320.0, 490.0, 709.0, 901.0, 1371.0, 2056.0, 3183.0, 5742.0, 13686.0, 41265.0, 143240.0, 377627.0, 306688.0, 97728.0, 28923.0, 10412.0, 4776.0, 2793.0, 1788.0, 1173.0, 831.0, 576.0, 448.0, 310.0, 218.0, 155.0, 107.0, 74.0, 51.0, 39.0, 33.0, 13.0, 12.0, 8.0, 6.0, 6.0, 7.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.234375, -4.10546875, -3.9765625, -3.84765625, -3.71875, -3.58984375, -3.4609375, -3.33203125, -3.203125, -3.07421875, -2.9453125, -2.81640625, -2.6875, -2.55859375, -2.4296875, -2.30078125, -2.171875, -2.04296875, -1.9140625, -1.78515625, -1.65625, -1.52734375, -1.3984375, -1.26953125, -1.140625, -1.01171875, -0.8828125, -0.75390625, -0.625, -0.49609375, -0.3671875, -0.23828125, -0.109375, 0.01953125, 0.1484375, 0.27734375, 0.40625, 0.53515625, 0.6640625, 0.79296875, 0.921875, 1.05078125, 1.1796875, 1.30859375, 1.4375, 1.56640625, 1.6953125, 1.82421875, 1.953125, 2.08203125, 2.2109375, 2.33984375, 2.46875, 2.59765625, 2.7265625, 2.85546875, 2.984375, 3.11328125, 3.2421875, 3.37109375, 3.5, 3.62890625, 3.7578125, 3.88671875, 4.015625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 12.0, 3.0, 11.0, 40.0, 79.0, 107.0, 163.0, 164.0, 153.0, 100.0, 73.0, 48.0, 20.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5341796875, -1.483734130859375, -1.43328857421875, -1.382843017578125, -1.3323974609375, -1.281951904296875, -1.23150634765625, -1.181060791015625, -1.130615234375, -1.080169677734375, -1.02972412109375, -0.979278564453125, -0.9288330078125, -0.878387451171875, -0.82794189453125, -0.777496337890625, -0.72705078125, -0.676605224609375, -0.62615966796875, -0.575714111328125, -0.5252685546875, -0.474822998046875, -0.42437744140625, -0.373931884765625, -0.323486328125, -0.273040771484375, -0.22259521484375, -0.172149658203125, -0.1217041015625, -0.071258544921875, -0.02081298828125, 0.029632568359375, 0.080078125, 0.130523681640625, 0.18096923828125, 0.231414794921875, 0.2818603515625, 0.332305908203125, 0.38275146484375, 0.433197021484375, 0.483642578125, 0.534088134765625, 0.58453369140625, 0.634979248046875, 0.6854248046875, 0.735870361328125, 0.78631591796875, 0.836761474609375, 0.88720703125, 0.937652587890625, 0.98809814453125, 1.038543701171875, 1.0889892578125, 1.139434814453125, 1.18988037109375, 1.240325927734375, 1.290771484375, 1.341217041015625, 1.39166259765625, 1.442108154296875, 1.4925537109375, 1.542999267578125, 1.59344482421875, 1.643890380859375, 1.6943359375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 8.0, 2.0, 8.0, 5.0, 13.0, 14.0, 14.0, 24.0, 23.0, 33.0, 38.0, 43.0, 43.0, 48.0, 56.0, 66.0, 65.0, 71.0, 65.0, 59.0, 62.0, 38.0, 41.0, 35.0, 20.0, 20.0, 13.0, 11.0, 13.0, 15.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.847781181335449, -7.621734619140625, -7.395688056945801, -7.169641017913818, -6.943594455718994, -6.71754789352417, -6.4915008544921875, -6.265454292297363, -6.039407730102539, -5.813361167907715, -5.587314605712891, -5.361267566680908, -5.135221004486084, -4.90917444229126, -4.683127403259277, -4.457080841064453, -4.231034278869629, -4.004987716674805, -3.7789409160614014, -3.552894115447998, -3.326847553253174, -3.1008009910583496, -2.8747541904449463, -2.648707389831543, -2.4226608276367188, -2.1966142654418945, -1.9705674648284912, -1.7445207834243774, -1.5184741020202637, -1.29242742061615, -1.0663807392120361, -0.8403340578079224, -0.6142868995666504, -0.3882402181625366, -0.16219353675842285, 0.06385314464569092, 0.2898998260498047, 0.5159465074539185, 0.7419931888580322, 0.968039870262146, 1.1940865516662598, 1.4201332330703735, 1.6461799144744873, 1.872226595878601, 2.098273277282715, 2.324319839477539, 2.5503666400909424, 2.7764134407043457, 3.00246000289917, 3.228506565093994, 3.4545533657073975, 3.680600166320801, 3.906646728515625, 4.132693290710449, 4.358739852905273, 4.584786891937256, 4.81083345413208, 5.036880016326904, 5.262927055358887, 5.488973617553711, 5.715020179748535, 5.941066741943359, 6.167113304138184, 6.393160343170166, 6.61920690536499]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 9.0, 9.0, 16.0, 14.0, 27.0, 24.0, 12.0, 28.0, 21.0, 31.0, 24.0, 41.0, 38.0, 35.0, 28.0, 35.0, 41.0, 37.0, 43.0, 37.0, 49.0, 36.0, 34.0, 37.0, 35.0, 28.0, 19.0, 21.0, 26.0, 19.0, 18.0, 14.0, 8.0, 8.0, 16.0, 13.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.6926181316375732, -3.572848081588745, -3.453077793121338, -3.3333077430725098, -3.2135376930236816, -3.0937674045562744, -2.9739973545074463, -2.854227066040039, -2.734457015991211, -2.614686965942383, -2.4949166774749756, -2.3751466274261475, -2.2553763389587402, -2.135606288909912, -2.015836238861084, -1.8960660696029663, -1.7762959003448486, -1.656525731086731, -1.5367555618286133, -1.4169855117797852, -1.2972153425216675, -1.1774451732635498, -1.0576751232147217, -0.937904953956604, -0.8181347846984863, -0.6983646154403687, -0.5785945057868958, -0.45882436633110046, -0.3390542268753052, -0.2192840576171875, -0.0995139479637146, 0.0202561616897583, 0.14002633094787598, 0.25979647040367126, 0.37956660985946655, 0.49933674931526184, 0.6191068887710571, 0.7388770580291748, 0.8586471676826477, 0.9784172773361206, 1.0981874465942383, 1.217957615852356, 1.3377277851104736, 1.4574978351593018, 1.5772680044174194, 1.697038173675537, 1.8168082237243652, 1.936578392982483, 2.0563485622406006, 2.1761186122894287, 2.295888900756836, 2.415658950805664, 2.535429000854492, 2.6551992893218994, 2.7749693393707275, 2.8947396278381348, 3.014509677886963, 3.134279727935791, 3.2540500164031982, 3.3738200664520264, 3.4935903549194336, 3.6133604049682617, 3.73313045501709, 3.852900505065918, 3.972670793533325]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 22.0, 18.0, 24.0, 49.0, 67.0, 108.0, 199.0, 348.0, 595.0, 1084.0, 2030.0, 3974.0, 8197.0, 16959.0, 37287.0, 84823.0, 176687.0, 267605.0, 227071.0, 120141.0, 54072.0, 23883.0, 11425.0, 5512.0, 2812.0, 1532.0, 812.0, 497.0, 263.0, 155.0, 75.0, 66.0, 59.0, 24.0, 24.0, 17.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.1175537109375, -7.844482421875, -7.5714111328125, -7.29833984375, -7.0252685546875, -6.752197265625, -6.4791259765625, -6.2060546875, -5.9329833984375, -5.659912109375, -5.3868408203125, -5.11376953125, -4.8406982421875, -4.567626953125, -4.2945556640625, -4.021484375, -3.7484130859375, -3.475341796875, -3.2022705078125, -2.92919921875, -2.6561279296875, -2.383056640625, -2.1099853515625, -1.8369140625, -1.5638427734375, -1.290771484375, -1.0177001953125, -0.74462890625, -0.4715576171875, -0.198486328125, 0.0745849609375, 0.34765625, 0.6207275390625, 0.893798828125, 1.1668701171875, 1.43994140625, 1.7130126953125, 1.986083984375, 2.2591552734375, 2.5322265625, 2.8052978515625, 3.078369140625, 3.3514404296875, 3.62451171875, 3.8975830078125, 4.170654296875, 4.4437255859375, 4.716796875, 4.9898681640625, 5.262939453125, 5.5360107421875, 5.80908203125, 6.0821533203125, 6.355224609375, 6.6282958984375, 6.9013671875, 7.1744384765625, 7.447509765625, 7.7205810546875, 7.99365234375, 8.2667236328125, 8.539794921875, 8.8128662109375, 9.0859375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 3.0, 11.0, 12.0, 10.0, 11.0, 14.0, 23.0, 30.0, 27.0, 18.0, 22.0, 35.0, 34.0, 34.0, 37.0, 25.0, 54.0, 36.0, 39.0, 41.0, 41.0, 47.0, 34.0, 36.0, 44.0, 38.0, 31.0, 29.0, 27.0, 21.0, 18.0, 15.0, 21.0, 20.0, 10.0, 5.0, 6.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.43212890625, -4.2900390625, -4.14794921875, -4.005859375, -3.86376953125, -3.7216796875, -3.57958984375, -3.4375, -3.29541015625, -3.1533203125, -3.01123046875, -2.869140625, -2.72705078125, -2.5849609375, -2.44287109375, -2.30078125, -2.15869140625, -2.0166015625, -1.87451171875, -1.732421875, -1.59033203125, -1.4482421875, -1.30615234375, -1.1640625, -1.02197265625, -0.8798828125, -0.73779296875, -0.595703125, -0.45361328125, -0.3115234375, -0.16943359375, -0.02734375, 0.11474609375, 0.2568359375, 0.39892578125, 0.541015625, 0.68310546875, 0.8251953125, 0.96728515625, 1.109375, 1.25146484375, 1.3935546875, 1.53564453125, 1.677734375, 1.81982421875, 1.9619140625, 2.10400390625, 2.24609375, 2.38818359375, 2.5302734375, 2.67236328125, 2.814453125, 2.95654296875, 3.0986328125, 3.24072265625, 3.3828125, 3.52490234375, 3.6669921875, 3.80908203125, 3.951171875, 4.09326171875, 4.2353515625, 4.37744140625, 4.51953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 17.0, 11.0, 26.0, 33.0, 47.0, 76.0, 116.0, 172.0, 257.0, 357.0, 553.0, 800.0, 1193.0, 1898.0, 2887.0, 4443.0, 7007.0, 11174.0, 18142.0, 29103.0, 46486.0, 72115.0, 106570.0, 141297.0, 158299.0, 141930.0, 106388.0, 72593.0, 46229.0, 29140.0, 18062.0, 11105.0, 7290.0, 4474.0, 2794.0, 1774.0, 1220.0, 818.0, 544.0, 367.0, 228.0, 161.0, 114.0, 81.0, 68.0, 32.0, 19.0, 22.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0], "bins": [-5.578125, -5.41644287109375, -5.2547607421875, -5.09307861328125, -4.931396484375, -4.76971435546875, -4.6080322265625, -4.44635009765625, -4.28466796875, -4.12298583984375, -3.9613037109375, -3.79962158203125, -3.637939453125, -3.47625732421875, -3.3145751953125, -3.15289306640625, -2.9912109375, -2.82952880859375, -2.6678466796875, -2.50616455078125, -2.344482421875, -2.18280029296875, -2.0211181640625, -1.85943603515625, -1.69775390625, -1.53607177734375, -1.3743896484375, -1.21270751953125, -1.051025390625, -0.88934326171875, -0.7276611328125, -0.56597900390625, -0.404296875, -0.24261474609375, -0.0809326171875, 0.08074951171875, 0.242431640625, 0.40411376953125, 0.5657958984375, 0.72747802734375, 0.88916015625, 1.05084228515625, 1.2125244140625, 1.37420654296875, 1.535888671875, 1.69757080078125, 1.8592529296875, 2.02093505859375, 2.1826171875, 2.34429931640625, 2.5059814453125, 2.66766357421875, 2.829345703125, 2.99102783203125, 3.1527099609375, 3.31439208984375, 3.47607421875, 3.63775634765625, 3.7994384765625, 3.96112060546875, 4.122802734375, 4.28448486328125, 4.4461669921875, 4.60784912109375, 4.76953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 11.0, 4.0, 11.0, 11.0, 19.0, 20.0, 20.0, 26.0, 18.0, 32.0, 34.0, 33.0, 30.0, 35.0, 32.0, 43.0, 39.0, 50.0, 46.0, 48.0, 42.0, 38.0, 37.0, 48.0, 33.0, 29.0, 38.0, 40.0, 18.0, 17.0, 18.0, 15.0, 14.0, 13.0, 15.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.275390625, -3.18011474609375, -3.0848388671875, -2.98956298828125, -2.894287109375, -2.79901123046875, -2.7037353515625, -2.60845947265625, -2.51318359375, -2.41790771484375, -2.3226318359375, -2.22735595703125, -2.132080078125, -2.03680419921875, -1.9415283203125, -1.84625244140625, -1.7509765625, -1.65570068359375, -1.5604248046875, -1.46514892578125, -1.369873046875, -1.27459716796875, -1.1793212890625, -1.08404541015625, -0.98876953125, -0.89349365234375, -0.7982177734375, -0.70294189453125, -0.607666015625, -0.51239013671875, -0.4171142578125, -0.32183837890625, -0.2265625, -0.13128662109375, -0.0360107421875, 0.05926513671875, 0.154541015625, 0.24981689453125, 0.3450927734375, 0.44036865234375, 0.53564453125, 0.63092041015625, 0.7261962890625, 0.82147216796875, 0.916748046875, 1.01202392578125, 1.1072998046875, 1.20257568359375, 1.2978515625, 1.39312744140625, 1.4884033203125, 1.58367919921875, 1.678955078125, 1.77423095703125, 1.8695068359375, 1.96478271484375, 2.06005859375, 2.15533447265625, 2.2506103515625, 2.34588623046875, 2.441162109375, 2.53643798828125, 2.6317138671875, 2.72698974609375, 2.822265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 11.0, 8.0, 8.0, 17.0, 18.0, 24.0, 42.0, 50.0, 73.0, 139.0, 184.0, 248.0, 339.0, 475.0, 773.0, 1081.0, 1645.0, 2582.0, 4085.0, 7062.0, 13398.0, 27502.0, 64829.0, 174434.0, 339687.0, 240116.0, 93075.0, 36729.0, 17014.0, 8741.0, 5128.0, 3079.0, 1955.0, 1231.0, 810.0, 624.0, 413.0, 251.0, 189.0, 152.0, 99.0, 60.0, 38.0, 40.0, 31.0, 17.0, 17.0, 12.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2421875, -5.081787109375, -4.92138671875, -4.760986328125, -4.6005859375, -4.440185546875, -4.27978515625, -4.119384765625, -3.958984375, -3.798583984375, -3.63818359375, -3.477783203125, -3.3173828125, -3.156982421875, -2.99658203125, -2.836181640625, -2.67578125, -2.515380859375, -2.35498046875, -2.194580078125, -2.0341796875, -1.873779296875, -1.71337890625, -1.552978515625, -1.392578125, -1.232177734375, -1.07177734375, -0.911376953125, -0.7509765625, -0.590576171875, -0.43017578125, -0.269775390625, -0.109375, 0.051025390625, 0.21142578125, 0.371826171875, 0.5322265625, 0.692626953125, 0.85302734375, 1.013427734375, 1.173828125, 1.334228515625, 1.49462890625, 1.655029296875, 1.8154296875, 1.975830078125, 2.13623046875, 2.296630859375, 2.45703125, 2.617431640625, 2.77783203125, 2.938232421875, 3.0986328125, 3.259033203125, 3.41943359375, 3.579833984375, 3.740234375, 3.900634765625, 4.06103515625, 4.221435546875, 4.3818359375, 4.542236328125, 4.70263671875, 4.863037109375, 5.0234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 4.0, 16.0, 10.0, 23.0, 29.0, 46.0, 61.0, 97.0, 120.0, 156.0, 139.0, 89.0, 70.0, 50.0, 29.0, 11.0, 10.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008454322814941406, -0.0008250437676906586, -0.0008046552538871765, -0.0007842667400836945, -0.0007638782262802124, -0.0007434897124767303, -0.0007231011986732483, -0.0007027126848697662, -0.0006823241710662842, -0.0006619356572628021, -0.0006415471434593201, -0.000621158629655838, -0.000600770115852356, -0.0005803816020488739, -0.0005599930882453918, -0.0005396045744419098, -0.0005192160606384277, -0.0004988275468349457, -0.0004784390330314636, -0.00045805051922798157, -0.0004376620054244995, -0.00041727349162101746, -0.0003968849778175354, -0.00037649646401405334, -0.0003561079502105713, -0.00033571943640708923, -0.0003153309226036072, -0.0002949424088001251, -0.00027455389499664307, -0.000254165381193161, -0.00023377686738967896, -0.0002133883535861969, -0.00019299983978271484, -0.0001726113259792328, -0.00015222281217575073, -0.00013183429837226868, -0.00011144578456878662, -9.105727076530457e-05, -7.066875696182251e-05, -5.0280243158340454e-05, -2.98917293548584e-05, -9.503215551376343e-06, 1.0885298252105713e-05, 3.127381205558777e-05, 5.1662325859069824e-05, 7.205083966255188e-05, 9.243935346603394e-05, 0.00011282786726951599, 0.00013321638107299805, 0.0001536048948764801, 0.00017399340867996216, 0.00019438192248344421, 0.00021477043628692627, 0.00023515895009040833, 0.0002555474638938904, 0.00027593597769737244, 0.0002963244915008545, 0.00031671300530433655, 0.0003371015191078186, 0.00035749003291130066, 0.0003778785467147827, 0.00039826706051826477, 0.0004186555743217468, 0.0004390440881252289, 0.00045943260192871094]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 10.0, 10.0, 13.0, 28.0, 29.0, 45.0, 76.0, 96.0, 174.0, 263.0, 394.0, 624.0, 887.0, 1439.0, 2201.0, 3497.0, 5693.0, 9670.0, 17202.0, 32204.0, 65876.0, 137498.0, 238489.0, 243914.0, 142511.0, 68248.0, 33824.0, 17706.0, 9891.0, 5894.0, 3687.0, 2313.0, 1468.0, 967.0, 620.0, 367.0, 235.0, 161.0, 132.0, 69.0, 47.0, 28.0, 25.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.40234375, -3.296112060546875, -3.18988037109375, -3.083648681640625, -2.9774169921875, -2.871185302734375, -2.76495361328125, -2.658721923828125, -2.552490234375, -2.446258544921875, -2.34002685546875, -2.233795166015625, -2.1275634765625, -2.021331787109375, -1.91510009765625, -1.808868408203125, -1.70263671875, -1.596405029296875, -1.49017333984375, -1.383941650390625, -1.2777099609375, -1.171478271484375, -1.06524658203125, -0.959014892578125, -0.852783203125, -0.746551513671875, -0.64031982421875, -0.534088134765625, -0.4278564453125, -0.321624755859375, -0.21539306640625, -0.109161376953125, -0.0029296875, 0.103302001953125, 0.20953369140625, 0.315765380859375, 0.4219970703125, 0.528228759765625, 0.63446044921875, 0.740692138671875, 0.846923828125, 0.953155517578125, 1.05938720703125, 1.165618896484375, 1.2718505859375, 1.378082275390625, 1.48431396484375, 1.590545654296875, 1.69677734375, 1.803009033203125, 1.90924072265625, 2.015472412109375, 2.1217041015625, 2.227935791015625, 2.33416748046875, 2.440399169921875, 2.546630859375, 2.652862548828125, 2.75909423828125, 2.865325927734375, 2.9715576171875, 3.077789306640625, 3.18402099609375, 3.290252685546875, 3.396484375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 10.0, 18.0, 18.0, 22.0, 19.0, 23.0, 47.0, 64.0, 41.0, 56.0, 56.0, 67.0, 67.0, 64.0, 61.0, 56.0, 42.0, 30.0, 30.0, 40.0, 25.0, 25.0, 15.0, 12.0, 14.0, 6.0, 9.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.790283203125, -0.76416015625, -0.738037109375, -0.7119140625, -0.685791015625, -0.65966796875, -0.633544921875, -0.607421875, -0.581298828125, -0.55517578125, -0.529052734375, -0.5029296875, -0.476806640625, -0.45068359375, -0.424560546875, -0.3984375, -0.372314453125, -0.34619140625, -0.320068359375, -0.2939453125, -0.267822265625, -0.24169921875, -0.215576171875, -0.189453125, -0.163330078125, -0.13720703125, -0.111083984375, -0.0849609375, -0.058837890625, -0.03271484375, -0.006591796875, 0.01953125, 0.045654296875, 0.07177734375, 0.097900390625, 0.1240234375, 0.150146484375, 0.17626953125, 0.202392578125, 0.228515625, 0.254638671875, 0.28076171875, 0.306884765625, 0.3330078125, 0.359130859375, 0.38525390625, 0.411376953125, 0.4375, 0.463623046875, 0.48974609375, 0.515869140625, 0.5419921875, 0.568115234375, 0.59423828125, 0.620361328125, 0.646484375, 0.672607421875, 0.69873046875, 0.724853515625, 0.7509765625, 0.777099609375, 0.80322265625, 0.829345703125, 0.85546875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 5.0, 11.0, 7.0, 12.0, 11.0, 13.0, 16.0, 20.0, 30.0, 25.0, 31.0, 28.0, 40.0, 34.0, 39.0, 62.0, 67.0, 64.0, 57.0, 64.0, 54.0, 47.0, 52.0, 29.0, 29.0, 13.0, 26.0, 20.0, 14.0, 9.0, 10.0, 11.0, 11.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.40284538269043, -6.201117038726807, -5.999388694763184, -5.797659873962402, -5.595931529998779, -5.394203186035156, -5.192474365234375, -4.990746021270752, -4.789017677307129, -4.587289333343506, -4.385560989379883, -4.183832168579102, -3.9821038246154785, -3.7803754806518555, -3.5786468982696533, -3.376918315887451, -3.175189971923828, -2.973461627960205, -2.771733045578003, -2.570004463195801, -2.3682761192321777, -2.1665477752685547, -1.9648191928863525, -1.76309072971344, -1.5613622665405273, -1.3596338033676147, -1.1579053401947021, -0.9561768770217896, -0.754448413848877, -0.5527199506759644, -0.35099148750305176, -0.14926302433013916, 0.05246591567993164, 0.25419437885284424, 0.45592284202575684, 0.6576513051986694, 0.859379768371582, 1.0611082315444946, 1.2628366947174072, 1.4645651578903198, 1.6662936210632324, 1.868022084236145, 2.0697505474090576, 2.2714791297912598, 2.473207473754883, 2.674935817718506, 2.876664400100708, 3.07839298248291, 3.280121326446533, 3.4818496704101562, 3.6835782527923584, 3.8853068351745605, 4.087035179138184, 4.288763523101807, 4.49049186706543, 4.692220687866211, 4.893949031829834, 5.095677375793457, 5.297406196594238, 5.499134540557861, 5.700862884521484, 5.902591228485107, 6.1043195724487305, 6.306048393249512, 6.507776737213135]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 11.0, 5.0, 17.0, 13.0, 22.0, 19.0, 28.0, 26.0, 20.0, 28.0, 25.0, 33.0, 41.0, 42.0, 32.0, 41.0, 48.0, 37.0, 49.0, 45.0, 38.0, 38.0, 27.0, 43.0, 33.0, 28.0, 34.0, 34.0, 27.0, 17.0, 10.0, 12.0, 8.0, 8.0, 8.0, 8.0, 8.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.52749490737915, -4.39070463180542, -4.2539143562316895, -4.117124557495117, -3.9803342819213867, -3.8435440063476562, -3.706753730773926, -3.5699634552001953, -3.433173418045044, -3.2963831424713135, -3.159593105316162, -3.0228028297424316, -2.886012554168701, -2.74922251701355, -2.6124322414398193, -2.475642204284668, -2.3388519287109375, -2.202061653137207, -2.0652716159820557, -1.9284813404083252, -1.7916911840438843, -1.6549010276794434, -1.518110752105713, -1.381320595741272, -1.244530439376831, -1.1077402830123901, -0.9709500670433044, -0.8341598510742188, -0.6973696947097778, -0.5605795383453369, -0.4237893223762512, -0.2869991064071655, -0.1502084732055664, -0.0134182870388031, 0.1233718991279602, 0.2601620852947235, 0.3969522714614868, 0.5337424278259277, 0.6705326437950134, 0.8073228597640991, 0.94411301612854, 1.080903172492981, 1.2176933288574219, 1.3544836044311523, 1.4912737607955933, 1.6280639171600342, 1.7648541927337646, 1.9016443490982056, 2.0384345054626465, 2.175224781036377, 2.3120148181915283, 2.448805093765259, 2.58559513092041, 2.7223854064941406, 2.859175682067871, 2.9959659576416016, 3.132755994796753, 3.2695462703704834, 3.4063363075256348, 3.5431265830993652, 3.6799168586730957, 3.816706895828247, 3.9534971714019775, 4.090287208557129, 4.227077484130859]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 12.0, 15.0, 21.0, 31.0, 47.0, 63.0, 112.0, 181.0, 252.0, 452.0, 750.0, 1388.0, 2432.0, 4699.0, 9699.0, 21073.0, 49377.0, 129991.0, 404757.0, 1294012.0, 1497458.0, 520023.0, 156567.0, 56460.0, 23088.0, 10428.0, 5008.0, 2514.0, 1378.0, 803.0, 445.0, 273.0, 174.0, 102.0, 66.0, 50.0, 28.0, 19.0, 9.0, 5.0, 7.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.496826171875, -10.18896484375, -9.881103515625, -9.5732421875, -9.265380859375, -8.95751953125, -8.649658203125, -8.341796875, -8.033935546875, -7.72607421875, -7.418212890625, -7.1103515625, -6.802490234375, -6.49462890625, -6.186767578125, -5.87890625, -5.571044921875, -5.26318359375, -4.955322265625, -4.6474609375, -4.339599609375, -4.03173828125, -3.723876953125, -3.416015625, -3.108154296875, -2.80029296875, -2.492431640625, -2.1845703125, -1.876708984375, -1.56884765625, -1.260986328125, -0.953125, -0.645263671875, -0.33740234375, -0.029541015625, 0.2783203125, 0.586181640625, 0.89404296875, 1.201904296875, 1.509765625, 1.817626953125, 2.12548828125, 2.433349609375, 2.7412109375, 3.049072265625, 3.35693359375, 3.664794921875, 3.97265625, 4.280517578125, 4.58837890625, 4.896240234375, 5.2041015625, 5.511962890625, 5.81982421875, 6.127685546875, 6.435546875, 6.743408203125, 7.05126953125, 7.359130859375, 7.6669921875, 7.974853515625, 8.28271484375, 8.590576171875, 8.8984375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 0.0, 7.0, 4.0, 9.0, 7.0, 14.0, 11.0, 6.0, 7.0, 17.0, 25.0, 29.0, 28.0, 19.0, 34.0, 37.0, 27.0, 30.0, 28.0, 31.0, 40.0, 32.0, 39.0, 33.0, 36.0, 36.0, 37.0, 36.0, 42.0, 35.0, 30.0, 32.0, 27.0, 30.0, 26.0, 21.0, 20.0, 12.0, 11.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-3.224609375, -3.12750244140625, -3.0303955078125, -2.93328857421875, -2.836181640625, -2.73907470703125, -2.6419677734375, -2.54486083984375, -2.44775390625, -2.35064697265625, -2.2535400390625, -2.15643310546875, -2.059326171875, -1.96221923828125, -1.8651123046875, -1.76800537109375, -1.6708984375, -1.57379150390625, -1.4766845703125, -1.37957763671875, -1.282470703125, -1.18536376953125, -1.0882568359375, -0.99114990234375, -0.89404296875, -0.79693603515625, -0.6998291015625, -0.60272216796875, -0.505615234375, -0.40850830078125, -0.3114013671875, -0.21429443359375, -0.1171875, -0.02008056640625, 0.0770263671875, 0.17413330078125, 0.271240234375, 0.36834716796875, 0.4654541015625, 0.56256103515625, 0.65966796875, 0.75677490234375, 0.8538818359375, 0.95098876953125, 1.048095703125, 1.14520263671875, 1.2423095703125, 1.33941650390625, 1.4365234375, 1.53363037109375, 1.6307373046875, 1.72784423828125, 1.824951171875, 1.92205810546875, 2.0191650390625, 2.11627197265625, 2.21337890625, 2.31048583984375, 2.4075927734375, 2.50469970703125, 2.601806640625, 2.69891357421875, 2.7960205078125, 2.89312744140625, 2.990234375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 13.0, 14.0, 24.0, 35.0, 34.0, 65.0, 109.0, 138.0, 217.0, 311.0, 474.0, 716.0, 1120.0, 1799.0, 2953.0, 4976.0, 8432.0, 15062.0, 28188.0, 55741.0, 114211.0, 248538.0, 546234.0, 1058596.0, 1064039.0, 552250.0, 251805.0, 116231.0, 56396.0, 28846.0, 15343.0, 8423.0, 4908.0, 2951.0, 1847.0, 1104.0, 671.0, 474.0, 338.0, 224.0, 138.0, 93.0, 57.0, 38.0, 42.0, 17.0, 13.0, 11.0, 8.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.6796875, -7.43975830078125, -7.1998291015625, -6.95989990234375, -6.719970703125, -6.48004150390625, -6.2401123046875, -6.00018310546875, -5.76025390625, -5.52032470703125, -5.2803955078125, -5.04046630859375, -4.800537109375, -4.56060791015625, -4.3206787109375, -4.08074951171875, -3.8408203125, -3.60089111328125, -3.3609619140625, -3.12103271484375, -2.881103515625, -2.64117431640625, -2.4012451171875, -2.16131591796875, -1.92138671875, -1.68145751953125, -1.4415283203125, -1.20159912109375, -0.961669921875, -0.72174072265625, -0.4818115234375, -0.24188232421875, -0.001953125, 0.23797607421875, 0.4779052734375, 0.71783447265625, 0.957763671875, 1.19769287109375, 1.4376220703125, 1.67755126953125, 1.91748046875, 2.15740966796875, 2.3973388671875, 2.63726806640625, 2.877197265625, 3.11712646484375, 3.3570556640625, 3.59698486328125, 3.8369140625, 4.07684326171875, 4.3167724609375, 4.55670166015625, 4.796630859375, 5.03656005859375, 5.2764892578125, 5.51641845703125, 5.75634765625, 5.99627685546875, 6.2362060546875, 6.47613525390625, 6.716064453125, 6.95599365234375, 7.1959228515625, 7.43585205078125, 7.67578125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 14.0, 15.0, 22.0, 29.0, 53.0, 40.0, 60.0, 64.0, 107.0, 137.0, 176.0, 197.0, 285.0, 284.0, 303.0, 304.0, 352.0, 299.0, 270.0, 227.0, 182.0, 152.0, 128.0, 94.0, 61.0, 54.0, 31.0, 23.0, 22.0, 12.0, 15.0, 12.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.187957763671875, -2.11419677734375, -2.040435791015625, -1.9666748046875, -1.892913818359375, -1.81915283203125, -1.745391845703125, -1.671630859375, -1.597869873046875, -1.52410888671875, -1.450347900390625, -1.3765869140625, -1.302825927734375, -1.22906494140625, -1.155303955078125, -1.08154296875, -1.007781982421875, -0.93402099609375, -0.860260009765625, -0.7864990234375, -0.712738037109375, -0.63897705078125, -0.565216064453125, -0.491455078125, -0.417694091796875, -0.34393310546875, -0.270172119140625, -0.1964111328125, -0.122650146484375, -0.04888916015625, 0.024871826171875, 0.0986328125, 0.172393798828125, 0.24615478515625, 0.319915771484375, 0.3936767578125, 0.467437744140625, 0.54119873046875, 0.614959716796875, 0.688720703125, 0.762481689453125, 0.83624267578125, 0.910003662109375, 0.9837646484375, 1.057525634765625, 1.13128662109375, 1.205047607421875, 1.27880859375, 1.352569580078125, 1.42633056640625, 1.500091552734375, 1.5738525390625, 1.647613525390625, 1.72137451171875, 1.795135498046875, 1.868896484375, 1.942657470703125, 2.01641845703125, 2.090179443359375, 2.1639404296875, 2.237701416015625, 2.31146240234375, 2.385223388671875, 2.458984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 5.0, 8.0, 9.0, 8.0, 19.0, 13.0, 24.0, 24.0, 23.0, 24.0, 41.0, 53.0, 62.0, 71.0, 58.0, 52.0, 72.0, 64.0, 62.0, 58.0, 26.0, 41.0, 36.0, 29.0, 19.0, 26.0, 15.0, 7.0, 6.0, 3.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.171698570251465, -6.946063995361328, -6.72042989730835, -6.494795799255371, -6.269161224365234, -6.043526649475098, -5.817892551422119, -5.592258453369141, -5.366623878479004, -5.140989303588867, -4.915355205535889, -4.68972110748291, -4.464086532592773, -4.238451957702637, -4.012817859649658, -3.7871835231781006, -3.561549186706543, -3.3359148502349854, -3.1102805137634277, -2.88464617729187, -2.6590118408203125, -2.433377504348755, -2.2077431678771973, -1.9821088314056396, -1.756474494934082, -1.5308401584625244, -1.3052058219909668, -1.0795714855194092, -0.8539371490478516, -0.628302812576294, -0.40266847610473633, -0.1770341396331787, 0.048600196838378906, 0.2742345333099365, 0.49986886978149414, 0.7255032062530518, 0.9511375427246094, 1.176771879196167, 1.4024062156677246, 1.6280405521392822, 1.8536748886108398, 2.0793092250823975, 2.304943561553955, 2.5305778980255127, 2.7562122344970703, 2.981846570968628, 3.2074809074401855, 3.433115243911743, 3.658749580383301, 3.8843839168548584, 4.110018253326416, 4.3356523513793945, 4.561286926269531, 4.786921501159668, 5.0125555992126465, 5.238189697265625, 5.463824272155762, 5.689458847045898, 5.915092945098877, 6.1407270431518555, 6.366361618041992, 6.591996192932129, 6.817630290985107, 7.043264389038086, 7.268898963928223]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 6.0, 11.0, 16.0, 14.0, 15.0, 22.0, 25.0, 24.0, 32.0, 31.0, 33.0, 46.0, 41.0, 50.0, 36.0, 45.0, 46.0, 45.0, 35.0, 48.0, 37.0, 29.0, 38.0, 36.0, 38.0, 30.0, 22.0, 19.0, 20.0, 19.0, 12.0, 13.0, 6.0, 5.0, 6.0, 6.0, 2.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1419172286987305, -4.007763862609863, -3.873610496520996, -3.739457130432129, -3.6053037643432617, -3.4711503982543945, -3.3369970321655273, -3.20284366607666, -3.068690299987793, -2.934536933898926, -2.8003835678100586, -2.6662302017211914, -2.532076835632324, -2.397923469543457, -2.26377010345459, -2.1296167373657227, -1.9954633712768555, -1.8613100051879883, -1.727156639099121, -1.593003273010254, -1.4588499069213867, -1.3246965408325195, -1.1905431747436523, -1.0563898086547852, -0.922236442565918, -0.7880830764770508, -0.6539297103881836, -0.5197763442993164, -0.3856229782104492, -0.25146961212158203, -0.11731624603271484, 0.016837120056152344, 0.15099000930786133, 0.2851433753967285, 0.4192967414855957, 0.5534501075744629, 0.6876034736633301, 0.8217568397521973, 0.9559102058410645, 1.0900635719299316, 1.2242169380187988, 1.358370304107666, 1.4925236701965332, 1.6266770362854004, 1.7608304023742676, 1.8949837684631348, 2.029137134552002, 2.163290500640869, 2.2974438667297363, 2.4315972328186035, 2.5657505989074707, 2.699903964996338, 2.834057331085205, 2.9682106971740723, 3.1023640632629395, 3.2365174293518066, 3.370670795440674, 3.504824161529541, 3.638977527618408, 3.7731308937072754, 3.9072842597961426, 4.04143762588501, 4.175590991973877, 4.309744358062744, 4.443897724151611]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 15.0, 15.0, 9.0, 32.0, 38.0, 62.0, 97.0, 133.0, 211.0, 370.0, 559.0, 1114.0, 2046.0, 3951.0, 8041.0, 16915.0, 37131.0, 80593.0, 163113.0, 253932.0, 230815.0, 131526.0, 62725.0, 28431.0, 13253.0, 6327.0, 3294.0, 1609.0, 896.0, 528.0, 267.0, 187.0, 108.0, 68.0, 45.0, 31.0, 28.0, 18.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.78515625, -5.62371826171875, -5.4622802734375, -5.30084228515625, -5.139404296875, -4.97796630859375, -4.8165283203125, -4.65509033203125, -4.49365234375, -4.33221435546875, -4.1707763671875, -4.00933837890625, -3.847900390625, -3.68646240234375, -3.5250244140625, -3.36358642578125, -3.2021484375, -3.04071044921875, -2.8792724609375, -2.71783447265625, -2.556396484375, -2.39495849609375, -2.2335205078125, -2.07208251953125, -1.91064453125, -1.74920654296875, -1.5877685546875, -1.42633056640625, -1.264892578125, -1.10345458984375, -0.9420166015625, -0.78057861328125, -0.619140625, -0.45770263671875, -0.2962646484375, -0.13482666015625, 0.026611328125, 0.18804931640625, 0.3494873046875, 0.51092529296875, 0.67236328125, 0.83380126953125, 0.9952392578125, 1.15667724609375, 1.318115234375, 1.47955322265625, 1.6409912109375, 1.80242919921875, 1.9638671875, 2.12530517578125, 2.2867431640625, 2.44818115234375, 2.609619140625, 2.77105712890625, 2.9324951171875, 3.09393310546875, 3.25537109375, 3.41680908203125, 3.5782470703125, 3.73968505859375, 3.901123046875, 4.06256103515625, 4.2239990234375, 4.38543701171875, 4.546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 10.0, 13.0, 14.0, 7.0, 15.0, 12.0, 11.0, 17.0, 28.0, 22.0, 27.0, 38.0, 29.0, 39.0, 49.0, 50.0, 46.0, 44.0, 43.0, 37.0, 48.0, 39.0, 29.0, 49.0, 38.0, 44.0, 25.0, 29.0, 22.0, 19.0, 23.0, 22.0, 11.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.72265625, -4.57403564453125, -4.4254150390625, -4.27679443359375, -4.128173828125, -3.97955322265625, -3.8309326171875, -3.68231201171875, -3.53369140625, -3.38507080078125, -3.2364501953125, -3.08782958984375, -2.939208984375, -2.79058837890625, -2.6419677734375, -2.49334716796875, -2.3447265625, -2.19610595703125, -2.0474853515625, -1.89886474609375, -1.750244140625, -1.60162353515625, -1.4530029296875, -1.30438232421875, -1.15576171875, -1.00714111328125, -0.8585205078125, -0.70989990234375, -0.561279296875, -0.41265869140625, -0.2640380859375, -0.11541748046875, 0.033203125, 0.18182373046875, 0.3304443359375, 0.47906494140625, 0.627685546875, 0.77630615234375, 0.9249267578125, 1.07354736328125, 1.22216796875, 1.37078857421875, 1.5194091796875, 1.66802978515625, 1.816650390625, 1.96527099609375, 2.1138916015625, 2.26251220703125, 2.4111328125, 2.55975341796875, 2.7083740234375, 2.85699462890625, 3.005615234375, 3.15423583984375, 3.3028564453125, 3.45147705078125, 3.60009765625, 3.74871826171875, 3.8973388671875, 4.04595947265625, 4.194580078125, 4.34320068359375, 4.4918212890625, 4.64044189453125, 4.7890625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 10.0, 9.0, 10.0, 16.0, 24.0, 14.0, 40.0, 53.0, 71.0, 105.0, 147.0, 242.0, 432.0, 640.0, 1134.0, 1978.0, 3832.0, 7859.0, 17155.0, 39680.0, 94290.0, 214437.0, 317632.0, 196749.0, 85308.0, 35541.0, 15570.0, 7352.0, 3557.0, 1875.0, 1085.0, 653.0, 374.0, 238.0, 152.0, 93.0, 64.0, 36.0, 32.0, 14.0, 16.0, 12.0, 9.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.71978759765625, -5.5255126953125, -5.33123779296875, -5.136962890625, -4.94268798828125, -4.7484130859375, -4.55413818359375, -4.35986328125, -4.16558837890625, -3.9713134765625, -3.77703857421875, -3.582763671875, -3.38848876953125, -3.1942138671875, -2.99993896484375, -2.8056640625, -2.61138916015625, -2.4171142578125, -2.22283935546875, -2.028564453125, -1.83428955078125, -1.6400146484375, -1.44573974609375, -1.25146484375, -1.05718994140625, -0.8629150390625, -0.66864013671875, -0.474365234375, -0.28009033203125, -0.0858154296875, 0.10845947265625, 0.302734375, 0.49700927734375, 0.6912841796875, 0.88555908203125, 1.079833984375, 1.27410888671875, 1.4683837890625, 1.66265869140625, 1.85693359375, 2.05120849609375, 2.2454833984375, 2.43975830078125, 2.634033203125, 2.82830810546875, 3.0225830078125, 3.21685791015625, 3.4111328125, 3.60540771484375, 3.7996826171875, 3.99395751953125, 4.188232421875, 4.38250732421875, 4.5767822265625, 4.77105712890625, 4.96533203125, 5.15960693359375, 5.3538818359375, 5.54815673828125, 5.742431640625, 5.93670654296875, 6.1309814453125, 6.32525634765625, 6.51953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 11.0, 7.0, 17.0, 11.0, 22.0, 15.0, 20.0, 13.0, 32.0, 24.0, 27.0, 26.0, 27.0, 34.0, 41.0, 38.0, 54.0, 40.0, 43.0, 34.0, 48.0, 47.0, 28.0, 40.0, 34.0, 22.0, 27.0, 18.0, 28.0, 25.0, 12.0, 20.0, 20.0, 13.0, 8.0, 9.0, 12.0, 5.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.15594482421875, -2.0794677734375, -2.00299072265625, -1.926513671875, -1.85003662109375, -1.7735595703125, -1.69708251953125, -1.62060546875, -1.54412841796875, -1.4676513671875, -1.39117431640625, -1.314697265625, -1.23822021484375, -1.1617431640625, -1.08526611328125, -1.0087890625, -0.93231201171875, -0.8558349609375, -0.77935791015625, -0.702880859375, -0.62640380859375, -0.5499267578125, -0.47344970703125, -0.39697265625, -0.32049560546875, -0.2440185546875, -0.16754150390625, -0.091064453125, -0.01458740234375, 0.0618896484375, 0.13836669921875, 0.21484375, 0.29132080078125, 0.3677978515625, 0.44427490234375, 0.520751953125, 0.59722900390625, 0.6737060546875, 0.75018310546875, 0.82666015625, 0.90313720703125, 0.9796142578125, 1.05609130859375, 1.132568359375, 1.20904541015625, 1.2855224609375, 1.36199951171875, 1.4384765625, 1.51495361328125, 1.5914306640625, 1.66790771484375, 1.744384765625, 1.82086181640625, 1.8973388671875, 1.97381591796875, 2.05029296875, 2.12677001953125, 2.2032470703125, 2.27972412109375, 2.356201171875, 2.43267822265625, 2.5091552734375, 2.58563232421875, 2.662109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 12.0, 32.0, 25.0, 19.0, 54.0, 102.0, 136.0, 218.0, 354.0, 600.0, 1112.0, 2267.0, 4441.0, 9464.0, 21324.0, 52917.0, 139139.0, 330258.0, 291309.0, 115918.0, 44011.0, 18425.0, 8206.0, 3883.0, 1905.0, 971.0, 581.0, 320.0, 190.0, 111.0, 74.0, 48.0, 43.0, 20.0, 17.0, 11.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2734375, -3.17083740234375, -3.0682373046875, -2.96563720703125, -2.863037109375, -2.76043701171875, -2.6578369140625, -2.55523681640625, -2.45263671875, -2.35003662109375, -2.2474365234375, -2.14483642578125, -2.042236328125, -1.93963623046875, -1.8370361328125, -1.73443603515625, -1.6318359375, -1.52923583984375, -1.4266357421875, -1.32403564453125, -1.221435546875, -1.11883544921875, -1.0162353515625, -0.91363525390625, -0.81103515625, -0.70843505859375, -0.6058349609375, -0.50323486328125, -0.400634765625, -0.29803466796875, -0.1954345703125, -0.09283447265625, 0.009765625, 0.11236572265625, 0.2149658203125, 0.31756591796875, 0.420166015625, 0.52276611328125, 0.6253662109375, 0.72796630859375, 0.83056640625, 0.93316650390625, 1.0357666015625, 1.13836669921875, 1.240966796875, 1.34356689453125, 1.4461669921875, 1.54876708984375, 1.6513671875, 1.75396728515625, 1.8565673828125, 1.95916748046875, 2.061767578125, 2.16436767578125, 2.2669677734375, 2.36956787109375, 2.47216796875, 2.57476806640625, 2.6773681640625, 2.77996826171875, 2.882568359375, 2.98516845703125, 3.0877685546875, 3.19036865234375, 3.29296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 13.0, 17.0, 12.0, 27.0, 36.0, 54.0, 61.0, 67.0, 79.0, 84.0, 78.0, 80.0, 78.0, 59.0, 32.0, 44.0, 35.0, 32.0, 20.0, 14.0, 7.0, 10.0, 5.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016772747039794922, -0.0001629665493965149, -0.00015820562839508057, -0.00015344470739364624, -0.00014868378639221191, -0.0001439228653907776, -0.00013916194438934326, -0.00013440102338790894, -0.0001296401023864746, -0.00012487918138504028, -0.00012011826038360596, -0.00011535733938217163, -0.0001105964183807373, -0.00010583549737930298, -0.00010107457637786865, -9.631365537643433e-05, -9.1552734375e-05, -8.679181337356567e-05, -8.203089237213135e-05, -7.726997137069702e-05, -7.25090503692627e-05, -6.774812936782837e-05, -6.298720836639404e-05, -5.822628736495972e-05, -5.346536636352539e-05, -4.8704445362091064e-05, -4.394352436065674e-05, -3.918260335922241e-05, -3.4421682357788086e-05, -2.966076135635376e-05, -2.4899840354919434e-05, -2.0138919353485107e-05, -1.537799835205078e-05, -1.0617077350616455e-05, -5.856156349182129e-06, -1.0952353477478027e-06, 3.6656856536865234e-06, 8.42660665512085e-06, 1.3187527656555176e-05, 1.7948448657989502e-05, 2.2709369659423828e-05, 2.7470290660858154e-05, 3.223121166229248e-05, 3.699213266372681e-05, 4.175305366516113e-05, 4.651397466659546e-05, 5.1274895668029785e-05, 5.603581666946411e-05, 6.079673767089844e-05, 6.555765867233276e-05, 7.031857967376709e-05, 7.507950067520142e-05, 7.984042167663574e-05, 8.460134267807007e-05, 8.93622636795044e-05, 9.412318468093872e-05, 9.888410568237305e-05, 0.00010364502668380737, 0.0001084059476852417, 0.00011316686868667603, 0.00011792778968811035, 0.00012268871068954468, 0.000127449631690979, 0.00013221055269241333, 0.00013697147369384766]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 7.0, 19.0, 17.0, 37.0, 53.0, 83.0, 120.0, 185.0, 279.0, 415.0, 650.0, 1046.0, 1658.0, 2696.0, 4464.0, 7565.0, 12817.0, 22438.0, 39646.0, 70663.0, 119475.0, 177096.0, 198157.0, 156994.0, 98795.0, 56967.0, 31767.0, 17847.0, 10520.0, 6217.0, 3566.0, 2308.0, 1421.0, 852.0, 609.0, 389.0, 247.0, 156.0, 101.0, 73.0, 40.0, 38.0, 22.0, 11.0, 4.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.861328125, -1.805450439453125, -1.74957275390625, -1.693695068359375, -1.6378173828125, -1.581939697265625, -1.52606201171875, -1.470184326171875, -1.414306640625, -1.358428955078125, -1.30255126953125, -1.246673583984375, -1.1907958984375, -1.134918212890625, -1.07904052734375, -1.023162841796875, -0.96728515625, -0.911407470703125, -0.85552978515625, -0.799652099609375, -0.7437744140625, -0.687896728515625, -0.63201904296875, -0.576141357421875, -0.520263671875, -0.464385986328125, -0.40850830078125, -0.352630615234375, -0.2967529296875, -0.240875244140625, -0.18499755859375, -0.129119873046875, -0.0732421875, -0.017364501953125, 0.03851318359375, 0.094390869140625, 0.1502685546875, 0.206146240234375, 0.26202392578125, 0.317901611328125, 0.373779296875, 0.429656982421875, 0.48553466796875, 0.541412353515625, 0.5972900390625, 0.653167724609375, 0.70904541015625, 0.764923095703125, 0.82080078125, 0.876678466796875, 0.93255615234375, 0.988433837890625, 1.0443115234375, 1.100189208984375, 1.15606689453125, 1.211944580078125, 1.267822265625, 1.323699951171875, 1.37957763671875, 1.435455322265625, 1.4913330078125, 1.547210693359375, 1.60308837890625, 1.658966064453125, 1.71484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 11.0, 7.0, 11.0, 13.0, 11.0, 21.0, 26.0, 29.0, 28.0, 28.0, 43.0, 52.0, 56.0, 36.0, 49.0, 56.0, 70.0, 68.0, 35.0, 68.0, 42.0, 37.0, 35.0, 30.0, 33.0, 21.0, 16.0, 17.0, 15.0, 5.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.583984375, -0.5670890808105469, -0.5501937866210938, -0.5332984924316406, -0.5164031982421875, -0.4995079040527344, -0.48261260986328125, -0.4657173156738281, -0.448822021484375, -0.4319267272949219, -0.41503143310546875, -0.3981361389160156, -0.3812408447265625, -0.3643455505371094, -0.34745025634765625, -0.3305549621582031, -0.31365966796875, -0.2967643737792969, -0.27986907958984375, -0.2629737854003906, -0.2460784912109375, -0.22918319702148438, -0.21228790283203125, -0.19539260864257812, -0.178497314453125, -0.16160202026367188, -0.14470672607421875, -0.12781143188476562, -0.1109161376953125, -0.09402084350585938, -0.07712554931640625, -0.060230255126953125, -0.0433349609375, -0.026439666748046875, -0.00954437255859375, 0.007350921630859375, 0.0242462158203125, 0.041141510009765625, 0.05803680419921875, 0.07493209838867188, 0.091827392578125, 0.10872268676757812, 0.12561798095703125, 0.14251327514648438, 0.1594085693359375, 0.17630386352539062, 0.19319915771484375, 0.21009445190429688, 0.22698974609375, 0.24388504028320312, 0.26078033447265625, 0.2776756286621094, 0.2945709228515625, 0.3114662170410156, 0.32836151123046875, 0.3452568054199219, 0.362152099609375, 0.3790473937988281, 0.39594268798828125, 0.4128379821777344, 0.4297332763671875, 0.4466285705566406, 0.46352386474609375, 0.4804191589355469, 0.497314453125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 9.0, 5.0, 6.0, 7.0, 11.0, 8.0, 14.0, 11.0, 25.0, 22.0, 28.0, 35.0, 33.0, 56.0, 56.0, 58.0, 57.0, 73.0, 47.0, 68.0, 68.0, 42.0, 48.0, 46.0, 31.0, 24.0, 24.0, 21.0, 18.0, 7.0, 5.0, 8.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.995565414428711, -6.775362014770508, -6.555158615112305, -6.334955215454102, -6.114751815795898, -5.894548416137695, -5.674345016479492, -5.454141616821289, -5.233938217163086, -5.013734817504883, -4.79353141784668, -4.573328018188477, -4.353124618530273, -4.13292121887207, -3.912717819213867, -3.692514419555664, -3.472310781478882, -3.2521073818206787, -3.0319039821624756, -2.8117005825042725, -2.5914971828460693, -2.371293544769287, -2.151090145111084, -1.9308868646621704, -1.7106834650039673, -1.4904800653457642, -1.270276665687561, -1.0500731468200684, -0.82986980676651, -0.6096663475036621, -0.389462947845459, -0.16925954818725586, 0.050943851470947266, 0.2711472511291504, 0.4913506805896759, 0.7115541100502014, 0.9317575097084045, 1.1519609689712524, 1.3721643686294556, 1.5923677682876587, 1.8125711679458618, 2.0327746868133545, 2.2529780864715576, 2.4731814861297607, 2.693384885787964, 2.913588285446167, 3.13379168510437, 3.3539950847625732, 3.5741984844207764, 3.7944018840789795, 4.014605522155762, 4.234808921813965, 4.455012321472168, 4.675215721130371, 4.895419120788574, 5.115622520446777, 5.3358259201049805, 5.556029319763184, 5.776232719421387, 5.99643611907959, 6.216639518737793, 6.436842918395996, 6.657046318054199, 6.877249717712402, 7.0974531173706055]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 3.0, 3.0, 8.0, 14.0, 10.0, 12.0, 15.0, 20.0, 26.0, 28.0, 26.0, 22.0, 34.0, 47.0, 37.0, 47.0, 36.0, 45.0, 46.0, 41.0, 42.0, 40.0, 42.0, 39.0, 32.0, 33.0, 44.0, 25.0, 31.0, 20.0, 26.0, 16.0, 16.0, 16.0, 6.0, 7.0, 5.0, 10.0, 3.0, 1.0, 3.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.998119592666626, -3.8669707775115967, -3.7358222007751465, -3.604673385620117, -3.473524570465088, -3.3423757553100586, -3.2112271785736084, -3.080078363418579, -2.948929786682129, -2.8177809715270996, -2.6866323947906494, -2.55548357963562, -2.424334764480591, -2.2931861877441406, -2.1620373725891113, -2.030888557434082, -1.8997397422790527, -1.768591046333313, -1.6374422311782837, -1.506293535232544, -1.3751447200775146, -1.243996024131775, -1.1128473281860352, -0.9816985726356506, -0.8505498170852661, -0.7194010615348816, -0.5882523059844971, -0.4571036100387573, -0.3259548544883728, -0.19480609893798828, -0.06365740299224854, 0.06749135255813599, 0.1986398696899414, 0.3297886252403259, 0.46093735098838806, 0.5920860767364502, 0.7232348322868347, 0.8543835878372192, 0.985532283782959, 1.1166810989379883, 1.247829794883728, 1.3789784908294678, 1.510127305984497, 1.6412760019302368, 1.7724246978759766, 1.9035735130310059, 2.034722328186035, 2.1658709049224854, 2.2970197200775146, 2.428168535232544, 2.559317111968994, 2.6904659271240234, 2.8216147422790527, 2.952763557434082, 3.0839121341705322, 3.2150609493255615, 3.3462095260620117, 3.477358341217041, 3.608506917953491, 3.7396557331085205, 3.87080454826355, 4.001953125, 4.133101940155029, 4.264250755310059, 4.395399570465088]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 17.0, 8.0, 30.0, 25.0, 45.0, 72.0, 103.0, 144.0, 227.0, 382.0, 577.0, 886.0, 1267.0, 2016.0, 3310.0, 5151.0, 7774.0, 12516.0, 19544.0, 30489.0, 47213.0, 70196.0, 99032.0, 126640.0, 142569.0, 134835.0, 109991.0, 80119.0, 54187.0, 35927.0, 23041.0, 14651.0, 9267.0, 5899.0, 3739.0, 2342.0, 1502.0, 1005.0, 628.0, 380.0, 292.0, 179.0, 102.0, 79.0, 50.0, 40.0, 14.0, 25.0, 13.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.59765625, -4.4525146484375, -4.307373046875, -4.1622314453125, -4.01708984375, -3.8719482421875, -3.726806640625, -3.5816650390625, -3.4365234375, -3.2913818359375, -3.146240234375, -3.0010986328125, -2.85595703125, -2.7108154296875, -2.565673828125, -2.4205322265625, -2.275390625, -2.1302490234375, -1.985107421875, -1.8399658203125, -1.69482421875, -1.5496826171875, -1.404541015625, -1.2593994140625, -1.1142578125, -0.9691162109375, -0.823974609375, -0.6788330078125, -0.53369140625, -0.3885498046875, -0.243408203125, -0.0982666015625, 0.046875, 0.1920166015625, 0.337158203125, 0.4822998046875, 0.62744140625, 0.7725830078125, 0.917724609375, 1.0628662109375, 1.2080078125, 1.3531494140625, 1.498291015625, 1.6434326171875, 1.78857421875, 1.9337158203125, 2.078857421875, 2.2239990234375, 2.369140625, 2.5142822265625, 2.659423828125, 2.8045654296875, 2.94970703125, 3.0948486328125, 3.239990234375, 3.3851318359375, 3.5302734375, 3.6754150390625, 3.820556640625, 3.9656982421875, 4.11083984375, 4.2559814453125, 4.401123046875, 4.5462646484375, 4.69140625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 8.0, 12.0, 19.0, 24.0, 20.0, 26.0, 18.0, 38.0, 41.0, 35.0, 34.0, 49.0, 51.0, 50.0, 46.0, 51.0, 45.0, 42.0, 44.0, 43.0, 42.0, 42.0, 28.0, 27.0, 23.0, 18.0, 16.0, 14.0, 13.0, 17.0, 4.0, 6.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.0703125, -4.9176025390625, -4.764892578125, -4.6121826171875, -4.45947265625, -4.3067626953125, -4.154052734375, -4.0013427734375, -3.8486328125, -3.6959228515625, -3.543212890625, -3.3905029296875, -3.23779296875, -3.0850830078125, -2.932373046875, -2.7796630859375, -2.626953125, -2.4742431640625, -2.321533203125, -2.1688232421875, -2.01611328125, -1.8634033203125, -1.710693359375, -1.5579833984375, -1.4052734375, -1.2525634765625, -1.099853515625, -0.9471435546875, -0.79443359375, -0.6417236328125, -0.489013671875, -0.3363037109375, -0.18359375, -0.0308837890625, 0.121826171875, 0.2745361328125, 0.42724609375, 0.5799560546875, 0.732666015625, 0.8853759765625, 1.0380859375, 1.1907958984375, 1.343505859375, 1.4962158203125, 1.64892578125, 1.8016357421875, 1.954345703125, 2.1070556640625, 2.259765625, 2.4124755859375, 2.565185546875, 2.7178955078125, 2.87060546875, 3.0233154296875, 3.176025390625, 3.3287353515625, 3.4814453125, 3.6341552734375, 3.786865234375, 3.9395751953125, 4.09228515625, 4.2449951171875, 4.397705078125, 4.5504150390625, 4.703125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 11.0, 21.0, 30.0, 38.0, 60.0, 91.0, 127.0, 242.0, 411.0, 733.0, 1287.0, 1987.0, 3634.0, 6374.0, 11023.0, 18968.0, 33205.0, 55015.0, 87945.0, 128898.0, 162973.0, 165380.0, 134110.0, 93334.0, 58655.0, 35422.0, 20646.0, 11814.0, 6874.0, 3891.0, 2210.0, 1295.0, 718.0, 463.0, 223.0, 176.0, 92.0, 59.0, 38.0, 26.0, 16.0, 13.0, 10.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.642578125, -5.4609375, -5.279296875, -5.09765625, -4.916015625, -4.734375, -4.552734375, -4.37109375, -4.189453125, -4.0078125, -3.826171875, -3.64453125, -3.462890625, -3.28125, -3.099609375, -2.91796875, -2.736328125, -2.5546875, -2.373046875, -2.19140625, -2.009765625, -1.828125, -1.646484375, -1.46484375, -1.283203125, -1.1015625, -0.919921875, -0.73828125, -0.556640625, -0.375, -0.193359375, -0.01171875, 0.169921875, 0.3515625, 0.533203125, 0.71484375, 0.896484375, 1.078125, 1.259765625, 1.44140625, 1.623046875, 1.8046875, 1.986328125, 2.16796875, 2.349609375, 2.53125, 2.712890625, 2.89453125, 3.076171875, 3.2578125, 3.439453125, 3.62109375, 3.802734375, 3.984375, 4.166015625, 4.34765625, 4.529296875, 4.7109375, 4.892578125, 5.07421875, 5.255859375, 5.4375, 5.619140625, 5.80078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 10.0, 9.0, 11.0, 5.0, 9.0, 8.0, 14.0, 18.0, 23.0, 23.0, 33.0, 35.0, 34.0, 34.0, 38.0, 33.0, 44.0, 43.0, 35.0, 51.0, 34.0, 42.0, 44.0, 34.0, 41.0, 51.0, 32.0, 36.0, 28.0, 20.0, 20.0, 23.0, 19.0, 15.0, 13.0, 12.0, 14.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.878662109375, -2.79052734375, -2.702392578125, -2.6142578125, -2.526123046875, -2.43798828125, -2.349853515625, -2.26171875, -2.173583984375, -2.08544921875, -1.997314453125, -1.9091796875, -1.821044921875, -1.73291015625, -1.644775390625, -1.556640625, -1.468505859375, -1.38037109375, -1.292236328125, -1.2041015625, -1.115966796875, -1.02783203125, -0.939697265625, -0.8515625, -0.763427734375, -0.67529296875, -0.587158203125, -0.4990234375, -0.410888671875, -0.32275390625, -0.234619140625, -0.146484375, -0.058349609375, 0.02978515625, 0.117919921875, 0.2060546875, 0.294189453125, 0.38232421875, 0.470458984375, 0.55859375, 0.646728515625, 0.73486328125, 0.822998046875, 0.9111328125, 0.999267578125, 1.08740234375, 1.175537109375, 1.263671875, 1.351806640625, 1.43994140625, 1.528076171875, 1.6162109375, 1.704345703125, 1.79248046875, 1.880615234375, 1.96875, 2.056884765625, 2.14501953125, 2.233154296875, 2.3212890625, 2.409423828125, 2.49755859375, 2.585693359375, 2.673828125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 26.0, 33.0, 37.0, 53.0, 72.0, 88.0, 122.0, 171.0, 216.0, 385.0, 515.0, 823.0, 1213.0, 2021.0, 3590.0, 6950.0, 15074.0, 39506.0, 123322.0, 327456.0, 330261.0, 125109.0, 39905.0, 15240.0, 6799.0, 3588.0, 2125.0, 1249.0, 818.0, 495.0, 371.0, 230.0, 172.0, 145.0, 97.0, 55.0, 52.0, 38.0, 27.0, 31.0, 13.0, 8.0, 10.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.41796875, -7.1998291015625, -6.981689453125, -6.7635498046875, -6.54541015625, -6.3272705078125, -6.109130859375, -5.8909912109375, -5.6728515625, -5.4547119140625, -5.236572265625, -5.0184326171875, -4.80029296875, -4.5821533203125, -4.364013671875, -4.1458740234375, -3.927734375, -3.7095947265625, -3.491455078125, -3.2733154296875, -3.05517578125, -2.8370361328125, -2.618896484375, -2.4007568359375, -2.1826171875, -1.9644775390625, -1.746337890625, -1.5281982421875, -1.31005859375, -1.0919189453125, -0.873779296875, -0.6556396484375, -0.4375, -0.2193603515625, -0.001220703125, 0.2169189453125, 0.43505859375, 0.6531982421875, 0.871337890625, 1.0894775390625, 1.3076171875, 1.5257568359375, 1.743896484375, 1.9620361328125, 2.18017578125, 2.3983154296875, 2.616455078125, 2.8345947265625, 3.052734375, 3.2708740234375, 3.489013671875, 3.7071533203125, 3.92529296875, 4.1434326171875, 4.361572265625, 4.5797119140625, 4.7978515625, 5.0159912109375, 5.234130859375, 5.4522705078125, 5.67041015625, 5.8885498046875, 6.106689453125, 6.3248291015625, 6.54296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 13.0, 32.0, 67.0, 127.0, 174.0, 211.0, 158.0, 96.0, 35.0, 25.0, 12.0, 9.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0013246536254882812, -0.001286044716835022, -0.0012474358081817627, -0.0012088268995285034, -0.0011702179908752441, -0.0011316090822219849, -0.0010930001735687256, -0.0010543912649154663, -0.001015782356262207, -0.0009771734476089478, -0.0009385645389556885, -0.0008999556303024292, -0.0008613467216491699, -0.0008227378129959106, -0.0007841289043426514, -0.0007455199956893921, -0.0007069110870361328, -0.0006683021783828735, -0.0006296932697296143, -0.000591084361076355, -0.0005524754524230957, -0.0005138665437698364, -0.00047525763511657715, -0.00043664872646331787, -0.0003980398178100586, -0.0003594309091567993, -0.00032082200050354004, -0.00028221309185028076, -0.00024360418319702148, -0.0002049952745437622, -0.00016638636589050293, -0.00012777745723724365, -8.916854858398438e-05, -5.05596399307251e-05, -1.195073127746582e-05, 2.6658177375793457e-05, 6.526708602905273e-05, 0.00010387599468231201, 0.0001424849033355713, 0.00018109381198883057, 0.00021970272064208984, 0.0002583116292953491, 0.0002969205379486084, 0.0003355294466018677, 0.00037413835525512695, 0.00041274726390838623, 0.0004513561725616455, 0.0004899650812149048, 0.0005285739898681641, 0.0005671828985214233, 0.0006057918071746826, 0.0006444007158279419, 0.0006830096244812012, 0.0007216185331344604, 0.0007602274417877197, 0.000798836350440979, 0.0008374452590942383, 0.0008760541677474976, 0.0009146630764007568, 0.0009532719850540161, 0.0009918808937072754, 0.0010304898023605347, 0.001069098711013794, 0.0011077076196670532, 0.0011463165283203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 14.0, 21.0, 23.0, 31.0, 53.0, 88.0, 120.0, 195.0, 332.0, 523.0, 805.0, 1343.0, 2381.0, 4528.0, 8953.0, 18876.0, 42280.0, 97736.0, 204359.0, 281303.0, 205287.0, 98029.0, 42658.0, 19067.0, 9087.0, 4514.0, 2380.0, 1408.0, 817.0, 479.0, 277.0, 187.0, 122.0, 87.0, 59.0, 32.0, 22.0, 21.0, 17.0, 6.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.0810546875, -3.947265625, -3.8134765625, -3.6796875, -3.5458984375, -3.412109375, -3.2783203125, -3.14453125, -3.0107421875, -2.876953125, -2.7431640625, -2.609375, -2.4755859375, -2.341796875, -2.2080078125, -2.07421875, -1.9404296875, -1.806640625, -1.6728515625, -1.5390625, -1.4052734375, -1.271484375, -1.1376953125, -1.00390625, -0.8701171875, -0.736328125, -0.6025390625, -0.46875, -0.3349609375, -0.201171875, -0.0673828125, 0.06640625, 0.2001953125, 0.333984375, 0.4677734375, 0.6015625, 0.7353515625, 0.869140625, 1.0029296875, 1.13671875, 1.2705078125, 1.404296875, 1.5380859375, 1.671875, 1.8056640625, 1.939453125, 2.0732421875, 2.20703125, 2.3408203125, 2.474609375, 2.6083984375, 2.7421875, 2.8759765625, 3.009765625, 3.1435546875, 3.27734375, 3.4111328125, 3.544921875, 3.6787109375, 3.8125, 3.9462890625, 4.080078125, 4.2138671875, 4.34765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 10.0, 8.0, 14.0, 15.0, 12.0, 29.0, 33.0, 36.0, 34.0, 45.0, 56.0, 54.0, 67.0, 56.0, 95.0, 68.0, 56.0, 51.0, 42.0, 33.0, 35.0, 25.0, 27.0, 12.0, 10.0, 11.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.978515625, -0.9477615356445312, -0.9170074462890625, -0.8862533569335938, -0.855499267578125, -0.8247451782226562, -0.7939910888671875, -0.7632369995117188, -0.73248291015625, -0.7017288208007812, -0.6709747314453125, -0.6402206420898438, -0.609466552734375, -0.5787124633789062, -0.5479583740234375, -0.5172042846679688, -0.4864501953125, -0.45569610595703125, -0.4249420166015625, -0.39418792724609375, -0.363433837890625, -0.33267974853515625, -0.3019256591796875, -0.27117156982421875, -0.24041748046875, -0.20966339111328125, -0.1789093017578125, -0.14815521240234375, -0.117401123046875, -0.08664703369140625, -0.0558929443359375, -0.02513885498046875, 0.005615234375, 0.03636932373046875, 0.0671234130859375, 0.09787750244140625, 0.128631591796875, 0.15938568115234375, 0.1901397705078125, 0.22089385986328125, 0.25164794921875, 0.28240203857421875, 0.3131561279296875, 0.34391021728515625, 0.374664306640625, 0.40541839599609375, 0.4361724853515625, 0.46692657470703125, 0.4976806640625, 0.5284347534179688, 0.5591888427734375, 0.5899429321289062, 0.620697021484375, 0.6514511108398438, 0.6822052001953125, 0.7129592895507812, 0.74371337890625, 0.7744674682617188, 0.8052215576171875, 0.8359756469726562, 0.866729736328125, 0.8974838256835938, 0.9282379150390625, 0.9589920043945312, 0.98974609375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 9.0, 3.0, 12.0, 10.0, 17.0, 12.0, 23.0, 24.0, 14.0, 38.0, 44.0, 53.0, 47.0, 57.0, 58.0, 70.0, 52.0, 67.0, 54.0, 68.0, 42.0, 41.0, 34.0, 27.0, 23.0, 19.0, 15.0, 16.0, 7.0, 6.0, 10.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.33606481552124, -7.108825206756592, -6.881585597991943, -6.654345989227295, -6.4271063804626465, -6.199866771697998, -5.97262716293335, -5.745387554168701, -5.518147945404053, -5.290908336639404, -5.063668727874756, -4.836429119110107, -4.609189510345459, -4.3819499015808105, -4.154710292816162, -3.9274706840515137, -3.7002310752868652, -3.472991466522217, -3.2457518577575684, -3.01851224899292, -2.7912726402282715, -2.564033031463623, -2.3367934226989746, -2.109553813934326, -1.8823142051696777, -1.6550745964050293, -1.4278349876403809, -1.2005953788757324, -0.973355770111084, -0.7461161613464355, -0.5188765525817871, -0.29163694381713867, -0.06439781188964844, 0.162841796875, 0.39008140563964844, 0.6173210144042969, 0.8445606231689453, 1.0718002319335938, 1.2990398406982422, 1.5262794494628906, 1.753519058227539, 1.9807586669921875, 2.207998275756836, 2.4352378845214844, 2.662477493286133, 2.8897171020507812, 3.1169567108154297, 3.344196319580078, 3.5714359283447266, 3.798675537109375, 4.025915145874023, 4.253154754638672, 4.48039436340332, 4.707633972167969, 4.934873580932617, 5.162113189697266, 5.389352798461914, 5.6165924072265625, 5.843832015991211, 6.071071624755859, 6.298311233520508, 6.525550842285156, 6.752790451049805, 6.980030059814453, 7.207269668579102]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 7.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 9.0, 13.0, 12.0, 16.0, 15.0, 19.0, 28.0, 22.0, 33.0, 33.0, 43.0, 34.0, 48.0, 45.0, 31.0, 39.0, 39.0, 36.0, 51.0, 54.0, 35.0, 42.0, 33.0, 50.0, 28.0, 25.0, 24.0, 22.0, 18.0, 9.0, 14.0, 10.0, 10.0, 7.0, 9.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09138822555542, -3.952510356903076, -3.8136324882507324, -3.6747546195983887, -3.535876750946045, -3.396998882293701, -3.2581212520599365, -3.1192433834075928, -2.980365514755249, -2.8414876461029053, -2.7026097774505615, -2.5637319087982178, -2.424854278564453, -2.2859764099121094, -2.1470985412597656, -2.008220672607422, -1.8693428039550781, -1.7304649353027344, -1.5915870666503906, -1.4527093172073364, -1.3138314485549927, -1.174953579902649, -1.0360758304595947, -0.897197961807251, -0.7583200931549072, -0.6194422245025635, -0.4805644154548645, -0.34168657660484314, -0.20280873775482178, -0.06393086910247803, 0.07494693994522095, 0.21382474899291992, 0.35270261764526367, 0.49158045649528503, 0.6304582953453064, 0.7693361043930054, 0.9082139730453491, 1.0470918416976929, 1.185969591140747, 1.3248474597930908, 1.4637253284454346, 1.6026031970977783, 1.741481065750122, 1.8803588151931763, 2.0192365646362305, 2.158114433288574, 2.296992301940918, 2.4358701705932617, 2.5747480392456055, 2.713625907897949, 2.852503776550293, 2.9913816452026367, 3.1302595138549805, 3.269137382507324, 3.408015012741089, 3.5468928813934326, 3.6857707500457764, 3.82464861869812, 3.963526487350464, 4.1024041175842285, 4.241281986236572, 4.380159854888916, 4.51903772354126, 4.6579155921936035, 4.796793460845947]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 9.0, 8.0, 7.0, 17.0, 20.0, 38.0, 58.0, 85.0, 113.0, 197.0, 351.0, 599.0, 986.0, 1737.0, 3114.0, 5682.0, 11209.0, 23273.0, 51247.0, 126649.0, 351821.0, 998785.0, 1463241.0, 732206.0, 250883.0, 94245.0, 39266.0, 18295.0, 9040.0, 4723.0, 2602.0, 1521.0, 875.0, 534.0, 319.0, 203.0, 114.0, 62.0, 44.0, 41.0, 18.0, 21.0, 9.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7877197265625, -7.512939453125, -7.2381591796875, -6.96337890625, -6.6885986328125, -6.413818359375, -6.1390380859375, -5.8642578125, -5.5894775390625, -5.314697265625, -5.0399169921875, -4.76513671875, -4.4903564453125, -4.215576171875, -3.9407958984375, -3.666015625, -3.3912353515625, -3.116455078125, -2.8416748046875, -2.56689453125, -2.2921142578125, -2.017333984375, -1.7425537109375, -1.4677734375, -1.1929931640625, -0.918212890625, -0.6434326171875, -0.36865234375, -0.0938720703125, 0.180908203125, 0.4556884765625, 0.73046875, 1.0052490234375, 1.280029296875, 1.5548095703125, 1.82958984375, 2.1043701171875, 2.379150390625, 2.6539306640625, 2.9287109375, 3.2034912109375, 3.478271484375, 3.7530517578125, 4.02783203125, 4.3026123046875, 4.577392578125, 4.8521728515625, 5.126953125, 5.4017333984375, 5.676513671875, 5.9512939453125, 6.22607421875, 6.5008544921875, 6.775634765625, 7.0504150390625, 7.3251953125, 7.5999755859375, 7.874755859375, 8.1495361328125, 8.42431640625, 8.6990966796875, 8.973876953125, 9.2486572265625, 9.5234375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 11.0, 10.0, 12.0, 18.0, 30.0, 19.0, 22.0, 32.0, 32.0, 29.0, 44.0, 49.0, 35.0, 56.0, 39.0, 38.0, 37.0, 57.0, 42.0, 43.0, 42.0, 46.0, 33.0, 33.0, 26.0, 30.0, 16.0, 13.0, 16.0, 7.0, 8.0, 6.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.537109375, -3.42144775390625, -3.3057861328125, -3.19012451171875, -3.074462890625, -2.95880126953125, -2.8431396484375, -2.72747802734375, -2.61181640625, -2.49615478515625, -2.3804931640625, -2.26483154296875, -2.149169921875, -2.03350830078125, -1.9178466796875, -1.80218505859375, -1.6865234375, -1.57086181640625, -1.4552001953125, -1.33953857421875, -1.223876953125, -1.10821533203125, -0.9925537109375, -0.87689208984375, -0.76123046875, -0.64556884765625, -0.5299072265625, -0.41424560546875, -0.298583984375, -0.18292236328125, -0.0672607421875, 0.04840087890625, 0.1640625, 0.27972412109375, 0.3953857421875, 0.51104736328125, 0.626708984375, 0.74237060546875, 0.8580322265625, 0.97369384765625, 1.08935546875, 1.20501708984375, 1.3206787109375, 1.43634033203125, 1.552001953125, 1.66766357421875, 1.7833251953125, 1.89898681640625, 2.0146484375, 2.13031005859375, 2.2459716796875, 2.36163330078125, 2.477294921875, 2.59295654296875, 2.7086181640625, 2.82427978515625, 2.93994140625, 3.05560302734375, 3.1712646484375, 3.28692626953125, 3.402587890625, 3.51824951171875, 3.6339111328125, 3.74957275390625, 3.865234375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 13.0, 18.0, 27.0, 40.0, 57.0, 97.0, 144.0, 205.0, 367.0, 485.0, 786.0, 1259.0, 2056.0, 3430.0, 5569.0, 9677.0, 16949.0, 30777.0, 57183.0, 110769.0, 221618.0, 451364.0, 859243.0, 1060757.0, 674265.0, 336138.0, 165477.0, 84389.0, 43980.0, 24157.0, 13261.0, 7725.0, 4569.0, 2757.0, 1755.0, 1062.0, 647.0, 433.0, 258.0, 174.0, 114.0, 81.0, 54.0, 25.0, 26.0, 16.0, 8.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.082275390625, -6.85595703125, -6.629638671875, -6.4033203125, -6.177001953125, -5.95068359375, -5.724365234375, -5.498046875, -5.271728515625, -5.04541015625, -4.819091796875, -4.5927734375, -4.366455078125, -4.14013671875, -3.913818359375, -3.6875, -3.461181640625, -3.23486328125, -3.008544921875, -2.7822265625, -2.555908203125, -2.32958984375, -2.103271484375, -1.876953125, -1.650634765625, -1.42431640625, -1.197998046875, -0.9716796875, -0.745361328125, -0.51904296875, -0.292724609375, -0.06640625, 0.159912109375, 0.38623046875, 0.612548828125, 0.8388671875, 1.065185546875, 1.29150390625, 1.517822265625, 1.744140625, 1.970458984375, 2.19677734375, 2.423095703125, 2.6494140625, 2.875732421875, 3.10205078125, 3.328369140625, 3.5546875, 3.781005859375, 4.00732421875, 4.233642578125, 4.4599609375, 4.686279296875, 4.91259765625, 5.138916015625, 5.365234375, 5.591552734375, 5.81787109375, 6.044189453125, 6.2705078125, 6.496826171875, 6.72314453125, 6.949462890625, 7.17578125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 2.0, 10.0, 8.0, 16.0, 12.0, 21.0, 38.0, 46.0, 54.0, 70.0, 79.0, 103.0, 129.0, 173.0, 213.0, 265.0, 304.0, 335.0, 350.0, 334.0, 307.0, 253.0, 219.0, 139.0, 130.0, 108.0, 85.0, 62.0, 65.0, 36.0, 23.0, 27.0, 9.0, 14.0, 7.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.64178466796875, -2.5667724609375, -2.49176025390625, -2.416748046875, -2.34173583984375, -2.2667236328125, -2.19171142578125, -2.11669921875, -2.04168701171875, -1.9666748046875, -1.89166259765625, -1.816650390625, -1.74163818359375, -1.6666259765625, -1.59161376953125, -1.5166015625, -1.44158935546875, -1.3665771484375, -1.29156494140625, -1.216552734375, -1.14154052734375, -1.0665283203125, -0.99151611328125, -0.91650390625, -0.84149169921875, -0.7664794921875, -0.69146728515625, -0.616455078125, -0.54144287109375, -0.4664306640625, -0.39141845703125, -0.31640625, -0.24139404296875, -0.1663818359375, -0.09136962890625, -0.016357421875, 0.05865478515625, 0.1336669921875, 0.20867919921875, 0.28369140625, 0.35870361328125, 0.4337158203125, 0.50872802734375, 0.583740234375, 0.65875244140625, 0.7337646484375, 0.80877685546875, 0.8837890625, 0.95880126953125, 1.0338134765625, 1.10882568359375, 1.183837890625, 1.25885009765625, 1.3338623046875, 1.40887451171875, 1.48388671875, 1.55889892578125, 1.6339111328125, 1.70892333984375, 1.783935546875, 1.85894775390625, 1.9339599609375, 2.00897216796875, 2.083984375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 15.0, 10.0, 10.0, 12.0, 11.0, 16.0, 22.0, 30.0, 42.0, 45.0, 53.0, 66.0, 62.0, 51.0, 83.0, 60.0, 76.0, 57.0, 47.0, 37.0, 39.0, 31.0, 21.0, 18.0, 16.0, 14.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.556941986083984, -9.307881355285645, -9.058820724487305, -8.809761047363281, -8.560700416564941, -8.311639785766602, -8.062579154968262, -7.81351900100708, -7.564458847045898, -7.315398216247559, -7.066338062286377, -6.817277431488037, -6.5682172775268555, -6.319156646728516, -6.070096015930176, -5.821035861968994, -5.571975231170654, -5.3229146003723145, -5.073854446411133, -4.824793815612793, -4.575733661651611, -4.3266730308532715, -4.07761287689209, -3.82855224609375, -3.5794918537139893, -3.3304314613342285, -3.0813710689544678, -2.832310676574707, -2.583250045776367, -2.3341898918151855, -2.0851292610168457, -1.836068868637085, -1.5870084762573242, -1.3379480838775635, -1.0888876914978027, -0.8398271799087524, -0.5907667875289917, -0.34170639514923096, -0.09264588356018066, 0.15641450881958008, 0.4054749011993408, 0.6545352935791016, 0.9035957455635071, 1.1526561975479126, 1.4017165899276733, 1.650776982307434, 1.8998374938964844, 2.148897886276245, 2.397958278656006, 2.6470186710357666, 2.8960790634155273, 3.145139694213867, 3.394199848175049, 3.6432604789733887, 3.8923208713531494, 4.14138126373291, 4.39044189453125, 4.63950252532959, 4.8885626792907715, 5.137623310089111, 5.386683464050293, 5.635744094848633, 5.884804725646973, 6.133864879608154, 6.382925033569336]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 10.0, 14.0, 6.0, 11.0, 15.0, 16.0, 16.0, 25.0, 32.0, 29.0, 36.0, 42.0, 28.0, 34.0, 53.0, 53.0, 37.0, 48.0, 53.0, 46.0, 34.0, 43.0, 47.0, 44.0, 28.0, 29.0, 34.0, 22.0, 20.0, 16.0, 14.0, 15.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.054889678955078, -4.903929710388184, -4.752969741821289, -4.6020097732543945, -4.4510498046875, -4.3000898361206055, -4.149129867553711, -3.9981696605682373, -3.8472096920013428, -3.6962497234344482, -3.5452897548675537, -3.394329786300659, -3.2433695793151855, -3.092409610748291, -2.9414496421813965, -2.790489673614502, -2.6395297050476074, -2.488569736480713, -2.3376097679138184, -2.186649799346924, -2.0356898307800293, -1.8847297430038452, -1.7337696552276611, -1.5828096866607666, -1.431849718093872, -1.2808897495269775, -1.129929780960083, -0.9789696931838989, -0.8280097246170044, -0.6770497560501099, -0.5260897278785706, -0.37512969970703125, -0.22416925430297852, -0.0732092559337616, 0.07775074243545532, 0.22871074080467224, 0.37967073917388916, 0.5306307077407837, 0.681590735912323, 0.8325507640838623, 0.9835107326507568, 1.1344707012176514, 1.285430669784546, 1.43639075756073, 1.5873507261276245, 1.738310694694519, 1.8892707824707031, 2.0402307510375977, 2.191190719604492, 2.3421506881713867, 2.4931106567382812, 2.644070625305176, 2.7950305938720703, 2.945990562438965, 3.0969507694244385, 3.247910737991333, 3.3988707065582275, 3.549830675125122, 3.7007906436920166, 3.851750612258911, 4.002710819244385, 4.153670787811279, 4.304630756378174, 4.455590724945068, 4.606550693511963]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 17.0, 20.0, 26.0, 55.0, 97.0, 138.0, 209.0, 346.0, 544.0, 954.0, 1622.0, 3017.0, 6498.0, 16393.0, 48724.0, 155216.0, 346434.0, 296861.0, 112238.0, 35457.0, 12366.0, 5225.0, 2544.0, 1430.0, 856.0, 501.0, 328.0, 157.0, 112.0, 59.0, 41.0, 16.0, 17.0, 14.0, 6.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.5975341796875, -7.351318359375, -7.1051025390625, -6.85888671875, -6.6126708984375, -6.366455078125, -6.1202392578125, -5.8740234375, -5.6278076171875, -5.381591796875, -5.1353759765625, -4.88916015625, -4.6429443359375, -4.396728515625, -4.1505126953125, -3.904296875, -3.6580810546875, -3.411865234375, -3.1656494140625, -2.91943359375, -2.6732177734375, -2.427001953125, -2.1807861328125, -1.9345703125, -1.6883544921875, -1.442138671875, -1.1959228515625, -0.94970703125, -0.7034912109375, -0.457275390625, -0.2110595703125, 0.03515625, 0.2813720703125, 0.527587890625, 0.7738037109375, 1.02001953125, 1.2662353515625, 1.512451171875, 1.7586669921875, 2.0048828125, 2.2510986328125, 2.497314453125, 2.7435302734375, 2.98974609375, 3.2359619140625, 3.482177734375, 3.7283935546875, 3.974609375, 4.2208251953125, 4.467041015625, 4.7132568359375, 4.95947265625, 5.2056884765625, 5.451904296875, 5.6981201171875, 5.9443359375, 6.1905517578125, 6.436767578125, 6.6829833984375, 6.92919921875, 7.1754150390625, 7.421630859375, 7.6678466796875, 7.9140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 12.0, 17.0, 18.0, 9.0, 15.0, 20.0, 28.0, 28.0, 29.0, 31.0, 28.0, 36.0, 35.0, 54.0, 44.0, 39.0, 35.0, 41.0, 55.0, 48.0, 39.0, 34.0, 36.0, 37.0, 32.0, 28.0, 27.0, 19.0, 12.0, 13.0, 17.0, 11.0, 9.0, 6.0, 12.0, 4.0, 11.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.23046875, -5.07958984375, -4.9287109375, -4.77783203125, -4.626953125, -4.47607421875, -4.3251953125, -4.17431640625, -4.0234375, -3.87255859375, -3.7216796875, -3.57080078125, -3.419921875, -3.26904296875, -3.1181640625, -2.96728515625, -2.81640625, -2.66552734375, -2.5146484375, -2.36376953125, -2.212890625, -2.06201171875, -1.9111328125, -1.76025390625, -1.609375, -1.45849609375, -1.3076171875, -1.15673828125, -1.005859375, -0.85498046875, -0.7041015625, -0.55322265625, -0.40234375, -0.25146484375, -0.1005859375, 0.05029296875, 0.201171875, 0.35205078125, 0.5029296875, 0.65380859375, 0.8046875, 0.95556640625, 1.1064453125, 1.25732421875, 1.408203125, 1.55908203125, 1.7099609375, 1.86083984375, 2.01171875, 2.16259765625, 2.3134765625, 2.46435546875, 2.615234375, 2.76611328125, 2.9169921875, 3.06787109375, 3.21875, 3.36962890625, 3.5205078125, 3.67138671875, 3.822265625, 3.97314453125, 4.1240234375, 4.27490234375, 4.42578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 6.0, 7.0, 10.0, 13.0, 14.0, 16.0, 26.0, 41.0, 45.0, 69.0, 93.0, 160.0, 218.0, 292.0, 526.0, 862.0, 1589.0, 3207.0, 7835.0, 27139.0, 129984.0, 494454.0, 297917.0, 59293.0, 14359.0, 5019.0, 2154.0, 1176.0, 678.0, 430.0, 270.0, 209.0, 133.0, 83.0, 50.0, 46.0, 31.0, 24.0, 19.0, 13.0, 15.0, 3.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.5086669921875, -11.134521484375, -10.7603759765625, -10.38623046875, -10.0120849609375, -9.637939453125, -9.2637939453125, -8.8896484375, -8.5155029296875, -8.141357421875, -7.7672119140625, -7.39306640625, -7.0189208984375, -6.644775390625, -6.2706298828125, -5.896484375, -5.5223388671875, -5.148193359375, -4.7740478515625, -4.39990234375, -4.0257568359375, -3.651611328125, -3.2774658203125, -2.9033203125, -2.5291748046875, -2.155029296875, -1.7808837890625, -1.40673828125, -1.0325927734375, -0.658447265625, -0.2843017578125, 0.08984375, 0.4639892578125, 0.838134765625, 1.2122802734375, 1.58642578125, 1.9605712890625, 2.334716796875, 2.7088623046875, 3.0830078125, 3.4571533203125, 3.831298828125, 4.2054443359375, 4.57958984375, 4.9537353515625, 5.327880859375, 5.7020263671875, 6.076171875, 6.4503173828125, 6.824462890625, 7.1986083984375, 7.57275390625, 7.9468994140625, 8.321044921875, 8.6951904296875, 9.0693359375, 9.4434814453125, 9.817626953125, 10.1917724609375, 10.56591796875, 10.9400634765625, 11.314208984375, 11.6883544921875, 12.0625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 3.0, 7.0, 10.0, 3.0, 14.0, 15.0, 21.0, 16.0, 24.0, 28.0, 23.0, 26.0, 37.0, 30.0, 30.0, 51.0, 40.0, 39.0, 32.0, 46.0, 40.0, 42.0, 46.0, 38.0, 34.0, 33.0, 33.0, 29.0, 32.0, 26.0, 22.0, 23.0, 23.0, 17.0, 11.0, 15.0, 11.0, 3.0, 2.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.849609375, -2.76300048828125, -2.6763916015625, -2.58978271484375, -2.503173828125, -2.41656494140625, -2.3299560546875, -2.24334716796875, -2.15673828125, -2.07012939453125, -1.9835205078125, -1.89691162109375, -1.810302734375, -1.72369384765625, -1.6370849609375, -1.55047607421875, -1.4638671875, -1.37725830078125, -1.2906494140625, -1.20404052734375, -1.117431640625, -1.03082275390625, -0.9442138671875, -0.85760498046875, -0.77099609375, -0.68438720703125, -0.5977783203125, -0.51116943359375, -0.424560546875, -0.33795166015625, -0.2513427734375, -0.16473388671875, -0.078125, 0.00848388671875, 0.0950927734375, 0.18170166015625, 0.268310546875, 0.35491943359375, 0.4415283203125, 0.52813720703125, 0.61474609375, 0.70135498046875, 0.7879638671875, 0.87457275390625, 0.961181640625, 1.04779052734375, 1.1343994140625, 1.22100830078125, 1.3076171875, 1.39422607421875, 1.4808349609375, 1.56744384765625, 1.654052734375, 1.74066162109375, 1.8272705078125, 1.91387939453125, 2.00048828125, 2.08709716796875, 2.1737060546875, 2.26031494140625, 2.346923828125, 2.43353271484375, 2.5201416015625, 2.60675048828125, 2.693359375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 13.0, 21.0, 20.0, 49.0, 51.0, 90.0, 122.0, 174.0, 237.0, 318.0, 418.0, 602.0, 884.0, 1235.0, 1923.0, 3001.0, 5226.0, 10858.0, 29419.0, 107388.0, 398762.0, 349485.0, 89227.0, 25670.0, 9736.0, 4894.0, 2743.0, 1846.0, 1216.0, 817.0, 601.0, 429.0, 322.0, 192.0, 153.0, 117.0, 89.0, 56.0, 40.0, 24.0, 25.0, 19.0, 11.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-6.20703125, -6.02935791015625, -5.8516845703125, -5.67401123046875, -5.496337890625, -5.31866455078125, -5.1409912109375, -4.96331787109375, -4.78564453125, -4.60797119140625, -4.4302978515625, -4.25262451171875, -4.074951171875, -3.89727783203125, -3.7196044921875, -3.54193115234375, -3.3642578125, -3.18658447265625, -3.0089111328125, -2.83123779296875, -2.653564453125, -2.47589111328125, -2.2982177734375, -2.12054443359375, -1.94287109375, -1.76519775390625, -1.5875244140625, -1.40985107421875, -1.232177734375, -1.05450439453125, -0.8768310546875, -0.69915771484375, -0.521484375, -0.34381103515625, -0.1661376953125, 0.01153564453125, 0.189208984375, 0.36688232421875, 0.5445556640625, 0.72222900390625, 0.89990234375, 1.07757568359375, 1.2552490234375, 1.43292236328125, 1.610595703125, 1.78826904296875, 1.9659423828125, 2.14361572265625, 2.3212890625, 2.49896240234375, 2.6766357421875, 2.85430908203125, 3.031982421875, 3.20965576171875, 3.3873291015625, 3.56500244140625, 3.74267578125, 3.92034912109375, 4.0980224609375, 4.27569580078125, 4.453369140625, 4.63104248046875, 4.8087158203125, 4.98638916015625, 5.1640625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 7.0, 15.0, 19.0, 33.0, 39.0, 54.0, 89.0, 110.0, 132.0, 118.0, 105.0, 81.0, 64.0, 32.0, 26.0, 15.0, 14.0, 7.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00034308433532714844, -0.0003342684358358383, -0.0003254525363445282, -0.0003166366368532181, -0.00030782073736190796, -0.00029900483787059784, -0.0002901889383792877, -0.0002813730388879776, -0.0002725571393966675, -0.00026374123990535736, -0.00025492534041404724, -0.0002461094409227371, -0.000237293541431427, -0.00022847764194011688, -0.00021966174244880676, -0.00021084584295749664, -0.00020202994346618652, -0.0001932140439748764, -0.00018439814448356628, -0.00017558224499225616, -0.00016676634550094604, -0.00015795044600963593, -0.0001491345465183258, -0.00014031864702701569, -0.00013150274753570557, -0.00012268684804439545, -0.00011387094855308533, -0.00010505504906177521, -9.623914957046509e-05, -8.742325007915497e-05, -7.860735058784485e-05, -6.979145109653473e-05, -6.097555160522461e-05, -5.215965211391449e-05, -4.334375262260437e-05, -3.452785313129425e-05, -2.571195363998413e-05, -1.689605414867401e-05, -8.080154657363892e-06, 7.35744833946228e-07, 9.551644325256348e-06, 1.8367543816566467e-05, 2.7183443307876587e-05, 3.5999342799186707e-05, 4.4815242290496826e-05, 5.3631141781806946e-05, 6.244704127311707e-05, 7.126294076442719e-05, 8.00788402557373e-05, 8.889473974704742e-05, 9.771063923835754e-05, 0.00010652653872966766, 0.00011534243822097778, 0.0001241583377122879, 0.00013297423720359802, 0.00014179013669490814, 0.00015060603618621826, 0.00015942193567752838, 0.0001682378351688385, 0.00017705373466014862, 0.00018586963415145874, 0.00019468553364276886, 0.00020350143313407898, 0.0002123173326253891, 0.00022113323211669922]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 13.0, 10.0, 15.0, 18.0, 44.0, 37.0, 59.0, 84.0, 113.0, 165.0, 213.0, 301.0, 434.0, 634.0, 1002.0, 1339.0, 2153.0, 3734.0, 6883.0, 16796.0, 59535.0, 241888.0, 449083.0, 188816.0, 45819.0, 13897.0, 5975.0, 3303.0, 2034.0, 1297.0, 836.0, 599.0, 420.0, 289.0, 206.0, 123.0, 99.0, 85.0, 47.0, 33.0, 34.0, 18.0, 21.0, 17.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.25, -5.08282470703125, -4.9156494140625, -4.74847412109375, -4.581298828125, -4.41412353515625, -4.2469482421875, -4.07977294921875, -3.91259765625, -3.74542236328125, -3.5782470703125, -3.41107177734375, -3.243896484375, -3.07672119140625, -2.9095458984375, -2.74237060546875, -2.5751953125, -2.40802001953125, -2.2408447265625, -2.07366943359375, -1.906494140625, -1.73931884765625, -1.5721435546875, -1.40496826171875, -1.23779296875, -1.07061767578125, -0.9034423828125, -0.73626708984375, -0.569091796875, -0.40191650390625, -0.2347412109375, -0.06756591796875, 0.099609375, 0.26678466796875, 0.4339599609375, 0.60113525390625, 0.768310546875, 0.93548583984375, 1.1026611328125, 1.26983642578125, 1.43701171875, 1.60418701171875, 1.7713623046875, 1.93853759765625, 2.105712890625, 2.27288818359375, 2.4400634765625, 2.60723876953125, 2.7744140625, 2.94158935546875, 3.1087646484375, 3.27593994140625, 3.443115234375, 3.61029052734375, 3.7774658203125, 3.94464111328125, 4.11181640625, 4.27899169921875, 4.4461669921875, 4.61334228515625, 4.780517578125, 4.94769287109375, 5.1148681640625, 5.28204345703125, 5.44921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 8.0, 24.0, 41.0, 65.0, 121.0, 142.0, 161.0, 124.0, 110.0, 76.0, 42.0, 27.0, 19.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.296051025390625, -1.24542236328125, -1.194793701171875, -1.1441650390625, -1.093536376953125, -1.04290771484375, -0.992279052734375, -0.941650390625, -0.891021728515625, -0.84039306640625, -0.789764404296875, -0.7391357421875, -0.688507080078125, -0.63787841796875, -0.587249755859375, -0.53662109375, -0.485992431640625, -0.43536376953125, -0.384735107421875, -0.3341064453125, -0.283477783203125, -0.23284912109375, -0.182220458984375, -0.131591796875, -0.080963134765625, -0.03033447265625, 0.020294189453125, 0.0709228515625, 0.121551513671875, 0.17218017578125, 0.222808837890625, 0.2734375, 0.324066162109375, 0.37469482421875, 0.425323486328125, 0.4759521484375, 0.526580810546875, 0.57720947265625, 0.627838134765625, 0.678466796875, 0.729095458984375, 0.77972412109375, 0.830352783203125, 0.8809814453125, 0.931610107421875, 0.98223876953125, 1.032867431640625, 1.08349609375, 1.134124755859375, 1.18475341796875, 1.235382080078125, 1.2860107421875, 1.336639404296875, 1.38726806640625, 1.437896728515625, 1.488525390625, 1.539154052734375, 1.58978271484375, 1.640411376953125, 1.6910400390625, 1.741668701171875, 1.79229736328125, 1.842926025390625, 1.8935546875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 13.0, 9.0, 9.0, 14.0, 7.0, 8.0, 24.0, 20.0, 34.0, 41.0, 59.0, 49.0, 52.0, 68.0, 65.0, 69.0, 73.0, 72.0, 55.0, 47.0, 40.0, 31.0, 25.0, 26.0, 17.0, 17.0, 13.0, 11.0, 14.0, 3.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.574878692626953, -9.324416160583496, -9.073952674865723, -8.823490142822266, -8.573026657104492, -8.322564125061035, -8.072100639343262, -7.821638107299805, -7.5711750984191895, -7.320712089538574, -7.070249080657959, -6.819786071777344, -6.569323539733887, -6.318860054016113, -6.068397521972656, -5.817934513092041, -5.567471504211426, -5.3170084953308105, -5.066545486450195, -4.81608247756958, -4.565619468688965, -4.315156936645508, -4.064693927764893, -3.8142309188842773, -3.563767910003662, -3.313304901123047, -3.0628418922424316, -2.8123791217803955, -2.5619161128997803, -2.311453104019165, -2.060990333557129, -1.8105273246765137, -1.560063362121582, -1.3096003532409668, -1.0591374635696411, -0.8086745142936707, -0.5582115650177002, -0.30774855613708496, -0.05728566646575928, 0.1931772232055664, 0.44364023208618164, 0.6941031813621521, 0.9445661306381226, 1.1950290203094482, 1.4454920291900635, 1.6959550380706787, 1.9464179277420044, 2.19688081741333, 2.4473438262939453, 2.6978068351745605, 2.948269844055176, 3.198732614517212, 3.449195623397827, 3.6996586322784424, 3.9501214027404785, 4.200584411621094, 4.451047420501709, 4.701510429382324, 4.9519734382629395, 5.202436447143555, 5.452898979187012, 5.703362464904785, 5.953824996948242, 6.204288005828857, 6.454751014709473]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 14.0, 9.0, 15.0, 18.0, 24.0, 25.0, 27.0, 40.0, 28.0, 29.0, 32.0, 50.0, 40.0, 56.0, 47.0, 47.0, 46.0, 38.0, 40.0, 40.0, 45.0, 29.0, 37.0, 34.0, 24.0, 25.0, 18.0, 18.0, 13.0, 13.0, 10.0, 11.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.813549041748047, -4.668715476989746, -4.523881912231445, -4.379047870635986, -4.2342143058776855, -4.089380741119385, -3.944546937942505, -3.799713134765625, -3.654879570007324, -3.5100460052490234, -3.3652122020721436, -3.2203783988952637, -3.075544834136963, -2.930711269378662, -2.7858774662017822, -2.6410436630249023, -2.4962100982666016, -2.351376533508301, -2.206542730331421, -2.061708927154541, -1.9168753623962402, -1.77204167842865, -1.6272079944610596, -1.4823743104934692, -1.337540626525879, -1.1927069425582886, -1.0478732585906982, -0.9030395746231079, -0.7582058906555176, -0.6133722066879272, -0.4685385227203369, -0.3237048387527466, -0.17887163162231445, -0.03403794765472412, 0.11079573631286621, 0.25562942028045654, 0.4004631042480469, 0.5452967882156372, 0.6901304721832275, 0.8349641561508179, 0.9797978401184082, 1.1246315240859985, 1.2694652080535889, 1.4142988920211792, 1.5591325759887695, 1.7039662599563599, 1.8487999439239502, 1.9936336278915405, 2.138467311859131, 2.2833008766174316, 2.4281346797943115, 2.5729684829711914, 2.717802047729492, 2.862635612487793, 3.007469415664673, 3.1523032188415527, 3.2971367835998535, 3.4419703483581543, 3.586804151535034, 3.731637954711914, 3.876471519470215, 4.021305084228516, 4.166138648986816, 4.310972690582275, 4.455806255340576]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 13.0, 19.0, 23.0, 42.0, 59.0, 88.0, 151.0, 216.0, 388.0, 632.0, 1102.0, 1817.0, 3176.0, 5523.0, 9538.0, 16531.0, 28602.0, 48671.0, 79318.0, 119164.0, 156694.0, 167841.0, 144587.0, 103323.0, 66071.0, 39855.0, 23049.0, 13260.0, 7693.0, 4528.0, 2624.0, 1533.0, 941.0, 585.0, 343.0, 197.0, 140.0, 75.0, 48.0, 34.0, 16.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.92578125, -5.73651123046875, -5.5472412109375, -5.35797119140625, -5.168701171875, -4.97943115234375, -4.7901611328125, -4.60089111328125, -4.41162109375, -4.22235107421875, -4.0330810546875, -3.84381103515625, -3.654541015625, -3.46527099609375, -3.2760009765625, -3.08673095703125, -2.8974609375, -2.70819091796875, -2.5189208984375, -2.32965087890625, -2.140380859375, -1.95111083984375, -1.7618408203125, -1.57257080078125, -1.38330078125, -1.19403076171875, -1.0047607421875, -0.81549072265625, -0.626220703125, -0.43695068359375, -0.2476806640625, -0.05841064453125, 0.130859375, 0.32012939453125, 0.5093994140625, 0.69866943359375, 0.887939453125, 1.07720947265625, 1.2664794921875, 1.45574951171875, 1.64501953125, 1.83428955078125, 2.0235595703125, 2.21282958984375, 2.402099609375, 2.59136962890625, 2.7806396484375, 2.96990966796875, 3.1591796875, 3.34844970703125, 3.5377197265625, 3.72698974609375, 3.916259765625, 4.10552978515625, 4.2947998046875, 4.48406982421875, 4.67333984375, 4.86260986328125, 5.0518798828125, 5.24114990234375, 5.430419921875, 5.61968994140625, 5.8089599609375, 5.99822998046875, 6.1875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 6.0, 9.0, 12.0, 13.0, 14.0, 19.0, 20.0, 26.0, 47.0, 47.0, 30.0, 41.0, 49.0, 43.0, 46.0, 37.0, 51.0, 48.0, 48.0, 39.0, 49.0, 46.0, 37.0, 38.0, 41.0, 21.0, 16.0, 10.0, 16.0, 15.0, 8.0, 12.0, 7.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0390625, -5.871826171875, -5.70458984375, -5.537353515625, -5.3701171875, -5.202880859375, -5.03564453125, -4.868408203125, -4.701171875, -4.533935546875, -4.36669921875, -4.199462890625, -4.0322265625, -3.864990234375, -3.69775390625, -3.530517578125, -3.36328125, -3.196044921875, -3.02880859375, -2.861572265625, -2.6943359375, -2.527099609375, -2.35986328125, -2.192626953125, -2.025390625, -1.858154296875, -1.69091796875, -1.523681640625, -1.3564453125, -1.189208984375, -1.02197265625, -0.854736328125, -0.6875, -0.520263671875, -0.35302734375, -0.185791015625, -0.0185546875, 0.148681640625, 0.31591796875, 0.483154296875, 0.650390625, 0.817626953125, 0.98486328125, 1.152099609375, 1.3193359375, 1.486572265625, 1.65380859375, 1.821044921875, 1.98828125, 2.155517578125, 2.32275390625, 2.489990234375, 2.6572265625, 2.824462890625, 2.99169921875, 3.158935546875, 3.326171875, 3.493408203125, 3.66064453125, 3.827880859375, 3.9951171875, 4.162353515625, 4.32958984375, 4.496826171875, 4.6640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 20.0, 19.0, 31.0, 59.0, 87.0, 148.0, 206.0, 308.0, 525.0, 827.0, 1272.0, 2216.0, 3550.0, 5508.0, 9165.0, 15202.0, 24330.0, 39645.0, 61824.0, 91586.0, 125363.0, 148392.0, 147086.0, 123055.0, 89135.0, 59672.0, 37857.0, 23730.0, 14406.0, 8977.0, 5401.0, 3365.0, 2047.0, 1318.0, 825.0, 484.0, 313.0, 216.0, 137.0, 95.0, 41.0, 30.0, 19.0, 16.0, 11.0, 9.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.23828125, -5.069091796875, -4.89990234375, -4.730712890625, -4.5615234375, -4.392333984375, -4.22314453125, -4.053955078125, -3.884765625, -3.715576171875, -3.54638671875, -3.377197265625, -3.2080078125, -3.038818359375, -2.86962890625, -2.700439453125, -2.53125, -2.362060546875, -2.19287109375, -2.023681640625, -1.8544921875, -1.685302734375, -1.51611328125, -1.346923828125, -1.177734375, -1.008544921875, -0.83935546875, -0.670166015625, -0.5009765625, -0.331787109375, -0.16259765625, 0.006591796875, 0.17578125, 0.344970703125, 0.51416015625, 0.683349609375, 0.8525390625, 1.021728515625, 1.19091796875, 1.360107421875, 1.529296875, 1.698486328125, 1.86767578125, 2.036865234375, 2.2060546875, 2.375244140625, 2.54443359375, 2.713623046875, 2.8828125, 3.052001953125, 3.22119140625, 3.390380859375, 3.5595703125, 3.728759765625, 3.89794921875, 4.067138671875, 4.236328125, 4.405517578125, 4.57470703125, 4.743896484375, 4.9130859375, 5.082275390625, 5.25146484375, 5.420654296875, 5.58984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 10.0, 7.0, 7.0, 6.0, 11.0, 10.0, 20.0, 19.0, 17.0, 31.0, 16.0, 28.0, 37.0, 33.0, 35.0, 30.0, 39.0, 18.0, 58.0, 43.0, 51.0, 46.0, 42.0, 25.0, 33.0, 45.0, 28.0, 28.0, 25.0, 26.0, 28.0, 21.0, 27.0, 11.0, 21.0, 12.0, 12.0, 14.0, 13.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.317108154296875, -2.22991943359375, -2.142730712890625, -2.0555419921875, -1.968353271484375, -1.88116455078125, -1.793975830078125, -1.706787109375, -1.619598388671875, -1.53240966796875, -1.445220947265625, -1.3580322265625, -1.270843505859375, -1.18365478515625, -1.096466064453125, -1.00927734375, -0.922088623046875, -0.83489990234375, -0.747711181640625, -0.6605224609375, -0.573333740234375, -0.48614501953125, -0.398956298828125, -0.311767578125, -0.224578857421875, -0.13739013671875, -0.050201416015625, 0.0369873046875, 0.124176025390625, 0.21136474609375, 0.298553466796875, 0.3857421875, 0.472930908203125, 0.56011962890625, 0.647308349609375, 0.7344970703125, 0.821685791015625, 0.90887451171875, 0.996063232421875, 1.083251953125, 1.170440673828125, 1.25762939453125, 1.344818115234375, 1.4320068359375, 1.519195556640625, 1.60638427734375, 1.693572998046875, 1.78076171875, 1.867950439453125, 1.95513916015625, 2.042327880859375, 2.1295166015625, 2.216705322265625, 2.30389404296875, 2.391082763671875, 2.478271484375, 2.565460205078125, 2.65264892578125, 2.739837646484375, 2.8270263671875, 2.914215087890625, 3.00140380859375, 3.088592529296875, 3.17578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 11.0, 16.0, 29.0, 36.0, 46.0, 54.0, 96.0, 126.0, 159.0, 264.0, 307.0, 502.0, 831.0, 1214.0, 1787.0, 2866.0, 4474.0, 7094.0, 11728.0, 20014.0, 33681.0, 58642.0, 100761.0, 161113.0, 202817.0, 171347.0, 110476.0, 64326.0, 37089.0, 21792.0, 12988.0, 7878.0, 4964.0, 3129.0, 1977.0, 1266.0, 832.0, 578.0, 384.0, 241.0, 170.0, 141.0, 80.0, 67.0, 46.0, 31.0, 24.0, 18.0, 8.0, 9.0, 7.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-3.78515625, -3.66900634765625, -3.5528564453125, -3.43670654296875, -3.320556640625, -3.20440673828125, -3.0882568359375, -2.97210693359375, -2.85595703125, -2.73980712890625, -2.6236572265625, -2.50750732421875, -2.391357421875, -2.27520751953125, -2.1590576171875, -2.04290771484375, -1.9267578125, -1.81060791015625, -1.6944580078125, -1.57830810546875, -1.462158203125, -1.34600830078125, -1.2298583984375, -1.11370849609375, -0.99755859375, -0.88140869140625, -0.7652587890625, -0.64910888671875, -0.532958984375, -0.41680908203125, -0.3006591796875, -0.18450927734375, -0.068359375, 0.04779052734375, 0.1639404296875, 0.28009033203125, 0.396240234375, 0.51239013671875, 0.6285400390625, 0.74468994140625, 0.86083984375, 0.97698974609375, 1.0931396484375, 1.20928955078125, 1.325439453125, 1.44158935546875, 1.5577392578125, 1.67388916015625, 1.7900390625, 1.90618896484375, 2.0223388671875, 2.13848876953125, 2.254638671875, 2.37078857421875, 2.4869384765625, 2.60308837890625, 2.71923828125, 2.83538818359375, 2.9515380859375, 3.06768798828125, 3.183837890625, 3.29998779296875, 3.4161376953125, 3.53228759765625, 3.6484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 4.0, 6.0, 1.0, 11.0, 7.0, 14.0, 21.0, 26.0, 33.0, 40.0, 40.0, 53.0, 85.0, 78.0, 93.0, 98.0, 83.0, 66.0, 51.0, 33.0, 43.0, 28.0, 18.0, 11.0, 7.0, 10.0, 13.0, 6.0, 6.0, 0.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005068778991699219, -0.0004900619387626648, -0.0004732459783554077, -0.00045643001794815063, -0.00043961405754089355, -0.0004227980971336365, -0.0004059821367263794, -0.0003891661763191223, -0.00037235021591186523, -0.00035553425550460815, -0.0003387182950973511, -0.000321902334690094, -0.0003050863742828369, -0.00028827041387557983, -0.00027145445346832275, -0.0002546384930610657, -0.0002378225326538086, -0.00022100657224655151, -0.00020419061183929443, -0.00018737465143203735, -0.00017055869102478027, -0.0001537427306175232, -0.0001369267702102661, -0.00012011080980300903, -0.00010329484939575195, -8.647888898849487e-05, -6.966292858123779e-05, -5.284696817398071e-05, -3.603100776672363e-05, -1.9215047359466553e-05, -2.3990869522094727e-06, 1.4416873455047607e-05, 3.123283386230469e-05, 4.804879426956177e-05, 6.486475467681885e-05, 8.168071508407593e-05, 9.849667549133301e-05, 0.00011531263589859009, 0.00013212859630584717, 0.00014894455671310425, 0.00016576051712036133, 0.0001825764775276184, 0.0001993924379348755, 0.00021620839834213257, 0.00023302435874938965, 0.00024984031915664673, 0.0002666562795639038, 0.0002834722399711609, 0.00030028820037841797, 0.00031710416078567505, 0.00033392012119293213, 0.0003507360816001892, 0.0003675520420074463, 0.00038436800241470337, 0.00040118396282196045, 0.00041799992322921753, 0.0004348158836364746, 0.0004516318440437317, 0.00046844780445098877, 0.00048526376485824585, 0.0005020797252655029, 0.00051889568567276, 0.0005357116460800171, 0.0005525276064872742, 0.0005693435668945312]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 13.0, 24.0, 27.0, 44.0, 69.0, 87.0, 129.0, 184.0, 276.0, 417.0, 609.0, 866.0, 1274.0, 2065.0, 3136.0, 4814.0, 7663.0, 11909.0, 18932.0, 30810.0, 49512.0, 78120.0, 117995.0, 156701.0, 166455.0, 136771.0, 95694.0, 61203.0, 38085.0, 23580.0, 14794.0, 9219.0, 5823.0, 3700.0, 2502.0, 1580.0, 1103.0, 781.0, 479.0, 315.0, 245.0, 175.0, 101.0, 80.0, 56.0, 41.0, 23.0, 22.0, 15.0, 14.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.765625, -2.6798095703125, -2.593994140625, -2.5081787109375, -2.42236328125, -2.3365478515625, -2.250732421875, -2.1649169921875, -2.0791015625, -1.9932861328125, -1.907470703125, -1.8216552734375, -1.73583984375, -1.6500244140625, -1.564208984375, -1.4783935546875, -1.392578125, -1.3067626953125, -1.220947265625, -1.1351318359375, -1.04931640625, -0.9635009765625, -0.877685546875, -0.7918701171875, -0.7060546875, -0.6202392578125, -0.534423828125, -0.4486083984375, -0.36279296875, -0.2769775390625, -0.191162109375, -0.1053466796875, -0.01953125, 0.0662841796875, 0.152099609375, 0.2379150390625, 0.32373046875, 0.4095458984375, 0.495361328125, 0.5811767578125, 0.6669921875, 0.7528076171875, 0.838623046875, 0.9244384765625, 1.01025390625, 1.0960693359375, 1.181884765625, 1.2677001953125, 1.353515625, 1.4393310546875, 1.525146484375, 1.6109619140625, 1.69677734375, 1.7825927734375, 1.868408203125, 1.9542236328125, 2.0400390625, 2.1258544921875, 2.211669921875, 2.2974853515625, 2.38330078125, 2.4691162109375, 2.554931640625, 2.6407470703125, 2.7265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 12.0, 13.0, 14.0, 10.0, 14.0, 16.0, 21.0, 21.0, 25.0, 32.0, 32.0, 21.0, 51.0, 59.0, 61.0, 54.0, 57.0, 56.0, 47.0, 50.0, 51.0, 49.0, 38.0, 32.0, 21.0, 18.0, 13.0, 21.0, 18.0, 14.0, 10.0, 10.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98486328125, -0.956817626953125, -0.92877197265625, -0.900726318359375, -0.8726806640625, -0.844635009765625, -0.81658935546875, -0.788543701171875, -0.760498046875, -0.732452392578125, -0.70440673828125, -0.676361083984375, -0.6483154296875, -0.620269775390625, -0.59222412109375, -0.564178466796875, -0.5361328125, -0.508087158203125, -0.48004150390625, -0.451995849609375, -0.4239501953125, -0.395904541015625, -0.36785888671875, -0.339813232421875, -0.311767578125, -0.283721923828125, -0.25567626953125, -0.227630615234375, -0.1995849609375, -0.171539306640625, -0.14349365234375, -0.115447998046875, -0.08740234375, -0.059356689453125, -0.03131103515625, -0.003265380859375, 0.0247802734375, 0.052825927734375, 0.08087158203125, 0.108917236328125, 0.136962890625, 0.165008544921875, 0.19305419921875, 0.221099853515625, 0.2491455078125, 0.277191162109375, 0.30523681640625, 0.333282470703125, 0.361328125, 0.389373779296875, 0.41741943359375, 0.445465087890625, 0.4735107421875, 0.501556396484375, 0.52960205078125, 0.557647705078125, 0.585693359375, 0.613739013671875, 0.64178466796875, 0.669830322265625, 0.6978759765625, 0.725921630859375, 0.75396728515625, 0.782012939453125, 0.81005859375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 1.0, 6.0, 5.0, 8.0, 14.0, 11.0, 25.0, 17.0, 32.0, 28.0, 42.0, 42.0, 76.0, 69.0, 66.0, 78.0, 68.0, 65.0, 73.0, 50.0, 41.0, 43.0, 27.0, 28.0, 15.0, 16.0, 16.0, 10.0, 12.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.663951873779297, -9.392720222473145, -9.121489524841309, -8.850257873535156, -8.57902717590332, -8.307795524597168, -8.036564826965332, -7.76533317565918, -7.4941020011901855, -7.222870826721191, -6.951639652252197, -6.680408477783203, -6.409176826477051, -6.137946128845215, -5.8667144775390625, -5.595483303070068, -5.324252128601074, -5.05302095413208, -4.781789779663086, -4.510558605194092, -4.239327430725098, -3.9680960178375244, -3.696864604949951, -3.425633430480957, -3.154402256011963, -2.8831710815429688, -2.6119399070739746, -2.3407084941864014, -2.0694773197174072, -1.798246145248413, -1.5270148515701294, -1.2557835578918457, -0.9845523834228516, -0.7133211493492126, -0.44208991527557373, -0.17085868120193481, 0.1003725528717041, 0.37160372734069824, 0.6428350210189819, 0.9140663146972656, 1.1852974891662598, 1.456528663635254, 1.7277599573135376, 1.9989912509918213, 2.2702224254608154, 2.5414535999298096, 2.812685012817383, 3.083916187286377, 3.355147361755371, 3.6263785362243652, 3.8976097106933594, 4.1688408851623535, 4.440072059631348, 4.7113037109375, 4.982534885406494, 5.253766059875488, 5.524997234344482, 5.796228408813477, 6.067459583282471, 6.338690757751465, 6.609922409057617, 6.881153106689453, 7.1523847579956055, 7.4236159324646, 7.694847106933594]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 4.0, 6.0, 9.0, 7.0, 9.0, 11.0, 13.0, 14.0, 20.0, 16.0, 28.0, 28.0, 19.0, 29.0, 25.0, 29.0, 24.0, 46.0, 33.0, 33.0, 47.0, 53.0, 48.0, 34.0, 43.0, 48.0, 37.0, 37.0, 44.0, 20.0, 30.0, 30.0, 22.0, 13.0, 19.0, 8.0, 13.0, 11.0, 5.0, 5.0, 8.0, 3.0, 2.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.654512405395508, -4.511689186096191, -4.368866443634033, -4.226043701171875, -4.083220481872559, -3.9403975009918213, -3.797574520111084, -3.6547515392303467, -3.5119285583496094, -3.369105577468872, -3.2262825965881348, -3.0834596157073975, -2.94063663482666, -2.797813653945923, -2.6549906730651855, -2.5121676921844482, -2.369344711303711, -2.2265217304229736, -2.0836987495422363, -1.940875768661499, -1.7980527877807617, -1.6552298069000244, -1.512406826019287, -1.3695838451385498, -1.2267608642578125, -1.0839378833770752, -0.9411149024963379, -0.7982919216156006, -0.6554689407348633, -0.512645959854126, -0.36982297897338867, -0.22699999809265137, -0.08417701721191406, 0.05864596366882324, 0.20146894454956055, 0.34429192543029785, 0.48711490631103516, 0.6299378871917725, 0.7727608680725098, 0.9155838489532471, 1.0584068298339844, 1.2012298107147217, 1.344052791595459, 1.4868757724761963, 1.6296987533569336, 1.772521734237671, 1.9153447151184082, 2.0581676959991455, 2.200990676879883, 2.34381365776062, 2.4866366386413574, 2.6294596195220947, 2.772282600402832, 2.9151055812835693, 3.0579285621643066, 3.200751543045044, 3.3435745239257812, 3.4863975048065186, 3.629220485687256, 3.772043466567993, 3.9148664474487305, 4.057689666748047, 4.200512409210205, 4.343335151672363, 4.48615837097168]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 13.0, 14.0, 14.0, 13.0, 25.0, 23.0, 44.0, 69.0, 103.0, 145.0, 241.0, 360.0, 555.0, 869.0, 1363.0, 2071.0, 3452.0, 6011.0, 10622.0, 19694.0, 38070.0, 80232.0, 181578.0, 438830.0, 983108.0, 1217101.0, 691316.0, 283790.0, 119806.0, 54357.0, 27003.0, 13981.0, 7842.0, 4333.0, 2708.0, 1544.0, 1049.0, 667.0, 435.0, 287.0, 188.0, 118.0, 74.0, 59.0, 37.0, 30.0, 15.0, 10.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.5078125, -8.2664794921875, -8.025146484375, -7.7838134765625, -7.54248046875, -7.3011474609375, -7.059814453125, -6.8184814453125, -6.5771484375, -6.3358154296875, -6.094482421875, -5.8531494140625, -5.61181640625, -5.3704833984375, -5.129150390625, -4.8878173828125, -4.646484375, -4.4051513671875, -4.163818359375, -3.9224853515625, -3.68115234375, -3.4398193359375, -3.198486328125, -2.9571533203125, -2.7158203125, -2.4744873046875, -2.233154296875, -1.9918212890625, -1.75048828125, -1.5091552734375, -1.267822265625, -1.0264892578125, -0.78515625, -0.5438232421875, -0.302490234375, -0.0611572265625, 0.18017578125, 0.4215087890625, 0.662841796875, 0.9041748046875, 1.1455078125, 1.3868408203125, 1.628173828125, 1.8695068359375, 2.11083984375, 2.3521728515625, 2.593505859375, 2.8348388671875, 3.076171875, 3.3175048828125, 3.558837890625, 3.8001708984375, 4.04150390625, 4.2828369140625, 4.524169921875, 4.7655029296875, 5.0068359375, 5.2481689453125, 5.489501953125, 5.7308349609375, 5.97216796875, 6.2135009765625, 6.454833984375, 6.6961669921875, 6.9375]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 9.0, 6.0, 9.0, 12.0, 14.0, 12.0, 9.0, 21.0, 25.0, 20.0, 30.0, 23.0, 33.0, 38.0, 28.0, 42.0, 38.0, 46.0, 40.0, 37.0, 47.0, 45.0, 41.0, 49.0, 41.0, 41.0, 32.0, 34.0, 32.0, 19.0, 22.0, 20.0, 16.0, 17.0, 7.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.859375, -3.742156982421875, -3.62493896484375, -3.507720947265625, -3.3905029296875, -3.273284912109375, -3.15606689453125, -3.038848876953125, -2.921630859375, -2.804412841796875, -2.68719482421875, -2.569976806640625, -2.4527587890625, -2.335540771484375, -2.21832275390625, -2.101104736328125, -1.98388671875, -1.866668701171875, -1.74945068359375, -1.632232666015625, -1.5150146484375, -1.397796630859375, -1.28057861328125, -1.163360595703125, -1.046142578125, -0.928924560546875, -0.81170654296875, -0.694488525390625, -0.5772705078125, -0.460052490234375, -0.34283447265625, -0.225616455078125, -0.1083984375, 0.008819580078125, 0.12603759765625, 0.243255615234375, 0.3604736328125, 0.477691650390625, 0.59490966796875, 0.712127685546875, 0.829345703125, 0.946563720703125, 1.06378173828125, 1.180999755859375, 1.2982177734375, 1.415435791015625, 1.53265380859375, 1.649871826171875, 1.76708984375, 1.884307861328125, 2.00152587890625, 2.118743896484375, 2.2359619140625, 2.353179931640625, 2.47039794921875, 2.587615966796875, 2.704833984375, 2.822052001953125, 2.93927001953125, 3.056488037109375, 3.1737060546875, 3.290924072265625, 3.40814208984375, 3.525360107421875, 3.642578125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 12.0, 18.0, 33.0, 50.0, 53.0, 86.0, 136.0, 176.0, 321.0, 443.0, 712.0, 1053.0, 1654.0, 2668.0, 4565.0, 7420.0, 12637.0, 22416.0, 40549.0, 74570.0, 142518.0, 280222.0, 551928.0, 940688.0, 945837.0, 560994.0, 285820.0, 145229.0, 75427.0, 40962.0, 22483.0, 12798.0, 7743.0, 4575.0, 2733.0, 1712.0, 1074.0, 668.0, 443.0, 278.0, 163.0, 135.0, 89.0, 64.0, 32.0, 35.0, 16.0, 17.0, 2.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8984375, -6.6685791015625, -6.438720703125, -6.2088623046875, -5.97900390625, -5.7491455078125, -5.519287109375, -5.2894287109375, -5.0595703125, -4.8297119140625, -4.599853515625, -4.3699951171875, -4.14013671875, -3.9102783203125, -3.680419921875, -3.4505615234375, -3.220703125, -2.9908447265625, -2.760986328125, -2.5311279296875, -2.30126953125, -2.0714111328125, -1.841552734375, -1.6116943359375, -1.3818359375, -1.1519775390625, -0.922119140625, -0.6922607421875, -0.46240234375, -0.2325439453125, -0.002685546875, 0.2271728515625, 0.45703125, 0.6868896484375, 0.916748046875, 1.1466064453125, 1.37646484375, 1.6063232421875, 1.836181640625, 2.0660400390625, 2.2958984375, 2.5257568359375, 2.755615234375, 2.9854736328125, 3.21533203125, 3.4451904296875, 3.675048828125, 3.9049072265625, 4.134765625, 4.3646240234375, 4.594482421875, 4.8243408203125, 5.05419921875, 5.2840576171875, 5.513916015625, 5.7437744140625, 5.9736328125, 6.2034912109375, 6.433349609375, 6.6632080078125, 6.89306640625, 7.1229248046875, 7.352783203125, 7.5826416015625, 7.8125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 10.0, 13.0, 13.0, 32.0, 29.0, 36.0, 53.0, 68.0, 86.0, 101.0, 125.0, 160.0, 190.0, 247.0, 252.0, 272.0, 315.0, 312.0, 300.0, 255.0, 216.0, 232.0, 165.0, 114.0, 102.0, 92.0, 61.0, 46.0, 30.0, 26.0, 21.0, 17.0, 16.0, 11.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.728515625, -2.654571533203125, -2.58062744140625, -2.506683349609375, -2.4327392578125, -2.358795166015625, -2.28485107421875, -2.210906982421875, -2.136962890625, -2.063018798828125, -1.98907470703125, -1.915130615234375, -1.8411865234375, -1.767242431640625, -1.69329833984375, -1.619354248046875, -1.54541015625, -1.471466064453125, -1.39752197265625, -1.323577880859375, -1.2496337890625, -1.175689697265625, -1.10174560546875, -1.027801513671875, -0.953857421875, -0.879913330078125, -0.80596923828125, -0.732025146484375, -0.6580810546875, -0.584136962890625, -0.51019287109375, -0.436248779296875, -0.3623046875, -0.288360595703125, -0.21441650390625, -0.140472412109375, -0.0665283203125, 0.007415771484375, 0.08135986328125, 0.155303955078125, 0.229248046875, 0.303192138671875, 0.37713623046875, 0.451080322265625, 0.5250244140625, 0.598968505859375, 0.67291259765625, 0.746856689453125, 0.82080078125, 0.894744873046875, 0.96868896484375, 1.042633056640625, 1.1165771484375, 1.190521240234375, 1.26446533203125, 1.338409423828125, 1.412353515625, 1.486297607421875, 1.56024169921875, 1.634185791015625, 1.7081298828125, 1.782073974609375, 1.85601806640625, 1.929962158203125, 2.00390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 9.0, 9.0, 10.0, 9.0, 17.0, 18.0, 17.0, 30.0, 30.0, 36.0, 38.0, 49.0, 67.0, 63.0, 66.0, 56.0, 68.0, 62.0, 58.0, 46.0, 40.0, 37.0, 41.0, 22.0, 22.0, 17.0, 13.0, 15.0, 12.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.27569580078125, -8.019668579101562, -7.763640880584717, -7.507613182067871, -7.251585960388184, -6.995558261871338, -6.739530563354492, -6.483503341674805, -6.227475643157959, -5.971447944641113, -5.715420722961426, -5.45939302444458, -5.203365325927734, -4.947338104248047, -4.691310405731201, -4.4352827072143555, -4.179255485534668, -3.9232280254364014, -3.6672005653381348, -3.411172866821289, -3.1551454067230225, -2.899117946624756, -2.64309024810791, -2.3870627880096436, -2.131035327911377, -1.8750078678131104, -1.6189802885055542, -1.362952709197998, -1.1069252490997314, -0.8508977890014648, -0.5948702096939087, -0.33884263038635254, -0.08281517028808594, 0.17321234941482544, 0.4292398691177368, 0.6852673888206482, 0.9412949085235596, 1.1973223686218262, 1.4533499479293823, 1.7093775272369385, 1.965404987335205, 2.2214324474334717, 2.4774599075317383, 2.733487606048584, 2.9895150661468506, 3.245542526245117, 3.501570224761963, 3.7575976848602295, 4.013625144958496, 4.269652843475342, 4.525680065155029, 4.781707763671875, 5.0377349853515625, 5.293762683868408, 5.549790382385254, 5.805817604064941, 6.061845302581787, 6.317873001098633, 6.57390022277832, 6.829927921295166, 7.085955619812012, 7.341982841491699, 7.598010540008545, 7.854038238525391, 8.110065460205078]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 1.0, 11.0, 8.0, 6.0, 8.0, 22.0, 15.0, 13.0, 25.0, 23.0, 27.0, 32.0, 30.0, 32.0, 28.0, 35.0, 48.0, 35.0, 41.0, 40.0, 51.0, 53.0, 45.0, 48.0, 36.0, 34.0, 33.0, 28.0, 36.0, 26.0, 18.0, 19.0, 13.0, 15.0, 12.0, 11.0, 12.0, 5.0, 5.0, 10.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.571853160858154, -4.4191575050354, -4.266462326049805, -4.113766670227051, -3.961071252822876, -3.808375835418701, -3.6556801795959473, -3.5029847621917725, -3.3502893447875977, -3.197593927383423, -3.044898509979248, -2.892202854156494, -2.7395074367523193, -2.5868120193481445, -2.4341163635253906, -2.281420946121216, -2.128725528717041, -1.9760301113128662, -1.8233345746994019, -1.6706390380859375, -1.5179436206817627, -1.365248203277588, -1.2125526666641235, -1.0598571300506592, -0.9071617126464844, -0.7544662356376648, -0.6017707586288452, -0.44907528162002563, -0.29637980461120605, -0.14368432760238647, 0.009011149406433105, 0.16170668601989746, 0.31440258026123047, 0.46709805727005005, 0.6197935342788696, 0.7724890112876892, 0.9251844882965088, 1.0778799057006836, 1.230575442314148, 1.3832709789276123, 1.535966396331787, 1.688661813735962, 1.8413573503494263, 1.9940528869628906, 2.1467483043670654, 2.2994437217712402, 2.452139377593994, 2.604834794998169, 2.7575302124023438, 2.9102256298065186, 3.0629210472106934, 3.2156167030334473, 3.368312120437622, 3.521007537841797, 3.673703193664551, 3.8263986110687256, 3.9790940284729004, 4.131789684295654, 4.28448486328125, 4.437180519104004, 4.589876174926758, 4.7425713539123535, 4.895267009735107, 5.047962188720703, 5.200657844543457]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 13.0, 15.0, 22.0, 40.0, 49.0, 58.0, 92.0, 167.0, 270.0, 420.0, 628.0, 957.0, 1567.0, 2494.0, 3882.0, 6499.0, 11057.0, 18145.0, 30641.0, 51060.0, 81917.0, 123701.0, 161614.0, 167993.0, 138177.0, 95608.0, 60284.0, 36460.0, 21583.0, 13006.0, 7619.0, 4753.0, 2874.0, 1745.0, 1089.0, 679.0, 450.0, 306.0, 195.0, 125.0, 103.0, 59.0, 54.0, 21.0, 21.0, 14.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0], "bins": [-3.705078125, -3.5997314453125, -3.494384765625, -3.3890380859375, -3.28369140625, -3.1783447265625, -3.072998046875, -2.9676513671875, -2.8623046875, -2.7569580078125, -2.651611328125, -2.5462646484375, -2.44091796875, -2.3355712890625, -2.230224609375, -2.1248779296875, -2.01953125, -1.9141845703125, -1.808837890625, -1.7034912109375, -1.59814453125, -1.4927978515625, -1.387451171875, -1.2821044921875, -1.1767578125, -1.0714111328125, -0.966064453125, -0.8607177734375, -0.75537109375, -0.6500244140625, -0.544677734375, -0.4393310546875, -0.333984375, -0.2286376953125, -0.123291015625, -0.0179443359375, 0.08740234375, 0.1927490234375, 0.298095703125, 0.4034423828125, 0.5087890625, 0.6141357421875, 0.719482421875, 0.8248291015625, 0.93017578125, 1.0355224609375, 1.140869140625, 1.2462158203125, 1.3515625, 1.4569091796875, 1.562255859375, 1.6676025390625, 1.77294921875, 1.8782958984375, 1.983642578125, 2.0889892578125, 2.1943359375, 2.2996826171875, 2.405029296875, 2.5103759765625, 2.61572265625, 2.7210693359375, 2.826416015625, 2.9317626953125, 3.037109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 7.0, 8.0, 11.0, 10.0, 14.0, 14.0, 22.0, 20.0, 24.0, 30.0, 35.0, 30.0, 37.0, 45.0, 43.0, 42.0, 49.0, 49.0, 39.0, 40.0, 48.0, 47.0, 45.0, 42.0, 21.0, 33.0, 28.0, 30.0, 26.0, 24.0, 24.0, 9.0, 15.0, 6.0, 9.0, 9.0, 2.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.7054443359375, -4.528076171875, -4.3507080078125, -4.17333984375, -3.9959716796875, -3.818603515625, -3.6412353515625, -3.4638671875, -3.2864990234375, -3.109130859375, -2.9317626953125, -2.75439453125, -2.5770263671875, -2.399658203125, -2.2222900390625, -2.044921875, -1.8675537109375, -1.690185546875, -1.5128173828125, -1.33544921875, -1.1580810546875, -0.980712890625, -0.8033447265625, -0.6259765625, -0.4486083984375, -0.271240234375, -0.0938720703125, 0.08349609375, 0.2608642578125, 0.438232421875, 0.6156005859375, 0.79296875, 0.9703369140625, 1.147705078125, 1.3250732421875, 1.50244140625, 1.6798095703125, 1.857177734375, 2.0345458984375, 2.2119140625, 2.3892822265625, 2.566650390625, 2.7440185546875, 2.92138671875, 3.0987548828125, 3.276123046875, 3.4534912109375, 3.630859375, 3.8082275390625, 3.985595703125, 4.1629638671875, 4.34033203125, 4.5177001953125, 4.695068359375, 4.8724365234375, 5.0498046875, 5.2271728515625, 5.404541015625, 5.5819091796875, 5.75927734375, 5.9366455078125, 6.114013671875, 6.2913818359375, 6.46875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 13.0, 22.0, 20.0, 48.0, 53.0, 102.0, 121.0, 209.0, 307.0, 413.0, 652.0, 966.0, 1525.0, 2410.0, 3514.0, 5595.0, 9024.0, 14958.0, 24534.0, 40937.0, 67142.0, 110060.0, 165226.0, 191959.0, 153053.0, 99883.0, 61102.0, 36244.0, 21931.0, 13478.0, 8269.0, 5239.0, 3367.0, 2083.0, 1398.0, 894.0, 617.0, 390.0, 277.0, 164.0, 109.0, 87.0, 52.0, 37.0, 23.0, 20.0, 11.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.97265625, -3.85369873046875, -3.7347412109375, -3.61578369140625, -3.496826171875, -3.37786865234375, -3.2589111328125, -3.13995361328125, -3.02099609375, -2.90203857421875, -2.7830810546875, -2.66412353515625, -2.545166015625, -2.42620849609375, -2.3072509765625, -2.18829345703125, -2.0693359375, -1.95037841796875, -1.8314208984375, -1.71246337890625, -1.593505859375, -1.47454833984375, -1.3555908203125, -1.23663330078125, -1.11767578125, -0.99871826171875, -0.8797607421875, -0.76080322265625, -0.641845703125, -0.52288818359375, -0.4039306640625, -0.28497314453125, -0.166015625, -0.04705810546875, 0.0718994140625, 0.19085693359375, 0.309814453125, 0.42877197265625, 0.5477294921875, 0.66668701171875, 0.78564453125, 0.90460205078125, 1.0235595703125, 1.14251708984375, 1.261474609375, 1.38043212890625, 1.4993896484375, 1.61834716796875, 1.7373046875, 1.85626220703125, 1.9752197265625, 2.09417724609375, 2.213134765625, 2.33209228515625, 2.4510498046875, 2.57000732421875, 2.68896484375, 2.80792236328125, 2.9268798828125, 3.04583740234375, 3.164794921875, 3.28375244140625, 3.4027099609375, 3.52166748046875, 3.640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 6.0, 19.0, 9.0, 10.0, 17.0, 8.0, 18.0, 34.0, 28.0, 38.0, 30.0, 46.0, 39.0, 41.0, 44.0, 42.0, 47.0, 36.0, 45.0, 54.0, 38.0, 55.0, 31.0, 40.0, 32.0, 28.0, 29.0, 24.0, 16.0, 15.0, 12.0, 8.0, 10.0, 9.0, 14.0, 1.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.96612548828125, -2.8638916015625, -2.76165771484375, -2.659423828125, -2.55718994140625, -2.4549560546875, -2.35272216796875, -2.25048828125, -2.14825439453125, -2.0460205078125, -1.94378662109375, -1.841552734375, -1.73931884765625, -1.6370849609375, -1.53485107421875, -1.4326171875, -1.33038330078125, -1.2281494140625, -1.12591552734375, -1.023681640625, -0.92144775390625, -0.8192138671875, -0.71697998046875, -0.61474609375, -0.51251220703125, -0.4102783203125, -0.30804443359375, -0.205810546875, -0.10357666015625, -0.0013427734375, 0.10089111328125, 0.203125, 0.30535888671875, 0.4075927734375, 0.50982666015625, 0.612060546875, 0.71429443359375, 0.8165283203125, 0.91876220703125, 1.02099609375, 1.12322998046875, 1.2254638671875, 1.32769775390625, 1.429931640625, 1.53216552734375, 1.6343994140625, 1.73663330078125, 1.8388671875, 1.94110107421875, 2.0433349609375, 2.14556884765625, 2.247802734375, 2.35003662109375, 2.4522705078125, 2.55450439453125, 2.65673828125, 2.75897216796875, 2.8612060546875, 2.96343994140625, 3.065673828125, 3.16790771484375, 3.2701416015625, 3.37237548828125, 3.474609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 12.0, 16.0, 23.0, 24.0, 43.0, 55.0, 93.0, 146.0, 184.0, 298.0, 490.0, 729.0, 1107.0, 1737.0, 2975.0, 5097.0, 9182.0, 17139.0, 33595.0, 67557.0, 135720.0, 238815.0, 245294.0, 141273.0, 71002.0, 35255.0, 18033.0, 9504.0, 5172.0, 3009.0, 1806.0, 1072.0, 697.0, 472.0, 335.0, 180.0, 128.0, 74.0, 63.0, 46.0, 32.0, 17.0, 14.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.27734375, -2.19610595703125, -2.1148681640625, -2.03363037109375, -1.952392578125, -1.87115478515625, -1.7899169921875, -1.70867919921875, -1.62744140625, -1.54620361328125, -1.4649658203125, -1.38372802734375, -1.302490234375, -1.22125244140625, -1.1400146484375, -1.05877685546875, -0.9775390625, -0.89630126953125, -0.8150634765625, -0.73382568359375, -0.652587890625, -0.57135009765625, -0.4901123046875, -0.40887451171875, -0.32763671875, -0.24639892578125, -0.1651611328125, -0.08392333984375, -0.002685546875, 0.07855224609375, 0.1597900390625, 0.24102783203125, 0.322265625, 0.40350341796875, 0.4847412109375, 0.56597900390625, 0.647216796875, 0.72845458984375, 0.8096923828125, 0.89093017578125, 0.97216796875, 1.05340576171875, 1.1346435546875, 1.21588134765625, 1.297119140625, 1.37835693359375, 1.4595947265625, 1.54083251953125, 1.6220703125, 1.70330810546875, 1.7845458984375, 1.86578369140625, 1.947021484375, 2.02825927734375, 2.1094970703125, 2.19073486328125, 2.27197265625, 2.35321044921875, 2.4344482421875, 2.51568603515625, 2.596923828125, 2.67816162109375, 2.7593994140625, 2.84063720703125, 2.921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 12.0, 12.0, 11.0, 26.0, 28.0, 22.0, 39.0, 55.0, 63.0, 74.0, 74.0, 75.0, 75.0, 58.0, 50.0, 55.0, 47.0, 34.0, 32.0, 34.0, 24.0, 16.0, 12.0, 11.0, 8.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013267993927001953, -0.00012789294123649597, -0.0001231059432029724, -0.00011831894516944885, -0.00011353194713592529, -0.00010874494910240173, -0.00010395795106887817, -9.917095303535461e-05, -9.438395500183105e-05, -8.95969569683075e-05, -8.480995893478394e-05, -8.002296090126038e-05, -7.523596286773682e-05, -7.044896483421326e-05, -6.56619668006897e-05, -6.087496876716614e-05, -5.608797073364258e-05, -5.130097270011902e-05, -4.651397466659546e-05, -4.17269766330719e-05, -3.693997859954834e-05, -3.215298056602478e-05, -2.736598253250122e-05, -2.257898449897766e-05, -1.77919864654541e-05, -1.3004988431930542e-05, -8.217990398406982e-06, -3.430992364883423e-06, 1.3560056686401367e-06, 6.143003702163696e-06, 1.0930001735687256e-05, 1.5716999769210815e-05, 2.0503997802734375e-05, 2.5290995836257935e-05, 3.0077993869781494e-05, 3.4864991903305054e-05, 3.965198993682861e-05, 4.443898797035217e-05, 4.922598600387573e-05, 5.401298403739929e-05, 5.879998207092285e-05, 6.358698010444641e-05, 6.837397813796997e-05, 7.316097617149353e-05, 7.794797420501709e-05, 8.273497223854065e-05, 8.752197027206421e-05, 9.230896830558777e-05, 9.709596633911133e-05, 0.00010188296437263489, 0.00010666996240615845, 0.00011145696043968201, 0.00011624395847320557, 0.00012103095650672913, 0.00012581795454025269, 0.00013060495257377625, 0.0001353919506072998, 0.00014017894864082336, 0.00014496594667434692, 0.00014975294470787048, 0.00015453994274139404, 0.0001593269407749176, 0.00016411393880844116, 0.00016890093684196472, 0.00017368793487548828]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 2.0, 7.0, 10.0, 17.0, 12.0, 29.0, 36.0, 42.0, 64.0, 93.0, 144.0, 168.0, 276.0, 383.0, 549.0, 853.0, 1226.0, 1873.0, 2643.0, 4191.0, 6610.0, 10626.0, 17140.0, 27704.0, 44665.0, 70140.0, 104546.0, 138210.0, 155042.0, 142816.0, 111204.0, 76369.0, 49083.0, 30480.0, 18779.0, 11618.0, 7274.0, 4494.0, 2913.0, 2002.0, 1335.0, 842.0, 592.0, 449.0, 303.0, 218.0, 149.0, 121.0, 71.0, 44.0, 31.0, 18.0, 16.0, 13.0, 9.0, 9.0, 6.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.6044921875, -1.5537109375, -1.5029296875, -1.4521484375, -1.4013671875, -1.3505859375, -1.2998046875, -1.2490234375, -1.1982421875, -1.1474609375, -1.0966796875, -1.0458984375, -0.9951171875, -0.9443359375, -0.8935546875, -0.8427734375, -0.7919921875, -0.7412109375, -0.6904296875, -0.6396484375, -0.5888671875, -0.5380859375, -0.4873046875, -0.4365234375, -0.3857421875, -0.3349609375, -0.2841796875, -0.2333984375, -0.1826171875, -0.1318359375, -0.0810546875, -0.0302734375, 0.0205078125, 0.0712890625, 0.1220703125, 0.1728515625, 0.2236328125, 0.2744140625, 0.3251953125, 0.3759765625, 0.4267578125, 0.4775390625, 0.5283203125, 0.5791015625, 0.6298828125, 0.6806640625, 0.7314453125, 0.7822265625, 0.8330078125, 0.8837890625, 0.9345703125, 0.9853515625, 1.0361328125, 1.0869140625, 1.1376953125, 1.1884765625, 1.2392578125, 1.2900390625, 1.3408203125, 1.3916015625, 1.4423828125, 1.4931640625, 1.5439453125, 1.5947265625, 1.6455078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 5.0, 10.0, 15.0, 21.0, 27.0, 27.0, 42.0, 47.0, 48.0, 59.0, 52.0, 78.0, 75.0, 84.0, 51.0, 65.0, 58.0, 54.0, 29.0, 31.0, 27.0, 23.0, 15.0, 11.0, 10.0, 8.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.76025390625, -0.7388153076171875, -0.717376708984375, -0.6959381103515625, -0.67449951171875, -0.6530609130859375, -0.631622314453125, -0.6101837158203125, -0.5887451171875, -0.5673065185546875, -0.545867919921875, -0.5244293212890625, -0.50299072265625, -0.4815521240234375, -0.460113525390625, -0.4386749267578125, -0.417236328125, -0.3957977294921875, -0.374359130859375, -0.3529205322265625, -0.33148193359375, -0.3100433349609375, -0.288604736328125, -0.2671661376953125, -0.2457275390625, -0.2242889404296875, -0.202850341796875, -0.1814117431640625, -0.15997314453125, -0.1385345458984375, -0.117095947265625, -0.0956573486328125, -0.07421875, -0.0527801513671875, -0.031341552734375, -0.0099029541015625, 0.01153564453125, 0.0329742431640625, 0.054412841796875, 0.0758514404296875, 0.0972900390625, 0.1187286376953125, 0.140167236328125, 0.1616058349609375, 0.18304443359375, 0.2044830322265625, 0.225921630859375, 0.2473602294921875, 0.268798828125, 0.2902374267578125, 0.311676025390625, 0.3331146240234375, 0.35455322265625, 0.3759918212890625, 0.397430419921875, 0.4188690185546875, 0.4403076171875, 0.4617462158203125, 0.483184814453125, 0.5046234130859375, 0.52606201171875, 0.5475006103515625, 0.568939208984375, 0.5903778076171875, 0.61181640625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 9.0, 8.0, 23.0, 9.0, 21.0, 22.0, 26.0, 33.0, 41.0, 55.0, 53.0, 61.0, 54.0, 73.0, 61.0, 68.0, 66.0, 53.0, 46.0, 29.0, 31.0, 33.0, 21.0, 25.0, 11.0, 14.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.051548957824707, -7.797083854675293, -7.542618751525879, -7.288154125213623, -7.033689022064209, -6.779223918914795, -6.524759292602539, -6.270294189453125, -6.015829086303711, -5.761363983154297, -5.506898880004883, -5.252434253692627, -4.997969150543213, -4.743504047393799, -4.489039421081543, -4.234574317932129, -3.980109214782715, -3.725644111633301, -3.471179246902466, -3.216714382171631, -2.962249279022217, -2.7077841758728027, -2.4533193111419678, -2.198854446411133, -1.9443893432617188, -1.6899243593215942, -1.4354593753814697, -1.1809943914413452, -0.9265294075012207, -0.6720644235610962, -0.4175994396209717, -0.16313445568084717, 0.09133052825927734, 0.34579551219940186, 0.6002604961395264, 0.8547254800796509, 1.1091904640197754, 1.3636554479599, 1.6181204319000244, 1.872585415840149, 2.1270503997802734, 2.3815155029296875, 2.6359803676605225, 2.8904452323913574, 3.1449103355407715, 3.3993754386901855, 3.6538403034210205, 3.9083051681518555, 4.1627702713012695, 4.417235374450684, 4.671700477600098, 4.9261651039123535, 5.180630207061768, 5.435095310211182, 5.6895599365234375, 5.944025039672852, 6.198490142822266, 6.45295524597168, 6.707420349121094, 6.96188497543335, 7.216350078582764, 7.470815181732178, 7.725279808044434, 7.979744911193848, 8.234210014343262]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 6.0, 7.0, 9.0, 8.0, 12.0, 19.0, 14.0, 22.0, 26.0, 26.0, 25.0, 26.0, 30.0, 36.0, 27.0, 41.0, 40.0, 37.0, 40.0, 49.0, 46.0, 48.0, 53.0, 36.0, 34.0, 33.0, 31.0, 31.0, 31.0, 26.0, 16.0, 20.0, 14.0, 12.0, 11.0, 14.0, 9.0, 5.0, 5.0, 7.0, 8.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.356161594390869, -4.208642482757568, -4.061123847961426, -3.913604736328125, -3.766085624694824, -3.6185667514801025, -3.471047878265381, -3.32352876663208, -3.1760098934173584, -3.0284910202026367, -2.880971908569336, -2.7334530353546143, -2.5859341621398926, -2.438415050506592, -2.29089617729187, -2.1433773040771484, -1.9958581924438477, -1.8483392000198364, -1.7008202075958252, -1.5533013343811035, -1.4057823419570923, -1.258263349533081, -1.1107444763183594, -0.9632254838943481, -0.8157064914703369, -0.6681874990463257, -0.5206685662269592, -0.3731496036052704, -0.22563064098358154, -0.07811164855957031, 0.06940728425979614, 0.2169262170791626, 0.36444568634033203, 0.5119646787643433, 0.6594836115837097, 0.8070025444030762, 0.9545215368270874, 1.1020405292510986, 1.2495594024658203, 1.3970783948898315, 1.5445973873138428, 1.692116379737854, 1.8396353721618652, 1.987154245376587, 2.1346731185913086, 2.2821922302246094, 2.429711103439331, 2.5772299766540527, 2.7247490882873535, 2.872267961502075, 3.019787073135376, 3.1673059463500977, 3.3148250579833984, 3.46234393119812, 3.609862804412842, 3.7573819160461426, 3.9049007892608643, 4.052419662475586, 4.199938774108887, 4.3474578857421875, 4.49497652053833, 4.642495632171631, 4.790014743804932, 4.937533378601074, 5.085052490234375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 1.0, 9.0, 4.0, 10.0, 9.0, 15.0, 13.0, 31.0, 49.0, 56.0, 81.0, 103.0, 180.0, 215.0, 359.0, 471.0, 779.0, 1204.0, 1893.0, 2928.0, 4426.0, 7108.0, 11364.0, 18111.0, 29140.0, 45789.0, 70188.0, 101531.0, 133697.0, 149619.0, 139720.0, 109719.0, 78354.0, 52143.0, 33138.0, 20623.0, 13134.0, 8074.0, 5006.0, 3202.0, 2061.0, 1271.0, 887.0, 568.0, 417.0, 248.0, 190.0, 128.0, 89.0, 68.0, 41.0, 28.0, 23.0, 9.0, 14.0, 10.0, 5.0, 8.0, 3.0, 3.0], "bins": [-5.69921875, -5.52978515625, -5.3603515625, -5.19091796875, -5.021484375, -4.85205078125, -4.6826171875, -4.51318359375, -4.34375, -4.17431640625, -4.0048828125, -3.83544921875, -3.666015625, -3.49658203125, -3.3271484375, -3.15771484375, -2.98828125, -2.81884765625, -2.6494140625, -2.47998046875, -2.310546875, -2.14111328125, -1.9716796875, -1.80224609375, -1.6328125, -1.46337890625, -1.2939453125, -1.12451171875, -0.955078125, -0.78564453125, -0.6162109375, -0.44677734375, -0.27734375, -0.10791015625, 0.0615234375, 0.23095703125, 0.400390625, 0.56982421875, 0.7392578125, 0.90869140625, 1.078125, 1.24755859375, 1.4169921875, 1.58642578125, 1.755859375, 1.92529296875, 2.0947265625, 2.26416015625, 2.43359375, 2.60302734375, 2.7724609375, 2.94189453125, 3.111328125, 3.28076171875, 3.4501953125, 3.61962890625, 3.7890625, 3.95849609375, 4.1279296875, 4.29736328125, 4.466796875, 4.63623046875, 4.8056640625, 4.97509765625, 5.14453125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 10.0, 7.0, 3.0, 13.0, 9.0, 24.0, 14.0, 23.0, 25.0, 31.0, 21.0, 31.0, 46.0, 42.0, 39.0, 48.0, 39.0, 55.0, 51.0, 55.0, 38.0, 40.0, 51.0, 37.0, 39.0, 27.0, 28.0, 27.0, 30.0, 19.0, 14.0, 14.0, 13.0, 4.0, 8.0, 6.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.961181640625, -4.78564453125, -4.610107421875, -4.4345703125, -4.259033203125, -4.08349609375, -3.907958984375, -3.732421875, -3.556884765625, -3.38134765625, -3.205810546875, -3.0302734375, -2.854736328125, -2.67919921875, -2.503662109375, -2.328125, -2.152587890625, -1.97705078125, -1.801513671875, -1.6259765625, -1.450439453125, -1.27490234375, -1.099365234375, -0.923828125, -0.748291015625, -0.57275390625, -0.397216796875, -0.2216796875, -0.046142578125, 0.12939453125, 0.304931640625, 0.48046875, 0.656005859375, 0.83154296875, 1.007080078125, 1.1826171875, 1.358154296875, 1.53369140625, 1.709228515625, 1.884765625, 2.060302734375, 2.23583984375, 2.411376953125, 2.5869140625, 2.762451171875, 2.93798828125, 3.113525390625, 3.2890625, 3.464599609375, 3.64013671875, 3.815673828125, 3.9912109375, 4.166748046875, 4.34228515625, 4.517822265625, 4.693359375, 4.868896484375, 5.04443359375, 5.219970703125, 5.3955078125, 5.571044921875, 5.74658203125, 5.922119140625, 6.09765625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 10.0, 20.0, 23.0, 40.0, 57.0, 84.0, 128.0, 167.0, 240.0, 380.0, 527.0, 819.0, 1302.0, 2015.0, 3237.0, 5202.0, 8228.0, 13724.0, 22218.0, 36377.0, 58258.0, 89542.0, 126907.0, 154503.0, 154224.0, 126667.0, 90235.0, 58372.0, 36324.0, 22340.0, 13677.0, 8393.0, 5175.0, 3251.0, 2072.0, 1279.0, 852.0, 575.0, 347.0, 223.0, 175.0, 106.0, 80.0, 51.0, 43.0, 21.0, 22.0, 15.0, 7.0, 3.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.52734375, -5.34906005859375, -5.1707763671875, -4.99249267578125, -4.814208984375, -4.63592529296875, -4.4576416015625, -4.27935791015625, -4.10107421875, -3.92279052734375, -3.7445068359375, -3.56622314453125, -3.387939453125, -3.20965576171875, -3.0313720703125, -2.85308837890625, -2.6748046875, -2.49652099609375, -2.3182373046875, -2.13995361328125, -1.961669921875, -1.78338623046875, -1.6051025390625, -1.42681884765625, -1.24853515625, -1.07025146484375, -0.8919677734375, -0.71368408203125, -0.535400390625, -0.35711669921875, -0.1788330078125, -0.00054931640625, 0.177734375, 0.35601806640625, 0.5343017578125, 0.71258544921875, 0.890869140625, 1.06915283203125, 1.2474365234375, 1.42572021484375, 1.60400390625, 1.78228759765625, 1.9605712890625, 2.13885498046875, 2.317138671875, 2.49542236328125, 2.6737060546875, 2.85198974609375, 3.0302734375, 3.20855712890625, 3.3868408203125, 3.56512451171875, 3.743408203125, 3.92169189453125, 4.0999755859375, 4.27825927734375, 4.45654296875, 4.63482666015625, 4.8131103515625, 4.99139404296875, 5.169677734375, 5.34796142578125, 5.5262451171875, 5.70452880859375, 5.8828125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 5.0, 17.0, 22.0, 21.0, 20.0, 17.0, 15.0, 20.0, 23.0, 40.0, 48.0, 42.0, 37.0, 43.0, 71.0, 52.0, 43.0, 36.0, 35.0, 47.0, 27.0, 41.0, 41.0, 32.0, 25.0, 32.0, 22.0, 18.0, 20.0, 17.0, 11.0, 6.0, 12.0, 7.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.45703125, -3.3521728515625, -3.247314453125, -3.1424560546875, -3.03759765625, -2.9327392578125, -2.827880859375, -2.7230224609375, -2.6181640625, -2.5133056640625, -2.408447265625, -2.3035888671875, -2.19873046875, -2.0938720703125, -1.989013671875, -1.8841552734375, -1.779296875, -1.6744384765625, -1.569580078125, -1.4647216796875, -1.35986328125, -1.2550048828125, -1.150146484375, -1.0452880859375, -0.9404296875, -0.8355712890625, -0.730712890625, -0.6258544921875, -0.52099609375, -0.4161376953125, -0.311279296875, -0.2064208984375, -0.1015625, 0.0032958984375, 0.108154296875, 0.2130126953125, 0.31787109375, 0.4227294921875, 0.527587890625, 0.6324462890625, 0.7373046875, 0.8421630859375, 0.947021484375, 1.0518798828125, 1.15673828125, 1.2615966796875, 1.366455078125, 1.4713134765625, 1.576171875, 1.6810302734375, 1.785888671875, 1.8907470703125, 1.99560546875, 2.1004638671875, 2.205322265625, 2.3101806640625, 2.4150390625, 2.5198974609375, 2.624755859375, 2.7296142578125, 2.83447265625, 2.9393310546875, 3.044189453125, 3.1490478515625, 3.25390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 6.0, 7.0, 23.0, 18.0, 40.0, 39.0, 68.0, 112.0, 153.0, 234.0, 340.0, 556.0, 757.0, 1182.0, 1697.0, 2705.0, 4522.0, 7439.0, 12501.0, 22847.0, 43174.0, 86191.0, 171175.0, 255637.0, 206442.0, 109675.0, 54241.0, 27843.0, 15530.0, 8740.0, 5320.0, 3312.0, 2048.0, 1356.0, 878.0, 562.0, 393.0, 259.0, 177.0, 113.0, 71.0, 52.0, 35.0, 28.0, 14.0, 10.0, 10.0, 3.0, 6.0, 2.0, 3.0, 5.0], "bins": [-5.0703125, -4.92816162109375, -4.7860107421875, -4.64385986328125, -4.501708984375, -4.35955810546875, -4.2174072265625, -4.07525634765625, -3.93310546875, -3.79095458984375, -3.6488037109375, -3.50665283203125, -3.364501953125, -3.22235107421875, -3.0802001953125, -2.93804931640625, -2.7958984375, -2.65374755859375, -2.5115966796875, -2.36944580078125, -2.227294921875, -2.08514404296875, -1.9429931640625, -1.80084228515625, -1.65869140625, -1.51654052734375, -1.3743896484375, -1.23223876953125, -1.090087890625, -0.94793701171875, -0.8057861328125, -0.66363525390625, -0.521484375, -0.37933349609375, -0.2371826171875, -0.09503173828125, 0.047119140625, 0.18927001953125, 0.3314208984375, 0.47357177734375, 0.61572265625, 0.75787353515625, 0.9000244140625, 1.04217529296875, 1.184326171875, 1.32647705078125, 1.4686279296875, 1.61077880859375, 1.7529296875, 1.89508056640625, 2.0372314453125, 2.17938232421875, 2.321533203125, 2.46368408203125, 2.6058349609375, 2.74798583984375, 2.89013671875, 3.03228759765625, 3.1744384765625, 3.31658935546875, 3.458740234375, 3.60089111328125, 3.7430419921875, 3.88519287109375, 4.02734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 10.0, 11.0, 11.0, 18.0, 13.0, 14.0, 29.0, 35.0, 36.0, 52.0, 64.0, 63.0, 81.0, 94.0, 65.0, 83.0, 57.0, 56.0, 48.0, 34.0, 27.0, 18.0, 11.0, 11.0, 17.0, 8.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000507354736328125, -0.0004931129515171051, -0.0004788711667060852, -0.0004646293818950653, -0.0004503875970840454, -0.0004361458122730255, -0.0004219040274620056, -0.0004076622426509857, -0.0003934204578399658, -0.0003791786730289459, -0.000364936888217926, -0.00035069510340690613, -0.00033645331859588623, -0.00032221153378486633, -0.00030796974897384644, -0.00029372796416282654, -0.00027948617935180664, -0.00026524439454078674, -0.00025100260972976685, -0.00023676082491874695, -0.00022251904010772705, -0.00020827725529670715, -0.00019403547048568726, -0.00017979368567466736, -0.00016555190086364746, -0.00015131011605262756, -0.00013706833124160767, -0.00012282654643058777, -0.00010858476161956787, -9.434297680854797e-05, -8.010119199752808e-05, -6.585940718650818e-05, -5.161762237548828e-05, -3.7375837564468384e-05, -2.3134052753448486e-05, -8.892267942428589e-06, 5.349516868591309e-06, 1.9591301679611206e-05, 3.3833086490631104e-05, 4.8074871301651e-05, 6.23166561126709e-05, 7.65584409236908e-05, 9.08002257347107e-05, 0.00010504201054573059, 0.00011928379535675049, 0.00013352558016777039, 0.00014776736497879028, 0.00016200914978981018, 0.00017625093460083008, 0.00019049271941184998, 0.00020473450422286987, 0.00021897628903388977, 0.00023321807384490967, 0.00024745985865592957, 0.00026170164346694946, 0.00027594342827796936, 0.00029018521308898926, 0.00030442699790000916, 0.00031866878271102905, 0.00033291056752204895, 0.00034715235233306885, 0.00036139413714408875, 0.00037563592195510864, 0.00038987770676612854, 0.00040411949157714844]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 9.0, 9.0, 14.0, 21.0, 25.0, 38.0, 54.0, 73.0, 130.0, 217.0, 382.0, 633.0, 1079.0, 2206.0, 4115.0, 8426.0, 17680.0, 39087.0, 86957.0, 188363.0, 287504.0, 217941.0, 105260.0, 46801.0, 21205.0, 9765.0, 4925.0, 2477.0, 1308.0, 724.0, 457.0, 251.0, 142.0, 85.0, 56.0, 40.0, 19.0, 21.0, 15.0, 9.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.8671875, -4.71795654296875, -4.5687255859375, -4.41949462890625, -4.270263671875, -4.12103271484375, -3.9718017578125, -3.82257080078125, -3.67333984375, -3.52410888671875, -3.3748779296875, -3.22564697265625, -3.076416015625, -2.92718505859375, -2.7779541015625, -2.62872314453125, -2.4794921875, -2.33026123046875, -2.1810302734375, -2.03179931640625, -1.882568359375, -1.73333740234375, -1.5841064453125, -1.43487548828125, -1.28564453125, -1.13641357421875, -0.9871826171875, -0.83795166015625, -0.688720703125, -0.53948974609375, -0.3902587890625, -0.24102783203125, -0.091796875, 0.05743408203125, 0.2066650390625, 0.35589599609375, 0.505126953125, 0.65435791015625, 0.8035888671875, 0.95281982421875, 1.10205078125, 1.25128173828125, 1.4005126953125, 1.54974365234375, 1.698974609375, 1.84820556640625, 1.9974365234375, 2.14666748046875, 2.2958984375, 2.44512939453125, 2.5943603515625, 2.74359130859375, 2.892822265625, 3.04205322265625, 3.1912841796875, 3.34051513671875, 3.48974609375, 3.63897705078125, 3.7882080078125, 3.93743896484375, 4.086669921875, 4.23590087890625, 4.3851318359375, 4.53436279296875, 4.68359375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 11.0, 10.0, 23.0, 32.0, 37.0, 42.0, 54.0, 68.0, 67.0, 89.0, 82.0, 99.0, 78.0, 72.0, 64.0, 30.0, 30.0, 21.0, 17.0, 17.0, 13.0, 13.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.953125, -1.9080047607421875, -1.862884521484375, -1.8177642822265625, -1.77264404296875, -1.7275238037109375, -1.682403564453125, -1.6372833251953125, -1.5921630859375, -1.5470428466796875, -1.501922607421875, -1.4568023681640625, -1.41168212890625, -1.3665618896484375, -1.321441650390625, -1.2763214111328125, -1.231201171875, -1.1860809326171875, -1.140960693359375, -1.0958404541015625, -1.05072021484375, -1.0055999755859375, -0.960479736328125, -0.9153594970703125, -0.8702392578125, -0.8251190185546875, -0.779998779296875, -0.7348785400390625, -0.68975830078125, -0.6446380615234375, -0.599517822265625, -0.5543975830078125, -0.50927734375, -0.4641571044921875, -0.419036865234375, -0.3739166259765625, -0.32879638671875, -0.2836761474609375, -0.238555908203125, -0.1934356689453125, -0.1483154296875, -0.1031951904296875, -0.058074951171875, -0.0129547119140625, 0.03216552734375, 0.0772857666015625, 0.122406005859375, 0.1675262451171875, 0.212646484375, 0.2577667236328125, 0.302886962890625, 0.3480072021484375, 0.39312744140625, 0.4382476806640625, 0.483367919921875, 0.5284881591796875, 0.5736083984375, 0.6187286376953125, 0.663848876953125, 0.7089691162109375, 0.75408935546875, 0.7992095947265625, 0.844329833984375, 0.8894500732421875, 0.9345703125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 6.0, 15.0, 15.0, 11.0, 23.0, 30.0, 19.0, 27.0, 40.0, 42.0, 51.0, 55.0, 53.0, 55.0, 43.0, 57.0, 40.0, 60.0, 48.0, 57.0, 43.0, 29.0, 33.0, 18.0, 13.0, 20.0, 16.0, 15.0, 7.0, 9.0, 6.0, 7.0, 9.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.334050178527832, -7.109960556030273, -6.885870933532715, -6.661780834197998, -6.4376912117004395, -6.213601589202881, -5.989511966705322, -5.7654218673706055, -5.541332244873047, -5.317242622375488, -5.09315299987793, -4.869062900543213, -4.644973278045654, -4.420883655548096, -4.196794033050537, -3.9727041721343994, -3.748614549636841, -3.5245249271392822, -3.3004350662231445, -3.076345443725586, -2.8522555828094482, -2.6281659603118896, -2.404076099395752, -2.1799864768981934, -1.9558967351913452, -1.731806993484497, -1.507717251777649, -1.2836275100708008, -1.0595378875732422, -0.835448145866394, -0.6113584041595459, -0.38726866245269775, -0.1631789207458496, 0.06091080605983734, 0.2850005328655243, 0.50909024477005, 0.7331799864768982, 0.9572696685791016, 1.1813594102859497, 1.4054491519927979, 1.629538893699646, 1.8536286354064941, 2.0777182579040527, 2.3018081188201904, 2.525897741317749, 2.7499876022338867, 2.9740772247314453, 3.198166847229004, 3.4222567081451416, 3.6463463306427, 3.870436191558838, 4.0945258140563965, 4.318615436553955, 4.542705535888672, 4.7667951583862305, 4.990884780883789, 5.214974403381348, 5.439064025878906, 5.663153648376465, 5.887243747711182, 6.11133337020874, 6.335422992706299, 6.559512615203857, 6.783602714538574, 7.007692337036133]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 12.0, 9.0, 14.0, 14.0, 17.0, 27.0, 24.0, 30.0, 29.0, 29.0, 38.0, 29.0, 38.0, 35.0, 36.0, 34.0, 32.0, 42.0, 38.0, 25.0, 36.0, 26.0, 42.0, 26.0, 28.0, 32.0, 31.0, 32.0, 25.0, 19.0, 25.0, 17.0, 19.0, 10.0, 8.0, 10.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.351051330566406, -4.2086663246154785, -4.066281795501709, -3.9238967895507812, -3.7815117835998535, -3.639127016067505, -3.4967422485351562, -3.3543572425842285, -3.21197247505188, -3.0695877075195312, -2.9272027015686035, -2.784817934036255, -2.6424331665039062, -2.5000481605529785, -2.35766339302063, -2.2152786254882812, -2.0728936195373535, -1.9305087327957153, -1.7881238460540771, -1.6457390785217285, -1.5033541917800903, -1.3609693050384521, -1.2185845375061035, -1.0761996507644653, -0.9338147640228271, -0.791429877281189, -0.6490450501441956, -0.5066602230072021, -0.36427533626556396, -0.22189044952392578, -0.07950562238693237, 0.06287920475006104, 0.20526361465454102, 0.3476484715938568, 0.4900333285331726, 0.632418155670166, 0.7748030424118042, 0.9171879291534424, 1.059572696685791, 1.2019575834274292, 1.3443424701690674, 1.4867273569107056, 1.6291122436523438, 1.7714970111846924, 1.9138818979263306, 2.0562667846679688, 2.1986515522003174, 2.341036319732666, 2.4834213256835938, 2.6258060932159424, 2.76819109916687, 2.9105758666992188, 3.0529608726501465, 3.195345640182495, 3.3377304077148438, 3.4801154136657715, 3.62250018119812, 3.7648849487304688, 3.9072699546813965, 4.049654960632324, 4.192039489746094, 4.3344244956970215, 4.476809501647949, 4.619194030761719, 4.7615790367126465]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 9.0, 22.0, 29.0, 47.0, 57.0, 94.0, 138.0, 202.0, 341.0, 446.0, 711.0, 1128.0, 1748.0, 2856.0, 4546.0, 7858.0, 13728.0, 25106.0, 47634.0, 96610.0, 207904.0, 468327.0, 935488.0, 1110558.0, 678973.0, 306855.0, 138017.0, 65604.0, 33459.0, 18515.0, 10595.0, 6229.0, 3715.0, 2378.0, 1526.0, 955.0, 614.0, 405.0, 273.0, 187.0, 138.0, 89.0, 50.0, 37.0, 33.0, 14.0, 10.0, 5.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.6875, -8.44097900390625, -8.1944580078125, -7.94793701171875, -7.701416015625, -7.45489501953125, -7.2083740234375, -6.96185302734375, -6.71533203125, -6.46881103515625, -6.2222900390625, -5.97576904296875, -5.729248046875, -5.48272705078125, -5.2362060546875, -4.98968505859375, -4.7431640625, -4.49664306640625, -4.2501220703125, -4.00360107421875, -3.757080078125, -3.51055908203125, -3.2640380859375, -3.01751708984375, -2.77099609375, -2.52447509765625, -2.2779541015625, -2.03143310546875, -1.784912109375, -1.53839111328125, -1.2918701171875, -1.04534912109375, -0.798828125, -0.55230712890625, -0.3057861328125, -0.05926513671875, 0.187255859375, 0.43377685546875, 0.6802978515625, 0.92681884765625, 1.17333984375, 1.41986083984375, 1.6663818359375, 1.91290283203125, 2.159423828125, 2.40594482421875, 2.6524658203125, 2.89898681640625, 3.1455078125, 3.39202880859375, 3.6385498046875, 3.88507080078125, 4.131591796875, 4.37811279296875, 4.6246337890625, 4.87115478515625, 5.11767578125, 5.36419677734375, 5.6107177734375, 5.85723876953125, 6.103759765625, 6.35028076171875, 6.5968017578125, 6.84332275390625, 7.08984375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 8.0, 14.0, 9.0, 13.0, 14.0, 16.0, 32.0, 34.0, 25.0, 22.0, 37.0, 34.0, 36.0, 45.0, 31.0, 32.0, 42.0, 47.0, 41.0, 32.0, 32.0, 35.0, 32.0, 34.0, 22.0, 33.0, 35.0, 22.0, 23.0, 25.0, 22.0, 27.0, 17.0, 11.0, 7.0, 9.0, 4.0, 3.0, 4.0, 0.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.541015625, -3.425140380859375, -3.30926513671875, -3.193389892578125, -3.0775146484375, -2.961639404296875, -2.84576416015625, -2.729888916015625, -2.614013671875, -2.498138427734375, -2.38226318359375, -2.266387939453125, -2.1505126953125, -2.034637451171875, -1.91876220703125, -1.802886962890625, -1.68701171875, -1.571136474609375, -1.45526123046875, -1.339385986328125, -1.2235107421875, -1.107635498046875, -0.99176025390625, -0.875885009765625, -0.760009765625, -0.644134521484375, -0.52825927734375, -0.412384033203125, -0.2965087890625, -0.180633544921875, -0.06475830078125, 0.051116943359375, 0.1669921875, 0.282867431640625, 0.39874267578125, 0.514617919921875, 0.6304931640625, 0.746368408203125, 0.86224365234375, 0.978118896484375, 1.093994140625, 1.209869384765625, 1.32574462890625, 1.441619873046875, 1.5574951171875, 1.673370361328125, 1.78924560546875, 1.905120849609375, 2.02099609375, 2.136871337890625, 2.25274658203125, 2.368621826171875, 2.4844970703125, 2.600372314453125, 2.71624755859375, 2.832122802734375, 2.947998046875, 3.063873291015625, 3.17974853515625, 3.295623779296875, 3.4114990234375, 3.527374267578125, 3.64324951171875, 3.759124755859375, 3.875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 13.0, 19.0, 31.0, 46.0, 62.0, 98.0, 153.0, 231.0, 336.0, 528.0, 813.0, 1304.0, 2159.0, 3647.0, 5961.0, 10324.0, 19014.0, 34706.0, 66860.0, 135621.0, 283078.0, 585841.0, 1007598.0, 970445.0, 543495.0, 261064.0, 124868.0, 62369.0, 31984.0, 17584.0, 9712.0, 5638.0, 3306.0, 1949.0, 1225.0, 780.0, 497.0, 338.0, 210.0, 127.0, 82.0, 45.0, 40.0, 30.0, 20.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.559326171875, -8.28271484375, -8.006103515625, -7.7294921875, -7.452880859375, -7.17626953125, -6.899658203125, -6.623046875, -6.346435546875, -6.06982421875, -5.793212890625, -5.5166015625, -5.239990234375, -4.96337890625, -4.686767578125, -4.41015625, -4.133544921875, -3.85693359375, -3.580322265625, -3.3037109375, -3.027099609375, -2.75048828125, -2.473876953125, -2.197265625, -1.920654296875, -1.64404296875, -1.367431640625, -1.0908203125, -0.814208984375, -0.53759765625, -0.260986328125, 0.015625, 0.292236328125, 0.56884765625, 0.845458984375, 1.1220703125, 1.398681640625, 1.67529296875, 1.951904296875, 2.228515625, 2.505126953125, 2.78173828125, 3.058349609375, 3.3349609375, 3.611572265625, 3.88818359375, 4.164794921875, 4.44140625, 4.718017578125, 4.99462890625, 5.271240234375, 5.5478515625, 5.824462890625, 6.10107421875, 6.377685546875, 6.654296875, 6.930908203125, 7.20751953125, 7.484130859375, 7.7607421875, 8.037353515625, 8.31396484375, 8.590576171875, 8.8671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 8.0, 11.0, 14.0, 18.0, 22.0, 20.0, 45.0, 56.0, 76.0, 71.0, 98.0, 145.0, 200.0, 195.0, 269.0, 319.0, 329.0, 355.0, 324.0, 286.0, 266.0, 214.0, 177.0, 142.0, 104.0, 91.0, 53.0, 45.0, 40.0, 24.0, 10.0, 13.0, 5.0, 7.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.410186767578125, -3.31842041015625, -3.226654052734375, -3.1348876953125, -3.043121337890625, -2.95135498046875, -2.859588623046875, -2.767822265625, -2.676055908203125, -2.58428955078125, -2.492523193359375, -2.4007568359375, -2.308990478515625, -2.21722412109375, -2.125457763671875, -2.03369140625, -1.941925048828125, -1.85015869140625, -1.758392333984375, -1.6666259765625, -1.574859619140625, -1.48309326171875, -1.391326904296875, -1.299560546875, -1.207794189453125, -1.11602783203125, -1.024261474609375, -0.9324951171875, -0.840728759765625, -0.74896240234375, -0.657196044921875, -0.5654296875, -0.473663330078125, -0.38189697265625, -0.290130615234375, -0.1983642578125, -0.106597900390625, -0.01483154296875, 0.076934814453125, 0.168701171875, 0.260467529296875, 0.35223388671875, 0.444000244140625, 0.5357666015625, 0.627532958984375, 0.71929931640625, 0.811065673828125, 0.90283203125, 0.994598388671875, 1.08636474609375, 1.178131103515625, 1.2698974609375, 1.361663818359375, 1.45343017578125, 1.545196533203125, 1.636962890625, 1.728729248046875, 1.82049560546875, 1.912261962890625, 2.0040283203125, 2.095794677734375, 2.18756103515625, 2.279327392578125, 2.37109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 4.0, 9.0, 11.0, 16.0, 17.0, 14.0, 26.0, 33.0, 34.0, 45.0, 51.0, 44.0, 68.0, 60.0, 68.0, 70.0, 56.0, 58.0, 45.0, 47.0, 30.0, 28.0, 24.0, 26.0, 25.0, 14.0, 13.0, 8.0, 15.0, 9.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6845011711120605, -7.41606330871582, -7.14762544631958, -6.87918758392334, -6.6107497215271, -6.342311859130859, -6.073873519897461, -5.805436134338379, -5.5369977951049805, -5.26855993270874, -5.0001220703125, -4.73168420791626, -4.4632463455200195, -4.194808483123779, -3.92637038230896, -3.6579325199127197, -3.3894948959350586, -3.1210570335388184, -2.852619171142578, -2.584181308746338, -2.3157434463500977, -2.0473055839538574, -1.778867483139038, -1.5104296207427979, -1.2419917583465576, -0.9735538959503174, -0.7051159739494324, -0.43667805194854736, -0.16824018955230713, 0.1001976728439331, 0.3686356544494629, 0.6370735168457031, 0.9055118560791016, 1.1739497184753418, 1.442387580871582, 1.7108255624771118, 1.979263424873352, 2.2477011680603027, 2.516139268875122, 2.7845771312713623, 3.0530149936676025, 3.3214528560638428, 3.589890718460083, 3.8583288192749023, 4.126766681671143, 4.395204544067383, 4.663642406463623, 4.932080268859863, 5.2005181312561035, 5.468955993652344, 5.737393856048584, 6.005831718444824, 6.2742695808410645, 6.542707443237305, 6.811145782470703, 7.079583168029785, 7.348021507263184, 7.616459369659424, 7.884897232055664, 8.153335571289062, 8.421772956848145, 8.690211296081543, 8.958648681640625, 9.227087020874023, 9.495524406433105]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 10.0, 7.0, 9.0, 5.0, 16.0, 19.0, 16.0, 26.0, 19.0, 23.0, 35.0, 50.0, 32.0, 28.0, 34.0, 40.0, 43.0, 36.0, 40.0, 33.0, 48.0, 44.0, 31.0, 32.0, 32.0, 40.0, 32.0, 37.0, 22.0, 24.0, 24.0, 20.0, 13.0, 18.0, 9.0, 13.0, 8.0, 6.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.958791732788086, -4.799306392669678, -4.639821529388428, -4.4803361892700195, -4.320850849151611, -4.161365509033203, -4.001880645751953, -3.842395305633545, -3.682910203933716, -3.5234251022338867, -3.3639397621154785, -3.2044546604156494, -3.0449695587158203, -2.885484218597412, -2.725999116897583, -2.566514015197754, -2.4070286750793457, -2.2475435733795166, -2.0880582332611084, -1.9285731315612793, -1.7690879106521606, -1.609602689743042, -1.450117588043213, -1.2906323671340942, -1.1311471462249756, -0.9716619253158569, -0.8121767640113831, -0.6526916027069092, -0.4932063817977905, -0.3337211608886719, -0.174235999584198, -0.014750838279724121, 0.14473390579223633, 0.3042190968990326, 0.46370428800582886, 0.6231894493103027, 0.7826746702194214, 0.94215989112854, 1.1016449928283691, 1.2611302137374878, 1.4206154346466064, 1.580100655555725, 1.7395858764648438, 1.8990709781646729, 2.058556079864502, 2.21804141998291, 2.3775265216827393, 2.5370116233825684, 2.6964969635009766, 2.8559820652008057, 3.015467405319214, 3.174952507019043, 3.334437847137451, 3.4939229488372803, 3.6534080505371094, 3.8128933906555176, 3.9723784923553467, 4.131863594055176, 4.291348934173584, 4.450834274291992, 4.610319137573242, 4.76980447769165, 4.929289817810059, 5.088774681091309, 5.248260021209717]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 14.0, 16.0, 23.0, 28.0, 35.0, 58.0, 96.0, 153.0, 233.0, 350.0, 525.0, 913.0, 1454.0, 2445.0, 4507.0, 8860.0, 20761.0, 55647.0, 160287.0, 341175.0, 275929.0, 107328.0, 37057.0, 14958.0, 6854.0, 3544.0, 2021.0, 1209.0, 722.0, 495.0, 294.0, 174.0, 131.0, 84.0, 65.0, 50.0, 19.0, 17.0, 5.0, 4.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.2890625, -10.9647216796875, -10.640380859375, -10.3160400390625, -9.99169921875, -9.6673583984375, -9.343017578125, -9.0186767578125, -8.6943359375, -8.3699951171875, -8.045654296875, -7.7213134765625, -7.39697265625, -7.0726318359375, -6.748291015625, -6.4239501953125, -6.099609375, -5.7752685546875, -5.450927734375, -5.1265869140625, -4.80224609375, -4.4779052734375, -4.153564453125, -3.8292236328125, -3.5048828125, -3.1805419921875, -2.856201171875, -2.5318603515625, -2.20751953125, -1.8831787109375, -1.558837890625, -1.2344970703125, -0.91015625, -0.5858154296875, -0.261474609375, 0.0628662109375, 0.38720703125, 0.7115478515625, 1.035888671875, 1.3602294921875, 1.6845703125, 2.0089111328125, 2.333251953125, 2.6575927734375, 2.98193359375, 3.3062744140625, 3.630615234375, 3.9549560546875, 4.279296875, 4.6036376953125, 4.927978515625, 5.2523193359375, 5.57666015625, 5.9010009765625, 6.225341796875, 6.5496826171875, 6.8740234375, 7.1983642578125, 7.522705078125, 7.8470458984375, 8.17138671875, 8.4957275390625, 8.820068359375, 9.1444091796875, 9.46875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 11.0, 6.0, 10.0, 15.0, 10.0, 11.0, 17.0, 19.0, 28.0, 28.0, 31.0, 32.0, 37.0, 31.0, 34.0, 37.0, 41.0, 42.0, 46.0, 37.0, 45.0, 50.0, 47.0, 33.0, 37.0, 43.0, 38.0, 27.0, 18.0, 28.0, 17.0, 16.0, 18.0, 11.0, 6.0, 5.0, 8.0, 8.0, 3.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.2689208984375, -5.088623046875, -4.9083251953125, -4.72802734375, -4.5477294921875, -4.367431640625, -4.1871337890625, -4.0068359375, -3.8265380859375, -3.646240234375, -3.4659423828125, -3.28564453125, -3.1053466796875, -2.925048828125, -2.7447509765625, -2.564453125, -2.3841552734375, -2.203857421875, -2.0235595703125, -1.84326171875, -1.6629638671875, -1.482666015625, -1.3023681640625, -1.1220703125, -0.9417724609375, -0.761474609375, -0.5811767578125, -0.40087890625, -0.2205810546875, -0.040283203125, 0.1400146484375, 0.3203125, 0.5006103515625, 0.680908203125, 0.8612060546875, 1.04150390625, 1.2218017578125, 1.402099609375, 1.5823974609375, 1.7626953125, 1.9429931640625, 2.123291015625, 2.3035888671875, 2.48388671875, 2.6641845703125, 2.844482421875, 3.0247802734375, 3.205078125, 3.3853759765625, 3.565673828125, 3.7459716796875, 3.92626953125, 4.1065673828125, 4.286865234375, 4.4671630859375, 4.6474609375, 4.8277587890625, 5.008056640625, 5.1883544921875, 5.36865234375, 5.5489501953125, 5.729248046875, 5.9095458984375, 6.08984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 17.0, 4.0, 12.0, 17.0, 21.0, 28.0, 40.0, 58.0, 70.0, 96.0, 162.0, 177.0, 263.0, 453.0, 598.0, 775.0, 1255.0, 1890.0, 3094.0, 5245.0, 9902.0, 21532.0, 55637.0, 161638.0, 374045.0, 257902.0, 89783.0, 32189.0, 13833.0, 6867.0, 3852.0, 2350.0, 1459.0, 1038.0, 718.0, 447.0, 337.0, 204.0, 160.0, 116.0, 71.0, 63.0, 40.0, 31.0, 21.0, 14.0, 13.0, 6.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-11.4375, -11.0880126953125, -10.738525390625, -10.3890380859375, -10.03955078125, -9.6900634765625, -9.340576171875, -8.9910888671875, -8.6416015625, -8.2921142578125, -7.942626953125, -7.5931396484375, -7.24365234375, -6.8941650390625, -6.544677734375, -6.1951904296875, -5.845703125, -5.4962158203125, -5.146728515625, -4.7972412109375, -4.44775390625, -4.0982666015625, -3.748779296875, -3.3992919921875, -3.0498046875, -2.7003173828125, -2.350830078125, -2.0013427734375, -1.65185546875, -1.3023681640625, -0.952880859375, -0.6033935546875, -0.25390625, 0.0955810546875, 0.445068359375, 0.7945556640625, 1.14404296875, 1.4935302734375, 1.843017578125, 2.1925048828125, 2.5419921875, 2.8914794921875, 3.240966796875, 3.5904541015625, 3.93994140625, 4.2894287109375, 4.638916015625, 4.9884033203125, 5.337890625, 5.6873779296875, 6.036865234375, 6.3863525390625, 6.73583984375, 7.0853271484375, 7.434814453125, 7.7843017578125, 8.1337890625, 8.4832763671875, 8.832763671875, 9.1822509765625, 9.53173828125, 9.8812255859375, 10.230712890625, 10.5802001953125, 10.9296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 10.0, 8.0, 9.0, 9.0, 8.0, 20.0, 19.0, 21.0, 18.0, 21.0, 26.0, 34.0, 36.0, 37.0, 39.0, 43.0, 38.0, 44.0, 39.0, 42.0, 44.0, 30.0, 43.0, 40.0, 23.0, 39.0, 31.0, 31.0, 23.0, 22.0, 13.0, 20.0, 15.0, 15.0, 12.0, 7.0, 7.0, 12.0, 11.0, 7.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.19140625, -3.089447021484375, -2.98748779296875, -2.885528564453125, -2.7835693359375, -2.681610107421875, -2.57965087890625, -2.477691650390625, -2.375732421875, -2.273773193359375, -2.17181396484375, -2.069854736328125, -1.9678955078125, -1.865936279296875, -1.76397705078125, -1.662017822265625, -1.56005859375, -1.458099365234375, -1.35614013671875, -1.254180908203125, -1.1522216796875, -1.050262451171875, -0.94830322265625, -0.846343994140625, -0.744384765625, -0.642425537109375, -0.54046630859375, -0.438507080078125, -0.3365478515625, -0.234588623046875, -0.13262939453125, -0.030670166015625, 0.0712890625, 0.173248291015625, 0.27520751953125, 0.377166748046875, 0.4791259765625, 0.581085205078125, 0.68304443359375, 0.785003662109375, 0.886962890625, 0.988922119140625, 1.09088134765625, 1.192840576171875, 1.2947998046875, 1.396759033203125, 1.49871826171875, 1.600677490234375, 1.70263671875, 1.804595947265625, 1.90655517578125, 2.008514404296875, 2.1104736328125, 2.212432861328125, 2.31439208984375, 2.416351318359375, 2.518310546875, 2.620269775390625, 2.72222900390625, 2.824188232421875, 2.9261474609375, 3.028106689453125, 3.13006591796875, 3.232025146484375, 3.333984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 10.0, 13.0, 21.0, 27.0, 26.0, 35.0, 71.0, 81.0, 125.0, 187.0, 204.0, 351.0, 441.0, 630.0, 952.0, 1342.0, 2052.0, 3313.0, 5376.0, 9763.0, 19692.0, 47347.0, 140143.0, 383240.0, 277912.0, 88283.0, 32321.0, 14374.0, 7415.0, 4364.0, 2733.0, 1780.0, 1175.0, 761.0, 556.0, 420.0, 291.0, 213.0, 157.0, 114.0, 75.0, 55.0, 30.0, 20.0, 11.0, 10.0, 11.0, 4.0, 5.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0], "bins": [-5.93359375, -5.752685546875, -5.57177734375, -5.390869140625, -5.2099609375, -5.029052734375, -4.84814453125, -4.667236328125, -4.486328125, -4.305419921875, -4.12451171875, -3.943603515625, -3.7626953125, -3.581787109375, -3.40087890625, -3.219970703125, -3.0390625, -2.858154296875, -2.67724609375, -2.496337890625, -2.3154296875, -2.134521484375, -1.95361328125, -1.772705078125, -1.591796875, -1.410888671875, -1.22998046875, -1.049072265625, -0.8681640625, -0.687255859375, -0.50634765625, -0.325439453125, -0.14453125, 0.036376953125, 0.21728515625, 0.398193359375, 0.5791015625, 0.760009765625, 0.94091796875, 1.121826171875, 1.302734375, 1.483642578125, 1.66455078125, 1.845458984375, 2.0263671875, 2.207275390625, 2.38818359375, 2.569091796875, 2.75, 2.930908203125, 3.11181640625, 3.292724609375, 3.4736328125, 3.654541015625, 3.83544921875, 4.016357421875, 4.197265625, 4.378173828125, 4.55908203125, 4.739990234375, 4.9208984375, 5.101806640625, 5.28271484375, 5.463623046875, 5.64453125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 11.0, 9.0, 17.0, 33.0, 32.0, 53.0, 81.0, 144.0, 151.0, 141.0, 116.0, 72.0, 54.0, 26.0, 19.0, 12.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004987716674804688, -0.00048445165157318115, -0.00047013163566589355, -0.00045581161975860596, -0.00044149160385131836, -0.00042717158794403076, -0.00041285157203674316, -0.00039853155612945557, -0.00038421154022216797, -0.00036989152431488037, -0.0003555715084075928, -0.0003412514925003052, -0.0003269314765930176, -0.00031261146068573, -0.0002982914447784424, -0.0002839714288711548, -0.0002696514129638672, -0.0002553313970565796, -0.000241011381149292, -0.0002266913652420044, -0.0002123713493347168, -0.0001980513334274292, -0.0001837313175201416, -0.000169411301612854, -0.0001550912857055664, -0.0001407712697982788, -0.0001264512538909912, -0.00011213123798370361, -9.781122207641602e-05, -8.349120616912842e-05, -6.917119026184082e-05, -5.485117435455322e-05, -4.0531158447265625e-05, -2.6211142539978027e-05, -1.189112663269043e-05, 2.428889274597168e-06, 1.6748905181884766e-05, 3.106892108917236e-05, 4.538893699645996e-05, 5.970895290374756e-05, 7.402896881103516e-05, 8.834898471832275e-05, 0.00010266900062561035, 0.00011698901653289795, 0.00013130903244018555, 0.00014562904834747314, 0.00015994906425476074, 0.00017426908016204834, 0.00018858909606933594, 0.00020290911197662354, 0.00021722912788391113, 0.00023154914379119873, 0.00024586915969848633, 0.0002601891756057739, 0.0002745091915130615, 0.0002888292074203491, 0.0003031492233276367, 0.0003174692392349243, 0.0003317892551422119, 0.0003461092710494995, 0.0003604292869567871, 0.0003747493028640747, 0.0003890693187713623, 0.0004033893346786499, 0.0004177093505859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 11.0, 10.0, 11.0, 12.0, 12.0, 20.0, 33.0, 62.0, 73.0, 74.0, 107.0, 162.0, 217.0, 317.0, 414.0, 597.0, 898.0, 1281.0, 1960.0, 3116.0, 4969.0, 8034.0, 15431.0, 36008.0, 127885.0, 397060.0, 307750.0, 83420.0, 26727.0, 12438.0, 6976.0, 4152.0, 2712.0, 1743.0, 1111.0, 784.0, 571.0, 388.0, 281.0, 218.0, 146.0, 98.0, 71.0, 52.0, 43.0, 29.0, 19.0, 11.0, 16.0, 8.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0], "bins": [-6.828125, -6.61370849609375, -6.3992919921875, -6.18487548828125, -5.970458984375, -5.75604248046875, -5.5416259765625, -5.32720947265625, -5.11279296875, -4.89837646484375, -4.6839599609375, -4.46954345703125, -4.255126953125, -4.04071044921875, -3.8262939453125, -3.61187744140625, -3.3974609375, -3.18304443359375, -2.9686279296875, -2.75421142578125, -2.539794921875, -2.32537841796875, -2.1109619140625, -1.89654541015625, -1.68212890625, -1.46771240234375, -1.2532958984375, -1.03887939453125, -0.824462890625, -0.61004638671875, -0.3956298828125, -0.18121337890625, 0.033203125, 0.24761962890625, 0.4620361328125, 0.67645263671875, 0.890869140625, 1.10528564453125, 1.3197021484375, 1.53411865234375, 1.74853515625, 1.96295166015625, 2.1773681640625, 2.39178466796875, 2.606201171875, 2.82061767578125, 3.0350341796875, 3.24945068359375, 3.4638671875, 3.67828369140625, 3.8927001953125, 4.10711669921875, 4.321533203125, 4.53594970703125, 4.7503662109375, 4.96478271484375, 5.17919921875, 5.39361572265625, 5.6080322265625, 5.82244873046875, 6.036865234375, 6.25128173828125, 6.4656982421875, 6.68011474609375, 6.89453125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 28.0, 53.0, 75.0, 110.0, 161.0, 157.0, 126.0, 93.0, 59.0, 23.0, 17.0, 9.0, 5.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.428131103515625, -2.35235595703125, -2.276580810546875, -2.2008056640625, -2.125030517578125, -2.04925537109375, -1.973480224609375, -1.897705078125, -1.821929931640625, -1.74615478515625, -1.670379638671875, -1.5946044921875, -1.518829345703125, -1.44305419921875, -1.367279052734375, -1.29150390625, -1.215728759765625, -1.13995361328125, -1.064178466796875, -0.9884033203125, -0.912628173828125, -0.83685302734375, -0.761077880859375, -0.685302734375, -0.609527587890625, -0.53375244140625, -0.457977294921875, -0.3822021484375, -0.306427001953125, -0.23065185546875, -0.154876708984375, -0.0791015625, -0.003326416015625, 0.07244873046875, 0.148223876953125, 0.2239990234375, 0.299774169921875, 0.37554931640625, 0.451324462890625, 0.527099609375, 0.602874755859375, 0.67864990234375, 0.754425048828125, 0.8302001953125, 0.905975341796875, 0.98175048828125, 1.057525634765625, 1.13330078125, 1.209075927734375, 1.28485107421875, 1.360626220703125, 1.4364013671875, 1.512176513671875, 1.58795166015625, 1.663726806640625, 1.739501953125, 1.815277099609375, 1.89105224609375, 1.966827392578125, 2.0426025390625, 2.118377685546875, 2.19415283203125, 2.269927978515625, 2.345703125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 4.0, 5.0, 5.0, 15.0, 8.0, 12.0, 17.0, 16.0, 24.0, 32.0, 28.0, 52.0, 47.0, 63.0, 53.0, 66.0, 74.0, 67.0, 55.0, 53.0, 50.0, 38.0, 38.0, 24.0, 29.0, 18.0, 23.0, 18.0, 12.0, 11.0, 10.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.132872581481934, -7.867674827575684, -7.602477073669434, -7.337279319763184, -7.072081565856934, -6.806883811950684, -6.541686058044434, -6.276488304138184, -6.011290550231934, -5.746092796325684, -5.480895042419434, -5.215697288513184, -4.950499534606934, -4.685301780700684, -4.420104026794434, -4.154906272888184, -3.8897085189819336, -3.6245107650756836, -3.3593130111694336, -3.0941152572631836, -2.8289175033569336, -2.5637197494506836, -2.2985219955444336, -2.0333242416381836, -1.7681264877319336, -1.5029287338256836, -1.2377309799194336, -0.9725332260131836, -0.7073354721069336, -0.4421377182006836, -0.1769399642944336, 0.0882577896118164, 0.35345458984375, 0.61865234375, 0.88385009765625, 1.1490478515625, 1.41424560546875, 1.679443359375, 1.94464111328125, 2.2098388671875, 2.47503662109375, 2.740234375, 3.00543212890625, 3.2706298828125, 3.53582763671875, 3.801025390625, 4.06622314453125, 4.3314208984375, 4.59661865234375, 4.86181640625, 5.12701416015625, 5.3922119140625, 5.65740966796875, 5.922607421875, 6.18780517578125, 6.4530029296875, 6.71820068359375, 6.9833984375, 7.24859619140625, 7.5137939453125, 7.77899169921875, 8.044189453125, 8.30938720703125, 8.5745849609375, 8.83978271484375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 9.0, 5.0, 9.0, 5.0, 12.0, 10.0, 14.0, 19.0, 20.0, 34.0, 30.0, 39.0, 40.0, 28.0, 34.0, 48.0, 45.0, 36.0, 37.0, 51.0, 38.0, 34.0, 43.0, 35.0, 41.0, 38.0, 38.0, 36.0, 28.0, 24.0, 21.0, 20.0, 12.0, 21.0, 14.0, 9.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453555583953857, -5.281481742858887, -5.109408378601074, -4.9373345375061035, -4.765260696411133, -4.59318733215332, -4.42111349105835, -4.249039649963379, -4.076966285705566, -3.904892683029175, -3.732818841934204, -3.5607452392578125, -3.388671398162842, -3.21659779548645, -3.0445241928100586, -2.872450351715088, -2.700376510620117, -2.5283029079437256, -2.356229066848755, -2.1841554641723633, -2.0120816230773926, -1.840008020401001, -1.6679344177246094, -1.4958606958389282, -1.323786973953247, -1.151713252067566, -0.9796395897865295, -0.8075659275054932, -0.635492205619812, -0.46341848373413086, -0.29134488105773926, -0.1192711591720581, 0.052802085876464844, 0.2248757779598236, 0.3969494700431824, 0.5690231323242188, 0.7410968542098999, 0.913170576095581, 1.0852441787719727, 1.2573179006576538, 1.429391622543335, 1.6014653444290161, 1.7735390663146973, 1.9456126689910889, 2.1176862716674805, 2.289760112762451, 2.4618337154388428, 2.6339073181152344, 2.805981159210205, 2.9780547618865967, 3.1501286029815674, 3.322202205657959, 3.4942760467529297, 3.6663496494293213, 3.838423252105713, 4.010497093200684, 4.182570457458496, 4.354644298553467, 4.526717662811279, 4.69879150390625, 4.870865345001221, 5.042939186096191, 5.215012550354004, 5.387086391448975, 5.559160232543945]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 17.0, 25.0, 29.0, 57.0, 80.0, 128.0, 172.0, 262.0, 431.0, 680.0, 977.0, 1457.0, 2184.0, 3408.0, 5228.0, 8280.0, 12882.0, 19690.0, 30020.0, 45526.0, 66635.0, 92278.0, 118062.0, 133793.0, 131177.0, 111668.0, 85161.0, 60277.0, 40980.0, 27048.0, 17563.0, 11342.0, 7371.0, 4691.0, 3133.0, 1981.0, 1354.0, 849.0, 549.0, 366.0, 255.0, 168.0, 104.0, 66.0, 40.0, 38.0, 18.0, 12.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0], "bins": [-4.65625, -4.51458740234375, -4.3729248046875, -4.23126220703125, -4.089599609375, -3.94793701171875, -3.8062744140625, -3.66461181640625, -3.52294921875, -3.38128662109375, -3.2396240234375, -3.09796142578125, -2.956298828125, -2.81463623046875, -2.6729736328125, -2.53131103515625, -2.3896484375, -2.24798583984375, -2.1063232421875, -1.96466064453125, -1.822998046875, -1.68133544921875, -1.5396728515625, -1.39801025390625, -1.25634765625, -1.11468505859375, -0.9730224609375, -0.83135986328125, -0.689697265625, -0.54803466796875, -0.4063720703125, -0.26470947265625, -0.123046875, 0.01861572265625, 0.1602783203125, 0.30194091796875, 0.443603515625, 0.58526611328125, 0.7269287109375, 0.86859130859375, 1.01025390625, 1.15191650390625, 1.2935791015625, 1.43524169921875, 1.576904296875, 1.71856689453125, 1.8602294921875, 2.00189208984375, 2.1435546875, 2.28521728515625, 2.4268798828125, 2.56854248046875, 2.710205078125, 2.85186767578125, 2.9935302734375, 3.13519287109375, 3.27685546875, 3.41851806640625, 3.5601806640625, 3.70184326171875, 3.843505859375, 3.98516845703125, 4.1268310546875, 4.26849365234375, 4.41015625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 13.0, 13.0, 15.0, 14.0, 20.0, 28.0, 32.0, 37.0, 28.0, 22.0, 34.0, 37.0, 36.0, 36.0, 43.0, 38.0, 43.0, 47.0, 37.0, 35.0, 37.0, 31.0, 48.0, 36.0, 36.0, 24.0, 31.0, 14.0, 16.0, 24.0, 13.0, 16.0, 8.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.568603515625, -5.39111328125, -5.213623046875, -5.0361328125, -4.858642578125, -4.68115234375, -4.503662109375, -4.326171875, -4.148681640625, -3.97119140625, -3.793701171875, -3.6162109375, -3.438720703125, -3.26123046875, -3.083740234375, -2.90625, -2.728759765625, -2.55126953125, -2.373779296875, -2.1962890625, -2.018798828125, -1.84130859375, -1.663818359375, -1.486328125, -1.308837890625, -1.13134765625, -0.953857421875, -0.7763671875, -0.598876953125, -0.42138671875, -0.243896484375, -0.06640625, 0.111083984375, 0.28857421875, 0.466064453125, 0.6435546875, 0.821044921875, 0.99853515625, 1.176025390625, 1.353515625, 1.531005859375, 1.70849609375, 1.885986328125, 2.0634765625, 2.240966796875, 2.41845703125, 2.595947265625, 2.7734375, 2.950927734375, 3.12841796875, 3.305908203125, 3.4833984375, 3.660888671875, 3.83837890625, 4.015869140625, 4.193359375, 4.370849609375, 4.54833984375, 4.725830078125, 4.9033203125, 5.080810546875, 5.25830078125, 5.435791015625, 5.61328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 22.0, 33.0, 40.0, 80.0, 124.0, 177.0, 316.0, 492.0, 802.0, 1291.0, 2049.0, 3342.0, 5220.0, 8876.0, 14198.0, 23525.0, 38527.0, 60949.0, 93313.0, 129610.0, 154645.0, 151654.0, 123304.0, 87577.0, 57186.0, 35251.0, 21445.0, 13308.0, 8075.0, 4936.0, 3091.0, 1984.0, 1175.0, 744.0, 469.0, 275.0, 159.0, 116.0, 69.0, 27.0, 24.0, 18.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.5859375, -5.42596435546875, -5.2659912109375, -5.10601806640625, -4.946044921875, -4.78607177734375, -4.6260986328125, -4.46612548828125, -4.30615234375, -4.14617919921875, -3.9862060546875, -3.82623291015625, -3.666259765625, -3.50628662109375, -3.3463134765625, -3.18634033203125, -3.0263671875, -2.86639404296875, -2.7064208984375, -2.54644775390625, -2.386474609375, -2.22650146484375, -2.0665283203125, -1.90655517578125, -1.74658203125, -1.58660888671875, -1.4266357421875, -1.26666259765625, -1.106689453125, -0.94671630859375, -0.7867431640625, -0.62677001953125, -0.466796875, -0.30682373046875, -0.1468505859375, 0.01312255859375, 0.173095703125, 0.33306884765625, 0.4930419921875, 0.65301513671875, 0.81298828125, 0.97296142578125, 1.1329345703125, 1.29290771484375, 1.452880859375, 1.61285400390625, 1.7728271484375, 1.93280029296875, 2.0927734375, 2.25274658203125, 2.4127197265625, 2.57269287109375, 2.732666015625, 2.89263916015625, 3.0526123046875, 3.21258544921875, 3.37255859375, 3.53253173828125, 3.6925048828125, 3.85247802734375, 4.012451171875, 4.17242431640625, 4.3323974609375, 4.49237060546875, 4.65234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 14.0, 13.0, 17.0, 17.0, 29.0, 26.0, 24.0, 28.0, 21.0, 31.0, 48.0, 50.0, 42.0, 51.0, 42.0, 39.0, 51.0, 51.0, 49.0, 35.0, 36.0, 37.0, 35.0, 33.0, 21.0, 16.0, 17.0, 15.0, 9.0, 14.0, 7.0, 3.0, 11.0, 6.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.442413330078125, -3.33795166015625, -3.233489990234375, -3.1290283203125, -3.024566650390625, -2.92010498046875, -2.815643310546875, -2.711181640625, -2.606719970703125, -2.50225830078125, -2.397796630859375, -2.2933349609375, -2.188873291015625, -2.08441162109375, -1.979949951171875, -1.87548828125, -1.771026611328125, -1.66656494140625, -1.562103271484375, -1.4576416015625, -1.353179931640625, -1.24871826171875, -1.144256591796875, -1.039794921875, -0.935333251953125, -0.83087158203125, -0.726409912109375, -0.6219482421875, -0.517486572265625, -0.41302490234375, -0.308563232421875, -0.2041015625, -0.099639892578125, 0.00482177734375, 0.109283447265625, 0.2137451171875, 0.318206787109375, 0.42266845703125, 0.527130126953125, 0.631591796875, 0.736053466796875, 0.84051513671875, 0.944976806640625, 1.0494384765625, 1.153900146484375, 1.25836181640625, 1.362823486328125, 1.46728515625, 1.571746826171875, 1.67620849609375, 1.780670166015625, 1.8851318359375, 1.989593505859375, 2.09405517578125, 2.198516845703125, 2.302978515625, 2.407440185546875, 2.51190185546875, 2.616363525390625, 2.7208251953125, 2.825286865234375, 2.92974853515625, 3.034210205078125, 3.138671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 13.0, 5.0, 15.0, 20.0, 38.0, 50.0, 83.0, 120.0, 204.0, 279.0, 458.0, 689.0, 1109.0, 1859.0, 3049.0, 4974.0, 8279.0, 14246.0, 24046.0, 40489.0, 66289.0, 103157.0, 144125.0, 167947.0, 154708.0, 116696.0, 77523.0, 47560.0, 28645.0, 16925.0, 9933.0, 5881.0, 3519.0, 2111.0, 1305.0, 828.0, 494.0, 331.0, 188.0, 133.0, 83.0, 56.0, 38.0, 33.0, 13.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0], "bins": [-2.98046875, -2.899169921875, -2.81787109375, -2.736572265625, -2.6552734375, -2.573974609375, -2.49267578125, -2.411376953125, -2.330078125, -2.248779296875, -2.16748046875, -2.086181640625, -2.0048828125, -1.923583984375, -1.84228515625, -1.760986328125, -1.6796875, -1.598388671875, -1.51708984375, -1.435791015625, -1.3544921875, -1.273193359375, -1.19189453125, -1.110595703125, -1.029296875, -0.947998046875, -0.86669921875, -0.785400390625, -0.7041015625, -0.622802734375, -0.54150390625, -0.460205078125, -0.37890625, -0.297607421875, -0.21630859375, -0.135009765625, -0.0537109375, 0.027587890625, 0.10888671875, 0.190185546875, 0.271484375, 0.352783203125, 0.43408203125, 0.515380859375, 0.5966796875, 0.677978515625, 0.75927734375, 0.840576171875, 0.921875, 1.003173828125, 1.08447265625, 1.165771484375, 1.2470703125, 1.328369140625, 1.40966796875, 1.490966796875, 1.572265625, 1.653564453125, 1.73486328125, 1.816162109375, 1.8974609375, 1.978759765625, 2.06005859375, 2.141357421875, 2.22265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 7.0, 9.0, 16.0, 14.0, 8.0, 18.0, 24.0, 28.0, 42.0, 32.0, 35.0, 52.0, 62.0, 50.0, 61.0, 56.0, 53.0, 58.0, 57.0, 55.0, 36.0, 40.0, 26.0, 35.0, 21.0, 20.0, 16.0, 12.0, 8.0, 8.0, 6.0, 5.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025463104248046875, -0.00024595484137535095, -0.00023727864027023315, -0.00022860243916511536, -0.00021992623805999756, -0.00021125003695487976, -0.00020257383584976196, -0.00019389763474464417, -0.00018522143363952637, -0.00017654523253440857, -0.00016786903142929077, -0.00015919283032417297, -0.00015051662921905518, -0.00014184042811393738, -0.00013316422700881958, -0.00012448802590370178, -0.00011581182479858398, -0.00010713562369346619, -9.845942258834839e-05, -8.978322148323059e-05, -8.110702037811279e-05, -7.2430819272995e-05, -6.37546181678772e-05, -5.50784170627594e-05, -4.64022159576416e-05, -3.7726014852523804e-05, -2.9049813747406006e-05, -2.0373612642288208e-05, -1.169741153717041e-05, -3.0212104320526123e-06, 5.6549906730651855e-06, 1.4331191778182983e-05, 2.300739288330078e-05, 3.168359398841858e-05, 4.035979509353638e-05, 4.9035996198654175e-05, 5.771219730377197e-05, 6.638839840888977e-05, 7.506459951400757e-05, 8.374080061912537e-05, 9.241700172424316e-05, 0.00010109320282936096, 0.00010976940393447876, 0.00011844560503959656, 0.00012712180614471436, 0.00013579800724983215, 0.00014447420835494995, 0.00015315040946006775, 0.00016182661056518555, 0.00017050281167030334, 0.00017917901277542114, 0.00018785521388053894, 0.00019653141498565674, 0.00020520761609077454, 0.00021388381719589233, 0.00022256001830101013, 0.00023123621940612793, 0.00023991242051124573, 0.0002485886216163635, 0.0002572648227214813, 0.0002659410238265991, 0.0002746172249317169, 0.0002832934260368347, 0.0002919696271419525, 0.0003006458282470703]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 13.0, 15.0, 21.0, 37.0, 44.0, 67.0, 85.0, 129.0, 211.0, 305.0, 458.0, 734.0, 1002.0, 1626.0, 2447.0, 3831.0, 5974.0, 9619.0, 14687.0, 23432.0, 36353.0, 56283.0, 83807.0, 115182.0, 141511.0, 145498.0, 126369.0, 94989.0, 65391.0, 42784.0, 27299.0, 17497.0, 11059.0, 7032.0, 4435.0, 2915.0, 1864.0, 1165.0, 823.0, 495.0, 331.0, 234.0, 163.0, 109.0, 72.0, 42.0, 39.0, 22.0, 15.0, 12.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.3046875, -2.233062744140625, -2.16143798828125, -2.089813232421875, -2.0181884765625, -1.946563720703125, -1.87493896484375, -1.803314208984375, -1.731689453125, -1.660064697265625, -1.58843994140625, -1.516815185546875, -1.4451904296875, -1.373565673828125, -1.30194091796875, -1.230316162109375, -1.15869140625, -1.087066650390625, -1.01544189453125, -0.943817138671875, -0.8721923828125, -0.800567626953125, -0.72894287109375, -0.657318115234375, -0.585693359375, -0.514068603515625, -0.44244384765625, -0.370819091796875, -0.2991943359375, -0.227569580078125, -0.15594482421875, -0.084320068359375, -0.0126953125, 0.058929443359375, 0.13055419921875, 0.202178955078125, 0.2738037109375, 0.345428466796875, 0.41705322265625, 0.488677978515625, 0.560302734375, 0.631927490234375, 0.70355224609375, 0.775177001953125, 0.8468017578125, 0.918426513671875, 0.99005126953125, 1.061676025390625, 1.13330078125, 1.204925537109375, 1.27655029296875, 1.348175048828125, 1.4197998046875, 1.491424560546875, 1.56304931640625, 1.634674072265625, 1.706298828125, 1.777923583984375, 1.84954833984375, 1.921173095703125, 1.9927978515625, 2.064422607421875, 2.13604736328125, 2.207672119140625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 3.0, 3.0, 9.0, 5.0, 4.0, 11.0, 13.0, 16.0, 7.0, 23.0, 32.0, 25.0, 34.0, 32.0, 39.0, 49.0, 41.0, 47.0, 55.0, 36.0, 40.0, 47.0, 50.0, 51.0, 49.0, 38.0, 29.0, 35.0, 30.0, 21.0, 28.0, 17.0, 12.0, 11.0, 11.0, 12.0, 8.0, 5.0, 3.0, 5.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63720703125, -0.615447998046875, -0.59368896484375, -0.571929931640625, -0.5501708984375, -0.528411865234375, -0.50665283203125, -0.484893798828125, -0.463134765625, -0.441375732421875, -0.41961669921875, -0.397857666015625, -0.3760986328125, -0.354339599609375, -0.33258056640625, -0.310821533203125, -0.2890625, -0.267303466796875, -0.24554443359375, -0.223785400390625, -0.2020263671875, -0.180267333984375, -0.15850830078125, -0.136749267578125, -0.114990234375, -0.093231201171875, -0.07147216796875, -0.049713134765625, -0.0279541015625, -0.006195068359375, 0.01556396484375, 0.037322998046875, 0.05908203125, 0.080841064453125, 0.10260009765625, 0.124359130859375, 0.1461181640625, 0.167877197265625, 0.18963623046875, 0.211395263671875, 0.233154296875, 0.254913330078125, 0.27667236328125, 0.298431396484375, 0.3201904296875, 0.341949462890625, 0.36370849609375, 0.385467529296875, 0.4072265625, 0.428985595703125, 0.45074462890625, 0.472503662109375, 0.4942626953125, 0.516021728515625, 0.53778076171875, 0.559539794921875, 0.581298828125, 0.603057861328125, 0.62481689453125, 0.646575927734375, 0.6683349609375, 0.690093994140625, 0.71185302734375, 0.733612060546875, 0.75537109375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 10.0, 9.0, 4.0, 18.0, 14.0, 31.0, 32.0, 34.0, 37.0, 47.0, 60.0, 64.0, 53.0, 75.0, 63.0, 47.0, 58.0, 48.0, 49.0, 35.0, 38.0, 33.0, 17.0, 14.0, 23.0, 10.0, 7.0, 7.0, 12.0, 6.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.54723072052002, -8.286473274230957, -8.025716781616211, -7.764959335327148, -7.504201889038086, -7.243444442749023, -6.982687473297119, -6.721930503845215, -6.461173057556152, -6.20041561126709, -5.9396586418151855, -5.678901672363281, -5.418144226074219, -5.157386779785156, -4.896629810333252, -4.635872840881348, -4.375115394592285, -4.114357948303223, -3.8536009788513184, -3.592843770980835, -3.3320865631103516, -3.071329355239868, -2.8105721473693848, -2.5498149394989014, -2.289057731628418, -2.0283005237579346, -1.7675433158874512, -1.5067861080169678, -1.2460289001464844, -0.985271692276001, -0.7245144844055176, -0.4637572765350342, -0.20299911499023438, 0.05775809288024902, 0.3185153007507324, 0.5792725086212158, 0.8400297164916992, 1.1007869243621826, 1.361544132232666, 1.6223013401031494, 1.8830585479736328, 2.143815755844116, 2.4045729637145996, 2.665330171585083, 2.9260873794555664, 3.18684458732605, 3.447601795196533, 3.7083590030670166, 3.9691162109375, 4.2298736572265625, 4.490630626678467, 4.751387596130371, 5.012145042419434, 5.272902488708496, 5.5336594581604, 5.794416427612305, 6.055173873901367, 6.31593132019043, 6.576688289642334, 6.837445259094238, 7.098202705383301, 7.358960151672363, 7.619717121124268, 7.880474090576172, 8.141231536865234]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 13.0, 10.0, 4.0, 13.0, 20.0, 8.0, 19.0, 28.0, 33.0, 29.0, 27.0, 38.0, 23.0, 41.0, 34.0, 33.0, 42.0, 43.0, 36.0, 41.0, 29.0, 39.0, 33.0, 47.0, 32.0, 37.0, 32.0, 20.0, 20.0, 25.0, 34.0, 17.0, 15.0, 15.0, 6.0, 15.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.270878791809082, -5.108799934387207, -4.946721076965332, -4.784642696380615, -4.62256383895874, -4.460484981536865, -4.29840612411499, -4.136327266693115, -3.9742486476898193, -3.8121697902679443, -3.6500911712646484, -3.4880123138427734, -3.3259334564208984, -3.1638548374176025, -3.0017759799957275, -2.8396973609924316, -2.6776185035705566, -2.5155396461486816, -2.3534610271453857, -2.1913821697235107, -2.029303550720215, -1.8672246932983398, -1.7051458358764648, -1.5430670976638794, -1.380988359451294, -1.2189096212387085, -1.056830883026123, -0.894752025604248, -0.7326732873916626, -0.5705945491790771, -0.4085157513618469, -0.2464369535446167, -0.08435773849487305, 0.07772102952003479, 0.23979979753494263, 0.40187856554985046, 0.5639573335647583, 0.7260360717773438, 0.888114869594574, 1.0501936674118042, 1.2122724056243896, 1.374351143836975, 1.5364298820495605, 1.6985087394714355, 1.860587477684021, 2.0226662158966064, 2.1847450733184814, 2.3468236923217773, 2.5089025497436523, 2.6709814071655273, 2.8330600261688232, 2.9951388835906982, 3.157217502593994, 3.319296360015869, 3.481375217437744, 3.643454074859619, 3.805532693862915, 3.96761155128479, 4.129690170288086, 4.291769027709961, 4.453847885131836, 4.615926742553711, 4.778005123138428, 4.940083980560303, 5.102162837982178]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 5.0, 7.0, 8.0, 11.0, 13.0, 34.0, 47.0, 66.0, 117.0, 163.0, 278.0, 393.0, 670.0, 1072.0, 1888.0, 3306.0, 5885.0, 10399.0, 20285.0, 41019.0, 90970.0, 218605.0, 553826.0, 1147926.0, 1151243.0, 556718.0, 216571.0, 88194.0, 40015.0, 19913.0, 10384.0, 5698.0, 3407.0, 1891.0, 1208.0, 756.0, 442.0, 302.0, 185.0, 123.0, 83.0, 59.0, 35.0, 25.0, 12.0, 11.0, 5.0, 4.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.7177734375, -9.404296875, -9.0908203125, -8.77734375, -8.4638671875, -8.150390625, -7.8369140625, -7.5234375, -7.2099609375, -6.896484375, -6.5830078125, -6.26953125, -5.9560546875, -5.642578125, -5.3291015625, -5.015625, -4.7021484375, -4.388671875, -4.0751953125, -3.76171875, -3.4482421875, -3.134765625, -2.8212890625, -2.5078125, -2.1943359375, -1.880859375, -1.5673828125, -1.25390625, -0.9404296875, -0.626953125, -0.3134765625, 0.0, 0.3134765625, 0.626953125, 0.9404296875, 1.25390625, 1.5673828125, 1.880859375, 2.1943359375, 2.5078125, 2.8212890625, 3.134765625, 3.4482421875, 3.76171875, 4.0751953125, 4.388671875, 4.7021484375, 5.015625, 5.3291015625, 5.642578125, 5.9560546875, 6.26953125, 6.5830078125, 6.896484375, 7.2099609375, 7.5234375, 7.8369140625, 8.150390625, 8.4638671875, 8.77734375, 9.0908203125, 9.404296875, 9.7177734375, 10.03125]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 5.0, 5.0, 8.0, 10.0, 11.0, 18.0, 15.0, 18.0, 21.0, 25.0, 31.0, 26.0, 34.0, 32.0, 29.0, 42.0, 39.0, 33.0, 39.0, 41.0, 34.0, 35.0, 46.0, 34.0, 43.0, 27.0, 33.0, 36.0, 24.0, 29.0, 25.0, 21.0, 14.0, 21.0, 19.0, 15.0, 8.0, 11.0, 12.0, 7.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.33984375, -4.208984375, -4.078125, -3.947265625, -3.81640625, -3.685546875, -3.5546875, -3.423828125, -3.29296875, -3.162109375, -3.03125, -2.900390625, -2.76953125, -2.638671875, -2.5078125, -2.376953125, -2.24609375, -2.115234375, -1.984375, -1.853515625, -1.72265625, -1.591796875, -1.4609375, -1.330078125, -1.19921875, -1.068359375, -0.9375, -0.806640625, -0.67578125, -0.544921875, -0.4140625, -0.283203125, -0.15234375, -0.021484375, 0.109375, 0.240234375, 0.37109375, 0.501953125, 0.6328125, 0.763671875, 0.89453125, 1.025390625, 1.15625, 1.287109375, 1.41796875, 1.548828125, 1.6796875, 1.810546875, 1.94140625, 2.072265625, 2.203125, 2.333984375, 2.46484375, 2.595703125, 2.7265625, 2.857421875, 2.98828125, 3.119140625, 3.25, 3.380859375, 3.51171875, 3.642578125, 3.7734375, 3.904296875, 4.03515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 7.0, 15.0, 33.0, 49.0, 66.0, 113.0, 133.0, 203.0, 327.0, 499.0, 700.0, 1098.0, 1592.0, 2490.0, 3782.0, 6051.0, 9608.0, 15788.0, 25943.0, 43763.0, 75909.0, 136455.0, 251503.0, 458018.0, 747012.0, 881119.0, 663363.0, 383922.0, 209589.0, 114571.0, 64441.0, 36977.0, 22079.0, 13452.0, 8188.0, 5282.0, 3443.0, 2202.0, 1489.0, 937.0, 650.0, 485.0, 284.0, 225.0, 141.0, 91.0, 67.0, 29.0, 37.0, 19.0, 11.0, 11.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-8.0859375, -7.83599853515625, -7.5860595703125, -7.33612060546875, -7.086181640625, -6.83624267578125, -6.5863037109375, -6.33636474609375, -6.08642578125, -5.83648681640625, -5.5865478515625, -5.33660888671875, -5.086669921875, -4.83673095703125, -4.5867919921875, -4.33685302734375, -4.0869140625, -3.83697509765625, -3.5870361328125, -3.33709716796875, -3.087158203125, -2.83721923828125, -2.5872802734375, -2.33734130859375, -2.08740234375, -1.83746337890625, -1.5875244140625, -1.33758544921875, -1.087646484375, -0.83770751953125, -0.5877685546875, -0.33782958984375, -0.087890625, 0.16204833984375, 0.4119873046875, 0.66192626953125, 0.911865234375, 1.16180419921875, 1.4117431640625, 1.66168212890625, 1.91162109375, 2.16156005859375, 2.4114990234375, 2.66143798828125, 2.911376953125, 3.16131591796875, 3.4112548828125, 3.66119384765625, 3.9111328125, 4.16107177734375, 4.4110107421875, 4.66094970703125, 4.910888671875, 5.16082763671875, 5.4107666015625, 5.66070556640625, 5.91064453125, 6.16058349609375, 6.4105224609375, 6.66046142578125, 6.910400390625, 7.16033935546875, 7.4102783203125, 7.66021728515625, 7.91015625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 8.0, 9.0, 10.0, 21.0, 19.0, 24.0, 25.0, 31.0, 54.0, 61.0, 62.0, 89.0, 104.0, 142.0, 180.0, 216.0, 221.0, 256.0, 296.0, 288.0, 306.0, 259.0, 274.0, 199.0, 182.0, 159.0, 122.0, 98.0, 72.0, 67.0, 49.0, 39.0, 24.0, 25.0, 14.0, 19.0, 11.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.04296875, -2.954254150390625, -2.86553955078125, -2.776824951171875, -2.6881103515625, -2.599395751953125, -2.51068115234375, -2.421966552734375, -2.333251953125, -2.244537353515625, -2.15582275390625, -2.067108154296875, -1.9783935546875, -1.889678955078125, -1.80096435546875, -1.712249755859375, -1.62353515625, -1.534820556640625, -1.44610595703125, -1.357391357421875, -1.2686767578125, -1.179962158203125, -1.09124755859375, -1.002532958984375, -0.913818359375, -0.825103759765625, -0.73638916015625, -0.647674560546875, -0.5589599609375, -0.470245361328125, -0.38153076171875, -0.292816162109375, -0.2041015625, -0.115386962890625, -0.02667236328125, 0.062042236328125, 0.1507568359375, 0.239471435546875, 0.32818603515625, 0.416900634765625, 0.505615234375, 0.594329833984375, 0.68304443359375, 0.771759033203125, 0.8604736328125, 0.949188232421875, 1.03790283203125, 1.126617431640625, 1.21533203125, 1.304046630859375, 1.39276123046875, 1.481475830078125, 1.5701904296875, 1.658905029296875, 1.74761962890625, 1.836334228515625, 1.925048828125, 2.013763427734375, 2.10247802734375, 2.191192626953125, 2.2799072265625, 2.368621826171875, 2.45733642578125, 2.546051025390625, 2.634765625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 3.0, 10.0, 4.0, 15.0, 14.0, 17.0, 29.0, 17.0, 31.0, 41.0, 39.0, 76.0, 62.0, 75.0, 70.0, 74.0, 64.0, 57.0, 42.0, 57.0, 50.0, 28.0, 28.0, 14.0, 23.0, 11.0, 11.0, 9.0, 3.0, 9.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.641690254211426, -11.29724407196045, -10.952796936035156, -10.60835075378418, -10.263903617858887, -9.91945743560791, -9.575010299682617, -9.23056411743164, -8.886117935180664, -8.541671752929688, -8.197224617004395, -7.852778434753418, -7.508331298828125, -7.163885116577148, -6.819438457489014, -6.474991798400879, -6.130544662475586, -5.786098003387451, -5.441651344299316, -5.09720516204834, -4.752758026123047, -4.40831184387207, -4.0638651847839355, -3.719418525695801, -3.374971866607666, -3.0305252075195312, -2.6860785484313965, -2.341632127761841, -1.997185468673706, -1.6527388095855713, -1.3082923889160156, -0.9638457298278809, -0.6193981170654297, -0.2749515175819397, 0.06949508190155029, 0.4139416217803955, 0.7583882808685303, 1.102834939956665, 1.4472813606262207, 1.7917280197143555, 2.1361746788024902, 2.480621337890625, 2.8250679969787598, 3.1695144176483154, 3.51396107673645, 3.858407735824585, 4.202854156494141, 4.547300815582275, 4.89174747467041, 5.236194133758545, 5.58064079284668, 5.925086975097656, 6.269534111022949, 6.613980293273926, 6.9584269523620605, 7.302873611450195, 7.64732027053833, 7.991766929626465, 8.336213111877441, 8.680660247802734, 9.025106430053711, 9.369553565979004, 9.71399974822998, 10.058446884155273, 10.40289306640625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 12.0, 15.0, 10.0, 14.0, 18.0, 14.0, 29.0, 24.0, 29.0, 25.0, 31.0, 31.0, 39.0, 35.0, 37.0, 49.0, 47.0, 45.0, 35.0, 40.0, 30.0, 34.0, 36.0, 31.0, 40.0, 40.0, 29.0, 20.0, 20.0, 25.0, 20.0, 9.0, 14.0, 12.0, 13.0, 9.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.996007442474365, -5.813138484954834, -5.630269527435303, -5.447400093078613, -5.264531135559082, -5.081662178039551, -4.8987932205200195, -4.715924263000488, -4.533055305480957, -4.350186347961426, -4.1673173904418945, -3.984448194503784, -3.801579236984253, -3.6187100410461426, -3.4358410835266113, -3.25297212600708, -3.0701029300689697, -2.8872339725494385, -2.704364776611328, -2.521495819091797, -2.3386268615722656, -2.1557579040527344, -1.972888708114624, -1.7900197505950928, -1.607150673866272, -1.4242815971374512, -1.24141263961792, -1.0585435628890991, -0.8756745457649231, -0.6928055286407471, -0.5099364519119263, -0.327067494392395, -0.14419841766357422, 0.038670614361763, 0.22153964638710022, 0.40440869331359863, 0.5872777104377747, 0.7701467275619507, 0.9530158042907715, 1.1358847618103027, 1.3187538385391235, 1.5016229152679443, 1.6844918727874756, 1.8673609495162964, 2.050230026245117, 2.2330989837646484, 2.4159679412841797, 2.598836898803711, 2.7817060947418213, 2.9645750522613525, 3.147444248199463, 3.330313205718994, 3.5131821632385254, 3.6960511207580566, 3.878920316696167, 4.061789512634277, 4.244658470153809, 4.42752742767334, 4.610396385192871, 4.793265342712402, 4.976134777069092, 5.159003734588623, 5.341872692108154, 5.5247416496276855, 5.707610607147217]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 29.0, 16.0, 28.0, 59.0, 81.0, 132.0, 215.0, 283.0, 453.0, 687.0, 1127.0, 1780.0, 2699.0, 4572.0, 7536.0, 12563.0, 21458.0, 35885.0, 59743.0, 96527.0, 141020.0, 172421.0, 163778.0, 123172.0, 80934.0, 48651.0, 28903.0, 17122.0, 10405.0, 6106.0, 3736.0, 2368.0, 1418.0, 934.0, 561.0, 376.0, 267.0, 154.0, 105.0, 81.0, 56.0, 29.0, 28.0, 15.0, 6.0, 8.0, 4.0, 7.0, 5.0, 0.0, 2.0, 1.0], "bins": [-4.65625, -4.51849365234375, -4.3807373046875, -4.24298095703125, -4.105224609375, -3.96746826171875, -3.8297119140625, -3.69195556640625, -3.55419921875, -3.41644287109375, -3.2786865234375, -3.14093017578125, -3.003173828125, -2.86541748046875, -2.7276611328125, -2.58990478515625, -2.4521484375, -2.31439208984375, -2.1766357421875, -2.03887939453125, -1.901123046875, -1.76336669921875, -1.6256103515625, -1.48785400390625, -1.35009765625, -1.21234130859375, -1.0745849609375, -0.93682861328125, -0.799072265625, -0.66131591796875, -0.5235595703125, -0.38580322265625, -0.248046875, -0.11029052734375, 0.0274658203125, 0.16522216796875, 0.302978515625, 0.44073486328125, 0.5784912109375, 0.71624755859375, 0.85400390625, 0.99176025390625, 1.1295166015625, 1.26727294921875, 1.405029296875, 1.54278564453125, 1.6805419921875, 1.81829833984375, 1.9560546875, 2.09381103515625, 2.2315673828125, 2.36932373046875, 2.507080078125, 2.64483642578125, 2.7825927734375, 2.92034912109375, 3.05810546875, 3.19586181640625, 3.3336181640625, 3.47137451171875, 3.609130859375, 3.74688720703125, 3.8846435546875, 4.02239990234375, 4.16015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 10.0, 11.0, 11.0, 13.0, 18.0, 15.0, 17.0, 22.0, 16.0, 17.0, 21.0, 24.0, 23.0, 19.0, 39.0, 42.0, 41.0, 43.0, 40.0, 42.0, 32.0, 27.0, 35.0, 32.0, 34.0, 31.0, 30.0, 36.0, 30.0, 29.0, 18.0, 28.0, 21.0, 10.0, 18.0, 12.0, 10.0, 18.0, 9.0, 6.0, 9.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0], "bins": [-5.9453125, -5.7720947265625, -5.598876953125, -5.4256591796875, -5.25244140625, -5.0792236328125, -4.906005859375, -4.7327880859375, -4.5595703125, -4.3863525390625, -4.213134765625, -4.0399169921875, -3.86669921875, -3.6934814453125, -3.520263671875, -3.3470458984375, -3.173828125, -3.0006103515625, -2.827392578125, -2.6541748046875, -2.48095703125, -2.3077392578125, -2.134521484375, -1.9613037109375, -1.7880859375, -1.6148681640625, -1.441650390625, -1.2684326171875, -1.09521484375, -0.9219970703125, -0.748779296875, -0.5755615234375, -0.40234375, -0.2291259765625, -0.055908203125, 0.1173095703125, 0.29052734375, 0.4637451171875, 0.636962890625, 0.8101806640625, 0.9833984375, 1.1566162109375, 1.329833984375, 1.5030517578125, 1.67626953125, 1.8494873046875, 2.022705078125, 2.1959228515625, 2.369140625, 2.5423583984375, 2.715576171875, 2.8887939453125, 3.06201171875, 3.2352294921875, 3.408447265625, 3.5816650390625, 3.7548828125, 3.9281005859375, 4.101318359375, 4.2745361328125, 4.44775390625, 4.6209716796875, 4.794189453125, 4.9674072265625, 5.140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 10.0, 14.0, 9.0, 21.0, 29.0, 27.0, 43.0, 68.0, 95.0, 136.0, 233.0, 369.0, 516.0, 905.0, 1526.0, 2657.0, 4736.0, 9143.0, 18226.0, 37078.0, 77481.0, 155263.0, 251213.0, 231105.0, 130367.0, 64044.0, 30582.0, 15010.0, 7715.0, 4041.0, 2309.0, 1273.0, 804.0, 503.0, 308.0, 204.0, 159.0, 113.0, 57.0, 44.0, 27.0, 24.0, 18.0, 16.0, 9.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.57421875, -7.3505859375, -7.126953125, -6.9033203125, -6.6796875, -6.4560546875, -6.232421875, -6.0087890625, -5.78515625, -5.5615234375, -5.337890625, -5.1142578125, -4.890625, -4.6669921875, -4.443359375, -4.2197265625, -3.99609375, -3.7724609375, -3.548828125, -3.3251953125, -3.1015625, -2.8779296875, -2.654296875, -2.4306640625, -2.20703125, -1.9833984375, -1.759765625, -1.5361328125, -1.3125, -1.0888671875, -0.865234375, -0.6416015625, -0.41796875, -0.1943359375, 0.029296875, 0.2529296875, 0.4765625, 0.7001953125, 0.923828125, 1.1474609375, 1.37109375, 1.5947265625, 1.818359375, 2.0419921875, 2.265625, 2.4892578125, 2.712890625, 2.9365234375, 3.16015625, 3.3837890625, 3.607421875, 3.8310546875, 4.0546875, 4.2783203125, 4.501953125, 4.7255859375, 4.94921875, 5.1728515625, 5.396484375, 5.6201171875, 5.84375, 6.0673828125, 6.291015625, 6.5146484375, 6.73828125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 12.0, 5.0, 11.0, 16.0, 15.0, 13.0, 21.0, 25.0, 24.0, 35.0, 18.0, 23.0, 39.0, 30.0, 33.0, 34.0, 28.0, 36.0, 40.0, 39.0, 45.0, 32.0, 42.0, 36.0, 32.0, 29.0, 27.0, 19.0, 30.0, 34.0, 26.0, 19.0, 20.0, 19.0, 24.0, 12.0, 9.0, 10.0, 4.0, 7.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.16796875, -3.063690185546875, -2.95941162109375, -2.855133056640625, -2.7508544921875, -2.646575927734375, -2.54229736328125, -2.438018798828125, -2.333740234375, -2.229461669921875, -2.12518310546875, -2.020904541015625, -1.9166259765625, -1.812347412109375, -1.70806884765625, -1.603790283203125, -1.49951171875, -1.395233154296875, -1.29095458984375, -1.186676025390625, -1.0823974609375, -0.978118896484375, -0.87384033203125, -0.769561767578125, -0.665283203125, -0.561004638671875, -0.45672607421875, -0.352447509765625, -0.2481689453125, -0.143890380859375, -0.03961181640625, 0.064666748046875, 0.1689453125, 0.273223876953125, 0.37750244140625, 0.481781005859375, 0.5860595703125, 0.690338134765625, 0.79461669921875, 0.898895263671875, 1.003173828125, 1.107452392578125, 1.21173095703125, 1.316009521484375, 1.4202880859375, 1.524566650390625, 1.62884521484375, 1.733123779296875, 1.83740234375, 1.941680908203125, 2.04595947265625, 2.150238037109375, 2.2545166015625, 2.358795166015625, 2.46307373046875, 2.567352294921875, 2.671630859375, 2.775909423828125, 2.88018798828125, 2.984466552734375, 3.0887451171875, 3.193023681640625, 3.29730224609375, 3.401580810546875, 3.505859375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 12.0, 11.0, 10.0, 28.0, 38.0, 51.0, 76.0, 101.0, 165.0, 297.0, 477.0, 770.0, 1237.0, 2091.0, 3840.0, 7309.0, 14701.0, 30860.0, 69290.0, 160030.0, 300929.0, 246790.0, 113532.0, 49501.0, 22575.0, 10852.0, 5555.0, 3103.0, 1708.0, 991.0, 580.0, 365.0, 218.0, 172.0, 87.0, 70.0, 42.0, 22.0, 23.0, 18.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.51171875, -4.3741455078125, -4.236572265625, -4.0989990234375, -3.96142578125, -3.8238525390625, -3.686279296875, -3.5487060546875, -3.4111328125, -3.2735595703125, -3.135986328125, -2.9984130859375, -2.86083984375, -2.7232666015625, -2.585693359375, -2.4481201171875, -2.310546875, -2.1729736328125, -2.035400390625, -1.8978271484375, -1.76025390625, -1.6226806640625, -1.485107421875, -1.3475341796875, -1.2099609375, -1.0723876953125, -0.934814453125, -0.7972412109375, -0.65966796875, -0.5220947265625, -0.384521484375, -0.2469482421875, -0.109375, 0.0281982421875, 0.165771484375, 0.3033447265625, 0.44091796875, 0.5784912109375, 0.716064453125, 0.8536376953125, 0.9912109375, 1.1287841796875, 1.266357421875, 1.4039306640625, 1.54150390625, 1.6790771484375, 1.816650390625, 1.9542236328125, 2.091796875, 2.2293701171875, 2.366943359375, 2.5045166015625, 2.64208984375, 2.7796630859375, 2.917236328125, 3.0548095703125, 3.1923828125, 3.3299560546875, 3.467529296875, 3.6051025390625, 3.74267578125, 3.8802490234375, 4.017822265625, 4.1553955078125, 4.29296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 3.0, 12.0, 15.0, 34.0, 35.0, 61.0, 73.0, 104.0, 99.0, 129.0, 108.0, 76.0, 74.0, 47.0, 40.0, 29.0, 20.0, 11.0, 6.0, 11.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023627281188964844, -0.0002266019582748413, -0.00021693110466003418, -0.00020726025104522705, -0.00019758939743041992, -0.0001879185438156128, -0.00017824769020080566, -0.00016857683658599854, -0.0001589059829711914, -0.00014923512935638428, -0.00013956427574157715, -0.00012989342212677002, -0.00012022256851196289, -0.00011055171489715576, -0.00010088086128234863, -9.12100076675415e-05, -8.153915405273438e-05, -7.186830043792725e-05, -6.219744682312012e-05, -5.252659320831299e-05, -4.285573959350586e-05, -3.318488597869873e-05, -2.35140323638916e-05, -1.3843178749084473e-05, -4.172325134277344e-06, 5.498528480529785e-06, 1.5169382095336914e-05, 2.4840235710144043e-05, 3.451108932495117e-05, 4.41819429397583e-05, 5.385279655456543e-05, 6.352365016937256e-05, 7.319450378417969e-05, 8.286535739898682e-05, 9.253621101379395e-05, 0.00010220706462860107, 0.0001118779182434082, 0.00012154877185821533, 0.00013121962547302246, 0.0001408904790878296, 0.00015056133270263672, 0.00016023218631744385, 0.00016990303993225098, 0.0001795738935470581, 0.00018924474716186523, 0.00019891560077667236, 0.0002085864543914795, 0.00021825730800628662, 0.00022792816162109375, 0.00023759901523590088, 0.000247269868850708, 0.00025694072246551514, 0.00026661157608032227, 0.0002762824296951294, 0.0002859532833099365, 0.00029562413692474365, 0.0003052949905395508, 0.0003149658441543579, 0.00032463669776916504, 0.00033430755138397217, 0.0003439784049987793, 0.0003536492586135864, 0.00036332011222839355, 0.0003729909658432007, 0.0003826618194580078]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 27.0, 39.0, 56.0, 68.0, 107.0, 145.0, 232.0, 323.0, 571.0, 976.0, 1572.0, 2621.0, 4733.0, 8641.0, 16461.0, 31093.0, 61286.0, 117472.0, 195105.0, 230628.0, 172535.0, 97414.0, 50344.0, 25480.0, 13263.0, 7278.0, 4134.0, 2350.0, 1395.0, 761.0, 470.0, 320.0, 177.0, 121.0, 87.0, 74.0, 45.0, 26.0, 28.0, 21.0, 9.0, 10.0, 7.0, 3.0, 0.0, 6.0, 1.0, 1.0, 3.0], "bins": [-4.09375, -3.974578857421875, -3.85540771484375, -3.736236572265625, -3.6170654296875, -3.497894287109375, -3.37872314453125, -3.259552001953125, -3.140380859375, -3.021209716796875, -2.90203857421875, -2.782867431640625, -2.6636962890625, -2.544525146484375, -2.42535400390625, -2.306182861328125, -2.18701171875, -2.067840576171875, -1.94866943359375, -1.829498291015625, -1.7103271484375, -1.591156005859375, -1.47198486328125, -1.352813720703125, -1.233642578125, -1.114471435546875, -0.99530029296875, -0.876129150390625, -0.7569580078125, -0.637786865234375, -0.51861572265625, -0.399444580078125, -0.2802734375, -0.161102294921875, -0.04193115234375, 0.077239990234375, 0.1964111328125, 0.315582275390625, 0.43475341796875, 0.553924560546875, 0.673095703125, 0.792266845703125, 0.91143798828125, 1.030609130859375, 1.1497802734375, 1.268951416015625, 1.38812255859375, 1.507293701171875, 1.62646484375, 1.745635986328125, 1.86480712890625, 1.983978271484375, 2.1031494140625, 2.222320556640625, 2.34149169921875, 2.460662841796875, 2.579833984375, 2.699005126953125, 2.81817626953125, 2.937347412109375, 3.0565185546875, 3.175689697265625, 3.29486083984375, 3.414031982421875, 3.533203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 8.0, 6.0, 6.0, 20.0, 14.0, 19.0, 16.0, 32.0, 30.0, 31.0, 48.0, 57.0, 57.0, 53.0, 75.0, 66.0, 57.0, 63.0, 58.0, 52.0, 46.0, 37.0, 30.0, 20.0, 19.0, 13.0, 19.0, 12.0, 8.0, 9.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-1.1826171875, -1.1511459350585938, -1.1196746826171875, -1.0882034301757812, -1.056732177734375, -1.0252609252929688, -0.9937896728515625, -0.9623184204101562, -0.93084716796875, -0.8993759155273438, -0.8679046630859375, -0.8364334106445312, -0.804962158203125, -0.7734909057617188, -0.7420196533203125, -0.7105484008789062, -0.6790771484375, -0.6476058959960938, -0.6161346435546875, -0.5846633911132812, -0.553192138671875, -0.5217208862304688, -0.4902496337890625, -0.45877838134765625, -0.42730712890625, -0.39583587646484375, -0.3643646240234375, -0.33289337158203125, -0.301422119140625, -0.26995086669921875, -0.2384796142578125, -0.20700836181640625, -0.175537109375, -0.14406585693359375, -0.1125946044921875, -0.08112335205078125, -0.049652099609375, -0.01818084716796875, 0.0132904052734375, 0.04476165771484375, 0.07623291015625, 0.10770416259765625, 0.1391754150390625, 0.17064666748046875, 0.202117919921875, 0.23358917236328125, 0.2650604248046875, 0.29653167724609375, 0.3280029296875, 0.35947418212890625, 0.3909454345703125, 0.42241668701171875, 0.453887939453125, 0.48535919189453125, 0.5168304443359375, 0.5483016967773438, 0.57977294921875, 0.6112442016601562, 0.6427154541015625, 0.6741867065429688, 0.705657958984375, 0.7371292114257812, 0.7686004638671875, 0.8000717163085938, 0.83154296875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 11.0, 9.0, 12.0, 26.0, 20.0, 25.0, 38.0, 34.0, 49.0, 61.0, 71.0, 89.0, 78.0, 79.0, 59.0, 48.0, 50.0, 52.0, 40.0, 36.0, 20.0, 13.0, 13.0, 14.0, 7.0, 12.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.844240188598633, -11.490038871765137, -11.135836601257324, -10.781635284423828, -10.427433013916016, -10.07323169708252, -9.719030380249023, -9.364828109741211, -9.010625839233398, -8.656424522399902, -8.30222225189209, -7.948020935058594, -7.593818664550781, -7.239617347717285, -6.885415554046631, -6.531213760375977, -6.1770124435424805, -5.822810649871826, -5.468608856201172, -5.114407539367676, -4.760205268859863, -4.406003952026367, -4.051802158355713, -3.6976003646850586, -3.3433985710144043, -2.98919677734375, -2.6349949836730957, -2.2807934284210205, -1.9265916347503662, -1.572389841079712, -1.2181882858276367, -0.8639864921569824, -0.5097856521606445, -0.155583918094635, 0.1986178159713745, 0.5528194904327393, 0.9070212841033936, 1.2612230777740479, 1.615424633026123, 1.9696264266967773, 2.3238282203674316, 2.678030014038086, 3.0322318077087402, 3.3864333629608154, 3.7406351566314697, 4.094837188720703, 4.449038505554199, 4.8032402992248535, 5.157442092895508, 5.511643886566162, 5.865845680236816, 6.2200469970703125, 6.574249267578125, 6.928450584411621, 7.282652378082275, 7.63685417175293, 7.991055965423584, 8.345257759094238, 8.699459075927734, 9.053661346435547, 9.407862663269043, 9.762064933776855, 10.116266250610352, 10.470468521118164, 10.82466983795166]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 18.0, 12.0, 8.0, 20.0, 15.0, 30.0, 28.0, 25.0, 27.0, 28.0, 30.0, 34.0, 34.0, 41.0, 50.0, 35.0, 59.0, 40.0, 29.0, 40.0, 26.0, 35.0, 39.0, 38.0, 34.0, 36.0, 19.0, 20.0, 19.0, 18.0, 20.0, 11.0, 16.0, 12.0, 11.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.831948280334473, -5.648662090301514, -5.4653754234313965, -5.2820892333984375, -5.09880256652832, -4.915516376495361, -4.732230186462402, -4.548943519592285, -4.365656852722168, -4.182370662689209, -3.999083995819092, -3.815797805786133, -3.6325111389160156, -3.4492249488830566, -3.2659385204315186, -3.0826520919799805, -2.8993659019470215, -2.7160794734954834, -2.5327930450439453, -2.3495068550109863, -2.166220188140869, -1.9829338788986206, -1.799647569656372, -1.616361141204834, -1.433074712753296, -1.2497882843017578, -1.0665018558502197, -0.8832155466079712, -0.6999291181564331, -0.516642689704895, -0.3333563804626465, -0.1500699520111084, 0.033215999603271484, 0.21650239825248718, 0.3997887969017029, 0.5830751657485962, 0.7663615942001343, 0.9496480226516724, 1.132934331893921, 1.316220760345459, 1.499507188796997, 1.6827936172485352, 1.8660800457000732, 2.0493664741516113, 2.2326526641845703, 2.4159393310546875, 2.5992255210876465, 2.7825119495391846, 2.9657983779907227, 3.1490848064422607, 3.332371234893799, 3.515657424926758, 3.698944091796875, 3.882230281829834, 4.065516471862793, 4.24880313873291, 4.432089805603027, 4.615375995635986, 4.7986626625061035, 4.9819488525390625, 5.16523551940918, 5.348521709442139, 5.531807899475098, 5.715094566345215, 5.898380756378174]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 9.0, 12.0, 22.0, 37.0, 42.0, 77.0, 118.0, 173.0, 241.0, 394.0, 620.0, 1013.0, 1602.0, 2787.0, 4515.0, 7272.0, 12239.0, 20649.0, 34321.0, 54779.0, 85272.0, 121978.0, 152267.0, 157236.0, 132279.0, 95638.0, 63164.0, 39182.0, 24161.0, 14363.0, 8644.0, 5179.0, 3030.0, 1978.0, 1182.0, 727.0, 492.0, 291.0, 203.0, 124.0, 86.0, 53.0, 36.0, 17.0, 19.0, 7.0, 7.0, 6.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-5.75, -5.5765380859375, -5.403076171875, -5.2296142578125, -5.05615234375, -4.8826904296875, -4.709228515625, -4.5357666015625, -4.3623046875, -4.1888427734375, -4.015380859375, -3.8419189453125, -3.66845703125, -3.4949951171875, -3.321533203125, -3.1480712890625, -2.974609375, -2.8011474609375, -2.627685546875, -2.4542236328125, -2.28076171875, -2.1072998046875, -1.933837890625, -1.7603759765625, -1.5869140625, -1.4134521484375, -1.239990234375, -1.0665283203125, -0.89306640625, -0.7196044921875, -0.546142578125, -0.3726806640625, -0.19921875, -0.0257568359375, 0.147705078125, 0.3211669921875, 0.49462890625, 0.6680908203125, 0.841552734375, 1.0150146484375, 1.1884765625, 1.3619384765625, 1.535400390625, 1.7088623046875, 1.88232421875, 2.0557861328125, 2.229248046875, 2.4027099609375, 2.576171875, 2.7496337890625, 2.923095703125, 3.0965576171875, 3.27001953125, 3.4434814453125, 3.616943359375, 3.7904052734375, 3.9638671875, 4.1373291015625, 4.310791015625, 4.4842529296875, 4.65771484375, 4.8311767578125, 5.004638671875, 5.1781005859375, 5.3515625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 3.0, 9.0, 4.0, 11.0, 14.0, 14.0, 14.0, 14.0, 19.0, 24.0, 28.0, 31.0, 24.0, 37.0, 36.0, 43.0, 39.0, 44.0, 46.0, 44.0, 39.0, 35.0, 34.0, 40.0, 33.0, 38.0, 31.0, 28.0, 25.0, 31.0, 13.0, 29.0, 24.0, 16.0, 13.0, 14.0, 12.0, 10.0, 3.0, 10.0, 4.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.30859375, -6.117431640625, -5.92626953125, -5.735107421875, -5.5439453125, -5.352783203125, -5.16162109375, -4.970458984375, -4.779296875, -4.588134765625, -4.39697265625, -4.205810546875, -4.0146484375, -3.823486328125, -3.63232421875, -3.441162109375, -3.25, -3.058837890625, -2.86767578125, -2.676513671875, -2.4853515625, -2.294189453125, -2.10302734375, -1.911865234375, -1.720703125, -1.529541015625, -1.33837890625, -1.147216796875, -0.9560546875, -0.764892578125, -0.57373046875, -0.382568359375, -0.19140625, -0.000244140625, 0.19091796875, 0.382080078125, 0.5732421875, 0.764404296875, 0.95556640625, 1.146728515625, 1.337890625, 1.529052734375, 1.72021484375, 1.911376953125, 2.1025390625, 2.293701171875, 2.48486328125, 2.676025390625, 2.8671875, 3.058349609375, 3.24951171875, 3.440673828125, 3.6318359375, 3.822998046875, 4.01416015625, 4.205322265625, 4.396484375, 4.587646484375, 4.77880859375, 4.969970703125, 5.1611328125, 5.352294921875, 5.54345703125, 5.734619140625, 5.92578125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 10.0, 18.0, 41.0, 63.0, 99.0, 149.0, 242.0, 383.0, 768.0, 1195.0, 2040.0, 3637.0, 6121.0, 10578.0, 18146.0, 30587.0, 51259.0, 80724.0, 118069.0, 150908.0, 161304.0, 139403.0, 103427.0, 67639.0, 41702.0, 24992.0, 14642.0, 8435.0, 5019.0, 2877.0, 1658.0, 1011.0, 566.0, 322.0, 205.0, 145.0, 71.0, 35.0, 32.0, 16.0, 7.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.40625, -6.219482421875, -6.03271484375, -5.845947265625, -5.6591796875, -5.472412109375, -5.28564453125, -5.098876953125, -4.912109375, -4.725341796875, -4.53857421875, -4.351806640625, -4.1650390625, -3.978271484375, -3.79150390625, -3.604736328125, -3.41796875, -3.231201171875, -3.04443359375, -2.857666015625, -2.6708984375, -2.484130859375, -2.29736328125, -2.110595703125, -1.923828125, -1.737060546875, -1.55029296875, -1.363525390625, -1.1767578125, -0.989990234375, -0.80322265625, -0.616455078125, -0.4296875, -0.242919921875, -0.05615234375, 0.130615234375, 0.3173828125, 0.504150390625, 0.69091796875, 0.877685546875, 1.064453125, 1.251220703125, 1.43798828125, 1.624755859375, 1.8115234375, 1.998291015625, 2.18505859375, 2.371826171875, 2.55859375, 2.745361328125, 2.93212890625, 3.118896484375, 3.3056640625, 3.492431640625, 3.67919921875, 3.865966796875, 4.052734375, 4.239501953125, 4.42626953125, 4.613037109375, 4.7998046875, 4.986572265625, 5.17333984375, 5.360107421875, 5.546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 13.0, 9.0, 17.0, 12.0, 15.0, 12.0, 18.0, 21.0, 26.0, 27.0, 32.0, 50.0, 54.0, 33.0, 37.0, 34.0, 33.0, 33.0, 46.0, 49.0, 40.0, 49.0, 36.0, 29.0, 34.0, 36.0, 36.0, 32.0, 25.0, 21.0, 15.0, 19.0, 18.0, 5.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.55078125, -4.41961669921875, -4.2884521484375, -4.15728759765625, -4.026123046875, -3.89495849609375, -3.7637939453125, -3.63262939453125, -3.50146484375, -3.37030029296875, -3.2391357421875, -3.10797119140625, -2.976806640625, -2.84564208984375, -2.7144775390625, -2.58331298828125, -2.4521484375, -2.32098388671875, -2.1898193359375, -2.05865478515625, -1.927490234375, -1.79632568359375, -1.6651611328125, -1.53399658203125, -1.40283203125, -1.27166748046875, -1.1405029296875, -1.00933837890625, -0.878173828125, -0.74700927734375, -0.6158447265625, -0.48468017578125, -0.353515625, -0.22235107421875, -0.0911865234375, 0.03997802734375, 0.171142578125, 0.30230712890625, 0.4334716796875, 0.56463623046875, 0.69580078125, 0.82696533203125, 0.9581298828125, 1.08929443359375, 1.220458984375, 1.35162353515625, 1.4827880859375, 1.61395263671875, 1.7451171875, 1.87628173828125, 2.0074462890625, 2.13861083984375, 2.269775390625, 2.40093994140625, 2.5321044921875, 2.66326904296875, 2.79443359375, 2.92559814453125, 3.0567626953125, 3.18792724609375, 3.319091796875, 3.45025634765625, 3.5814208984375, 3.71258544921875, 3.84375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 8.0, 5.0, 8.0, 19.0, 35.0, 38.0, 58.0, 80.0, 127.0, 203.0, 283.0, 488.0, 722.0, 1037.0, 1604.0, 2572.0, 3905.0, 6243.0, 10024.0, 15712.0, 25242.0, 39452.0, 60695.0, 89752.0, 121665.0, 145975.0, 145479.0, 120830.0, 89059.0, 60220.0, 39241.0, 25060.0, 15801.0, 9978.0, 6187.0, 3707.0, 2456.0, 1574.0, 1017.0, 679.0, 414.0, 293.0, 194.0, 120.0, 96.0, 75.0, 36.0, 35.0, 21.0, 16.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.57421875, -2.496185302734375, -2.41815185546875, -2.340118408203125, -2.2620849609375, -2.184051513671875, -2.10601806640625, -2.027984619140625, -1.949951171875, -1.871917724609375, -1.79388427734375, -1.715850830078125, -1.6378173828125, -1.559783935546875, -1.48175048828125, -1.403717041015625, -1.32568359375, -1.247650146484375, -1.16961669921875, -1.091583251953125, -1.0135498046875, -0.935516357421875, -0.85748291015625, -0.779449462890625, -0.701416015625, -0.623382568359375, -0.54534912109375, -0.467315673828125, -0.3892822265625, -0.311248779296875, -0.23321533203125, -0.155181884765625, -0.0771484375, 0.000885009765625, 0.07891845703125, 0.156951904296875, 0.2349853515625, 0.313018798828125, 0.39105224609375, 0.469085693359375, 0.547119140625, 0.625152587890625, 0.70318603515625, 0.781219482421875, 0.8592529296875, 0.937286376953125, 1.01531982421875, 1.093353271484375, 1.17138671875, 1.249420166015625, 1.32745361328125, 1.405487060546875, 1.4835205078125, 1.561553955078125, 1.63958740234375, 1.717620849609375, 1.795654296875, 1.873687744140625, 1.95172119140625, 2.029754638671875, 2.1077880859375, 2.185821533203125, 2.26385498046875, 2.341888427734375, 2.419921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 5.0, 11.0, 8.0, 24.0, 22.0, 24.0, 21.0, 30.0, 29.0, 47.0, 50.0, 47.0, 55.0, 65.0, 54.0, 48.0, 57.0, 57.0, 37.0, 33.0, 42.0, 33.0, 32.0, 31.0, 25.0, 16.0, 17.0, 14.0, 8.0, 7.0, 7.0, 14.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024080276489257812, -0.00023199990391731262, -0.00022319704294204712, -0.00021439418196678162, -0.0002055913209915161, -0.0001967884600162506, -0.0001879855990409851, -0.0001791827380657196, -0.0001703798770904541, -0.0001615770161151886, -0.0001527741551399231, -0.0001439712941646576, -0.0001351684331893921, -0.0001263655722141266, -0.00011756271123886108, -0.00010875985026359558, -9.995698928833008e-05, -9.115412831306458e-05, -8.235126733779907e-05, -7.354840636253357e-05, -6.474554538726807e-05, -5.5942684412002563e-05, -4.713982343673706e-05, -3.833696246147156e-05, -2.9534101486206055e-05, -2.0731240510940552e-05, -1.1928379535675049e-05, -3.125518560409546e-06, 5.677342414855957e-06, 1.448020339012146e-05, 2.3283064365386963e-05, 3.2085925340652466e-05, 4.088878631591797e-05, 4.969164729118347e-05, 5.8494508266448975e-05, 6.729736924171448e-05, 7.610023021697998e-05, 8.490309119224548e-05, 9.370595216751099e-05, 0.00010250881314277649, 0.00011131167411804199, 0.0001201145350933075, 0.000128917396068573, 0.0001377202570438385, 0.000146523118019104, 0.0001553259789943695, 0.000164128839969635, 0.0001729317009449005, 0.00018173456192016602, 0.00019053742289543152, 0.00019934028387069702, 0.00020814314484596252, 0.00021694600582122803, 0.00022574886679649353, 0.00023455172777175903, 0.00024335458874702454, 0.00025215744972229004, 0.00026096031069755554, 0.00026976317167282104, 0.00027856603264808655, 0.00028736889362335205, 0.00029617175459861755, 0.00030497461557388306, 0.00031377747654914856, 0.00032258033752441406]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 12.0, 21.0, 30.0, 37.0, 54.0, 90.0, 144.0, 179.0, 290.0, 360.0, 594.0, 924.0, 1439.0, 2237.0, 3462.0, 5522.0, 8957.0, 14636.0, 24499.0, 40140.0, 65154.0, 101411.0, 139918.0, 164559.0, 153050.0, 116864.0, 78119.0, 48827.0, 29832.0, 17758.0, 11150.0, 6713.0, 4084.0, 2562.0, 1709.0, 1094.0, 723.0, 485.0, 294.0, 217.0, 110.0, 95.0, 60.0, 46.0, 36.0, 23.0, 15.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.064453125, -2.9735107421875, -2.882568359375, -2.7916259765625, -2.70068359375, -2.6097412109375, -2.518798828125, -2.4278564453125, -2.3369140625, -2.2459716796875, -2.155029296875, -2.0640869140625, -1.97314453125, -1.8822021484375, -1.791259765625, -1.7003173828125, -1.609375, -1.5184326171875, -1.427490234375, -1.3365478515625, -1.24560546875, -1.1546630859375, -1.063720703125, -0.9727783203125, -0.8818359375, -0.7908935546875, -0.699951171875, -0.6090087890625, -0.51806640625, -0.4271240234375, -0.336181640625, -0.2452392578125, -0.154296875, -0.0633544921875, 0.027587890625, 0.1185302734375, 0.20947265625, 0.3004150390625, 0.391357421875, 0.4822998046875, 0.5732421875, 0.6641845703125, 0.755126953125, 0.8460693359375, 0.93701171875, 1.0279541015625, 1.118896484375, 1.2098388671875, 1.30078125, 1.3917236328125, 1.482666015625, 1.5736083984375, 1.66455078125, 1.7554931640625, 1.846435546875, 1.9373779296875, 2.0283203125, 2.1192626953125, 2.210205078125, 2.3011474609375, 2.39208984375, 2.4830322265625, 2.573974609375, 2.6649169921875, 2.755859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 9.0, 5.0, 2.0, 11.0, 6.0, 12.0, 16.0, 18.0, 22.0, 28.0, 27.0, 25.0, 29.0, 41.0, 44.0, 45.0, 48.0, 46.0, 48.0, 47.0, 41.0, 51.0, 48.0, 48.0, 34.0, 24.0, 38.0, 21.0, 32.0, 26.0, 17.0, 14.0, 19.0, 15.0, 14.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80126953125, -0.7725753784179688, -0.7438812255859375, -0.7151870727539062, -0.686492919921875, -0.6577987670898438, -0.6291046142578125, -0.6004104614257812, -0.57171630859375, -0.5430221557617188, -0.5143280029296875, -0.48563385009765625, -0.456939697265625, -0.42824554443359375, -0.3995513916015625, -0.37085723876953125, -0.3421630859375, -0.31346893310546875, -0.2847747802734375, -0.25608062744140625, -0.227386474609375, -0.19869232177734375, -0.1699981689453125, -0.14130401611328125, -0.11260986328125, -0.08391571044921875, -0.0552215576171875, -0.02652740478515625, 0.002166748046875, 0.03086090087890625, 0.0595550537109375, 0.08824920654296875, 0.116943359375, 0.14563751220703125, 0.1743316650390625, 0.20302581787109375, 0.231719970703125, 0.26041412353515625, 0.2891082763671875, 0.31780242919921875, 0.34649658203125, 0.37519073486328125, 0.4038848876953125, 0.43257904052734375, 0.461273193359375, 0.48996734619140625, 0.5186614990234375, 0.5473556518554688, 0.5760498046875, 0.6047439575195312, 0.6334381103515625, 0.6621322631835938, 0.690826416015625, 0.7195205688476562, 0.7482147216796875, 0.7769088745117188, 0.80560302734375, 0.8342971801757812, 0.8629913330078125, 0.8916854858398438, 0.920379638671875, 0.9490737915039062, 0.9777679443359375, 1.0064620971679688, 1.03515625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 5.0, 6.0, 2.0, 8.0, 10.0, 9.0, 22.0, 27.0, 19.0, 32.0, 41.0, 45.0, 77.0, 61.0, 76.0, 81.0, 81.0, 65.0, 62.0, 60.0, 47.0, 38.0, 34.0, 32.0, 17.0, 11.0, 9.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.307778358459473, -11.931976318359375, -11.556175231933594, -11.180374145507812, -10.804572105407715, -10.428770065307617, -10.052968978881836, -9.677167892456055, -9.301365852355957, -8.92556381225586, -8.549762725830078, -8.173961639404297, -7.798159599304199, -7.42235803604126, -7.04655647277832, -6.670754909515381, -6.294953346252441, -5.919151782989502, -5.5433502197265625, -5.167548656463623, -4.791747093200684, -4.415945529937744, -4.040143966674805, -3.6643424034118652, -3.288540840148926, -2.9127392768859863, -2.536937713623047, -2.1611361503601074, -1.785334587097168, -1.4095330238342285, -1.033731460571289, -0.6579298973083496, -0.28212928771972656, 0.09367227554321289, 0.46947383880615234, 0.8452754020690918, 1.2210769653320312, 1.5968785285949707, 1.9726800918579102, 2.3484816551208496, 2.724283218383789, 3.1000847816467285, 3.475886344909668, 3.8516879081726074, 4.227489471435547, 4.603291034698486, 4.979092597961426, 5.354894161224365, 5.730695724487305, 6.106497287750244, 6.482298851013184, 6.858100414276123, 7.2339019775390625, 7.609703540802002, 7.985505104064941, 8.361307144165039, 8.73710823059082, 9.112909317016602, 9.4887113571167, 9.864513397216797, 10.240314483642578, 10.61611557006836, 10.991917610168457, 11.367719650268555, 11.743520736694336]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 11.0, 9.0, 10.0, 16.0, 9.0, 18.0, 25.0, 27.0, 25.0, 29.0, 25.0, 26.0, 33.0, 38.0, 46.0, 38.0, 33.0, 52.0, 47.0, 39.0, 32.0, 48.0, 43.0, 38.0, 29.0, 34.0, 27.0, 26.0, 24.0, 21.0, 17.0, 17.0, 15.0, 13.0, 9.0, 8.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.901891231536865, -5.707763671875, -5.513636589050293, -5.319509029388428, -5.1253814697265625, -4.931253910064697, -4.737126350402832, -4.542999267578125, -4.34887170791626, -4.1547441482543945, -3.9606168270111084, -3.7664895057678223, -3.572361946105957, -3.378234386444092, -3.1841070652008057, -2.9899797439575195, -2.7958521842956543, -2.601724624633789, -2.407597303390503, -2.213469982147217, -2.0193424224853516, -1.8252149820327759, -1.6310875415802002, -1.4369601011276245, -1.2428326606750488, -1.0487052202224731, -0.8545777797698975, -0.6604503393173218, -0.4663228988647461, -0.2721954584121704, -0.07806801795959473, 0.11605942249298096, 0.31018686294555664, 0.5043143033981323, 0.698441743850708, 0.8925691843032837, 1.0866966247558594, 1.280824065208435, 1.4749515056610107, 1.6690789461135864, 1.863206386566162, 2.0573339462280273, 2.2514612674713135, 2.4455885887145996, 2.639716148376465, 2.83384370803833, 3.027971029281616, 3.2220983505249023, 3.4162259101867676, 3.610353469848633, 3.804480791091919, 3.998608112335205, 4.19273567199707, 4.3868632316589355, 4.580990791320801, 4.775117874145508, 4.969245433807373, 5.163372993469238, 5.357500076293945, 5.5516276359558105, 5.745755195617676, 5.939882755279541, 6.134010314941406, 6.328137397766113, 6.5222649574279785]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 24.0, 43.0, 61.0, 100.0, 159.0, 261.0, 381.0, 640.0, 1049.0, 1769.0, 2985.0, 5087.0, 9567.0, 18421.0, 37909.0, 83114.0, 205924.0, 530090.0, 1127762.0, 1185023.0, 581553.0, 226937.0, 91372.0, 40778.0, 19547.0, 10264.0, 5598.0, 3145.0, 1809.0, 1090.0, 669.0, 420.0, 271.0, 139.0, 108.0, 54.0, 44.0, 34.0, 16.0, 11.0, 12.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.2330322265625, -8.864501953125, -8.4959716796875, -8.12744140625, -7.7589111328125, -7.390380859375, -7.0218505859375, -6.6533203125, -6.2847900390625, -5.916259765625, -5.5477294921875, -5.17919921875, -4.8106689453125, -4.442138671875, -4.0736083984375, -3.705078125, -3.3365478515625, -2.968017578125, -2.5994873046875, -2.23095703125, -1.8624267578125, -1.493896484375, -1.1253662109375, -0.7568359375, -0.3883056640625, -0.019775390625, 0.3487548828125, 0.71728515625, 1.0858154296875, 1.454345703125, 1.8228759765625, 2.19140625, 2.5599365234375, 2.928466796875, 3.2969970703125, 3.66552734375, 4.0340576171875, 4.402587890625, 4.7711181640625, 5.1396484375, 5.5081787109375, 5.876708984375, 6.2452392578125, 6.61376953125, 6.9822998046875, 7.350830078125, 7.7193603515625, 8.087890625, 8.4564208984375, 8.824951171875, 9.1934814453125, 9.56201171875, 9.9305419921875, 10.299072265625, 10.6676025390625, 11.0361328125, 11.4046630859375, 11.773193359375, 12.1417236328125, 12.51025390625, 12.8787841796875, 13.247314453125, 13.6158447265625, 13.984375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 5.0, 11.0, 12.0, 7.0, 12.0, 20.0, 21.0, 24.0, 21.0, 25.0, 26.0, 29.0, 30.0, 32.0, 36.0, 32.0, 45.0, 43.0, 41.0, 40.0, 42.0, 40.0, 52.0, 31.0, 38.0, 32.0, 38.0, 30.0, 29.0, 18.0, 24.0, 17.0, 11.0, 14.0, 12.0, 7.0, 10.0, 8.0, 13.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.26953125, -5.1148681640625, -4.960205078125, -4.8055419921875, -4.65087890625, -4.4962158203125, -4.341552734375, -4.1868896484375, -4.0322265625, -3.8775634765625, -3.722900390625, -3.5682373046875, -3.41357421875, -3.2589111328125, -3.104248046875, -2.9495849609375, -2.794921875, -2.6402587890625, -2.485595703125, -2.3309326171875, -2.17626953125, -2.0216064453125, -1.866943359375, -1.7122802734375, -1.5576171875, -1.4029541015625, -1.248291015625, -1.0936279296875, -0.93896484375, -0.7843017578125, -0.629638671875, -0.4749755859375, -0.3203125, -0.1656494140625, -0.010986328125, 0.1436767578125, 0.29833984375, 0.4530029296875, 0.607666015625, 0.7623291015625, 0.9169921875, 1.0716552734375, 1.226318359375, 1.3809814453125, 1.53564453125, 1.6903076171875, 1.844970703125, 1.9996337890625, 2.154296875, 2.3089599609375, 2.463623046875, 2.6182861328125, 2.77294921875, 2.9276123046875, 3.082275390625, 3.2369384765625, 3.3916015625, 3.5462646484375, 3.700927734375, 3.8555908203125, 4.01025390625, 4.1649169921875, 4.319580078125, 4.4742431640625, 4.62890625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 12.0, 25.0, 22.0, 30.0, 60.0, 73.0, 113.0, 139.0, 230.0, 333.0, 499.0, 681.0, 1096.0, 1807.0, 2751.0, 4323.0, 7270.0, 12328.0, 21468.0, 38459.0, 71287.0, 136756.0, 272232.0, 532521.0, 888364.0, 941793.0, 604150.0, 313011.0, 157590.0, 81353.0, 43795.0, 24192.0, 13644.0, 8178.0, 5093.0, 3042.0, 1885.0, 1185.0, 787.0, 527.0, 362.0, 265.0, 167.0, 111.0, 72.0, 55.0, 42.0, 30.0, 21.0, 9.0, 14.0, 7.0, 5.0, 6.0, 3.0, 6.0, 4.0], "bins": [-10.8671875, -10.5286865234375, -10.190185546875, -9.8516845703125, -9.51318359375, -9.1746826171875, -8.836181640625, -8.4976806640625, -8.1591796875, -7.8206787109375, -7.482177734375, -7.1436767578125, -6.80517578125, -6.4666748046875, -6.128173828125, -5.7896728515625, -5.451171875, -5.1126708984375, -4.774169921875, -4.4356689453125, -4.09716796875, -3.7586669921875, -3.420166015625, -3.0816650390625, -2.7431640625, -2.4046630859375, -2.066162109375, -1.7276611328125, -1.38916015625, -1.0506591796875, -0.712158203125, -0.3736572265625, -0.03515625, 0.3033447265625, 0.641845703125, 0.9803466796875, 1.31884765625, 1.6573486328125, 1.995849609375, 2.3343505859375, 2.6728515625, 3.0113525390625, 3.349853515625, 3.6883544921875, 4.02685546875, 4.3653564453125, 4.703857421875, 5.0423583984375, 5.380859375, 5.7193603515625, 6.057861328125, 6.3963623046875, 6.73486328125, 7.0733642578125, 7.411865234375, 7.7503662109375, 8.0888671875, 8.4273681640625, 8.765869140625, 9.1043701171875, 9.44287109375, 9.7813720703125, 10.119873046875, 10.4583740234375, 10.796875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 10.0, 13.0, 14.0, 10.0, 15.0, 26.0, 40.0, 47.0, 55.0, 58.0, 81.0, 95.0, 131.0, 185.0, 211.0, 244.0, 279.0, 326.0, 308.0, 349.0, 315.0, 280.0, 208.0, 185.0, 133.0, 102.0, 98.0, 76.0, 43.0, 27.0, 35.0, 19.0, 15.0, 8.0, 14.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.719329833984375, -3.60076904296875, -3.482208251953125, -3.3636474609375, -3.245086669921875, -3.12652587890625, -3.007965087890625, -2.889404296875, -2.770843505859375, -2.65228271484375, -2.533721923828125, -2.4151611328125, -2.296600341796875, -2.17803955078125, -2.059478759765625, -1.94091796875, -1.822357177734375, -1.70379638671875, -1.585235595703125, -1.4666748046875, -1.348114013671875, -1.22955322265625, -1.110992431640625, -0.992431640625, -0.873870849609375, -0.75531005859375, -0.636749267578125, -0.5181884765625, -0.399627685546875, -0.28106689453125, -0.162506103515625, -0.0439453125, 0.074615478515625, 0.19317626953125, 0.311737060546875, 0.4302978515625, 0.548858642578125, 0.66741943359375, 0.785980224609375, 0.904541015625, 1.023101806640625, 1.14166259765625, 1.260223388671875, 1.3787841796875, 1.497344970703125, 1.61590576171875, 1.734466552734375, 1.85302734375, 1.971588134765625, 2.09014892578125, 2.208709716796875, 2.3272705078125, 2.445831298828125, 2.56439208984375, 2.682952880859375, 2.801513671875, 2.920074462890625, 3.03863525390625, 3.157196044921875, 3.2757568359375, 3.394317626953125, 3.51287841796875, 3.631439208984375, 3.75]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 5.0, 5.0, 12.0, 14.0, 18.0, 22.0, 31.0, 39.0, 41.0, 44.0, 53.0, 68.0, 68.0, 78.0, 93.0, 88.0, 60.0, 50.0, 46.0, 35.0, 31.0, 20.0, 12.0, 11.0, 11.0, 10.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.259316444396973, -10.833648681640625, -10.407981872558594, -9.982314109802246, -9.556647300720215, -9.130979537963867, -8.705312728881836, -8.279644966125488, -7.853978157043457, -7.428310871124268, -7.002643585205078, -6.576976299285889, -6.151309013366699, -5.725641250610352, -5.29997444152832, -4.874306678771973, -4.448639392852783, -4.022972106933594, -3.5973048210144043, -3.171637535095215, -2.7459702491760254, -2.320302724838257, -1.8946354389190674, -1.468968152999878, -1.0433008670806885, -0.617633581161499, -0.1919662356376648, 0.23370110988616943, 0.6593683958053589, 1.085035800933838, 1.5107030868530273, 1.9363703727722168, 2.3620376586914062, 2.7877049446105957, 3.213372230529785, 3.6390395164489746, 4.064706802368164, 4.490374565124512, 4.916041374206543, 5.341709136962891, 5.767375946044922, 6.193043231964111, 6.618710517883301, 7.04437780380249, 7.47004508972168, 7.895712852478027, 8.321379661560059, 8.747047424316406, 9.172714233398438, 9.598381996154785, 10.024048805236816, 10.449716567993164, 10.875383377075195, 11.301051139831543, 11.726717948913574, 12.152385711669922, 12.57805347442627, 13.003721237182617, 13.429388046264648, 13.855055809020996, 14.280722618103027, 14.706390380859375, 15.132057189941406, 15.557724952697754, 15.983391761779785]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 1.0, 2.0, 3.0, 13.0, 9.0, 12.0, 15.0, 12.0, 19.0, 22.0, 20.0, 31.0, 16.0, 28.0, 41.0, 36.0, 37.0, 44.0, 44.0, 33.0, 37.0, 38.0, 50.0, 40.0, 34.0, 31.0, 37.0, 37.0, 33.0, 32.0, 26.0, 26.0, 29.0, 23.0, 13.0, 9.0, 15.0, 12.0, 11.0, 10.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.2488226890563965, -7.030524730682373, -6.812226295471191, -6.593928337097168, -6.375629901885986, -6.157331943511963, -5.939033508300781, -5.720735549926758, -5.502437591552734, -5.284139633178711, -5.065841197967529, -4.847543239593506, -4.629244804382324, -4.410946846008301, -4.192648887634277, -3.9743504524230957, -3.756052017211914, -3.5377538204193115, -3.319455623626709, -3.1011576652526855, -2.882859230041504, -2.6645612716674805, -2.446263074874878, -2.2279648780822754, -2.009666681289673, -1.7913684844970703, -1.5730702877044678, -1.3547722101211548, -1.1364740133285522, -0.9181758165359497, -0.6998777389526367, -0.4815795421600342, -0.26328182220458984, -0.04498365521430969, 0.17331451177597046, 0.3916126489639282, 0.6099108457565308, 0.8282090425491333, 1.0465071201324463, 1.2648053169250488, 1.4831035137176514, 1.701401710510254, 1.9196999073028564, 2.137998104095459, 2.3562960624694824, 2.574594497680664, 2.7928924560546875, 3.01119065284729, 3.2294888496398926, 3.447787046432495, 3.6660852432250977, 3.884383201599121, 4.102681636810303, 4.320979595184326, 4.539278030395508, 4.757575988769531, 4.975873947143555, 5.194171905517578, 5.41247034072876, 5.630768299102783, 5.849066734313965, 6.067364692687988, 6.285662651062012, 6.503961086273193, 6.722259521484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 7.0, 11.0, 20.0, 22.0, 35.0, 62.0, 87.0, 141.0, 223.0, 322.0, 563.0, 964.0, 1482.0, 2529.0, 4242.0, 7246.0, 12255.0, 21100.0, 36597.0, 61748.0, 99979.0, 144932.0, 174543.0, 163429.0, 121806.0, 79133.0, 47760.0, 28074.0, 16029.0, 9462.0, 5453.0, 3194.0, 1983.0, 1204.0, 731.0, 422.0, 275.0, 155.0, 117.0, 68.0, 48.0, 38.0, 21.0, 8.0, 12.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 4.0], "bins": [-5.87890625, -5.709716796875, -5.54052734375, -5.371337890625, -5.2021484375, -5.032958984375, -4.86376953125, -4.694580078125, -4.525390625, -4.356201171875, -4.18701171875, -4.017822265625, -3.8486328125, -3.679443359375, -3.51025390625, -3.341064453125, -3.171875, -3.002685546875, -2.83349609375, -2.664306640625, -2.4951171875, -2.325927734375, -2.15673828125, -1.987548828125, -1.818359375, -1.649169921875, -1.47998046875, -1.310791015625, -1.1416015625, -0.972412109375, -0.80322265625, -0.634033203125, -0.46484375, -0.295654296875, -0.12646484375, 0.042724609375, 0.2119140625, 0.381103515625, 0.55029296875, 0.719482421875, 0.888671875, 1.057861328125, 1.22705078125, 1.396240234375, 1.5654296875, 1.734619140625, 1.90380859375, 2.072998046875, 2.2421875, 2.411376953125, 2.58056640625, 2.749755859375, 2.9189453125, 3.088134765625, 3.25732421875, 3.426513671875, 3.595703125, 3.764892578125, 3.93408203125, 4.103271484375, 4.2724609375, 4.441650390625, 4.61083984375, 4.780029296875, 4.94921875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 8.0, 13.0, 8.0, 12.0, 10.0, 10.0, 16.0, 10.0, 30.0, 21.0, 19.0, 24.0, 36.0, 40.0, 34.0, 42.0, 28.0, 43.0, 50.0, 32.0, 39.0, 44.0, 47.0, 42.0, 41.0, 41.0, 37.0, 27.0, 25.0, 22.0, 20.0, 25.0, 20.0, 13.0, 12.0, 15.0, 7.0, 11.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.968994140625, -6.73486328125, -6.500732421875, -6.2666015625, -6.032470703125, -5.79833984375, -5.564208984375, -5.330078125, -5.095947265625, -4.86181640625, -4.627685546875, -4.3935546875, -4.159423828125, -3.92529296875, -3.691162109375, -3.45703125, -3.222900390625, -2.98876953125, -2.754638671875, -2.5205078125, -2.286376953125, -2.05224609375, -1.818115234375, -1.583984375, -1.349853515625, -1.11572265625, -0.881591796875, -0.6474609375, -0.413330078125, -0.17919921875, 0.054931640625, 0.2890625, 0.523193359375, 0.75732421875, 0.991455078125, 1.2255859375, 1.459716796875, 1.69384765625, 1.927978515625, 2.162109375, 2.396240234375, 2.63037109375, 2.864501953125, 3.0986328125, 3.332763671875, 3.56689453125, 3.801025390625, 4.03515625, 4.269287109375, 4.50341796875, 4.737548828125, 4.9716796875, 5.205810546875, 5.43994140625, 5.674072265625, 5.908203125, 6.142333984375, 6.37646484375, 6.610595703125, 6.8447265625, 7.078857421875, 7.31298828125, 7.547119140625, 7.78125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 7.0, 13.0, 17.0, 32.0, 45.0, 73.0, 111.0, 224.0, 421.0, 702.0, 1312.0, 2610.0, 5559.0, 13335.0, 33418.0, 90433.0, 234836.0, 354039.0, 192960.0, 71501.0, 26534.0, 10798.0, 4718.0, 2245.0, 1112.0, 610.0, 341.0, 219.0, 123.0, 74.0, 45.0, 22.0, 17.0, 15.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.7884521484375, -11.412841796875, -11.0372314453125, -10.66162109375, -10.2860107421875, -9.910400390625, -9.5347900390625, -9.1591796875, -8.7835693359375, -8.407958984375, -8.0323486328125, -7.65673828125, -7.2811279296875, -6.905517578125, -6.5299072265625, -6.154296875, -5.7786865234375, -5.403076171875, -5.0274658203125, -4.65185546875, -4.2762451171875, -3.900634765625, -3.5250244140625, -3.1494140625, -2.7738037109375, -2.398193359375, -2.0225830078125, -1.64697265625, -1.2713623046875, -0.895751953125, -0.5201416015625, -0.14453125, 0.2310791015625, 0.606689453125, 0.9822998046875, 1.35791015625, 1.7335205078125, 2.109130859375, 2.4847412109375, 2.8603515625, 3.2359619140625, 3.611572265625, 3.9871826171875, 4.36279296875, 4.7384033203125, 5.114013671875, 5.4896240234375, 5.865234375, 6.2408447265625, 6.616455078125, 6.9920654296875, 7.36767578125, 7.7432861328125, 8.118896484375, 8.4945068359375, 8.8701171875, 9.2457275390625, 9.621337890625, 9.9969482421875, 10.37255859375, 10.7481689453125, 11.123779296875, 11.4993896484375, 11.875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 12.0, 5.0, 16.0, 20.0, 18.0, 20.0, 24.0, 27.0, 30.0, 29.0, 34.0, 40.0, 35.0, 49.0, 41.0, 34.0, 38.0, 42.0, 57.0, 48.0, 47.0, 38.0, 25.0, 39.0, 38.0, 19.0, 28.0, 18.0, 22.0, 14.0, 19.0, 10.0, 6.0, 8.0, 17.0, 11.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.3017578125, -4.154296875, -4.0068359375, -3.859375, -3.7119140625, -3.564453125, -3.4169921875, -3.26953125, -3.1220703125, -2.974609375, -2.8271484375, -2.6796875, -2.5322265625, -2.384765625, -2.2373046875, -2.08984375, -1.9423828125, -1.794921875, -1.6474609375, -1.5, -1.3525390625, -1.205078125, -1.0576171875, -0.91015625, -0.7626953125, -0.615234375, -0.4677734375, -0.3203125, -0.1728515625, -0.025390625, 0.1220703125, 0.26953125, 0.4169921875, 0.564453125, 0.7119140625, 0.859375, 1.0068359375, 1.154296875, 1.3017578125, 1.44921875, 1.5966796875, 1.744140625, 1.8916015625, 2.0390625, 2.1865234375, 2.333984375, 2.4814453125, 2.62890625, 2.7763671875, 2.923828125, 3.0712890625, 3.21875, 3.3662109375, 3.513671875, 3.6611328125, 3.80859375, 3.9560546875, 4.103515625, 4.2509765625, 4.3984375, 4.5458984375, 4.693359375, 4.8408203125, 4.98828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 2.0, 8.0, 11.0, 16.0, 37.0, 43.0, 45.0, 88.0, 137.0, 197.0, 258.0, 432.0, 649.0, 1049.0, 1509.0, 2620.0, 4333.0, 7538.0, 13213.0, 24600.0, 47617.0, 93880.0, 178856.0, 261632.0, 193948.0, 102004.0, 52155.0, 27041.0, 14465.0, 7872.0, 4742.0, 2763.0, 1700.0, 1057.0, 713.0, 423.0, 288.0, 195.0, 131.0, 102.0, 41.0, 36.0, 36.0, 18.0, 14.0, 18.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5390625, -4.38555908203125, -4.2320556640625, -4.07855224609375, -3.925048828125, -3.77154541015625, -3.6180419921875, -3.46453857421875, -3.31103515625, -3.15753173828125, -3.0040283203125, -2.85052490234375, -2.697021484375, -2.54351806640625, -2.3900146484375, -2.23651123046875, -2.0830078125, -1.92950439453125, -1.7760009765625, -1.62249755859375, -1.468994140625, -1.31549072265625, -1.1619873046875, -1.00848388671875, -0.85498046875, -0.70147705078125, -0.5479736328125, -0.39447021484375, -0.240966796875, -0.08746337890625, 0.0660400390625, 0.21954345703125, 0.373046875, 0.52655029296875, 0.6800537109375, 0.83355712890625, 0.987060546875, 1.14056396484375, 1.2940673828125, 1.44757080078125, 1.60107421875, 1.75457763671875, 1.9080810546875, 2.06158447265625, 2.215087890625, 2.36859130859375, 2.5220947265625, 2.67559814453125, 2.8291015625, 2.98260498046875, 3.1361083984375, 3.28961181640625, 3.443115234375, 3.59661865234375, 3.7501220703125, 3.90362548828125, 4.05712890625, 4.21063232421875, 4.3641357421875, 4.51763916015625, 4.671142578125, 4.82464599609375, 4.9781494140625, 5.13165283203125, 5.28515625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 12.0, 10.0, 21.0, 24.0, 23.0, 32.0, 40.0, 68.0, 47.0, 56.0, 56.0, 84.0, 61.0, 66.0, 49.0, 55.0, 49.0, 45.0, 34.0, 29.0, 32.0, 18.0, 20.0, 10.0, 10.0, 3.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00023734569549560547, -0.000229736790060997, -0.00022212788462638855, -0.0002145189791917801, -0.00020691007375717163, -0.00019930116832256317, -0.0001916922628879547, -0.00018408335745334625, -0.0001764744520187378, -0.00016886554658412933, -0.00016125664114952087, -0.00015364773571491241, -0.00014603883028030396, -0.0001384299248456955, -0.00013082101941108704, -0.00012321211397647858, -0.00011560320854187012, -0.00010799430310726166, -0.0001003853976726532, -9.277649223804474e-05, -8.516758680343628e-05, -7.755868136882782e-05, -6.994977593421936e-05, -6.23408704996109e-05, -5.473196506500244e-05, -4.712305963039398e-05, -3.951415419578552e-05, -3.190524876117706e-05, -2.4296343326568604e-05, -1.6687437891960144e-05, -9.078532457351685e-06, -1.469627022743225e-06, 6.139278411865234e-06, 1.3748183846473694e-05, 2.1357089281082153e-05, 2.8965994715690613e-05, 3.657490015029907e-05, 4.418380558490753e-05, 5.179271101951599e-05, 5.940161645412445e-05, 6.701052188873291e-05, 7.461942732334137e-05, 8.222833275794983e-05, 8.983723819255829e-05, 9.744614362716675e-05, 0.00010505504906177521, 0.00011266395449638367, 0.00012027285993099213, 0.00012788176536560059, 0.00013549067080020905, 0.0001430995762348175, 0.00015070848166942596, 0.00015831738710403442, 0.00016592629253864288, 0.00017353519797325134, 0.0001811441034078598, 0.00018875300884246826, 0.00019636191427707672, 0.00020397081971168518, 0.00021157972514629364, 0.0002191886305809021, 0.00022679753601551056, 0.00023440644145011902, 0.00024201534688472748, 0.00024962425231933594]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 7.0, 11.0, 16.0, 18.0, 26.0, 26.0, 47.0, 65.0, 87.0, 148.0, 182.0, 293.0, 484.0, 773.0, 1259.0, 2098.0, 3562.0, 5931.0, 10574.0, 19179.0, 34697.0, 62326.0, 107824.0, 168342.0, 204030.0, 171236.0, 110049.0, 64093.0, 35204.0, 19673.0, 10925.0, 6121.0, 3654.0, 2074.0, 1264.0, 793.0, 510.0, 326.0, 215.0, 120.0, 96.0, 61.0, 45.0, 22.0, 18.0, 18.0, 14.0, 9.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.4921875, -4.34967041015625, -4.2071533203125, -4.06463623046875, -3.922119140625, -3.77960205078125, -3.6370849609375, -3.49456787109375, -3.35205078125, -3.20953369140625, -3.0670166015625, -2.92449951171875, -2.781982421875, -2.63946533203125, -2.4969482421875, -2.35443115234375, -2.2119140625, -2.06939697265625, -1.9268798828125, -1.78436279296875, -1.641845703125, -1.49932861328125, -1.3568115234375, -1.21429443359375, -1.07177734375, -0.92926025390625, -0.7867431640625, -0.64422607421875, -0.501708984375, -0.35919189453125, -0.2166748046875, -0.07415771484375, 0.068359375, 0.21087646484375, 0.3533935546875, 0.49591064453125, 0.638427734375, 0.78094482421875, 0.9234619140625, 1.06597900390625, 1.20849609375, 1.35101318359375, 1.4935302734375, 1.63604736328125, 1.778564453125, 1.92108154296875, 2.0635986328125, 2.20611572265625, 2.3486328125, 2.49114990234375, 2.6336669921875, 2.77618408203125, 2.918701171875, 3.06121826171875, 3.2037353515625, 3.34625244140625, 3.48876953125, 3.63128662109375, 3.7738037109375, 3.91632080078125, 4.058837890625, 4.20135498046875, 4.3438720703125, 4.48638916015625, 4.62890625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 11.0, 12.0, 19.0, 19.0, 27.0, 29.0, 48.0, 58.0, 86.0, 76.0, 93.0, 83.0, 76.0, 82.0, 72.0, 64.0, 40.0, 36.0, 32.0, 14.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.130859375, -2.065185546875, -1.99951171875, -1.933837890625, -1.8681640625, -1.802490234375, -1.73681640625, -1.671142578125, -1.60546875, -1.539794921875, -1.47412109375, -1.408447265625, -1.3427734375, -1.277099609375, -1.21142578125, -1.145751953125, -1.080078125, -1.014404296875, -0.94873046875, -0.883056640625, -0.8173828125, -0.751708984375, -0.68603515625, -0.620361328125, -0.5546875, -0.489013671875, -0.42333984375, -0.357666015625, -0.2919921875, -0.226318359375, -0.16064453125, -0.094970703125, -0.029296875, 0.036376953125, 0.10205078125, 0.167724609375, 0.2333984375, 0.299072265625, 0.36474609375, 0.430419921875, 0.49609375, 0.561767578125, 0.62744140625, 0.693115234375, 0.7587890625, 0.824462890625, 0.89013671875, 0.955810546875, 1.021484375, 1.087158203125, 1.15283203125, 1.218505859375, 1.2841796875, 1.349853515625, 1.41552734375, 1.481201171875, 1.546875, 1.612548828125, 1.67822265625, 1.743896484375, 1.8095703125, 1.875244140625, 1.94091796875, 2.006591796875, 2.072265625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 4.0, 7.0, 18.0, 11.0, 23.0, 25.0, 30.0, 39.0, 42.0, 53.0, 61.0, 71.0, 65.0, 96.0, 85.0, 87.0, 62.0, 36.0, 47.0, 37.0, 23.0, 14.0, 9.0, 13.0, 11.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.542037010192871, -11.099223136901855, -10.656408309936523, -10.213594436645508, -9.770779609680176, -9.32796573638916, -8.885150909423828, -8.442337036132812, -7.999522686004639, -7.556708335876465, -7.113893985748291, -6.671079635620117, -6.228265762329102, -5.7854509353637695, -5.342637062072754, -4.89982271194458, -4.457008361816406, -4.014194011688232, -3.5713796615600586, -3.128565549850464, -2.68575119972229, -2.242936849594116, -1.8001227378845215, -1.3573083877563477, -0.9144940376281738, -0.4716797471046448, -0.028865456581115723, 0.41394877433776855, 0.8567631244659424, 1.2995774745941162, 1.742391586303711, 2.1852059364318848, 2.628021240234375, 3.070835590362549, 3.5136499404907227, 3.9564640522003174, 4.39927864074707, 4.842092514038086, 5.28490686416626, 5.727721214294434, 6.170535564422607, 6.613349914550781, 7.056164264678955, 7.498978614807129, 7.9417924880981445, 8.384607315063477, 8.827421188354492, 9.270235061645508, 9.71304988861084, 10.155863761901855, 10.598678588867188, 11.041492462158203, 11.484307289123535, 11.92712116241455, 12.369935989379883, 12.812749862670898, 13.255563735961914, 13.69837760925293, 14.141192436218262, 14.584006309509277, 15.02682113647461, 15.469635009765625, 15.91244888305664, 16.355262756347656, 16.798078536987305]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 4.0, 13.0, 18.0, 10.0, 21.0, 14.0, 23.0, 17.0, 19.0, 27.0, 22.0, 32.0, 36.0, 44.0, 35.0, 44.0, 41.0, 42.0, 29.0, 45.0, 38.0, 47.0, 33.0, 39.0, 29.0, 27.0, 38.0, 29.0, 26.0, 29.0, 25.0, 17.0, 9.0, 19.0, 12.0, 16.0, 5.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.177400588989258, -6.958394527435303, -6.739388942718506, -6.520382881164551, -6.301377296447754, -6.082371234893799, -5.863365650177002, -5.644359588623047, -5.42535400390625, -5.206347942352295, -4.987342357635498, -4.768336296081543, -4.549330711364746, -4.330324649810791, -4.111319065093994, -3.892313003540039, -3.673307180404663, -3.454301357269287, -3.235295534133911, -3.016289710998535, -2.797283887863159, -2.578278064727783, -2.359272003173828, -2.1402664184570312, -1.9212604761123657, -1.7022546529769897, -1.4832488298416138, -1.2642428874969482, -1.0452370643615723, -0.8262312412261963, -0.6072254180908203, -0.38821959495544434, -0.16921377182006836, 0.04979206621646881, 0.268797904253006, 0.48780375719070435, 0.7068095803260803, 0.9258154630661011, 1.144821286201477, 1.363827109336853, 1.582832932472229, 1.801838755607605, 2.0208446979522705, 2.2398505210876465, 2.4588563442230225, 2.6778621673583984, 2.8968679904937744, 3.1158738136291504, 3.3348796367645264, 3.5538854598999023, 3.7728912830352783, 3.9918971061706543, 4.210903167724609, 4.429908752441406, 4.648914813995361, 4.867920398712158, 5.086926460266113, 5.305932521820068, 5.524938106536865, 5.74394416809082, 5.962949752807617, 6.181955814361572, 6.400961399078369, 6.619967460632324, 6.838973045349121]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 19.0, 28.0, 43.0, 66.0, 86.0, 162.0, 231.0, 398.0, 596.0, 1096.0, 1836.0, 3340.0, 5801.0, 10948.0, 20256.0, 37763.0, 69428.0, 117214.0, 170115.0, 193186.0, 164650.0, 110617.0, 64139.0, 34958.0, 18660.0, 10064.0, 5533.0, 2991.0, 1751.0, 1006.0, 601.0, 326.0, 223.0, 144.0, 82.0, 61.0, 37.0, 26.0, 20.0, 9.0, 13.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3671875, -8.116943359375, -7.86669921875, -7.616455078125, -7.3662109375, -7.115966796875, -6.86572265625, -6.615478515625, -6.365234375, -6.114990234375, -5.86474609375, -5.614501953125, -5.3642578125, -5.114013671875, -4.86376953125, -4.613525390625, -4.36328125, -4.113037109375, -3.86279296875, -3.612548828125, -3.3623046875, -3.112060546875, -2.86181640625, -2.611572265625, -2.361328125, -2.111083984375, -1.86083984375, -1.610595703125, -1.3603515625, -1.110107421875, -0.85986328125, -0.609619140625, -0.359375, -0.109130859375, 0.14111328125, 0.391357421875, 0.6416015625, 0.891845703125, 1.14208984375, 1.392333984375, 1.642578125, 1.892822265625, 2.14306640625, 2.393310546875, 2.6435546875, 2.893798828125, 3.14404296875, 3.394287109375, 3.64453125, 3.894775390625, 4.14501953125, 4.395263671875, 4.6455078125, 4.895751953125, 5.14599609375, 5.396240234375, 5.646484375, 5.896728515625, 6.14697265625, 6.397216796875, 6.6474609375, 6.897705078125, 7.14794921875, 7.398193359375, 7.6484375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 9.0, 18.0, 16.0, 13.0, 23.0, 21.0, 26.0, 27.0, 27.0, 36.0, 43.0, 26.0, 27.0, 40.0, 33.0, 57.0, 54.0, 59.0, 38.0, 35.0, 43.0, 39.0, 29.0, 24.0, 26.0, 19.0, 29.0, 16.0, 16.0, 27.0, 16.0, 12.0, 8.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0545654296875, -6.820068359375, -6.5855712890625, -6.35107421875, -6.1165771484375, -5.882080078125, -5.6475830078125, -5.4130859375, -5.1785888671875, -4.944091796875, -4.7095947265625, -4.47509765625, -4.2406005859375, -4.006103515625, -3.7716064453125, -3.537109375, -3.3026123046875, -3.068115234375, -2.8336181640625, -2.59912109375, -2.3646240234375, -2.130126953125, -1.8956298828125, -1.6611328125, -1.4266357421875, -1.192138671875, -0.9576416015625, -0.72314453125, -0.4886474609375, -0.254150390625, -0.0196533203125, 0.21484375, 0.4493408203125, 0.683837890625, 0.9183349609375, 1.15283203125, 1.3873291015625, 1.621826171875, 1.8563232421875, 2.0908203125, 2.3253173828125, 2.559814453125, 2.7943115234375, 3.02880859375, 3.2633056640625, 3.497802734375, 3.7322998046875, 3.966796875, 4.2012939453125, 4.435791015625, 4.6702880859375, 4.90478515625, 5.1392822265625, 5.373779296875, 5.6082763671875, 5.8427734375, 6.0772705078125, 6.311767578125, 6.5462646484375, 6.78076171875, 7.0152587890625, 7.249755859375, 7.4842529296875, 7.71875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 6.0, 8.0, 12.0, 16.0, 27.0, 27.0, 62.0, 70.0, 116.0, 173.0, 266.0, 362.0, 576.0, 824.0, 1247.0, 1896.0, 3022.0, 4640.0, 7211.0, 11128.0, 17493.0, 26946.0, 40706.0, 59588.0, 83335.0, 109600.0, 128889.0, 132564.0, 118090.0, 94292.0, 68292.0, 47107.0, 31419.0, 20851.0, 13329.0, 8509.0, 5473.0, 3559.0, 2334.0, 1511.0, 986.0, 650.0, 410.0, 306.0, 213.0, 131.0, 90.0, 66.0, 51.0, 35.0, 22.0, 15.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.33673095703125, -5.1539306640625, -4.97113037109375, -4.788330078125, -4.60552978515625, -4.4227294921875, -4.23992919921875, -4.05712890625, -3.87432861328125, -3.6915283203125, -3.50872802734375, -3.325927734375, -3.14312744140625, -2.9603271484375, -2.77752685546875, -2.5947265625, -2.41192626953125, -2.2291259765625, -2.04632568359375, -1.863525390625, -1.68072509765625, -1.4979248046875, -1.31512451171875, -1.13232421875, -0.94952392578125, -0.7667236328125, -0.58392333984375, -0.401123046875, -0.21832275390625, -0.0355224609375, 0.14727783203125, 0.330078125, 0.51287841796875, 0.6956787109375, 0.87847900390625, 1.061279296875, 1.24407958984375, 1.4268798828125, 1.60968017578125, 1.79248046875, 1.97528076171875, 2.1580810546875, 2.34088134765625, 2.523681640625, 2.70648193359375, 2.8892822265625, 3.07208251953125, 3.2548828125, 3.43768310546875, 3.6204833984375, 3.80328369140625, 3.986083984375, 4.16888427734375, 4.3516845703125, 4.53448486328125, 4.71728515625, 4.90008544921875, 5.0828857421875, 5.26568603515625, 5.448486328125, 5.63128662109375, 5.8140869140625, 5.99688720703125, 6.1796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 4.0, 9.0, 8.0, 14.0, 24.0, 12.0, 27.0, 22.0, 24.0, 27.0, 25.0, 28.0, 31.0, 37.0, 50.0, 37.0, 40.0, 35.0, 44.0, 52.0, 33.0, 41.0, 50.0, 43.0, 37.0, 28.0, 24.0, 33.0, 19.0, 26.0, 23.0, 18.0, 19.0, 11.0, 7.0, 14.0, 5.0, 1.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.34765625, -5.19378662109375, -5.0399169921875, -4.88604736328125, -4.732177734375, -4.57830810546875, -4.4244384765625, -4.27056884765625, -4.11669921875, -3.96282958984375, -3.8089599609375, -3.65509033203125, -3.501220703125, -3.34735107421875, -3.1934814453125, -3.03961181640625, -2.8857421875, -2.73187255859375, -2.5780029296875, -2.42413330078125, -2.270263671875, -2.11639404296875, -1.9625244140625, -1.80865478515625, -1.65478515625, -1.50091552734375, -1.3470458984375, -1.19317626953125, -1.039306640625, -0.88543701171875, -0.7315673828125, -0.57769775390625, -0.423828125, -0.26995849609375, -0.1160888671875, 0.03778076171875, 0.191650390625, 0.34552001953125, 0.4993896484375, 0.65325927734375, 0.80712890625, 0.96099853515625, 1.1148681640625, 1.26873779296875, 1.422607421875, 1.57647705078125, 1.7303466796875, 1.88421630859375, 2.0380859375, 2.19195556640625, 2.3458251953125, 2.49969482421875, 2.653564453125, 2.80743408203125, 2.9613037109375, 3.11517333984375, 3.26904296875, 3.42291259765625, 3.5767822265625, 3.73065185546875, 3.884521484375, 4.03839111328125, 4.1922607421875, 4.34613037109375, 4.5]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 7.0, 6.0, 8.0, 19.0, 22.0, 21.0, 35.0, 59.0, 86.0, 125.0, 175.0, 264.0, 438.0, 584.0, 970.0, 1532.0, 2652.0, 4272.0, 7632.0, 13321.0, 23713.0, 42913.0, 76230.0, 129399.0, 183105.0, 195849.0, 150093.0, 93301.0, 53373.0, 29082.0, 16446.0, 9183.0, 5382.0, 3203.0, 1935.0, 1106.0, 702.0, 437.0, 264.0, 195.0, 121.0, 100.0, 58.0, 34.0, 34.0, 20.0, 14.0, 14.0, 8.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.23046875, -4.10296630859375, -3.9754638671875, -3.84796142578125, -3.720458984375, -3.59295654296875, -3.4654541015625, -3.33795166015625, -3.21044921875, -3.08294677734375, -2.9554443359375, -2.82794189453125, -2.700439453125, -2.57293701171875, -2.4454345703125, -2.31793212890625, -2.1904296875, -2.06292724609375, -1.9354248046875, -1.80792236328125, -1.680419921875, -1.55291748046875, -1.4254150390625, -1.29791259765625, -1.17041015625, -1.04290771484375, -0.9154052734375, -0.78790283203125, -0.660400390625, -0.53289794921875, -0.4053955078125, -0.27789306640625, -0.150390625, -0.02288818359375, 0.1046142578125, 0.23211669921875, 0.359619140625, 0.48712158203125, 0.6146240234375, 0.74212646484375, 0.86962890625, 0.99713134765625, 1.1246337890625, 1.25213623046875, 1.379638671875, 1.50714111328125, 1.6346435546875, 1.76214599609375, 1.8896484375, 2.01715087890625, 2.1446533203125, 2.27215576171875, 2.399658203125, 2.52716064453125, 2.6546630859375, 2.78216552734375, 2.90966796875, 3.03717041015625, 3.1646728515625, 3.29217529296875, 3.419677734375, 3.54718017578125, 3.6746826171875, 3.80218505859375, 3.9296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 8.0, 11.0, 17.0, 15.0, 17.0, 19.0, 34.0, 30.0, 33.0, 54.0, 53.0, 67.0, 59.0, 56.0, 71.0, 76.0, 61.0, 50.0, 46.0, 46.0, 31.0, 28.0, 27.0, 20.0, 11.0, 10.0, 8.0, 7.0, 4.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0004611015319824219, -0.0004482269287109375, -0.0004353523254394531, -0.00042247772216796875, -0.0004096031188964844, -0.000396728515625, -0.0003838539123535156, -0.00037097930908203125, -0.0003581047058105469, -0.0003452301025390625, -0.0003323554992675781, -0.00031948089599609375, -0.0003066062927246094, -0.000293731689453125, -0.0002808570861816406, -0.00026798248291015625, -0.0002551078796386719, -0.0002422332763671875, -0.00022935867309570312, -0.00021648406982421875, -0.00020360946655273438, -0.00019073486328125, -0.00017786026000976562, -0.00016498565673828125, -0.00015211105346679688, -0.0001392364501953125, -0.00012636184692382812, -0.00011348724365234375, -0.00010061264038085938, -8.7738037109375e-05, -7.486343383789062e-05, -6.198883056640625e-05, -4.9114227294921875e-05, -3.62396240234375e-05, -2.3365020751953125e-05, -1.049041748046875e-05, 2.384185791015625e-06, 1.52587890625e-05, 2.8133392333984375e-05, 4.100799560546875e-05, 5.3882598876953125e-05, 6.67572021484375e-05, 7.963180541992188e-05, 9.250640869140625e-05, 0.00010538101196289062, 0.000118255615234375, 0.00013113021850585938, 0.00014400482177734375, 0.00015687942504882812, 0.0001697540283203125, 0.00018262863159179688, 0.00019550323486328125, 0.00020837783813476562, 0.00022125244140625, 0.00023412704467773438, 0.00024700164794921875, 0.0002598762512207031, 0.0002727508544921875, 0.0002856254577636719, 0.00029850006103515625, 0.0003113746643066406, 0.000324249267578125, 0.0003371238708496094, 0.00034999847412109375, 0.0003628730773925781]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 7.0, 17.0, 29.0, 38.0, 56.0, 81.0, 164.0, 239.0, 354.0, 574.0, 1017.0, 1624.0, 2774.0, 4682.0, 7992.0, 14269.0, 25248.0, 44975.0, 77732.0, 126985.0, 177567.0, 189559.0, 147692.0, 95119.0, 55922.0, 31587.0, 17922.0, 10088.0, 5691.0, 3307.0, 2011.0, 1234.0, 765.0, 461.0, 275.0, 172.0, 118.0, 78.0, 41.0, 26.0, 9.0, 17.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-4.45703125, -4.326690673828125, -4.19635009765625, -4.066009521484375, -3.9356689453125, -3.805328369140625, -3.67498779296875, -3.544647216796875, -3.414306640625, -3.283966064453125, -3.15362548828125, -3.023284912109375, -2.8929443359375, -2.762603759765625, -2.63226318359375, -2.501922607421875, -2.37158203125, -2.241241455078125, -2.11090087890625, -1.980560302734375, -1.8502197265625, -1.719879150390625, -1.58953857421875, -1.459197998046875, -1.328857421875, -1.198516845703125, -1.06817626953125, -0.937835693359375, -0.8074951171875, -0.677154541015625, -0.54681396484375, -0.416473388671875, -0.2861328125, -0.155792236328125, -0.02545166015625, 0.104888916015625, 0.2352294921875, 0.365570068359375, 0.49591064453125, 0.626251220703125, 0.756591796875, 0.886932373046875, 1.01727294921875, 1.147613525390625, 1.2779541015625, 1.408294677734375, 1.53863525390625, 1.668975830078125, 1.79931640625, 1.929656982421875, 2.05999755859375, 2.190338134765625, 2.3206787109375, 2.451019287109375, 2.58135986328125, 2.711700439453125, 2.842041015625, 2.972381591796875, 3.10272216796875, 3.233062744140625, 3.3634033203125, 3.493743896484375, 3.62408447265625, 3.754425048828125, 3.884765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 28.0, 26.0, 24.0, 23.0, 28.0, 41.0, 44.0, 47.0, 42.0, 51.0, 64.0, 52.0, 52.0, 49.0, 56.0, 43.0, 47.0, 32.0, 23.0, 31.0, 25.0, 17.0, 26.0, 12.0, 19.0, 7.0, 10.0, 9.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.341796875, -1.3036651611328125, -1.265533447265625, -1.2274017333984375, -1.18927001953125, -1.1511383056640625, -1.113006591796875, -1.0748748779296875, -1.0367431640625, -0.9986114501953125, -0.960479736328125, -0.9223480224609375, -0.88421630859375, -0.8460845947265625, -0.807952880859375, -0.7698211669921875, -0.731689453125, -0.6935577392578125, -0.655426025390625, -0.6172943115234375, -0.57916259765625, -0.5410308837890625, -0.502899169921875, -0.4647674560546875, -0.4266357421875, -0.3885040283203125, -0.350372314453125, -0.3122406005859375, -0.27410888671875, -0.2359771728515625, -0.197845458984375, -0.1597137451171875, -0.12158203125, -0.0834503173828125, -0.045318603515625, -0.0071868896484375, 0.03094482421875, 0.0690765380859375, 0.107208251953125, 0.1453399658203125, 0.1834716796875, 0.2216033935546875, 0.259735107421875, 0.2978668212890625, 0.33599853515625, 0.3741302490234375, 0.412261962890625, 0.4503936767578125, 0.488525390625, 0.5266571044921875, 0.564788818359375, 0.6029205322265625, 0.64105224609375, 0.6791839599609375, 0.717315673828125, 0.7554473876953125, 0.7935791015625, 0.8317108154296875, 0.869842529296875, 0.9079742431640625, 0.94610595703125, 0.9842376708984375, 1.022369384765625, 1.0605010986328125, 1.0986328125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 6.0, 8.0, 12.0, 16.0, 12.0, 20.0, 38.0, 35.0, 47.0, 53.0, 61.0, 73.0, 76.0, 84.0, 91.0, 76.0, 49.0, 59.0, 36.0, 38.0, 29.0, 18.0, 16.0, 14.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.42067813873291, -11.963934898376465, -11.507190704345703, -11.050447463989258, -10.593703269958496, -10.13696002960205, -9.680215835571289, -9.223472595214844, -8.766729354858398, -8.309986114501953, -7.853241920471191, -7.396498680114746, -6.939754486083984, -6.483011245727539, -6.0262675285339355, -5.569523811340332, -5.11277961730957, -4.656035900115967, -4.199292182922363, -3.742548704147339, -3.2858049869537354, -2.829061269760132, -2.3723177909851074, -1.915574073791504, -1.4588303565979004, -1.0020866394042969, -0.5453430414199829, -0.08859944343566895, 0.36814427375793457, 0.8248879909515381, 1.2816314697265625, 1.738375186920166, 2.195117950439453, 2.6518616676330566, 3.10860538482666, 3.5653488636016846, 4.022092819213867, 4.4788360595703125, 4.935579776763916, 5.3923234939575195, 5.849067211151123, 6.305810928344727, 6.76255464553833, 7.219298362731934, 7.676041603088379, 8.13278579711914, 8.589529037475586, 9.046272277832031, 9.503016471862793, 9.959759712219238, 10.41650390625, 10.873247146606445, 11.329991340637207, 11.786734580993652, 12.243478775024414, 12.70022201538086, 13.156965255737305, 13.61370849609375, 14.070452690124512, 14.527195930480957, 14.983940124511719, 15.440683364868164, 15.89742660522461, 16.354171752929688, 16.810914993286133]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 5.0, 12.0, 7.0, 5.0, 12.0, 16.0, 18.0, 19.0, 17.0, 18.0, 28.0, 28.0, 30.0, 34.0, 35.0, 34.0, 40.0, 39.0, 39.0, 46.0, 41.0, 28.0, 37.0, 43.0, 36.0, 36.0, 32.0, 33.0, 29.0, 18.0, 15.0, 19.0, 17.0, 24.0, 13.0, 10.0, 12.0, 11.0, 12.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.598753452301025, -6.39119291305542, -6.1836323738098145, -5.976071834564209, -5.7685112953186035, -5.560950756072998, -5.353390216827393, -5.145829677581787, -4.938269138336182, -4.730708599090576, -4.523148059844971, -4.315587520599365, -4.10802698135376, -3.9004664421081543, -3.692905902862549, -3.4853453636169434, -3.277784824371338, -3.0702242851257324, -2.862663745880127, -2.6551032066345215, -2.447542667388916, -2.2399821281433105, -2.032421588897705, -1.8248610496520996, -1.6173005104064941, -1.4097399711608887, -1.2021794319152832, -0.9946188926696777, -0.7870583534240723, -0.5794978141784668, -0.37193727493286133, -0.16437673568725586, 0.04318428039550781, 0.2507448196411133, 0.45830535888671875, 0.6658658981323242, 0.8734264373779297, 1.0809869766235352, 1.2885475158691406, 1.496108055114746, 1.7036685943603516, 1.911229133605957, 2.1187896728515625, 2.326350212097168, 2.5339107513427734, 2.741471290588379, 2.9490318298339844, 3.15659236907959, 3.3641529083251953, 3.571713447570801, 3.7792739868164062, 3.9868345260620117, 4.194395065307617, 4.401955604553223, 4.609516143798828, 4.817076683044434, 5.024637222290039, 5.2321977615356445, 5.43975830078125, 5.6473188400268555, 5.854879379272461, 6.062439918518066, 6.270000457763672, 6.477560997009277, 6.685121536254883]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 11.0, 11.0, 9.0, 12.0, 19.0, 28.0, 64.0, 64.0, 116.0, 143.0, 219.0, 369.0, 545.0, 848.0, 1339.0, 2163.0, 3636.0, 5952.0, 10694.0, 19535.0, 37997.0, 78719.0, 176883.0, 408992.0, 856629.0, 1145658.0, 780916.0, 362146.0, 157189.0, 70476.0, 33767.0, 17291.0, 9206.0, 5105.0, 2958.0, 1658.0, 1065.0, 678.0, 406.0, 255.0, 178.0, 127.0, 74.0, 49.0, 28.0, 21.0, 9.0, 10.0, 11.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.8828125, -12.4854736328125, -12.088134765625, -11.6907958984375, -11.29345703125, -10.8961181640625, -10.498779296875, -10.1014404296875, -9.7041015625, -9.3067626953125, -8.909423828125, -8.5120849609375, -8.11474609375, -7.7174072265625, -7.320068359375, -6.9227294921875, -6.525390625, -6.1280517578125, -5.730712890625, -5.3333740234375, -4.93603515625, -4.5386962890625, -4.141357421875, -3.7440185546875, -3.3466796875, -2.9493408203125, -2.552001953125, -2.1546630859375, -1.75732421875, -1.3599853515625, -0.962646484375, -0.5653076171875, -0.16796875, 0.2293701171875, 0.626708984375, 1.0240478515625, 1.42138671875, 1.8187255859375, 2.216064453125, 2.6134033203125, 3.0107421875, 3.4080810546875, 3.805419921875, 4.2027587890625, 4.60009765625, 4.9974365234375, 5.394775390625, 5.7921142578125, 6.189453125, 6.5867919921875, 6.984130859375, 7.3814697265625, 7.77880859375, 8.1761474609375, 8.573486328125, 8.9708251953125, 9.3681640625, 9.7655029296875, 10.162841796875, 10.5601806640625, 10.95751953125, 11.3548583984375, 11.752197265625, 12.1495361328125, 12.546875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 15.0, 11.0, 9.0, 12.0, 18.0, 16.0, 15.0, 16.0, 26.0, 30.0, 27.0, 23.0, 33.0, 28.0, 46.0, 52.0, 43.0, 35.0, 35.0, 31.0, 39.0, 46.0, 39.0, 33.0, 37.0, 30.0, 19.0, 25.0, 27.0, 16.0, 21.0, 17.0, 24.0, 15.0, 17.0, 5.0, 10.0, 7.0, 8.0, 4.0, 2.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.0767822265625, -5.895751953125, -5.7147216796875, -5.53369140625, -5.3526611328125, -5.171630859375, -4.9906005859375, -4.8095703125, -4.6285400390625, -4.447509765625, -4.2664794921875, -4.08544921875, -3.9044189453125, -3.723388671875, -3.5423583984375, -3.361328125, -3.1802978515625, -2.999267578125, -2.8182373046875, -2.63720703125, -2.4561767578125, -2.275146484375, -2.0941162109375, -1.9130859375, -1.7320556640625, -1.551025390625, -1.3699951171875, -1.18896484375, -1.0079345703125, -0.826904296875, -0.6458740234375, -0.46484375, -0.2838134765625, -0.102783203125, 0.0782470703125, 0.25927734375, 0.4403076171875, 0.621337890625, 0.8023681640625, 0.9833984375, 1.1644287109375, 1.345458984375, 1.5264892578125, 1.70751953125, 1.8885498046875, 2.069580078125, 2.2506103515625, 2.431640625, 2.6126708984375, 2.793701171875, 2.9747314453125, 3.15576171875, 3.3367919921875, 3.517822265625, 3.6988525390625, 3.8798828125, 4.0609130859375, 4.241943359375, 4.4229736328125, 4.60400390625, 4.7850341796875, 4.966064453125, 5.1470947265625, 5.328125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 11.0, 16.0, 33.0, 50.0, 78.0, 90.0, 171.0, 250.0, 389.0, 610.0, 1047.0, 1547.0, 2594.0, 4318.0, 7203.0, 12934.0, 22607.0, 41164.0, 78132.0, 151681.0, 303542.0, 590991.0, 942975.0, 908417.0, 545912.0, 277196.0, 139572.0, 72206.0, 38485.0, 20711.0, 11839.0, 6935.0, 3937.0, 2503.0, 1503.0, 943.0, 589.0, 396.0, 243.0, 153.0, 118.0, 89.0, 30.0, 16.0, 19.0, 12.0, 15.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.8828125, -13.4481201171875, -13.013427734375, -12.5787353515625, -12.14404296875, -11.7093505859375, -11.274658203125, -10.8399658203125, -10.4052734375, -9.9705810546875, -9.535888671875, -9.1011962890625, -8.66650390625, -8.2318115234375, -7.797119140625, -7.3624267578125, -6.927734375, -6.4930419921875, -6.058349609375, -5.6236572265625, -5.18896484375, -4.7542724609375, -4.319580078125, -3.8848876953125, -3.4501953125, -3.0155029296875, -2.580810546875, -2.1461181640625, -1.71142578125, -1.2767333984375, -0.842041015625, -0.4073486328125, 0.02734375, 0.4620361328125, 0.896728515625, 1.3314208984375, 1.76611328125, 2.2008056640625, 2.635498046875, 3.0701904296875, 3.5048828125, 3.9395751953125, 4.374267578125, 4.8089599609375, 5.24365234375, 5.6783447265625, 6.113037109375, 6.5477294921875, 6.982421875, 7.4171142578125, 7.851806640625, 8.2864990234375, 8.72119140625, 9.1558837890625, 9.590576171875, 10.0252685546875, 10.4599609375, 10.8946533203125, 11.329345703125, 11.7640380859375, 12.19873046875, 12.6334228515625, 13.068115234375, 13.5028076171875, 13.9375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 1.0, 3.0, 2.0, 8.0, 13.0, 11.0, 10.0, 10.0, 19.0, 30.0, 39.0, 43.0, 48.0, 66.0, 79.0, 123.0, 145.0, 167.0, 225.0, 233.0, 308.0, 263.0, 296.0, 280.0, 282.0, 264.0, 213.0, 165.0, 164.0, 120.0, 92.0, 78.0, 59.0, 49.0, 42.0, 27.0, 23.0, 16.0, 13.0, 8.0, 10.0, 9.0, 2.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.69140625, -4.55560302734375, -4.4197998046875, -4.28399658203125, -4.148193359375, -4.01239013671875, -3.8765869140625, -3.74078369140625, -3.60498046875, -3.46917724609375, -3.3333740234375, -3.19757080078125, -3.061767578125, -2.92596435546875, -2.7901611328125, -2.65435791015625, -2.5185546875, -2.38275146484375, -2.2469482421875, -2.11114501953125, -1.975341796875, -1.83953857421875, -1.7037353515625, -1.56793212890625, -1.43212890625, -1.29632568359375, -1.1605224609375, -1.02471923828125, -0.888916015625, -0.75311279296875, -0.6173095703125, -0.48150634765625, -0.345703125, -0.20989990234375, -0.0740966796875, 0.06170654296875, 0.197509765625, 0.33331298828125, 0.4691162109375, 0.60491943359375, 0.74072265625, 0.87652587890625, 1.0123291015625, 1.14813232421875, 1.283935546875, 1.41973876953125, 1.5555419921875, 1.69134521484375, 1.8271484375, 1.96295166015625, 2.0987548828125, 2.23455810546875, 2.370361328125, 2.50616455078125, 2.6419677734375, 2.77777099609375, 2.91357421875, 3.04937744140625, 3.1851806640625, 3.32098388671875, 3.456787109375, 3.59259033203125, 3.7283935546875, 3.86419677734375, 4.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 7.0, 12.0, 18.0, 25.0, 26.0, 17.0, 36.0, 39.0, 34.0, 45.0, 61.0, 67.0, 56.0, 65.0, 62.0, 53.0, 62.0, 54.0, 43.0, 35.0, 22.0, 32.0, 35.0, 23.0, 15.0, 10.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.131260871887207, -11.676679611206055, -11.222098350524902, -10.76751708984375, -10.312935829162598, -9.858354568481445, -9.403772354125977, -8.94919204711914, -8.494609832763672, -8.04002857208252, -7.585447311401367, -7.130866050720215, -6.6762847900390625, -6.22170352935791, -5.7671217918396, -5.312540531158447, -4.857959747314453, -4.403378486633301, -3.9487972259521484, -3.494215726852417, -3.0396344661712646, -2.5850532054901123, -2.130471706390381, -1.6758904457092285, -1.2213091850280762, -0.766727864742279, -0.31214654445648193, 0.14243483543395996, 0.5970160961151123, 1.0515973567962646, 1.506178855895996, 1.9607601165771484, 2.415342330932617, 2.8699235916137695, 3.324504852294922, 3.7790863513946533, 4.233667373657227, 4.688248634338379, 5.1428303718566895, 5.597411632537842, 6.051992893218994, 6.5065741539001465, 6.961155414581299, 7.415737152099609, 7.870318412780762, 8.324899673461914, 8.779480934143066, 9.234062194824219, 9.688643455505371, 10.143224716186523, 10.597805976867676, 11.052387237548828, 11.50696849822998, 11.961549758911133, 12.416131973266602, 12.870712280273438, 13.325294494628906, 13.779875755310059, 14.234457015991211, 14.689038276672363, 15.143619537353516, 15.598200798034668, 16.05278205871582, 16.50736427307129, 16.961944580078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 17.0, 6.0, 16.0, 12.0, 16.0, 22.0, 18.0, 29.0, 36.0, 33.0, 38.0, 48.0, 41.0, 44.0, 44.0, 45.0, 33.0, 40.0, 54.0, 24.0, 46.0, 41.0, 24.0, 28.0, 40.0, 31.0, 22.0, 19.0, 18.0, 12.0, 13.0, 19.0, 13.0, 7.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.43345832824707, -9.149964332580566, -8.866470336914062, -8.582977294921875, -8.299483299255371, -8.015989303588867, -7.732495307922363, -7.449001312255859, -7.165507793426514, -6.88201379776001, -6.598520278930664, -6.31502628326416, -6.031532287597656, -5.7480387687683105, -5.464544773101807, -5.181051254272461, -4.897557258605957, -4.614063262939453, -4.330569744110107, -4.0470757484436035, -3.7635819911956787, -3.480088233947754, -3.19659423828125, -2.913100481033325, -2.6296067237854004, -2.3461129665374756, -2.062619209289551, -1.7791252136230469, -1.495631456375122, -1.2121376991271973, -0.9286438226699829, -0.6451499462127686, -0.36165618896484375, -0.07816237211227417, 0.2053314447402954, 0.488825261592865, 0.7723190784454346, 1.0558128356933594, 1.3393067121505737, 1.622800588607788, 1.906294345855713, 2.1897881031036377, 2.4732818603515625, 2.7567758560180664, 3.040269613265991, 3.323763370513916, 3.60725736618042, 3.8907511234283447, 4.1742448806762695, 4.457738876342773, 4.741232395172119, 5.024726390838623, 5.308219909667969, 5.591713905334473, 5.875207901000977, 6.1587018966674805, 6.442195415496826, 6.72568941116333, 7.009182929992676, 7.29267692565918, 7.576170921325684, 7.859664440155029, 8.143157958984375, 8.426651954650879, 8.710145950317383]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 5.0, 5.0, 12.0, 21.0, 24.0, 40.0, 64.0, 88.0, 110.0, 184.0, 255.0, 407.0, 590.0, 984.0, 1510.0, 2510.0, 3745.0, 6143.0, 10231.0, 16670.0, 28084.0, 46879.0, 77675.0, 122588.0, 167851.0, 178076.0, 142943.0, 94622.0, 57504.0, 34640.0, 21190.0, 12551.0, 7485.0, 4697.0, 3000.0, 1857.0, 1127.0, 745.0, 452.0, 306.0, 225.0, 138.0, 99.0, 73.0, 47.0, 37.0, 20.0, 17.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.76171875, -7.51300048828125, -7.2642822265625, -7.01556396484375, -6.766845703125, -6.51812744140625, -6.2694091796875, -6.02069091796875, -5.77197265625, -5.52325439453125, -5.2745361328125, -5.02581787109375, -4.777099609375, -4.52838134765625, -4.2796630859375, -4.03094482421875, -3.7822265625, -3.53350830078125, -3.2847900390625, -3.03607177734375, -2.787353515625, -2.53863525390625, -2.2899169921875, -2.04119873046875, -1.79248046875, -1.54376220703125, -1.2950439453125, -1.04632568359375, -0.797607421875, -0.54888916015625, -0.3001708984375, -0.05145263671875, 0.197265625, 0.44598388671875, 0.6947021484375, 0.94342041015625, 1.192138671875, 1.44085693359375, 1.6895751953125, 1.93829345703125, 2.18701171875, 2.43572998046875, 2.6844482421875, 2.93316650390625, 3.181884765625, 3.43060302734375, 3.6793212890625, 3.92803955078125, 4.1767578125, 4.42547607421875, 4.6741943359375, 4.92291259765625, 5.171630859375, 5.42034912109375, 5.6690673828125, 5.91778564453125, 6.16650390625, 6.41522216796875, 6.6639404296875, 6.91265869140625, 7.161376953125, 7.41009521484375, 7.6588134765625, 7.90753173828125, 8.15625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 6.0, 12.0, 4.0, 9.0, 14.0, 17.0, 11.0, 18.0, 21.0, 28.0, 20.0, 38.0, 41.0, 35.0, 42.0, 42.0, 48.0, 45.0, 44.0, 40.0, 52.0, 42.0, 31.0, 42.0, 37.0, 35.0, 36.0, 31.0, 19.0, 17.0, 23.0, 17.0, 14.0, 15.0, 10.0, 11.0, 4.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6590576171875, -8.349365234375, -8.0396728515625, -7.72998046875, -7.4202880859375, -7.110595703125, -6.8009033203125, -6.4912109375, -6.1815185546875, -5.871826171875, -5.5621337890625, -5.25244140625, -4.9427490234375, -4.633056640625, -4.3233642578125, -4.013671875, -3.7039794921875, -3.394287109375, -3.0845947265625, -2.77490234375, -2.4652099609375, -2.155517578125, -1.8458251953125, -1.5361328125, -1.2264404296875, -0.916748046875, -0.6070556640625, -0.29736328125, 0.0123291015625, 0.322021484375, 0.6317138671875, 0.94140625, 1.2510986328125, 1.560791015625, 1.8704833984375, 2.18017578125, 2.4898681640625, 2.799560546875, 3.1092529296875, 3.4189453125, 3.7286376953125, 4.038330078125, 4.3480224609375, 4.65771484375, 4.9674072265625, 5.277099609375, 5.5867919921875, 5.896484375, 6.2061767578125, 6.515869140625, 6.8255615234375, 7.13525390625, 7.4449462890625, 7.754638671875, 8.0643310546875, 8.3740234375, 8.6837158203125, 8.993408203125, 9.3031005859375, 9.61279296875, 9.9224853515625, 10.232177734375, 10.5418701171875, 10.8515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 10.0, 10.0, 8.0, 14.0, 19.0, 27.0, 41.0, 47.0, 79.0, 114.0, 192.0, 276.0, 428.0, 669.0, 1233.0, 2074.0, 3807.0, 7820.0, 17326.0, 43573.0, 115734.0, 284676.0, 325558.0, 148159.0, 54883.0, 21754.0, 9537.0, 4580.0, 2395.0, 1323.0, 754.0, 496.0, 297.0, 192.0, 117.0, 94.0, 62.0, 49.0, 27.0, 24.0, 11.0, 12.0, 10.0, 9.0, 5.0, 2.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-17.515625, -16.98681640625, -16.4580078125, -15.92919921875, -15.400390625, -14.87158203125, -14.3427734375, -13.81396484375, -13.28515625, -12.75634765625, -12.2275390625, -11.69873046875, -11.169921875, -10.64111328125, -10.1123046875, -9.58349609375, -9.0546875, -8.52587890625, -7.9970703125, -7.46826171875, -6.939453125, -6.41064453125, -5.8818359375, -5.35302734375, -4.82421875, -4.29541015625, -3.7666015625, -3.23779296875, -2.708984375, -2.18017578125, -1.6513671875, -1.12255859375, -0.59375, -0.06494140625, 0.4638671875, 0.99267578125, 1.521484375, 2.05029296875, 2.5791015625, 3.10791015625, 3.63671875, 4.16552734375, 4.6943359375, 5.22314453125, 5.751953125, 6.28076171875, 6.8095703125, 7.33837890625, 7.8671875, 8.39599609375, 8.9248046875, 9.45361328125, 9.982421875, 10.51123046875, 11.0400390625, 11.56884765625, 12.09765625, 12.62646484375, 13.1552734375, 13.68408203125, 14.212890625, 14.74169921875, 15.2705078125, 15.79931640625, 16.328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 5.0, 12.0, 9.0, 6.0, 15.0, 19.0, 18.0, 18.0, 24.0, 26.0, 30.0, 28.0, 38.0, 20.0, 41.0, 37.0, 42.0, 38.0, 37.0, 48.0, 32.0, 45.0, 36.0, 38.0, 29.0, 28.0, 34.0, 30.0, 35.0, 22.0, 23.0, 12.0, 19.0, 19.0, 13.0, 14.0, 12.0, 4.0, 12.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.5234375, -5.3529052734375, -5.182373046875, -5.0118408203125, -4.84130859375, -4.6707763671875, -4.500244140625, -4.3297119140625, -4.1591796875, -3.9886474609375, -3.818115234375, -3.6475830078125, -3.47705078125, -3.3065185546875, -3.135986328125, -2.9654541015625, -2.794921875, -2.6243896484375, -2.453857421875, -2.2833251953125, -2.11279296875, -1.9422607421875, -1.771728515625, -1.6011962890625, -1.4306640625, -1.2601318359375, -1.089599609375, -0.9190673828125, -0.74853515625, -0.5780029296875, -0.407470703125, -0.2369384765625, -0.06640625, 0.1041259765625, 0.274658203125, 0.4451904296875, 0.61572265625, 0.7862548828125, 0.956787109375, 1.1273193359375, 1.2978515625, 1.4683837890625, 1.638916015625, 1.8094482421875, 1.97998046875, 2.1505126953125, 2.321044921875, 2.4915771484375, 2.662109375, 2.8326416015625, 3.003173828125, 3.1737060546875, 3.34423828125, 3.5147705078125, 3.685302734375, 3.8558349609375, 4.0263671875, 4.1968994140625, 4.367431640625, 4.5379638671875, 4.70849609375, 4.8790283203125, 5.049560546875, 5.2200927734375, 5.390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 22.0, 39.0, 61.0, 98.0, 161.0, 262.0, 458.0, 764.0, 1325.0, 2279.0, 4277.0, 8420.0, 17622.0, 40722.0, 102550.0, 260103.0, 340926.0, 158217.0, 60431.0, 25138.0, 11720.0, 5752.0, 3061.0, 1642.0, 968.0, 557.0, 383.0, 200.0, 139.0, 82.0, 47.0, 33.0, 21.0, 23.0, 5.0, 5.0, 8.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2884521484375, -8.990966796875, -8.6934814453125, -8.39599609375, -8.0985107421875, -7.801025390625, -7.5035400390625, -7.2060546875, -6.9085693359375, -6.611083984375, -6.3135986328125, -6.01611328125, -5.7186279296875, -5.421142578125, -5.1236572265625, -4.826171875, -4.5286865234375, -4.231201171875, -3.9337158203125, -3.63623046875, -3.3387451171875, -3.041259765625, -2.7437744140625, -2.4462890625, -2.1488037109375, -1.851318359375, -1.5538330078125, -1.25634765625, -0.9588623046875, -0.661376953125, -0.3638916015625, -0.06640625, 0.2310791015625, 0.528564453125, 0.8260498046875, 1.12353515625, 1.4210205078125, 1.718505859375, 2.0159912109375, 2.3134765625, 2.6109619140625, 2.908447265625, 3.2059326171875, 3.50341796875, 3.8009033203125, 4.098388671875, 4.3958740234375, 4.693359375, 4.9908447265625, 5.288330078125, 5.5858154296875, 5.88330078125, 6.1807861328125, 6.478271484375, 6.7757568359375, 7.0732421875, 7.3707275390625, 7.668212890625, 7.9656982421875, 8.26318359375, 8.5606689453125, 8.858154296875, 9.1556396484375, 9.453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 13.0, 11.0, 22.0, 14.0, 34.0, 30.0, 42.0, 52.0, 60.0, 61.0, 54.0, 71.0, 73.0, 66.0, 59.0, 54.0, 55.0, 39.0, 30.0, 28.0, 22.0, 20.0, 10.0, 11.0, 9.0, 8.0, 12.0, 8.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00039005279541015625, -0.0003794766962528229, -0.0003689005970954895, -0.00035832449793815613, -0.00034774839878082275, -0.0003371722996234894, -0.000326596200466156, -0.00031602010130882263, -0.00030544400215148926, -0.0002948679029941559, -0.0002842918038368225, -0.00027371570467948914, -0.00026313960552215576, -0.0002525635063648224, -0.00024198740720748901, -0.00023141130805015564, -0.00022083520889282227, -0.0002102591097354889, -0.00019968301057815552, -0.00018910691142082214, -0.00017853081226348877, -0.0001679547131061554, -0.00015737861394882202, -0.00014680251479148865, -0.00013622641563415527, -0.0001256503164768219, -0.00011507421731948853, -0.00010449811816215515, -9.392201900482178e-05, -8.33459198474884e-05, -7.276982069015503e-05, -6.219372153282166e-05, -5.161762237548828e-05, -4.104152321815491e-05, -3.0465424060821533e-05, -1.988932490348816e-05, -9.313225746154785e-06, 1.2628734111785889e-06, 1.1838972568511963e-05, 2.2415071725845337e-05, 3.299117088317871e-05, 4.3567270040512085e-05, 5.414336919784546e-05, 6.471946835517883e-05, 7.529556751251221e-05, 8.587166666984558e-05, 9.644776582717896e-05, 0.00010702386498451233, 0.0001175999641418457, 0.00012817606329917908, 0.00013875216245651245, 0.00014932826161384583, 0.0001599043607711792, 0.00017048045992851257, 0.00018105655908584595, 0.00019163265824317932, 0.0002022087574005127, 0.00021278485655784607, 0.00022336095571517944, 0.00023393705487251282, 0.0002445131540298462, 0.00025508925318717957, 0.00026566535234451294, 0.0002762414515018463, 0.0002868175506591797]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 20.0, 24.0, 25.0, 41.0, 54.0, 64.0, 96.0, 169.0, 224.0, 329.0, 475.0, 743.0, 1094.0, 1656.0, 2583.0, 3973.0, 6329.0, 9845.0, 16816.0, 28510.0, 49808.0, 87376.0, 143634.0, 196489.0, 186728.0, 128485.0, 75587.0, 42901.0, 24887.0, 14834.0, 8819.0, 5514.0, 3602.0, 2223.0, 1512.0, 1043.0, 636.0, 456.0, 280.0, 190.0, 127.0, 114.0, 60.0, 44.0, 28.0, 26.0, 18.0, 15.0, 9.0, 9.0, 5.0, 1.0, 7.0, 3.0, 1.0], "bins": [-6.921875, -6.7113037109375, -6.500732421875, -6.2901611328125, -6.07958984375, -5.8690185546875, -5.658447265625, -5.4478759765625, -5.2373046875, -5.0267333984375, -4.816162109375, -4.6055908203125, -4.39501953125, -4.1844482421875, -3.973876953125, -3.7633056640625, -3.552734375, -3.3421630859375, -3.131591796875, -2.9210205078125, -2.71044921875, -2.4998779296875, -2.289306640625, -2.0787353515625, -1.8681640625, -1.6575927734375, -1.447021484375, -1.2364501953125, -1.02587890625, -0.8153076171875, -0.604736328125, -0.3941650390625, -0.18359375, 0.0269775390625, 0.237548828125, 0.4481201171875, 0.65869140625, 0.8692626953125, 1.079833984375, 1.2904052734375, 1.5009765625, 1.7115478515625, 1.922119140625, 2.1326904296875, 2.34326171875, 2.5538330078125, 2.764404296875, 2.9749755859375, 3.185546875, 3.3961181640625, 3.606689453125, 3.8172607421875, 4.02783203125, 4.2384033203125, 4.448974609375, 4.6595458984375, 4.8701171875, 5.0806884765625, 5.291259765625, 5.5018310546875, 5.71240234375, 5.9229736328125, 6.133544921875, 6.3441162109375, 6.5546875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 6.0, 7.0, 5.0, 15.0, 11.0, 20.0, 23.0, 35.0, 40.0, 52.0, 72.0, 77.0, 91.0, 87.0, 92.0, 81.0, 69.0, 46.0, 44.0, 25.0, 19.0, 12.0, 13.0, 12.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.574920654296875, -2.47991943359375, -2.384918212890625, -2.2899169921875, -2.194915771484375, -2.09991455078125, -2.004913330078125, -1.909912109375, -1.814910888671875, -1.71990966796875, -1.624908447265625, -1.5299072265625, -1.434906005859375, -1.33990478515625, -1.244903564453125, -1.14990234375, -1.054901123046875, -0.95989990234375, -0.864898681640625, -0.7698974609375, -0.674896240234375, -0.57989501953125, -0.484893798828125, -0.389892578125, -0.294891357421875, -0.19989013671875, -0.104888916015625, -0.0098876953125, 0.085113525390625, 0.18011474609375, 0.275115966796875, 0.3701171875, 0.465118408203125, 0.56011962890625, 0.655120849609375, 0.7501220703125, 0.845123291015625, 0.94012451171875, 1.035125732421875, 1.130126953125, 1.225128173828125, 1.32012939453125, 1.415130615234375, 1.5101318359375, 1.605133056640625, 1.70013427734375, 1.795135498046875, 1.89013671875, 1.985137939453125, 2.08013916015625, 2.175140380859375, 2.2701416015625, 2.365142822265625, 2.46014404296875, 2.555145263671875, 2.650146484375, 2.745147705078125, 2.84014892578125, 2.935150146484375, 3.0301513671875, 3.125152587890625, 3.22015380859375, 3.315155029296875, 3.41015625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 4.0, 10.0, 21.0, 17.0, 23.0, 31.0, 22.0, 54.0, 42.0, 48.0, 71.0, 63.0, 52.0, 69.0, 68.0, 63.0, 67.0, 47.0, 42.0, 35.0, 29.0, 37.0, 20.0, 19.0, 4.0, 14.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.911978721618652, -12.421529769897461, -11.93108081817627, -11.440631866455078, -10.950182914733887, -10.459733963012695, -9.96928596496582, -9.478836059570312, -8.988388061523438, -8.497939109802246, -8.007490158081055, -7.517041206359863, -7.026592254638672, -6.5361433029174805, -6.045694828033447, -5.555245876312256, -5.064796447753906, -4.574347496032715, -4.083898544311523, -3.593449831008911, -3.1030008792877197, -2.6125519275665283, -2.122103214263916, -1.6316542625427246, -1.1412053108215332, -0.6507564187049866, -0.16030752658843994, 0.3301413059234619, 0.8205902576446533, 1.3110392093658447, 1.801487922668457, 2.2919368743896484, 2.7823848724365234, 3.272833824157715, 3.7632827758789062, 4.253731727600098, 4.744180679321289, 5.2346296310424805, 5.725078105926514, 6.215527057647705, 6.7059760093688965, 7.196424961090088, 7.686873912811279, 8.177322387695312, 8.667771339416504, 9.158220291137695, 9.648669242858887, 10.139118194580078, 10.62956714630127, 11.120016098022461, 11.610465049743652, 12.100914001464844, 12.591362953186035, 13.081811904907227, 13.572259902954102, 14.06270980834961, 14.553157806396484, 15.043606758117676, 15.534055709838867, 16.024503707885742, 16.51495361328125, 17.005401611328125, 17.495851516723633, 17.986299514770508, 18.476749420166016]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 10.0, 7.0, 22.0, 18.0, 24.0, 20.0, 26.0, 41.0, 30.0, 39.0, 47.0, 41.0, 52.0, 48.0, 43.0, 41.0, 48.0, 41.0, 42.0, 33.0, 33.0, 38.0, 33.0, 27.0, 31.0, 26.0, 18.0, 15.0, 15.0, 13.0, 12.0, 14.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.819650650024414, -9.521260261535645, -9.222870826721191, -8.924480438232422, -8.626090049743652, -8.327699661254883, -8.02931022644043, -7.73091983795166, -7.432529926300049, -7.1341400146484375, -6.835749626159668, -6.537359714508057, -6.238969802856445, -5.940579414367676, -5.6421895027160645, -5.343799591064453, -5.045409202575684, -4.747019290924072, -4.448628902435303, -4.150238990783691, -3.851848840713501, -3.5534586906433105, -3.255068778991699, -2.956678628921509, -2.6582884788513184, -2.359898328781128, -2.0615081787109375, -1.7631182670593262, -1.4647281169891357, -1.1663379669189453, -0.8679479360580444, -0.5695579051971436, -0.2711668014526367, 0.027223289012908936, 0.3256133794784546, 0.6240034699440002, 0.9223935604095459, 1.2207837104797363, 1.5191737413406372, 1.817563772201538, 2.1159539222717285, 2.414344072341919, 2.7127342224121094, 3.0111241340637207, 3.309514284133911, 3.6079044342041016, 3.906294345855713, 4.204684257507324, 4.503074645996094, 4.801464557647705, 5.099854946136475, 5.398244857788086, 5.6966352462768555, 5.995025157928467, 6.293415069580078, 6.591805458068848, 6.890195369720459, 7.18858528137207, 7.48697566986084, 7.785365581512451, 8.083755493164062, 8.382145881652832, 8.680536270141602, 8.978925704956055, 9.277316093444824]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 20.0, 11.0, 25.0, 42.0, 54.0, 79.0, 148.0, 181.0, 317.0, 458.0, 674.0, 1081.0, 1595.0, 2605.0, 4193.0, 6472.0, 10389.0, 16519.0, 26047.0, 40650.0, 62421.0, 91461.0, 122403.0, 142722.0, 142144.0, 119889.0, 88653.0, 60291.0, 39058.0, 25007.0, 15830.0, 9821.0, 6225.0, 3886.0, 2608.0, 1578.0, 1081.0, 605.0, 424.0, 288.0, 201.0, 132.0, 98.0, 54.0, 38.0, 31.0, 22.0, 8.0, 6.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.11328125, -6.88348388671875, -6.6536865234375, -6.42388916015625, -6.194091796875, -5.96429443359375, -5.7344970703125, -5.50469970703125, -5.27490234375, -5.04510498046875, -4.8153076171875, -4.58551025390625, -4.355712890625, -4.12591552734375, -3.8961181640625, -3.66632080078125, -3.4365234375, -3.20672607421875, -2.9769287109375, -2.74713134765625, -2.517333984375, -2.28753662109375, -2.0577392578125, -1.82794189453125, -1.59814453125, -1.36834716796875, -1.1385498046875, -0.90875244140625, -0.678955078125, -0.44915771484375, -0.2193603515625, 0.01043701171875, 0.240234375, 0.47003173828125, 0.6998291015625, 0.92962646484375, 1.159423828125, 1.38922119140625, 1.6190185546875, 1.84881591796875, 2.07861328125, 2.30841064453125, 2.5382080078125, 2.76800537109375, 2.997802734375, 3.22760009765625, 3.4573974609375, 3.68719482421875, 3.9169921875, 4.14678955078125, 4.3765869140625, 4.60638427734375, 4.836181640625, 5.06597900390625, 5.2957763671875, 5.52557373046875, 5.75537109375, 5.98516845703125, 6.2149658203125, 6.44476318359375, 6.674560546875, 6.90435791015625, 7.1341552734375, 7.36395263671875, 7.59375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 4.0, 13.0, 19.0, 16.0, 16.0, 12.0, 21.0, 29.0, 37.0, 26.0, 21.0, 40.0, 47.0, 42.0, 45.0, 47.0, 45.0, 41.0, 30.0, 33.0, 37.0, 38.0, 38.0, 31.0, 27.0, 31.0, 25.0, 24.0, 20.0, 18.0, 20.0, 21.0, 9.0, 12.0, 5.0, 7.0, 5.0, 8.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2265625, -8.9312744140625, -8.635986328125, -8.3406982421875, -8.04541015625, -7.7501220703125, -7.454833984375, -7.1595458984375, -6.8642578125, -6.5689697265625, -6.273681640625, -5.9783935546875, -5.68310546875, -5.3878173828125, -5.092529296875, -4.7972412109375, -4.501953125, -4.2066650390625, -3.911376953125, -3.6160888671875, -3.32080078125, -3.0255126953125, -2.730224609375, -2.4349365234375, -2.1396484375, -1.8443603515625, -1.549072265625, -1.2537841796875, -0.95849609375, -0.6632080078125, -0.367919921875, -0.0726318359375, 0.22265625, 0.5179443359375, 0.813232421875, 1.1085205078125, 1.40380859375, 1.6990966796875, 1.994384765625, 2.2896728515625, 2.5849609375, 2.8802490234375, 3.175537109375, 3.4708251953125, 3.76611328125, 4.0614013671875, 4.356689453125, 4.6519775390625, 4.947265625, 5.2425537109375, 5.537841796875, 5.8331298828125, 6.12841796875, 6.4237060546875, 6.718994140625, 7.0142822265625, 7.3095703125, 7.6048583984375, 7.900146484375, 8.1954345703125, 8.49072265625, 8.7860107421875, 9.081298828125, 9.3765869140625, 9.671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 10.0, 6.0, 17.0, 20.0, 31.0, 65.0, 85.0, 128.0, 186.0, 277.0, 384.0, 621.0, 924.0, 1350.0, 2172.0, 3384.0, 5307.0, 8233.0, 13080.0, 20131.0, 31417.0, 47837.0, 70902.0, 99867.0, 126972.0, 142246.0, 132654.0, 107561.0, 78701.0, 53877.0, 36026.0, 23091.0, 14579.0, 9338.0, 6048.0, 3826.0, 2473.0, 1633.0, 1022.0, 706.0, 454.0, 304.0, 198.0, 142.0, 85.0, 58.0, 41.0, 42.0, 14.0, 16.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-7.640625, -7.399169921875, -7.15771484375, -6.916259765625, -6.6748046875, -6.433349609375, -6.19189453125, -5.950439453125, -5.708984375, -5.467529296875, -5.22607421875, -4.984619140625, -4.7431640625, -4.501708984375, -4.26025390625, -4.018798828125, -3.77734375, -3.535888671875, -3.29443359375, -3.052978515625, -2.8115234375, -2.570068359375, -2.32861328125, -2.087158203125, -1.845703125, -1.604248046875, -1.36279296875, -1.121337890625, -0.8798828125, -0.638427734375, -0.39697265625, -0.155517578125, 0.0859375, 0.327392578125, 0.56884765625, 0.810302734375, 1.0517578125, 1.293212890625, 1.53466796875, 1.776123046875, 2.017578125, 2.259033203125, 2.50048828125, 2.741943359375, 2.9833984375, 3.224853515625, 3.46630859375, 3.707763671875, 3.94921875, 4.190673828125, 4.43212890625, 4.673583984375, 4.9150390625, 5.156494140625, 5.39794921875, 5.639404296875, 5.880859375, 6.122314453125, 6.36376953125, 6.605224609375, 6.8466796875, 7.088134765625, 7.32958984375, 7.571044921875, 7.8125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 5.0, 12.0, 20.0, 12.0, 19.0, 21.0, 12.0, 32.0, 36.0, 33.0, 36.0, 43.0, 39.0, 42.0, 41.0, 29.0, 44.0, 46.0, 40.0, 27.0, 34.0, 35.0, 36.0, 30.0, 41.0, 31.0, 29.0, 19.0, 19.0, 22.0, 23.0, 24.0, 11.0, 10.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.33203125, -6.13580322265625, -5.9395751953125, -5.74334716796875, -5.547119140625, -5.35089111328125, -5.1546630859375, -4.95843505859375, -4.76220703125, -4.56597900390625, -4.3697509765625, -4.17352294921875, -3.977294921875, -3.78106689453125, -3.5848388671875, -3.38861083984375, -3.1923828125, -2.99615478515625, -2.7999267578125, -2.60369873046875, -2.407470703125, -2.21124267578125, -2.0150146484375, -1.81878662109375, -1.62255859375, -1.42633056640625, -1.2301025390625, -1.03387451171875, -0.837646484375, -0.64141845703125, -0.4451904296875, -0.24896240234375, -0.052734375, 0.14349365234375, 0.3397216796875, 0.53594970703125, 0.732177734375, 0.92840576171875, 1.1246337890625, 1.32086181640625, 1.51708984375, 1.71331787109375, 1.9095458984375, 2.10577392578125, 2.302001953125, 2.49822998046875, 2.6944580078125, 2.89068603515625, 3.0869140625, 3.28314208984375, 3.4793701171875, 3.67559814453125, 3.871826171875, 4.06805419921875, 4.2642822265625, 4.46051025390625, 4.65673828125, 4.85296630859375, 5.0491943359375, 5.24542236328125, 5.441650390625, 5.63787841796875, 5.8341064453125, 6.03033447265625, 6.2265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 11.0, 12.0, 17.0, 32.0, 38.0, 76.0, 103.0, 150.0, 249.0, 387.0, 583.0, 850.0, 1316.0, 2146.0, 3423.0, 5654.0, 10243.0, 18308.0, 36437.0, 72005.0, 139573.0, 217800.0, 224226.0, 149260.0, 79334.0, 39438.0, 20207.0, 10801.0, 6002.0, 3694.0, 2200.0, 1383.0, 897.0, 576.0, 384.0, 249.0, 161.0, 114.0, 66.0, 42.0, 34.0, 28.0, 17.0, 9.0, 10.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26953125, -6.06097412109375, -5.8524169921875, -5.64385986328125, -5.435302734375, -5.22674560546875, -5.0181884765625, -4.80963134765625, -4.60107421875, -4.39251708984375, -4.1839599609375, -3.97540283203125, -3.766845703125, -3.55828857421875, -3.3497314453125, -3.14117431640625, -2.9326171875, -2.72406005859375, -2.5155029296875, -2.30694580078125, -2.098388671875, -1.88983154296875, -1.6812744140625, -1.47271728515625, -1.26416015625, -1.05560302734375, -0.8470458984375, -0.63848876953125, -0.429931640625, -0.22137451171875, -0.0128173828125, 0.19573974609375, 0.404296875, 0.61285400390625, 0.8214111328125, 1.02996826171875, 1.238525390625, 1.44708251953125, 1.6556396484375, 1.86419677734375, 2.07275390625, 2.28131103515625, 2.4898681640625, 2.69842529296875, 2.906982421875, 3.11553955078125, 3.3240966796875, 3.53265380859375, 3.7412109375, 3.94976806640625, 4.1583251953125, 4.36688232421875, 4.575439453125, 4.78399658203125, 4.9925537109375, 5.20111083984375, 5.40966796875, 5.61822509765625, 5.8267822265625, 6.03533935546875, 6.243896484375, 6.45245361328125, 6.6610107421875, 6.86956787109375, 7.078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 10.0, 11.0, 20.0, 16.0, 37.0, 41.0, 49.0, 65.0, 107.0, 136.0, 121.0, 106.0, 77.0, 59.0, 45.0, 26.0, 20.0, 12.0, 8.0, 7.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007772445678710938, -0.0007472783327102661, -0.0007173120975494385, -0.0006873458623886108, -0.0006573796272277832, -0.0006274133920669556, -0.0005974471569061279, -0.0005674809217453003, -0.0005375146865844727, -0.000507548451423645, -0.0004775822162628174, -0.00044761598110198975, -0.0004176497459411621, -0.00038768351078033447, -0.00035771727561950684, -0.0003277510404586792, -0.00029778480529785156, -0.0002678185701370239, -0.0002378523349761963, -0.00020788609981536865, -0.00017791986465454102, -0.00014795362949371338, -0.00011798739433288574, -8.80211591720581e-05, -5.805492401123047e-05, -2.8088688850402832e-05, 1.8775463104248047e-06, 3.184378147125244e-05, 6.181001663208008e-05, 9.177625179290771e-05, 0.00012174248695373535, 0.000151708722114563, 0.00018167495727539062, 0.00021164119243621826, 0.0002416074275970459, 0.00027157366275787354, 0.00030153989791870117, 0.0003315061330795288, 0.00036147236824035645, 0.0003914386034011841, 0.0004214048385620117, 0.00045137107372283936, 0.000481337308883667, 0.0005113035440444946, 0.0005412697792053223, 0.0005712360143661499, 0.0006012022495269775, 0.0006311684846878052, 0.0006611347198486328, 0.0006911009550094604, 0.0007210671901702881, 0.0007510334253311157, 0.0007809996604919434, 0.000810965895652771, 0.0008409321308135986, 0.0008708983659744263, 0.0009008646011352539, 0.0009308308362960815, 0.0009607970714569092, 0.0009907633066177368, 0.0010207295417785645, 0.001050695776939392, 0.0010806620121002197, 0.0011106282472610474, 0.001140594482421875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 9.0, 9.0, 7.0, 21.0, 33.0, 40.0, 49.0, 89.0, 115.0, 170.0, 207.0, 278.0, 475.0, 642.0, 865.0, 1248.0, 1902.0, 2615.0, 4073.0, 6118.0, 9525.0, 14695.0, 23134.0, 37534.0, 59805.0, 93722.0, 134896.0, 161987.0, 155917.0, 119559.0, 80109.0, 50257.0, 31976.0, 19619.0, 12548.0, 7905.0, 5251.0, 3453.0, 2415.0, 1605.0, 1109.0, 744.0, 581.0, 379.0, 248.0, 181.0, 123.0, 98.0, 83.0, 43.0, 37.0, 14.0, 14.0, 14.0, 7.0, 2.0, 4.0, 5.0, 1.0, 3.0], "bins": [-4.7421875, -4.5931396484375, -4.444091796875, -4.2950439453125, -4.14599609375, -3.9969482421875, -3.847900390625, -3.6988525390625, -3.5498046875, -3.4007568359375, -3.251708984375, -3.1026611328125, -2.95361328125, -2.8045654296875, -2.655517578125, -2.5064697265625, -2.357421875, -2.2083740234375, -2.059326171875, -1.9102783203125, -1.76123046875, -1.6121826171875, -1.463134765625, -1.3140869140625, -1.1650390625, -1.0159912109375, -0.866943359375, -0.7178955078125, -0.56884765625, -0.4197998046875, -0.270751953125, -0.1217041015625, 0.02734375, 0.1763916015625, 0.325439453125, 0.4744873046875, 0.62353515625, 0.7725830078125, 0.921630859375, 1.0706787109375, 1.2197265625, 1.3687744140625, 1.517822265625, 1.6668701171875, 1.81591796875, 1.9649658203125, 2.114013671875, 2.2630615234375, 2.412109375, 2.5611572265625, 2.710205078125, 2.8592529296875, 3.00830078125, 3.1573486328125, 3.306396484375, 3.4554443359375, 3.6044921875, 3.7535400390625, 3.902587890625, 4.0516357421875, 4.20068359375, 4.3497314453125, 4.498779296875, 4.6478271484375, 4.796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 16.0, 16.0, 17.0, 20.0, 20.0, 29.0, 32.0, 36.0, 45.0, 57.0, 45.0, 56.0, 74.0, 70.0, 56.0, 59.0, 50.0, 39.0, 43.0, 28.0, 28.0, 28.0, 18.0, 17.0, 9.0, 12.0, 9.0, 11.0, 8.0, 12.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7685546875, -1.713287353515625, -1.65802001953125, -1.602752685546875, -1.5474853515625, -1.492218017578125, -1.43695068359375, -1.381683349609375, -1.326416015625, -1.271148681640625, -1.21588134765625, -1.160614013671875, -1.1053466796875, -1.050079345703125, -0.99481201171875, -0.939544677734375, -0.88427734375, -0.829010009765625, -0.77374267578125, -0.718475341796875, -0.6632080078125, -0.607940673828125, -0.55267333984375, -0.497406005859375, -0.442138671875, -0.386871337890625, -0.33160400390625, -0.276336669921875, -0.2210693359375, -0.165802001953125, -0.11053466796875, -0.055267333984375, 0.0, 0.055267333984375, 0.11053466796875, 0.165802001953125, 0.2210693359375, 0.276336669921875, 0.33160400390625, 0.386871337890625, 0.442138671875, 0.497406005859375, 0.55267333984375, 0.607940673828125, 0.6632080078125, 0.718475341796875, 0.77374267578125, 0.829010009765625, 0.88427734375, 0.939544677734375, 0.99481201171875, 1.050079345703125, 1.1053466796875, 1.160614013671875, 1.21588134765625, 1.271148681640625, 1.326416015625, 1.381683349609375, 1.43695068359375, 1.492218017578125, 1.5474853515625, 1.602752685546875, 1.65802001953125, 1.713287353515625, 1.7685546875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 7.0, 11.0, 13.0, 18.0, 21.0, 37.0, 21.0, 33.0, 40.0, 45.0, 48.0, 70.0, 53.0, 61.0, 55.0, 66.0, 63.0, 55.0, 46.0, 42.0, 34.0, 25.0, 23.0, 26.0, 21.0, 21.0, 9.0, 5.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75258731842041, -13.276729583740234, -12.800870895385742, -12.32501220703125, -11.849154472351074, -11.373296737670898, -10.897438049316406, -10.421579360961914, -9.945721626281738, -9.469863891601562, -8.99400520324707, -8.518146514892578, -8.042288780212402, -7.566430568695068, -7.090572357177734, -6.6147141456604, -6.138855934143066, -5.662997722625732, -5.187139511108398, -4.7112812995910645, -4.2354230880737305, -3.7595648765563965, -3.2837066650390625, -2.8078484535217285, -2.3319902420043945, -1.8561320304870605, -1.3802738189697266, -0.9044156074523926, -0.4285573959350586, 0.04730081558227539, 0.5231590270996094, 0.9990172386169434, 1.4748764038085938, 1.9507346153259277, 2.4265928268432617, 2.9024510383605957, 3.3783092498779297, 3.8541674613952637, 4.330025672912598, 4.805883884429932, 5.281742095947266, 5.7576003074646, 6.233458518981934, 6.709316730499268, 7.185174942016602, 7.6610331535339355, 8.13689136505127, 8.612749099731445, 9.088607788085938, 9.56446647644043, 10.040324211120605, 10.516181945800781, 10.992040634155273, 11.467899322509766, 11.943757057189941, 12.419614791870117, 12.89547348022461, 13.371332168579102, 13.847189903259277, 14.323047637939453, 14.798906326293945, 15.274765014648438, 15.750622749328613, 16.22648048400879, 16.70233917236328]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 7.0, 12.0, 11.0, 13.0, 16.0, 13.0, 24.0, 22.0, 21.0, 33.0, 37.0, 34.0, 37.0, 40.0, 34.0, 54.0, 35.0, 46.0, 59.0, 38.0, 36.0, 38.0, 43.0, 43.0, 34.0, 26.0, 22.0, 29.0, 23.0, 22.0, 14.0, 14.0, 12.0, 11.0, 5.0, 6.0, 10.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.46254825592041, -9.14201545715332, -8.82148265838623, -8.500950813293457, -8.180418014526367, -7.859885215759277, -7.5393524169921875, -7.218819618225098, -6.898287296295166, -6.577754497528076, -6.2572221755981445, -5.936689376831055, -5.616156578063965, -5.295624256134033, -4.975091457366943, -4.654559135437012, -4.334026336669922, -4.013493537902832, -3.6929612159729004, -3.3724284172058105, -3.0518958568573, -2.731363296508789, -2.410830497741699, -2.0902979373931885, -1.7697653770446777, -1.449232816696167, -1.1287001371383667, -0.8081675171852112, -0.48763489723205566, -0.16710233688354492, 0.15343034267425537, 0.47396302223205566, 0.7944965362548828, 1.1150290966033936, 1.4355617761611938, 1.7560944557189941, 2.076627016067505, 2.3971595764160156, 2.7176923751831055, 3.038224935531616, 3.358757495880127, 3.6792900562286377, 3.9998226165771484, 4.320355415344238, 4.640888214111328, 4.96142053604126, 5.28195333480835, 5.602485656738281, 5.923018455505371, 6.243551254272461, 6.564083576202393, 6.884616374969482, 7.205148696899414, 7.525681495666504, 7.846214294433594, 8.166747093200684, 8.487279891967773, 8.807812690734863, 9.128345489501953, 9.448877334594727, 9.769410133361816, 10.089942932128906, 10.410475730895996, 10.731008529663086, 11.05154037475586]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 10.0, 12.0, 21.0, 30.0, 50.0, 84.0, 104.0, 164.0, 229.0, 383.0, 563.0, 849.0, 1345.0, 2115.0, 3398.0, 5708.0, 9424.0, 16976.0, 31351.0, 61446.0, 127985.0, 280279.0, 598047.0, 1006224.0, 980716.0, 563688.0, 262340.0, 118864.0, 56039.0, 28789.0, 15238.0, 8478.0, 4958.0, 2971.0, 1809.0, 1201.0, 747.0, 531.0, 362.0, 224.0, 152.0, 124.0, 72.0, 54.0, 38.0, 36.0, 17.0, 12.0, 9.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.5546875, -14.08447265625, -13.6142578125, -13.14404296875, -12.673828125, -12.20361328125, -11.7333984375, -11.26318359375, -10.79296875, -10.32275390625, -9.8525390625, -9.38232421875, -8.912109375, -8.44189453125, -7.9716796875, -7.50146484375, -7.03125, -6.56103515625, -6.0908203125, -5.62060546875, -5.150390625, -4.68017578125, -4.2099609375, -3.73974609375, -3.26953125, -2.79931640625, -2.3291015625, -1.85888671875, -1.388671875, -0.91845703125, -0.4482421875, 0.02197265625, 0.4921875, 0.96240234375, 1.4326171875, 1.90283203125, 2.373046875, 2.84326171875, 3.3134765625, 3.78369140625, 4.25390625, 4.72412109375, 5.1943359375, 5.66455078125, 6.134765625, 6.60498046875, 7.0751953125, 7.54541015625, 8.015625, 8.48583984375, 8.9560546875, 9.42626953125, 9.896484375, 10.36669921875, 10.8369140625, 11.30712890625, 11.77734375, 12.24755859375, 12.7177734375, 13.18798828125, 13.658203125, 14.12841796875, 14.5986328125, 15.06884765625, 15.5390625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 8.0, 8.0, 14.0, 9.0, 16.0, 19.0, 15.0, 18.0, 13.0, 29.0, 38.0, 37.0, 30.0, 33.0, 35.0, 48.0, 40.0, 56.0, 54.0, 49.0, 33.0, 41.0, 39.0, 44.0, 38.0, 37.0, 31.0, 22.0, 28.0, 20.0, 15.0, 14.0, 9.0, 13.0, 14.0, 6.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.2109375, -8.928466796875, -8.64599609375, -8.363525390625, -8.0810546875, -7.798583984375, -7.51611328125, -7.233642578125, -6.951171875, -6.668701171875, -6.38623046875, -6.103759765625, -5.8212890625, -5.538818359375, -5.25634765625, -4.973876953125, -4.69140625, -4.408935546875, -4.12646484375, -3.843994140625, -3.5615234375, -3.279052734375, -2.99658203125, -2.714111328125, -2.431640625, -2.149169921875, -1.86669921875, -1.584228515625, -1.3017578125, -1.019287109375, -0.73681640625, -0.454345703125, -0.171875, 0.110595703125, 0.39306640625, 0.675537109375, 0.9580078125, 1.240478515625, 1.52294921875, 1.805419921875, 2.087890625, 2.370361328125, 2.65283203125, 2.935302734375, 3.2177734375, 3.500244140625, 3.78271484375, 4.065185546875, 4.34765625, 4.630126953125, 4.91259765625, 5.195068359375, 5.4775390625, 5.760009765625, 6.04248046875, 6.324951171875, 6.607421875, 6.889892578125, 7.17236328125, 7.454833984375, 7.7373046875, 8.019775390625, 8.30224609375, 8.584716796875, 8.8671875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 5.0, 8.0, 23.0, 21.0, 28.0, 42.0, 63.0, 98.0, 136.0, 228.0, 287.0, 387.0, 654.0, 969.0, 1512.0, 2106.0, 3286.0, 4928.0, 7638.0, 12014.0, 19088.0, 30690.0, 50803.0, 83565.0, 141096.0, 238625.0, 394770.0, 605324.0, 758746.0, 672638.0, 459994.0, 282319.0, 167193.0, 98806.0, 58852.0, 35864.0, 22115.0, 13829.0, 8836.0, 5646.0, 3624.0, 2397.0, 1645.0, 1041.0, 718.0, 507.0, 354.0, 226.0, 180.0, 112.0, 82.0, 60.0, 43.0, 33.0, 10.0, 15.0, 9.0, 4.0, 2.0, 2.0], "bins": [-14.109375, -13.6773681640625, -13.245361328125, -12.8133544921875, -12.38134765625, -11.9493408203125, -11.517333984375, -11.0853271484375, -10.6533203125, -10.2213134765625, -9.789306640625, -9.3572998046875, -8.92529296875, -8.4932861328125, -8.061279296875, -7.6292724609375, -7.197265625, -6.7652587890625, -6.333251953125, -5.9012451171875, -5.46923828125, -5.0372314453125, -4.605224609375, -4.1732177734375, -3.7412109375, -3.3092041015625, -2.877197265625, -2.4451904296875, -2.01318359375, -1.5811767578125, -1.149169921875, -0.7171630859375, -0.28515625, 0.1468505859375, 0.578857421875, 1.0108642578125, 1.44287109375, 1.8748779296875, 2.306884765625, 2.7388916015625, 3.1708984375, 3.6029052734375, 4.034912109375, 4.4669189453125, 4.89892578125, 5.3309326171875, 5.762939453125, 6.1949462890625, 6.626953125, 7.0589599609375, 7.490966796875, 7.9229736328125, 8.35498046875, 8.7869873046875, 9.218994140625, 9.6510009765625, 10.0830078125, 10.5150146484375, 10.947021484375, 11.3790283203125, 11.81103515625, 12.2430419921875, 12.675048828125, 13.1070556640625, 13.5390625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 7.0, 10.0, 8.0, 7.0, 14.0, 16.0, 23.0, 29.0, 31.0, 43.0, 50.0, 68.0, 99.0, 99.0, 139.0, 112.0, 196.0, 223.0, 233.0, 256.0, 257.0, 262.0, 247.0, 244.0, 220.0, 208.0, 204.0, 154.0, 123.0, 97.0, 97.0, 68.0, 48.0, 45.0, 35.0, 17.0, 20.0, 17.0, 12.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3671875, -5.20074462890625, -5.0343017578125, -4.86785888671875, -4.701416015625, -4.53497314453125, -4.3685302734375, -4.20208740234375, -4.03564453125, -3.86920166015625, -3.7027587890625, -3.53631591796875, -3.369873046875, -3.20343017578125, -3.0369873046875, -2.87054443359375, -2.7041015625, -2.53765869140625, -2.3712158203125, -2.20477294921875, -2.038330078125, -1.87188720703125, -1.7054443359375, -1.53900146484375, -1.37255859375, -1.20611572265625, -1.0396728515625, -0.87322998046875, -0.706787109375, -0.54034423828125, -0.3739013671875, -0.20745849609375, -0.041015625, 0.12542724609375, 0.2918701171875, 0.45831298828125, 0.624755859375, 0.79119873046875, 0.9576416015625, 1.12408447265625, 1.29052734375, 1.45697021484375, 1.6234130859375, 1.78985595703125, 1.956298828125, 2.12274169921875, 2.2891845703125, 2.45562744140625, 2.6220703125, 2.78851318359375, 2.9549560546875, 3.12139892578125, 3.287841796875, 3.45428466796875, 3.6207275390625, 3.78717041015625, 3.95361328125, 4.12005615234375, 4.2864990234375, 4.45294189453125, 4.619384765625, 4.78582763671875, 4.9522705078125, 5.11871337890625, 5.28515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 4.0, 6.0, 11.0, 10.0, 10.0, 10.0, 18.0, 26.0, 32.0, 29.0, 35.0, 46.0, 50.0, 33.0, 57.0, 43.0, 53.0, 58.0, 41.0, 64.0, 53.0, 34.0, 31.0, 34.0, 27.0, 32.0, 25.0, 24.0, 18.0, 19.0, 13.0, 13.0, 7.0, 6.0, 8.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.737723350524902, -15.2180757522583, -14.698427200317383, -14.178779602050781, -13.65913200378418, -13.139483451843262, -12.61983585357666, -12.100187301635742, -11.58053970336914, -11.060892105102539, -10.541243553161621, -10.02159595489502, -9.501947402954102, -8.9822998046875, -8.462652206420898, -7.943004131317139, -7.423356056213379, -6.903707981109619, -6.384059906005859, -5.864412307739258, -5.344764232635498, -4.825116157531738, -4.305468559265137, -3.785820484161377, -3.266172409057617, -2.7465243339538574, -2.2268764972686768, -1.7072285413742065, -1.1875805854797363, -0.6679325103759766, -0.1482846736907959, 0.37136316299438477, 0.8910102844238281, 1.4106582403182983, 1.9303061962127686, 2.449954032897949, 2.969602108001709, 3.4892501831054688, 4.00889778137207, 4.52854585647583, 5.04819393157959, 5.56784200668335, 6.087490081787109, 6.607137680053711, 7.126785755157471, 7.6464338302612305, 8.166081428527832, 8.68572998046875, 9.205377578735352, 9.725025177001953, 10.244673728942871, 10.764321327209473, 11.28396987915039, 11.803617477416992, 12.323265075683594, 12.842912673950195, 13.362561225891113, 13.882208824157715, 14.401857376098633, 14.921504974365234, 15.441152572631836, 15.960801124572754, 16.480449676513672, 17.000097274780273, 17.519744873046875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 16.0, 24.0, 22.0, 19.0, 26.0, 34.0, 20.0, 31.0, 28.0, 37.0, 37.0, 28.0, 55.0, 45.0, 47.0, 43.0, 45.0, 36.0, 32.0, 37.0, 41.0, 26.0, 21.0, 23.0, 33.0, 25.0, 28.0, 21.0, 11.0, 14.0, 11.0, 7.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.929536819458008, -10.570655822753906, -10.211775779724121, -9.852895736694336, -9.494014739990234, -9.135133743286133, -8.776253700256348, -8.417373657226562, -8.058492660522461, -7.699612140655518, -7.340731620788574, -6.981851100921631, -6.6229705810546875, -6.264090061187744, -5.905209541320801, -5.546329021453857, -5.187448501586914, -4.828567981719971, -4.469687461853027, -4.110806941986084, -3.7519264221191406, -3.3930459022521973, -3.034165382385254, -2.6752848625183105, -2.316404342651367, -1.9575238227844238, -1.5986433029174805, -1.239762783050537, -0.8808822631835938, -0.5220017433166504, -0.16312122344970703, 0.19575929641723633, 0.5546388626098633, 0.9135193824768066, 1.27239990234375, 1.6312804222106934, 1.9901609420776367, 2.34904146194458, 2.7079219818115234, 3.066802501678467, 3.42568302154541, 3.7845635414123535, 4.143444061279297, 4.50232458114624, 4.861205101013184, 5.220085620880127, 5.57896614074707, 5.937846660614014, 6.296727180480957, 6.6556077003479, 7.014488220214844, 7.373368740081787, 7.7322492599487305, 8.091129302978516, 8.450010299682617, 8.808891296386719, 9.167771339416504, 9.526651382446289, 9.88553237915039, 10.244413375854492, 10.603293418884277, 10.962173461914062, 11.321054458618164, 11.679935455322266, 12.03881549835205]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 12.0, 12.0, 25.0, 27.0, 41.0, 68.0, 99.0, 122.0, 214.0, 324.0, 484.0, 756.0, 1237.0, 2129.0, 3589.0, 6114.0, 10877.0, 19935.0, 35607.0, 62420.0, 104786.0, 157879.0, 190791.0, 169648.0, 117184.0, 71038.0, 40797.0, 22650.0, 12516.0, 7133.0, 3886.0, 2297.0, 1403.0, 920.0, 518.0, 353.0, 219.0, 135.0, 85.0, 69.0, 48.0, 30.0, 22.0, 10.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.6796875, -9.363525390625, -9.04736328125, -8.731201171875, -8.4150390625, -8.098876953125, -7.78271484375, -7.466552734375, -7.150390625, -6.834228515625, -6.51806640625, -6.201904296875, -5.8857421875, -5.569580078125, -5.25341796875, -4.937255859375, -4.62109375, -4.304931640625, -3.98876953125, -3.672607421875, -3.3564453125, -3.040283203125, -2.72412109375, -2.407958984375, -2.091796875, -1.775634765625, -1.45947265625, -1.143310546875, -0.8271484375, -0.510986328125, -0.19482421875, 0.121337890625, 0.4375, 0.753662109375, 1.06982421875, 1.385986328125, 1.7021484375, 2.018310546875, 2.33447265625, 2.650634765625, 2.966796875, 3.282958984375, 3.59912109375, 3.915283203125, 4.2314453125, 4.547607421875, 4.86376953125, 5.179931640625, 5.49609375, 5.812255859375, 6.12841796875, 6.444580078125, 6.7607421875, 7.076904296875, 7.39306640625, 7.709228515625, 8.025390625, 8.341552734375, 8.65771484375, 8.973876953125, 9.2900390625, 9.606201171875, 9.92236328125, 10.238525390625, 10.5546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 6.0, 11.0, 16.0, 10.0, 14.0, 24.0, 22.0, 22.0, 28.0, 23.0, 32.0, 27.0, 33.0, 41.0, 47.0, 39.0, 52.0, 39.0, 29.0, 41.0, 43.0, 42.0, 45.0, 35.0, 46.0, 33.0, 23.0, 25.0, 20.0, 27.0, 22.0, 19.0, 12.0, 9.0, 7.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.96875, -11.5711669921875, -11.173583984375, -10.7760009765625, -10.37841796875, -9.9808349609375, -9.583251953125, -9.1856689453125, -8.7880859375, -8.3905029296875, -7.992919921875, -7.5953369140625, -7.19775390625, -6.8001708984375, -6.402587890625, -6.0050048828125, -5.607421875, -5.2098388671875, -4.812255859375, -4.4146728515625, -4.01708984375, -3.6195068359375, -3.221923828125, -2.8243408203125, -2.4267578125, -2.0291748046875, -1.631591796875, -1.2340087890625, -0.83642578125, -0.4388427734375, -0.041259765625, 0.3563232421875, 0.75390625, 1.1514892578125, 1.549072265625, 1.9466552734375, 2.34423828125, 2.7418212890625, 3.139404296875, 3.5369873046875, 3.9345703125, 4.3321533203125, 4.729736328125, 5.1273193359375, 5.52490234375, 5.9224853515625, 6.320068359375, 6.7176513671875, 7.115234375, 7.5128173828125, 7.910400390625, 8.3079833984375, 8.70556640625, 9.1031494140625, 9.500732421875, 9.8983154296875, 10.2958984375, 10.6934814453125, 11.091064453125, 11.4886474609375, 11.88623046875, 12.2838134765625, 12.681396484375, 13.0789794921875, 13.4765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 25.0, 29.0, 46.0, 57.0, 71.0, 94.0, 147.0, 199.0, 263.0, 397.0, 546.0, 895.0, 1376.0, 2256.0, 3742.0, 6904.0, 13263.0, 27013.0, 59433.0, 130989.0, 251628.0, 269468.0, 148486.0, 67273.0, 30415.0, 14717.0, 7671.0, 4248.0, 2354.0, 1555.0, 939.0, 635.0, 434.0, 272.0, 187.0, 153.0, 118.0, 72.0, 53.0, 37.0, 23.0, 18.0, 9.0, 4.0, 6.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.078125, -16.5618896484375, -16.045654296875, -15.5294189453125, -15.01318359375, -14.4969482421875, -13.980712890625, -13.4644775390625, -12.9482421875, -12.4320068359375, -11.915771484375, -11.3995361328125, -10.88330078125, -10.3670654296875, -9.850830078125, -9.3345947265625, -8.818359375, -8.3021240234375, -7.785888671875, -7.2696533203125, -6.75341796875, -6.2371826171875, -5.720947265625, -5.2047119140625, -4.6884765625, -4.1722412109375, -3.656005859375, -3.1397705078125, -2.62353515625, -2.1072998046875, -1.591064453125, -1.0748291015625, -0.55859375, -0.0423583984375, 0.473876953125, 0.9901123046875, 1.50634765625, 2.0225830078125, 2.538818359375, 3.0550537109375, 3.5712890625, 4.0875244140625, 4.603759765625, 5.1199951171875, 5.63623046875, 6.1524658203125, 6.668701171875, 7.1849365234375, 7.701171875, 8.2174072265625, 8.733642578125, 9.2498779296875, 9.76611328125, 10.2823486328125, 10.798583984375, 11.3148193359375, 11.8310546875, 12.3472900390625, 12.863525390625, 13.3797607421875, 13.89599609375, 14.4122314453125, 14.928466796875, 15.4447021484375, 15.9609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 4.0, 9.0, 10.0, 5.0, 8.0, 17.0, 14.0, 16.0, 18.0, 22.0, 33.0, 36.0, 27.0, 31.0, 26.0, 45.0, 29.0, 29.0, 49.0, 28.0, 44.0, 44.0, 42.0, 42.0, 34.0, 47.0, 27.0, 26.0, 39.0, 27.0, 23.0, 24.0, 19.0, 16.0, 17.0, 24.0, 11.0, 6.0, 5.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.1953125, -6.96746826171875, -6.7396240234375, -6.51177978515625, -6.283935546875, -6.05609130859375, -5.8282470703125, -5.60040283203125, -5.37255859375, -5.14471435546875, -4.9168701171875, -4.68902587890625, -4.461181640625, -4.23333740234375, -4.0054931640625, -3.77764892578125, -3.5498046875, -3.32196044921875, -3.0941162109375, -2.86627197265625, -2.638427734375, -2.41058349609375, -2.1827392578125, -1.95489501953125, -1.72705078125, -1.49920654296875, -1.2713623046875, -1.04351806640625, -0.815673828125, -0.58782958984375, -0.3599853515625, -0.13214111328125, 0.095703125, 0.32354736328125, 0.5513916015625, 0.77923583984375, 1.007080078125, 1.23492431640625, 1.4627685546875, 1.69061279296875, 1.91845703125, 2.14630126953125, 2.3741455078125, 2.60198974609375, 2.829833984375, 3.05767822265625, 3.2855224609375, 3.51336669921875, 3.7412109375, 3.96905517578125, 4.1968994140625, 4.42474365234375, 4.652587890625, 4.88043212890625, 5.1082763671875, 5.33612060546875, 5.56396484375, 5.79180908203125, 6.0196533203125, 6.24749755859375, 6.475341796875, 6.70318603515625, 6.9310302734375, 7.15887451171875, 7.38671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 15.0, 23.0, 33.0, 61.0, 87.0, 113.0, 153.0, 257.0, 370.0, 606.0, 899.0, 1450.0, 2319.0, 3905.0, 6788.0, 12162.0, 22542.0, 42815.0, 84211.0, 159953.0, 250112.0, 211567.0, 117733.0, 60276.0, 31072.0, 16448.0, 9134.0, 5256.0, 3073.0, 1831.0, 1219.0, 717.0, 450.0, 304.0, 193.0, 139.0, 65.0, 59.0, 43.0, 29.0, 26.0, 13.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8359375, -8.566162109375, -8.29638671875, -8.026611328125, -7.7568359375, -7.487060546875, -7.21728515625, -6.947509765625, -6.677734375, -6.407958984375, -6.13818359375, -5.868408203125, -5.5986328125, -5.328857421875, -5.05908203125, -4.789306640625, -4.51953125, -4.249755859375, -3.97998046875, -3.710205078125, -3.4404296875, -3.170654296875, -2.90087890625, -2.631103515625, -2.361328125, -2.091552734375, -1.82177734375, -1.552001953125, -1.2822265625, -1.012451171875, -0.74267578125, -0.472900390625, -0.203125, 0.066650390625, 0.33642578125, 0.606201171875, 0.8759765625, 1.145751953125, 1.41552734375, 1.685302734375, 1.955078125, 2.224853515625, 2.49462890625, 2.764404296875, 3.0341796875, 3.303955078125, 3.57373046875, 3.843505859375, 4.11328125, 4.383056640625, 4.65283203125, 4.922607421875, 5.1923828125, 5.462158203125, 5.73193359375, 6.001708984375, 6.271484375, 6.541259765625, 6.81103515625, 7.080810546875, 7.3505859375, 7.620361328125, 7.89013671875, 8.159912109375, 8.4296875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 11.0, 13.0, 13.0, 8.0, 20.0, 25.0, 28.0, 25.0, 41.0, 52.0, 58.0, 53.0, 56.0, 52.0, 57.0, 45.0, 60.0, 44.0, 51.0, 43.0, 27.0, 25.0, 30.0, 22.0, 30.0, 13.0, 8.0, 10.0, 7.0, 9.0, 8.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003669261932373047, -0.0003559477627277374, -0.00034496933221817017, -0.0003339909017086029, -0.00032301247119903564, -0.0003120340406894684, -0.0003010556101799011, -0.00029007717967033386, -0.0002790987491607666, -0.00026812031865119934, -0.0002571418881416321, -0.0002461634576320648, -0.00023518502712249756, -0.0002242065966129303, -0.00021322816610336304, -0.00020224973559379578, -0.00019127130508422852, -0.00018029287457466125, -0.000169314444065094, -0.00015833601355552673, -0.00014735758304595947, -0.0001363791525363922, -0.00012540072202682495, -0.00011442229151725769, -0.00010344386100769043, -9.246543049812317e-05, -8.148699998855591e-05, -7.050856947898865e-05, -5.953013896942139e-05, -4.8551708459854126e-05, -3.7573277950286865e-05, -2.6594847440719604e-05, -1.5616416931152344e-05, -4.637986421585083e-06, 6.340444087982178e-06, 1.731887459754944e-05, 2.82973051071167e-05, 3.927573561668396e-05, 5.025416612625122e-05, 6.123259663581848e-05, 7.221102714538574e-05, 8.3189457654953e-05, 9.416788816452026e-05, 0.00010514631867408752, 0.00011612474918365479, 0.00012710317969322205, 0.0001380816102027893, 0.00014906004071235657, 0.00016003847122192383, 0.0001710169017314911, 0.00018199533224105835, 0.0001929737627506256, 0.00020395219326019287, 0.00021493062376976013, 0.0002259090542793274, 0.00023688748478889465, 0.0002478659152984619, 0.0002588443458080292, 0.00026982277631759644, 0.0002808012068271637, 0.00029177963733673096, 0.0003027580678462982, 0.0003137364983558655, 0.00032471492886543274, 0.000335693359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 6.0, 12.0, 16.0, 28.0, 43.0, 48.0, 58.0, 98.0, 148.0, 251.0, 345.0, 511.0, 717.0, 1091.0, 1677.0, 2530.0, 3900.0, 6081.0, 9485.0, 14656.0, 22544.0, 35184.0, 54383.0, 81787.0, 115935.0, 146723.0, 152256.0, 127303.0, 92739.0, 62729.0, 40810.0, 26251.0, 16824.0, 10860.0, 7131.0, 4617.0, 2939.0, 2034.0, 1266.0, 783.0, 522.0, 368.0, 289.0, 171.0, 123.0, 93.0, 65.0, 45.0, 23.0, 17.0, 16.0, 8.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.7109375, -6.5023193359375, -6.293701171875, -6.0850830078125, -5.87646484375, -5.6678466796875, -5.459228515625, -5.2506103515625, -5.0419921875, -4.8333740234375, -4.624755859375, -4.4161376953125, -4.20751953125, -3.9989013671875, -3.790283203125, -3.5816650390625, -3.373046875, -3.1644287109375, -2.955810546875, -2.7471923828125, -2.53857421875, -2.3299560546875, -2.121337890625, -1.9127197265625, -1.7041015625, -1.4954833984375, -1.286865234375, -1.0782470703125, -0.86962890625, -0.6610107421875, -0.452392578125, -0.2437744140625, -0.03515625, 0.1734619140625, 0.382080078125, 0.5906982421875, 0.79931640625, 1.0079345703125, 1.216552734375, 1.4251708984375, 1.6337890625, 1.8424072265625, 2.051025390625, 2.2596435546875, 2.46826171875, 2.6768798828125, 2.885498046875, 3.0941162109375, 3.302734375, 3.5113525390625, 3.719970703125, 3.9285888671875, 4.13720703125, 4.3458251953125, 4.554443359375, 4.7630615234375, 4.9716796875, 5.1802978515625, 5.388916015625, 5.5975341796875, 5.80615234375, 6.0147705078125, 6.223388671875, 6.4320068359375, 6.640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 6.0, 12.0, 7.0, 20.0, 15.0, 18.0, 33.0, 37.0, 50.0, 49.0, 54.0, 81.0, 74.0, 75.0, 80.0, 71.0, 58.0, 54.0, 51.0, 30.0, 36.0, 23.0, 16.0, 17.0, 4.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7265625, -2.624664306640625, -2.52276611328125, -2.420867919921875, -2.3189697265625, -2.217071533203125, -2.11517333984375, -2.013275146484375, -1.911376953125, -1.809478759765625, -1.70758056640625, -1.605682373046875, -1.5037841796875, -1.401885986328125, -1.29998779296875, -1.198089599609375, -1.09619140625, -0.994293212890625, -0.89239501953125, -0.790496826171875, -0.6885986328125, -0.586700439453125, -0.48480224609375, -0.382904052734375, -0.281005859375, -0.179107666015625, -0.07720947265625, 0.024688720703125, 0.1265869140625, 0.228485107421875, 0.33038330078125, 0.432281494140625, 0.5341796875, 0.636077880859375, 0.73797607421875, 0.839874267578125, 0.9417724609375, 1.043670654296875, 1.14556884765625, 1.247467041015625, 1.349365234375, 1.451263427734375, 1.55316162109375, 1.655059814453125, 1.7569580078125, 1.858856201171875, 1.96075439453125, 2.062652587890625, 2.16455078125, 2.266448974609375, 2.36834716796875, 2.470245361328125, 2.5721435546875, 2.674041748046875, 2.77593994140625, 2.877838134765625, 2.979736328125, 3.081634521484375, 3.18353271484375, 3.285430908203125, 3.3873291015625, 3.489227294921875, 3.59112548828125, 3.693023681640625, 3.794921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 8.0, 16.0, 23.0, 25.0, 33.0, 38.0, 27.0, 43.0, 51.0, 48.0, 40.0, 64.0, 57.0, 57.0, 51.0, 63.0, 53.0, 33.0, 39.0, 21.0, 30.0, 27.0, 26.0, 22.0, 22.0, 15.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.555696487426758, -16.001737594604492, -15.44778060913086, -14.89382266998291, -14.339864730834961, -13.785905838012695, -13.231947898864746, -12.677989959716797, -12.124032020568848, -11.570074081420898, -11.01611614227295, -10.462158203125, -9.908199310302734, -9.354242324829102, -8.800283432006836, -8.246325492858887, -7.6923675537109375, -7.138409614562988, -6.584451675415039, -6.030493259429932, -5.476535320281982, -4.922577381134033, -4.368618965148926, -3.8146610260009766, -3.2607030868530273, -2.706745147705078, -2.15278697013855, -1.598828911781311, -1.0448708534240723, -0.49091291427612305, 0.06304526329040527, 0.6170034408569336, 1.1709613800048828, 1.7249194383621216, 2.2788774967193604, 2.8328356742858887, 3.386793613433838, 3.940751552581787, 4.4947099685668945, 5.048667907714844, 5.602625846862793, 6.156583786010742, 6.710541725158691, 7.264500141143799, 7.818458080291748, 8.372415542602539, 8.926374435424805, 9.480332374572754, 10.034290313720703, 10.588248252868652, 11.142206192016602, 11.69616413116455, 12.2501220703125, 12.804080963134766, 13.358038902282715, 13.911996841430664, 14.465954780578613, 15.019912719726562, 15.573870658874512, 16.12782859802246, 16.681787490844727, 17.23574447631836, 17.789703369140625, 18.34366226196289, 18.897619247436523]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 7.0, 5.0, 9.0, 17.0, 15.0, 12.0, 21.0, 23.0, 29.0, 23.0, 20.0, 33.0, 26.0, 36.0, 37.0, 25.0, 37.0, 47.0, 31.0, 48.0, 48.0, 40.0, 47.0, 27.0, 30.0, 47.0, 30.0, 17.0, 27.0, 20.0, 28.0, 27.0, 24.0, 15.0, 14.0, 9.0, 7.0, 10.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.247703552246094, -9.898707389831543, -9.549710273742676, -9.200714111328125, -8.851716995239258, -8.502720832824707, -8.153724670410156, -7.804727554321289, -7.45573091506958, -7.106734275817871, -6.757737636566162, -6.408740997314453, -6.059744834899902, -5.710747718811035, -5.361751556396484, -5.012754917144775, -4.663758277893066, -4.314761638641357, -3.9657649993896484, -3.6167685985565186, -3.2677719593048096, -2.9187753200531006, -2.5697789192199707, -2.2207822799682617, -1.8717856407165527, -1.5227890014648438, -1.1737924814224243, -0.8247959613800049, -0.4757993221282959, -0.12680268287658691, 0.22219371795654297, 0.571190357208252, 0.9201879501342773, 1.2691845893859863, 1.6181811094284058, 1.9671776294708252, 2.316174268722534, 2.665170907974243, 3.014167308807373, 3.363163948059082, 3.712160587310791, 4.0611572265625, 4.410153865814209, 4.759150505065918, 5.108146667480469, 5.457143783569336, 5.806139945983887, 6.155136585235596, 6.504133224487305, 6.853129863739014, 7.202126502990723, 7.551122665405273, 7.900119781494141, 8.249115943908691, 8.598112106323242, 8.94710922241211, 9.296106338500977, 9.645102500915527, 9.994099617004395, 10.343095779418945, 10.692092895507812, 11.041089057922363, 11.390085220336914, 11.739082336425781, 12.088078498840332]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 10.0, 20.0, 19.0, 34.0, 50.0, 74.0, 96.0, 164.0, 219.0, 329.0, 476.0, 666.0, 1045.0, 1485.0, 2261.0, 3399.0, 5284.0, 8337.0, 13116.0, 20766.0, 32776.0, 50739.0, 77192.0, 107672.0, 135619.0, 145180.0, 131824.0, 103735.0, 73095.0, 47753.0, 30643.0, 19375.0, 12319.0, 7819.0, 5022.0, 3309.0, 2133.0, 1519.0, 978.0, 596.0, 438.0, 309.0, 219.0, 122.0, 110.0, 64.0, 41.0, 34.0, 15.0, 12.0, 14.0, 15.0, 8.0, 4.0, 8.0, 2.0], "bins": [-9.953125, -9.6553955078125, -9.357666015625, -9.0599365234375, -8.76220703125, -8.4644775390625, -8.166748046875, -7.8690185546875, -7.5712890625, -7.2735595703125, -6.975830078125, -6.6781005859375, -6.38037109375, -6.0826416015625, -5.784912109375, -5.4871826171875, -5.189453125, -4.8917236328125, -4.593994140625, -4.2962646484375, -3.99853515625, -3.7008056640625, -3.403076171875, -3.1053466796875, -2.8076171875, -2.5098876953125, -2.212158203125, -1.9144287109375, -1.61669921875, -1.3189697265625, -1.021240234375, -0.7235107421875, -0.42578125, -0.1280517578125, 0.169677734375, 0.4674072265625, 0.76513671875, 1.0628662109375, 1.360595703125, 1.6583251953125, 1.9560546875, 2.2537841796875, 2.551513671875, 2.8492431640625, 3.14697265625, 3.4447021484375, 3.742431640625, 4.0401611328125, 4.337890625, 4.6356201171875, 4.933349609375, 5.2310791015625, 5.52880859375, 5.8265380859375, 6.124267578125, 6.4219970703125, 6.7197265625, 7.0174560546875, 7.315185546875, 7.6129150390625, 7.91064453125, 8.2083740234375, 8.506103515625, 8.8038330078125, 9.1015625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 2.0, 7.0, 4.0, 4.0, 11.0, 10.0, 13.0, 13.0, 13.0, 16.0, 24.0, 19.0, 20.0, 27.0, 29.0, 43.0, 31.0, 29.0, 37.0, 41.0, 44.0, 32.0, 47.0, 38.0, 44.0, 37.0, 43.0, 31.0, 34.0, 24.0, 30.0, 37.0, 21.0, 18.0, 34.0, 13.0, 17.0, 15.0, 8.0, 4.0, 12.0, 3.0, 5.0, 8.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.095458984375, -10.72998046875, -10.364501953125, -9.9990234375, -9.633544921875, -9.26806640625, -8.902587890625, -8.537109375, -8.171630859375, -7.80615234375, -7.440673828125, -7.0751953125, -6.709716796875, -6.34423828125, -5.978759765625, -5.61328125, -5.247802734375, -4.88232421875, -4.516845703125, -4.1513671875, -3.785888671875, -3.42041015625, -3.054931640625, -2.689453125, -2.323974609375, -1.95849609375, -1.593017578125, -1.2275390625, -0.862060546875, -0.49658203125, -0.131103515625, 0.234375, 0.599853515625, 0.96533203125, 1.330810546875, 1.6962890625, 2.061767578125, 2.42724609375, 2.792724609375, 3.158203125, 3.523681640625, 3.88916015625, 4.254638671875, 4.6201171875, 4.985595703125, 5.35107421875, 5.716552734375, 6.08203125, 6.447509765625, 6.81298828125, 7.178466796875, 7.5439453125, 7.909423828125, 8.27490234375, 8.640380859375, 9.005859375, 9.371337890625, 9.73681640625, 10.102294921875, 10.4677734375, 10.833251953125, 11.19873046875, 11.564208984375, 11.9296875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 15.0, 27.0, 31.0, 45.0, 46.0, 78.0, 101.0, 160.0, 232.0, 348.0, 477.0, 768.0, 1110.0, 1716.0, 2714.0, 4450.0, 7117.0, 12344.0, 20384.0, 34516.0, 58501.0, 93953.0, 138192.0, 169249.0, 163897.0, 126900.0, 84158.0, 51128.0, 30288.0, 17785.0, 10431.0, 6251.0, 3929.0, 2496.0, 1542.0, 1066.0, 690.0, 456.0, 295.0, 198.0, 146.0, 93.0, 81.0, 51.0, 34.0, 24.0, 11.0, 10.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8203125, -12.405029296875, -11.98974609375, -11.574462890625, -11.1591796875, -10.743896484375, -10.32861328125, -9.913330078125, -9.498046875, -9.082763671875, -8.66748046875, -8.252197265625, -7.8369140625, -7.421630859375, -7.00634765625, -6.591064453125, -6.17578125, -5.760498046875, -5.34521484375, -4.929931640625, -4.5146484375, -4.099365234375, -3.68408203125, -3.268798828125, -2.853515625, -2.438232421875, -2.02294921875, -1.607666015625, -1.1923828125, -0.777099609375, -0.36181640625, 0.053466796875, 0.46875, 0.884033203125, 1.29931640625, 1.714599609375, 2.1298828125, 2.545166015625, 2.96044921875, 3.375732421875, 3.791015625, 4.206298828125, 4.62158203125, 5.036865234375, 5.4521484375, 5.867431640625, 6.28271484375, 6.697998046875, 7.11328125, 7.528564453125, 7.94384765625, 8.359130859375, 8.7744140625, 9.189697265625, 9.60498046875, 10.020263671875, 10.435546875, 10.850830078125, 11.26611328125, 11.681396484375, 12.0966796875, 12.511962890625, 12.92724609375, 13.342529296875, 13.7578125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 7.0, 5.0, 7.0, 9.0, 13.0, 10.0, 13.0, 9.0, 22.0, 21.0, 20.0, 25.0, 24.0, 28.0, 28.0, 37.0, 33.0, 30.0, 35.0, 37.0, 41.0, 44.0, 37.0, 44.0, 36.0, 40.0, 47.0, 30.0, 28.0, 32.0, 29.0, 26.0, 19.0, 24.0, 14.0, 14.0, 11.0, 14.0, 10.0, 8.0, 9.0, 7.0, 4.0, 6.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-8.4609375, -8.2200927734375, -7.979248046875, -7.7384033203125, -7.49755859375, -7.2567138671875, -7.015869140625, -6.7750244140625, -6.5341796875, -6.2933349609375, -6.052490234375, -5.8116455078125, -5.57080078125, -5.3299560546875, -5.089111328125, -4.8482666015625, -4.607421875, -4.3665771484375, -4.125732421875, -3.8848876953125, -3.64404296875, -3.4031982421875, -3.162353515625, -2.9215087890625, -2.6806640625, -2.4398193359375, -2.198974609375, -1.9581298828125, -1.71728515625, -1.4764404296875, -1.235595703125, -0.9947509765625, -0.75390625, -0.5130615234375, -0.272216796875, -0.0313720703125, 0.20947265625, 0.4503173828125, 0.691162109375, 0.9320068359375, 1.1728515625, 1.4136962890625, 1.654541015625, 1.8953857421875, 2.13623046875, 2.3770751953125, 2.617919921875, 2.8587646484375, 3.099609375, 3.3404541015625, 3.581298828125, 3.8221435546875, 4.06298828125, 4.3038330078125, 4.544677734375, 4.7855224609375, 5.0263671875, 5.2672119140625, 5.508056640625, 5.7489013671875, 5.98974609375, 6.2305908203125, 6.471435546875, 6.7122802734375, 6.953125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 8.0, 10.0, 17.0, 22.0, 26.0, 42.0, 57.0, 87.0, 101.0, 172.0, 205.0, 399.0, 543.0, 831.0, 1358.0, 2066.0, 3471.0, 6099.0, 11566.0, 24178.0, 55334.0, 134284.0, 267148.0, 277911.0, 146796.0, 60966.0, 25854.0, 12401.0, 6531.0, 3805.0, 2380.0, 1369.0, 834.0, 570.0, 330.0, 242.0, 191.0, 121.0, 70.0, 49.0, 28.0, 22.0, 17.0, 9.0, 6.0, 8.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.09375, -11.7164306640625, -11.339111328125, -10.9617919921875, -10.58447265625, -10.2071533203125, -9.829833984375, -9.4525146484375, -9.0751953125, -8.6978759765625, -8.320556640625, -7.9432373046875, -7.56591796875, -7.1885986328125, -6.811279296875, -6.4339599609375, -6.056640625, -5.6793212890625, -5.302001953125, -4.9246826171875, -4.54736328125, -4.1700439453125, -3.792724609375, -3.4154052734375, -3.0380859375, -2.6607666015625, -2.283447265625, -1.9061279296875, -1.52880859375, -1.1514892578125, -0.774169921875, -0.3968505859375, -0.01953125, 0.3577880859375, 0.735107421875, 1.1124267578125, 1.48974609375, 1.8670654296875, 2.244384765625, 2.6217041015625, 2.9990234375, 3.3763427734375, 3.753662109375, 4.1309814453125, 4.50830078125, 4.8856201171875, 5.262939453125, 5.6402587890625, 6.017578125, 6.3948974609375, 6.772216796875, 7.1495361328125, 7.52685546875, 7.9041748046875, 8.281494140625, 8.6588134765625, 9.0361328125, 9.4134521484375, 9.790771484375, 10.1680908203125, 10.54541015625, 10.9227294921875, 11.300048828125, 11.6773681640625, 12.0546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 11.0, 27.0, 37.0, 73.0, 114.0, 150.0, 163.0, 127.0, 91.0, 67.0, 37.0, 21.0, 19.0, 11.0, 13.0, 4.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001922607421875, -0.0018632113933563232, -0.0018038153648376465, -0.0017444193363189697, -0.001685023307800293, -0.0016256272792816162, -0.0015662312507629395, -0.0015068352222442627, -0.001447439193725586, -0.0013880431652069092, -0.0013286471366882324, -0.0012692511081695557, -0.001209855079650879, -0.0011504590511322021, -0.0010910630226135254, -0.0010316669940948486, -0.0009722709655761719, -0.0009128749370574951, -0.0008534789085388184, -0.0007940828800201416, -0.0007346868515014648, -0.0006752908229827881, -0.0006158947944641113, -0.0005564987659454346, -0.0004971027374267578, -0.00043770670890808105, -0.0003783106803894043, -0.00031891465187072754, -0.0002595186233520508, -0.00020012259483337402, -0.00014072656631469727, -8.133053779602051e-05, -2.193450927734375e-05, 3.746151924133301e-05, 9.685754776000977e-05, 0.00015625357627868652, 0.00021564960479736328, 0.00027504563331604004, 0.0003344416618347168, 0.00039383769035339355, 0.0004532337188720703, 0.0005126297473907471, 0.0005720257759094238, 0.0006314218044281006, 0.0006908178329467773, 0.0007502138614654541, 0.0008096098899841309, 0.0008690059185028076, 0.0009284019470214844, 0.0009877979755401611, 0.0010471940040588379, 0.0011065900325775146, 0.0011659860610961914, 0.0012253820896148682, 0.001284778118133545, 0.0013441741466522217, 0.0014035701751708984, 0.0014629662036895752, 0.001522362232208252, 0.0015817582607269287, 0.0016411542892456055, 0.0017005503177642822, 0.001759946346282959, 0.0018193423748016357, 0.0018787384033203125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 22.0, 20.0, 40.0, 83.0, 116.0, 169.0, 267.0, 377.0, 586.0, 966.0, 1442.0, 2272.0, 3472.0, 5558.0, 9366.0, 16246.0, 30954.0, 63120.0, 129424.0, 220829.0, 240451.0, 157999.0, 78078.0, 38363.0, 19617.0, 10934.0, 6535.0, 3902.0, 2570.0, 1605.0, 1032.0, 747.0, 442.0, 328.0, 198.0, 148.0, 89.0, 60.0, 31.0, 31.0, 21.0, 8.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.189208984375, -8.86279296875, -8.536376953125, -8.2099609375, -7.883544921875, -7.55712890625, -7.230712890625, -6.904296875, -6.577880859375, -6.25146484375, -5.925048828125, -5.5986328125, -5.272216796875, -4.94580078125, -4.619384765625, -4.29296875, -3.966552734375, -3.64013671875, -3.313720703125, -2.9873046875, -2.660888671875, -2.33447265625, -2.008056640625, -1.681640625, -1.355224609375, -1.02880859375, -0.702392578125, -0.3759765625, -0.049560546875, 0.27685546875, 0.603271484375, 0.9296875, 1.256103515625, 1.58251953125, 1.908935546875, 2.2353515625, 2.561767578125, 2.88818359375, 3.214599609375, 3.541015625, 3.867431640625, 4.19384765625, 4.520263671875, 4.8466796875, 5.173095703125, 5.49951171875, 5.825927734375, 6.15234375, 6.478759765625, 6.80517578125, 7.131591796875, 7.4580078125, 7.784423828125, 8.11083984375, 8.437255859375, 8.763671875, 9.090087890625, 9.41650390625, 9.742919921875, 10.0693359375, 10.395751953125, 10.72216796875, 11.048583984375, 11.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 12.0, 27.0, 17.0, 30.0, 20.0, 43.0, 63.0, 54.0, 68.0, 73.0, 71.0, 75.0, 90.0, 61.0, 54.0, 38.0, 39.0, 29.0, 13.0, 27.0, 13.0, 5.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.171875, -3.070404052734375, -2.96893310546875, -2.867462158203125, -2.7659912109375, -2.664520263671875, -2.56304931640625, -2.461578369140625, -2.360107421875, -2.258636474609375, -2.15716552734375, -2.055694580078125, -1.9542236328125, -1.852752685546875, -1.75128173828125, -1.649810791015625, -1.54833984375, -1.446868896484375, -1.34539794921875, -1.243927001953125, -1.1424560546875, -1.040985107421875, -0.93951416015625, -0.838043212890625, -0.736572265625, -0.635101318359375, -0.53363037109375, -0.432159423828125, -0.3306884765625, -0.229217529296875, -0.12774658203125, -0.026275634765625, 0.0751953125, 0.176666259765625, 0.27813720703125, 0.379608154296875, 0.4810791015625, 0.582550048828125, 0.68402099609375, 0.785491943359375, 0.886962890625, 0.988433837890625, 1.08990478515625, 1.191375732421875, 1.2928466796875, 1.394317626953125, 1.49578857421875, 1.597259521484375, 1.69873046875, 1.800201416015625, 1.90167236328125, 2.003143310546875, 2.1046142578125, 2.206085205078125, 2.30755615234375, 2.409027099609375, 2.510498046875, 2.611968994140625, 2.71343994140625, 2.814910888671875, 2.9163818359375, 3.017852783203125, 3.11932373046875, 3.220794677734375, 3.322265625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 3.0, 10.0, 8.0, 15.0, 14.0, 15.0, 20.0, 38.0, 23.0, 31.0, 45.0, 37.0, 58.0, 46.0, 42.0, 53.0, 55.0, 67.0, 62.0, 52.0, 42.0, 33.0, 32.0, 21.0, 34.0, 23.0, 24.0, 25.0, 18.0, 13.0, 6.0, 7.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.171552658081055, -17.60867691040039, -17.045801162719727, -16.48292350769043, -15.920047760009766, -15.357172012329102, -14.794296264648438, -14.231420516967773, -13.668543815612793, -13.105668067932129, -12.542791366577148, -11.979915618896484, -11.41703987121582, -10.85416316986084, -10.291287422180176, -9.728410720825195, -9.165534973144531, -8.602659225463867, -8.039782524108887, -7.476906776428223, -6.9140305519104, -6.351154327392578, -5.788278579711914, -5.225402355194092, -4.6625261306762695, -4.099649906158447, -3.536773920059204, -2.973897933959961, -2.4110217094421387, -1.8481454849243164, -1.2852694988250732, -0.7223935127258301, -0.159515380859375, 0.4033607244491577, 0.9662368297576904, 1.5291129350662231, 2.091989040374756, 2.654865264892578, 3.2177412509918213, 3.7806172370910645, 4.343493461608887, 4.906369686126709, 5.469245910644531, 6.032121658325195, 6.594997882843018, 7.15787410736084, 7.720749855041504, 8.283626556396484, 8.846502304077148, 9.409378051757812, 9.972254753112793, 10.535130500793457, 11.098007202148438, 11.660882949829102, 12.223758697509766, 12.78663444519043, 13.34951114654541, 13.912386894226074, 14.475263595581055, 15.038139343261719, 15.601015090942383, 16.163890838623047, 16.726768493652344, 17.289644241333008, 17.852519989013672]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 8.0, 14.0, 18.0, 25.0, 21.0, 19.0, 30.0, 29.0, 28.0, 27.0, 31.0, 34.0, 32.0, 34.0, 27.0, 45.0, 48.0, 28.0, 45.0, 41.0, 40.0, 30.0, 50.0, 29.0, 42.0, 23.0, 22.0, 19.0, 15.0, 18.0, 14.0, 17.0, 10.0, 19.0, 13.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.908498764038086, -11.512176513671875, -11.115854263305664, -10.719532012939453, -10.323209762573242, -9.926887512207031, -9.53056526184082, -9.13424301147461, -8.737920761108398, -8.341598510742188, -7.945276260375977, -7.548954010009766, -7.152631759643555, -6.756309509277344, -6.359987258911133, -5.963665008544922, -5.567342758178711, -5.1710205078125, -4.774698257446289, -4.378376007080078, -3.982053756713867, -3.5857315063476562, -3.1894092559814453, -2.7930870056152344, -2.3967647552490234, -2.0004425048828125, -1.6041202545166016, -1.2077980041503906, -0.8114757537841797, -0.41515350341796875, -0.018831253051757812, 0.3774909973144531, 0.7738142013549805, 1.1701364517211914, 1.5664587020874023, 1.9627809524536133, 2.359103202819824, 2.755425453186035, 3.151747703552246, 3.548069953918457, 3.944392204284668, 4.340714454650879, 4.73703670501709, 5.133358955383301, 5.529681205749512, 5.926003456115723, 6.322325706481934, 6.7186479568481445, 7.1149702072143555, 7.511292457580566, 7.907614707946777, 8.303936958312988, 8.7002592086792, 9.09658145904541, 9.492903709411621, 9.889225959777832, 10.285548210144043, 10.681870460510254, 11.078192710876465, 11.474514961242676, 11.870837211608887, 12.267159461975098, 12.663481712341309, 13.05980396270752, 13.45612621307373]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 14.0, 25.0, 30.0, 55.0, 68.0, 155.0, 196.0, 294.0, 429.0, 713.0, 1069.0, 1683.0, 2682.0, 4394.0, 7126.0, 12801.0, 22412.0, 41338.0, 80805.0, 164102.0, 343773.0, 683686.0, 1000824.0, 865037.0, 490337.0, 234620.0, 113411.0, 56122.0, 28498.0, 15488.0, 8759.0, 5179.0, 2945.0, 1799.0, 1182.0, 697.0, 461.0, 339.0, 237.0, 143.0, 112.0, 67.0, 51.0, 41.0, 33.0, 15.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.125, -16.529052734375, -15.93310546875, -15.337158203125, -14.7412109375, -14.145263671875, -13.54931640625, -12.953369140625, -12.357421875, -11.761474609375, -11.16552734375, -10.569580078125, -9.9736328125, -9.377685546875, -8.78173828125, -8.185791015625, -7.58984375, -6.993896484375, -6.39794921875, -5.802001953125, -5.2060546875, -4.610107421875, -4.01416015625, -3.418212890625, -2.822265625, -2.226318359375, -1.63037109375, -1.034423828125, -0.4384765625, 0.157470703125, 0.75341796875, 1.349365234375, 1.9453125, 2.541259765625, 3.13720703125, 3.733154296875, 4.3291015625, 4.925048828125, 5.52099609375, 6.116943359375, 6.712890625, 7.308837890625, 7.90478515625, 8.500732421875, 9.0966796875, 9.692626953125, 10.28857421875, 10.884521484375, 11.48046875, 12.076416015625, 12.67236328125, 13.268310546875, 13.8642578125, 14.460205078125, 15.05615234375, 15.652099609375, 16.248046875, 16.843994140625, 17.43994140625, 18.035888671875, 18.6318359375, 19.227783203125, 19.82373046875, 20.419677734375, 21.015625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 11.0, 9.0, 8.0, 3.0, 12.0, 9.0, 15.0, 19.0, 21.0, 19.0, 26.0, 19.0, 28.0, 20.0, 20.0, 34.0, 23.0, 31.0, 28.0, 34.0, 31.0, 25.0, 46.0, 35.0, 36.0, 45.0, 41.0, 31.0, 30.0, 30.0, 25.0, 32.0, 29.0, 19.0, 22.0, 10.0, 17.0, 19.0, 12.0, 11.0, 15.0, 10.0, 15.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-11.5, -11.157958984375, -10.81591796875, -10.473876953125, -10.1318359375, -9.789794921875, -9.44775390625, -9.105712890625, -8.763671875, -8.421630859375, -8.07958984375, -7.737548828125, -7.3955078125, -7.053466796875, -6.71142578125, -6.369384765625, -6.02734375, -5.685302734375, -5.34326171875, -5.001220703125, -4.6591796875, -4.317138671875, -3.97509765625, -3.633056640625, -3.291015625, -2.948974609375, -2.60693359375, -2.264892578125, -1.9228515625, -1.580810546875, -1.23876953125, -0.896728515625, -0.5546875, -0.212646484375, 0.12939453125, 0.471435546875, 0.8134765625, 1.155517578125, 1.49755859375, 1.839599609375, 2.181640625, 2.523681640625, 2.86572265625, 3.207763671875, 3.5498046875, 3.891845703125, 4.23388671875, 4.575927734375, 4.91796875, 5.260009765625, 5.60205078125, 5.944091796875, 6.2861328125, 6.628173828125, 6.97021484375, 7.312255859375, 7.654296875, 7.996337890625, 8.33837890625, 8.680419921875, 9.0224609375, 9.364501953125, 9.70654296875, 10.048583984375, 10.390625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 16.0, 19.0, 25.0, 38.0, 61.0, 86.0, 112.0, 156.0, 236.0, 371.0, 517.0, 733.0, 1106.0, 1642.0, 2596.0, 4040.0, 6301.0, 10265.0, 17178.0, 28939.0, 52278.0, 95136.0, 182114.0, 351225.0, 648021.0, 938282.0, 819632.0, 482482.0, 253379.0, 131293.0, 69913.0, 38614.0, 22114.0, 13019.0, 7988.0, 4921.0, 3176.0, 2064.0, 1361.0, 911.0, 613.0, 405.0, 289.0, 206.0, 119.0, 80.0, 67.0, 42.0, 35.0, 21.0, 17.0, 11.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0], "bins": [-24.625, -23.849365234375, -23.07373046875, -22.298095703125, -21.5224609375, -20.746826171875, -19.97119140625, -19.195556640625, -18.419921875, -17.644287109375, -16.86865234375, -16.093017578125, -15.3173828125, -14.541748046875, -13.76611328125, -12.990478515625, -12.21484375, -11.439208984375, -10.66357421875, -9.887939453125, -9.1123046875, -8.336669921875, -7.56103515625, -6.785400390625, -6.009765625, -5.234130859375, -4.45849609375, -3.682861328125, -2.9072265625, -2.131591796875, -1.35595703125, -0.580322265625, 0.1953125, 0.970947265625, 1.74658203125, 2.522216796875, 3.2978515625, 4.073486328125, 4.84912109375, 5.624755859375, 6.400390625, 7.176025390625, 7.95166015625, 8.727294921875, 9.5029296875, 10.278564453125, 11.05419921875, 11.829833984375, 12.60546875, 13.381103515625, 14.15673828125, 14.932373046875, 15.7080078125, 16.483642578125, 17.25927734375, 18.034912109375, 18.810546875, 19.586181640625, 20.36181640625, 21.137451171875, 21.9130859375, 22.688720703125, 23.46435546875, 24.239990234375, 25.015625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 10.0, 5.0, 13.0, 17.0, 23.0, 42.0, 30.0, 39.0, 47.0, 62.0, 78.0, 89.0, 108.0, 121.0, 157.0, 196.0, 211.0, 253.0, 279.0, 273.0, 301.0, 238.0, 211.0, 212.0, 201.0, 162.0, 137.0, 102.0, 72.0, 87.0, 60.0, 35.0, 33.0, 26.0, 25.0, 32.0, 18.0, 10.0, 9.0, 8.0, 7.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.6015625, -7.3621826171875, -7.122802734375, -6.8834228515625, -6.64404296875, -6.4046630859375, -6.165283203125, -5.9259033203125, -5.6865234375, -5.4471435546875, -5.207763671875, -4.9683837890625, -4.72900390625, -4.4896240234375, -4.250244140625, -4.0108642578125, -3.771484375, -3.5321044921875, -3.292724609375, -3.0533447265625, -2.81396484375, -2.5745849609375, -2.335205078125, -2.0958251953125, -1.8564453125, -1.6170654296875, -1.377685546875, -1.1383056640625, -0.89892578125, -0.6595458984375, -0.420166015625, -0.1807861328125, 0.05859375, 0.2979736328125, 0.537353515625, 0.7767333984375, 1.01611328125, 1.2554931640625, 1.494873046875, 1.7342529296875, 1.9736328125, 2.2130126953125, 2.452392578125, 2.6917724609375, 2.93115234375, 3.1705322265625, 3.409912109375, 3.6492919921875, 3.888671875, 4.1280517578125, 4.367431640625, 4.6068115234375, 4.84619140625, 5.0855712890625, 5.324951171875, 5.5643310546875, 5.8037109375, 6.0430908203125, 6.282470703125, 6.5218505859375, 6.76123046875, 7.0006103515625, 7.239990234375, 7.4793701171875, 7.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 6.0, 4.0, 6.0, 16.0, 5.0, 12.0, 17.0, 8.0, 21.0, 25.0, 32.0, 37.0, 31.0, 33.0, 53.0, 46.0, 44.0, 62.0, 56.0, 46.0, 66.0, 45.0, 43.0, 41.0, 34.0, 37.0, 31.0, 19.0, 26.0, 23.0, 16.0, 14.0, 9.0, 4.0, 6.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.721359252929688, -25.900625228881836, -25.079891204833984, -24.259157180786133, -23.43842315673828, -22.617687225341797, -21.796953201293945, -20.976219177246094, -20.155485153198242, -19.33475112915039, -18.51401710510254, -17.693283081054688, -16.872547149658203, -16.051815032958984, -15.2310791015625, -14.410345077514648, -13.589611053466797, -12.768877029418945, -11.948143005371094, -11.127408027648926, -10.306674003601074, -9.485939979553223, -8.665205001831055, -7.844470977783203, -7.023736953735352, -6.2030029296875, -5.38226842880249, -4.5615339279174805, -3.740799903869629, -2.9200658798217773, -2.0993313789367676, -1.2785968780517578, -0.45786285400390625, 0.3628714084625244, 1.183605670928955, 2.0043399333953857, 2.8250741958618164, 3.645808219909668, 4.466542720794678, 5.2872772216796875, 6.108011245727539, 6.928745269775391, 7.7494797706604, 8.57021427154541, 9.390948295593262, 10.211682319641113, 11.032417297363281, 11.853151321411133, 12.673885345458984, 13.494619369506836, 14.315353393554688, 15.136088371276855, 15.956822395324707, 16.777557373046875, 17.598291397094727, 18.419025421142578, 19.23975944519043, 20.06049346923828, 20.881227493286133, 21.701961517333984, 22.52269744873047, 23.343429565429688, 24.164165496826172, 24.984899520874023, 25.805633544921875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 12.0, 12.0, 14.0, 14.0, 10.0, 18.0, 18.0, 21.0, 27.0, 21.0, 37.0, 29.0, 38.0, 33.0, 41.0, 41.0, 40.0, 47.0, 36.0, 26.0, 47.0, 37.0, 35.0, 41.0, 32.0, 29.0, 31.0, 26.0, 31.0, 22.0, 13.0, 24.0, 14.0, 16.0, 12.0, 5.0, 10.0, 10.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-17.098608016967773, -16.550521850585938, -16.002437591552734, -15.454351425170898, -14.906265258789062, -14.358179092407227, -13.810093879699707, -13.262008666992188, -12.713922500610352, -12.165836334228516, -11.617751121520996, -11.069665908813477, -10.52157974243164, -9.973493576049805, -9.425408363342285, -8.877323150634766, -8.32923698425293, -7.781151294708252, -7.233065605163574, -6.6849799156188965, -6.136894226074219, -5.588808536529541, -5.040722846984863, -4.4926371574401855, -3.944551467895508, -3.39646577835083, -2.8483800888061523, -2.3002943992614746, -1.7522087097167969, -1.2041230201721191, -0.6560373306274414, -0.10795164108276367, 0.44013214111328125, 0.988217830657959, 1.5363035202026367, 2.0843892097473145, 2.632474899291992, 3.18056058883667, 3.7286462783813477, 4.276731967926025, 4.824817657470703, 5.372903347015381, 5.920989036560059, 6.469074726104736, 7.017160415649414, 7.565246105194092, 8.11333179473877, 8.661417007446289, 9.209503173828125, 9.757589340209961, 10.30567455291748, 10.853759765625, 11.401845932006836, 11.949932098388672, 12.498017311096191, 13.046102523803711, 13.594188690185547, 14.142274856567383, 14.690360069274902, 15.238445281982422, 15.786531448364258, 16.334617614746094, 16.882701873779297, 17.430788040161133, 17.97887420654297]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 14.0, 25.0, 26.0, 39.0, 71.0, 105.0, 154.0, 259.0, 389.0, 604.0, 976.0, 1442.0, 2207.0, 3323.0, 5461.0, 8373.0, 14036.0, 22228.0, 35270.0, 56033.0, 86307.0, 122638.0, 152794.0, 155249.0, 128102.0, 90629.0, 59992.0, 38055.0, 23512.0, 14734.0, 9241.0, 5808.0, 3751.0, 2413.0, 1525.0, 943.0, 612.0, 405.0, 284.0, 174.0, 112.0, 89.0, 61.0, 41.0, 15.0, 14.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3416748046875, -10.988037109375, -10.6343994140625, -10.28076171875, -9.9271240234375, -9.573486328125, -9.2198486328125, -8.8662109375, -8.5125732421875, -8.158935546875, -7.8052978515625, -7.45166015625, -7.0980224609375, -6.744384765625, -6.3907470703125, -6.037109375, -5.6834716796875, -5.329833984375, -4.9761962890625, -4.62255859375, -4.2689208984375, -3.915283203125, -3.5616455078125, -3.2080078125, -2.8543701171875, -2.500732421875, -2.1470947265625, -1.79345703125, -1.4398193359375, -1.086181640625, -0.7325439453125, -0.37890625, -0.0252685546875, 0.328369140625, 0.6820068359375, 1.03564453125, 1.3892822265625, 1.742919921875, 2.0965576171875, 2.4501953125, 2.8038330078125, 3.157470703125, 3.5111083984375, 3.86474609375, 4.2183837890625, 4.572021484375, 4.9256591796875, 5.279296875, 5.6329345703125, 5.986572265625, 6.3402099609375, 6.69384765625, 7.0474853515625, 7.401123046875, 7.7547607421875, 8.1083984375, 8.4620361328125, 8.815673828125, 9.1693115234375, 9.52294921875, 9.8765869140625, 10.230224609375, 10.5838623046875, 10.9375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 10.0, 11.0, 15.0, 11.0, 8.0, 13.0, 27.0, 22.0, 30.0, 27.0, 35.0, 49.0, 35.0, 36.0, 40.0, 41.0, 48.0, 40.0, 40.0, 47.0, 40.0, 36.0, 44.0, 29.0, 43.0, 37.0, 26.0, 20.0, 25.0, 10.0, 26.0, 11.0, 13.0, 12.0, 9.0, 11.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.671875, -20.0234375, -19.375, -18.7265625, -18.078125, -17.4296875, -16.78125, -16.1328125, -15.484375, -14.8359375, -14.1875, -13.5390625, -12.890625, -12.2421875, -11.59375, -10.9453125, -10.296875, -9.6484375, -9.0, -8.3515625, -7.703125, -7.0546875, -6.40625, -5.7578125, -5.109375, -4.4609375, -3.8125, -3.1640625, -2.515625, -1.8671875, -1.21875, -0.5703125, 0.078125, 0.7265625, 1.375, 2.0234375, 2.671875, 3.3203125, 3.96875, 4.6171875, 5.265625, 5.9140625, 6.5625, 7.2109375, 7.859375, 8.5078125, 9.15625, 9.8046875, 10.453125, 11.1015625, 11.75, 12.3984375, 13.046875, 13.6953125, 14.34375, 14.9921875, 15.640625, 16.2890625, 16.9375, 17.5859375, 18.234375, 18.8828125, 19.53125, 20.1796875, 20.828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 1.0, 8.0, 8.0, 14.0, 32.0, 30.0, 44.0, 89.0, 110.0, 197.0, 266.0, 437.0, 630.0, 1031.0, 1642.0, 2553.0, 4254.0, 7335.0, 12598.0, 22364.0, 40679.0, 73417.0, 127462.0, 194710.0, 209206.0, 148469.0, 88331.0, 48846.0, 26923.0, 15050.0, 8636.0, 4999.0, 3035.0, 1823.0, 1120.0, 744.0, 508.0, 316.0, 231.0, 135.0, 90.0, 50.0, 39.0, 32.0, 26.0, 7.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.125, -15.62353515625, -15.1220703125, -14.62060546875, -14.119140625, -13.61767578125, -13.1162109375, -12.61474609375, -12.11328125, -11.61181640625, -11.1103515625, -10.60888671875, -10.107421875, -9.60595703125, -9.1044921875, -8.60302734375, -8.1015625, -7.60009765625, -7.0986328125, -6.59716796875, -6.095703125, -5.59423828125, -5.0927734375, -4.59130859375, -4.08984375, -3.58837890625, -3.0869140625, -2.58544921875, -2.083984375, -1.58251953125, -1.0810546875, -0.57958984375, -0.078125, 0.42333984375, 0.9248046875, 1.42626953125, 1.927734375, 2.42919921875, 2.9306640625, 3.43212890625, 3.93359375, 4.43505859375, 4.9365234375, 5.43798828125, 5.939453125, 6.44091796875, 6.9423828125, 7.44384765625, 7.9453125, 8.44677734375, 8.9482421875, 9.44970703125, 9.951171875, 10.45263671875, 10.9541015625, 11.45556640625, 11.95703125, 12.45849609375, 12.9599609375, 13.46142578125, 13.962890625, 14.46435546875, 14.9658203125, 15.46728515625, 15.96875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 9.0, 14.0, 13.0, 8.0, 17.0, 16.0, 21.0, 18.0, 27.0, 21.0, 34.0, 42.0, 44.0, 47.0, 43.0, 48.0, 47.0, 46.0, 51.0, 47.0, 39.0, 42.0, 43.0, 51.0, 32.0, 27.0, 26.0, 20.0, 13.0, 21.0, 18.0, 9.0, 10.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.2734375, -12.87109375, -12.46875, -12.06640625, -11.6640625, -11.26171875, -10.859375, -10.45703125, -10.0546875, -9.65234375, -9.25, -8.84765625, -8.4453125, -8.04296875, -7.640625, -7.23828125, -6.8359375, -6.43359375, -6.03125, -5.62890625, -5.2265625, -4.82421875, -4.421875, -4.01953125, -3.6171875, -3.21484375, -2.8125, -2.41015625, -2.0078125, -1.60546875, -1.203125, -0.80078125, -0.3984375, 0.00390625, 0.40625, 0.80859375, 1.2109375, 1.61328125, 2.015625, 2.41796875, 2.8203125, 3.22265625, 3.625, 4.02734375, 4.4296875, 4.83203125, 5.234375, 5.63671875, 6.0390625, 6.44140625, 6.84375, 7.24609375, 7.6484375, 8.05078125, 8.453125, 8.85546875, 9.2578125, 9.66015625, 10.0625, 10.46484375, 10.8671875, 11.26953125, 11.671875, 12.07421875, 12.4765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 10.0, 24.0, 29.0, 19.0, 43.0, 79.0, 67.0, 148.0, 230.0, 297.0, 551.0, 805.0, 1313.0, 2093.0, 3484.0, 6017.0, 10396.0, 18709.0, 35221.0, 65856.0, 122654.0, 202921.0, 229910.0, 156782.0, 87305.0, 46229.0, 24589.0, 13573.0, 7657.0, 4432.0, 2635.0, 1652.0, 1003.0, 640.0, 405.0, 273.0, 185.0, 112.0, 79.0, 40.0, 31.0, 18.0, 13.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-9.6328125, -9.351318359375, -9.06982421875, -8.788330078125, -8.5068359375, -8.225341796875, -7.94384765625, -7.662353515625, -7.380859375, -7.099365234375, -6.81787109375, -6.536376953125, -6.2548828125, -5.973388671875, -5.69189453125, -5.410400390625, -5.12890625, -4.847412109375, -4.56591796875, -4.284423828125, -4.0029296875, -3.721435546875, -3.43994140625, -3.158447265625, -2.876953125, -2.595458984375, -2.31396484375, -2.032470703125, -1.7509765625, -1.469482421875, -1.18798828125, -0.906494140625, -0.625, -0.343505859375, -0.06201171875, 0.219482421875, 0.5009765625, 0.782470703125, 1.06396484375, 1.345458984375, 1.626953125, 1.908447265625, 2.18994140625, 2.471435546875, 2.7529296875, 3.034423828125, 3.31591796875, 3.597412109375, 3.87890625, 4.160400390625, 4.44189453125, 4.723388671875, 5.0048828125, 5.286376953125, 5.56787109375, 5.849365234375, 6.130859375, 6.412353515625, 6.69384765625, 6.975341796875, 7.2568359375, 7.538330078125, 7.81982421875, 8.101318359375, 8.3828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 7.0, 10.0, 16.0, 11.0, 17.0, 25.0, 27.0, 31.0, 36.0, 31.0, 59.0, 44.0, 47.0, 56.0, 59.0, 78.0, 54.0, 48.0, 47.0, 44.0, 34.0, 36.0, 34.0, 23.0, 23.0, 13.0, 12.0, 15.0, 13.0, 4.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003979206085205078, -0.00038359686732292175, -0.0003692731261253357, -0.00035494938492774963, -0.0003406256437301636, -0.0003263019025325775, -0.00031197816133499146, -0.0002976544201374054, -0.00028333067893981934, -0.0002690069377422333, -0.0002546831965446472, -0.00024035945534706116, -0.0002260357141494751, -0.00021171197295188904, -0.00019738823175430298, -0.00018306449055671692, -0.00016874074935913086, -0.0001544170081615448, -0.00014009326696395874, -0.00012576952576637268, -0.00011144578456878662, -9.712204337120056e-05, -8.27983021736145e-05, -6.847456097602844e-05, -5.415081977844238e-05, -3.982707858085632e-05, -2.5503337383270264e-05, -1.1179596185684204e-05, 3.1441450119018555e-06, 1.7467886209487915e-05, 3.1791627407073975e-05, 4.6115368604660034e-05, 6.0439109802246094e-05, 7.476285099983215e-05, 8.908659219741821e-05, 0.00010341033339500427, 0.00011773407459259033, 0.0001320578157901764, 0.00014638155698776245, 0.0001607052981853485, 0.00017502903938293457, 0.00018935278058052063, 0.0002036765217781067, 0.00021800026297569275, 0.0002323240041732788, 0.00024664774537086487, 0.00026097148656845093, 0.000275295227766037, 0.00028961896896362305, 0.0003039427101612091, 0.00031826645135879517, 0.0003325901925563812, 0.0003469139337539673, 0.00036123767495155334, 0.0003755614161491394, 0.00038988515734672546, 0.0004042088985443115, 0.0004185326397418976, 0.00043285638093948364, 0.0004471801221370697, 0.00046150386333465576, 0.0004758276045322418, 0.0004901513457298279, 0.0005044750869274139, 0.000518798828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 13.0, 7.0, 8.0, 18.0, 26.0, 38.0, 59.0, 90.0, 107.0, 193.0, 253.0, 366.0, 530.0, 823.0, 1203.0, 1880.0, 2895.0, 4636.0, 7194.0, 11724.0, 19485.0, 33313.0, 55735.0, 91587.0, 138687.0, 174663.0, 168636.0, 126644.0, 81877.0, 49852.0, 29701.0, 17675.0, 10609.0, 6437.0, 3928.0, 2534.0, 1666.0, 1115.0, 700.0, 504.0, 365.0, 256.0, 153.0, 111.0, 87.0, 59.0, 39.0, 25.0, 20.0, 7.0, 9.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0], "bins": [-8.7109375, -8.446044921875, -8.18115234375, -7.916259765625, -7.6513671875, -7.386474609375, -7.12158203125, -6.856689453125, -6.591796875, -6.326904296875, -6.06201171875, -5.797119140625, -5.5322265625, -5.267333984375, -5.00244140625, -4.737548828125, -4.47265625, -4.207763671875, -3.94287109375, -3.677978515625, -3.4130859375, -3.148193359375, -2.88330078125, -2.618408203125, -2.353515625, -2.088623046875, -1.82373046875, -1.558837890625, -1.2939453125, -1.029052734375, -0.76416015625, -0.499267578125, -0.234375, 0.030517578125, 0.29541015625, 0.560302734375, 0.8251953125, 1.090087890625, 1.35498046875, 1.619873046875, 1.884765625, 2.149658203125, 2.41455078125, 2.679443359375, 2.9443359375, 3.209228515625, 3.47412109375, 3.739013671875, 4.00390625, 4.268798828125, 4.53369140625, 4.798583984375, 5.0634765625, 5.328369140625, 5.59326171875, 5.858154296875, 6.123046875, 6.387939453125, 6.65283203125, 6.917724609375, 7.1826171875, 7.447509765625, 7.71240234375, 7.977294921875, 8.2421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 6.0, 9.0, 11.0, 14.0, 27.0, 35.0, 26.0, 29.0, 37.0, 43.0, 51.0, 60.0, 56.0, 67.0, 55.0, 56.0, 59.0, 60.0, 33.0, 34.0, 34.0, 33.0, 36.0, 19.0, 18.0, 17.0, 8.0, 6.0, 12.0, 11.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.36328125, -3.27142333984375, -3.1795654296875, -3.08770751953125, -2.995849609375, -2.90399169921875, -2.8121337890625, -2.72027587890625, -2.62841796875, -2.53656005859375, -2.4447021484375, -2.35284423828125, -2.260986328125, -2.16912841796875, -2.0772705078125, -1.98541259765625, -1.8935546875, -1.80169677734375, -1.7098388671875, -1.61798095703125, -1.526123046875, -1.43426513671875, -1.3424072265625, -1.25054931640625, -1.15869140625, -1.06683349609375, -0.9749755859375, -0.88311767578125, -0.791259765625, -0.69940185546875, -0.6075439453125, -0.51568603515625, -0.423828125, -0.33197021484375, -0.2401123046875, -0.14825439453125, -0.056396484375, 0.03546142578125, 0.1273193359375, 0.21917724609375, 0.31103515625, 0.40289306640625, 0.4947509765625, 0.58660888671875, 0.678466796875, 0.77032470703125, 0.8621826171875, 0.95404052734375, 1.0458984375, 1.13775634765625, 1.2296142578125, 1.32147216796875, 1.413330078125, 1.50518798828125, 1.5970458984375, 1.68890380859375, 1.78076171875, 1.87261962890625, 1.9644775390625, 2.05633544921875, 2.148193359375, 2.24005126953125, 2.3319091796875, 2.42376708984375, 2.515625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 5.0, 9.0, 7.0, 10.0, 9.0, 13.0, 12.0, 23.0, 23.0, 33.0, 29.0, 30.0, 41.0, 52.0, 43.0, 50.0, 58.0, 47.0, 66.0, 67.0, 46.0, 48.0, 29.0, 40.0, 39.0, 27.0, 35.0, 21.0, 16.0, 18.0, 8.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.771923065185547, -26.920028686523438, -26.06813621520996, -25.21624183654785, -24.364349365234375, -23.512454986572266, -22.660560607910156, -21.80866813659668, -20.95677375793457, -20.10487937927246, -19.252986907958984, -18.401092529296875, -17.5492000579834, -16.69730567932129, -15.845412254333496, -14.993518829345703, -14.14162540435791, -13.289731979370117, -12.437838554382324, -11.585945129394531, -10.734050750732422, -9.882157325744629, -9.030263900756836, -8.178369522094727, -7.326476573944092, -6.474583148956299, -5.622689247131348, -4.770795822143555, -3.9189021587371826, -3.0670084953308105, -2.2151150703430176, -1.3632211685180664, -0.5113277435302734, 0.34056586027145386, 1.1924594640731812, 2.0443530082702637, 2.8962466716766357, 3.748140335083008, 4.600033760070801, 5.451927661895752, 6.303821086883545, 7.155714511871338, 8.007608413696289, 8.859501838684082, 9.711395263671875, 10.563289642333984, 11.415182113647461, 12.26707649230957, 13.118969917297363, 13.970863342285156, 14.82275676727295, 15.674650192260742, 16.52654457092285, 17.378437042236328, 18.230331420898438, 19.082225799560547, 19.934118270874023, 20.786012649536133, 21.63790512084961, 22.48979949951172, 23.341691970825195, 24.193586349487305, 25.04547882080078, 25.89737319946289, 26.749267578125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 13.0, 10.0, 16.0, 15.0, 19.0, 21.0, 26.0, 20.0, 40.0, 24.0, 33.0, 40.0, 39.0, 39.0, 39.0, 44.0, 38.0, 42.0, 34.0, 41.0, 29.0, 34.0, 31.0, 41.0, 37.0, 23.0, 23.0, 28.0, 26.0, 17.0, 12.0, 17.0, 10.0, 8.0, 12.0, 12.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.176673889160156, -16.617765426635742, -16.058856964111328, -15.499948501586914, -14.941040992736816, -14.382132530212402, -13.823224067687988, -13.264315605163574, -12.705408096313477, -12.146499633789062, -11.587591171264648, -11.028682708740234, -10.469775199890137, -9.910866737365723, -9.351958274841309, -8.793049812316895, -8.23414134979248, -7.675232887268066, -7.1163249015808105, -6.5574164390563965, -5.998508453369141, -5.439599990844727, -4.8806915283203125, -4.321783065795898, -3.7628750801086426, -3.2039668560028076, -2.6450586318969727, -2.0861501693725586, -1.5272419452667236, -0.9683337211608887, -0.4094252586364746, 0.14948296546936035, 0.7083911895751953, 1.2672994136810303, 1.8262077569961548, 2.3851161003112793, 2.9440243244171143, 3.502932548522949, 4.061841011047363, 4.620749473571777, 5.179657459259033, 5.738565921783447, 6.297473907470703, 6.856382369995117, 7.415290832519531, 7.974198818206787, 8.53310775756836, 9.092015266418457, 9.650923728942871, 10.209832191467285, 10.7687406539917, 11.327648162841797, 11.886556625366211, 12.445465087890625, 13.004373550415039, 13.563282012939453, 14.122190475463867, 14.681098937988281, 15.240007400512695, 15.79891586303711, 16.357824325561523, 16.916732788085938, 17.47563934326172, 18.034547805786133, 18.593456268310547]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 10.0, 12.0, 7.0, 24.0, 35.0, 70.0, 87.0, 112.0, 186.0, 298.0, 421.0, 643.0, 909.0, 1384.0, 2307.0, 3504.0, 5569.0, 9011.0, 15083.0, 24990.0, 42396.0, 70714.0, 110640.0, 153094.0, 171329.0, 150873.0, 109606.0, 69854.0, 41583.0, 24764.0, 14577.0, 9020.0, 5501.0, 3477.0, 2264.0, 1383.0, 920.0, 635.0, 386.0, 338.0, 186.0, 136.0, 77.0, 49.0, 27.0, 29.0, 16.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.546875, -15.036865234375, -14.52685546875, -14.016845703125, -13.5068359375, -12.996826171875, -12.48681640625, -11.976806640625, -11.466796875, -10.956787109375, -10.44677734375, -9.936767578125, -9.4267578125, -8.916748046875, -8.40673828125, -7.896728515625, -7.38671875, -6.876708984375, -6.36669921875, -5.856689453125, -5.3466796875, -4.836669921875, -4.32666015625, -3.816650390625, -3.306640625, -2.796630859375, -2.28662109375, -1.776611328125, -1.2666015625, -0.756591796875, -0.24658203125, 0.263427734375, 0.7734375, 1.283447265625, 1.79345703125, 2.303466796875, 2.8134765625, 3.323486328125, 3.83349609375, 4.343505859375, 4.853515625, 5.363525390625, 5.87353515625, 6.383544921875, 6.8935546875, 7.403564453125, 7.91357421875, 8.423583984375, 8.93359375, 9.443603515625, 9.95361328125, 10.463623046875, 10.9736328125, 11.483642578125, 11.99365234375, 12.503662109375, 13.013671875, 13.523681640625, 14.03369140625, 14.543701171875, 15.0537109375, 15.563720703125, 16.07373046875, 16.583740234375, 17.09375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 12.0, 9.0, 12.0, 13.0, 23.0, 14.0, 19.0, 22.0, 25.0, 35.0, 32.0, 31.0, 39.0, 34.0, 48.0, 56.0, 37.0, 43.0, 41.0, 43.0, 45.0, 33.0, 46.0, 31.0, 29.0, 38.0, 29.0, 25.0, 29.0, 15.0, 12.0, 13.0, 14.0, 8.0, 14.0, 6.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.86083984375, -18.2216796875, -17.58251953125, -16.943359375, -16.30419921875, -15.6650390625, -15.02587890625, -14.38671875, -13.74755859375, -13.1083984375, -12.46923828125, -11.830078125, -11.19091796875, -10.5517578125, -9.91259765625, -9.2734375, -8.63427734375, -7.9951171875, -7.35595703125, -6.716796875, -6.07763671875, -5.4384765625, -4.79931640625, -4.16015625, -3.52099609375, -2.8818359375, -2.24267578125, -1.603515625, -0.96435546875, -0.3251953125, 0.31396484375, 0.953125, 1.59228515625, 2.2314453125, 2.87060546875, 3.509765625, 4.14892578125, 4.7880859375, 5.42724609375, 6.06640625, 6.70556640625, 7.3447265625, 7.98388671875, 8.623046875, 9.26220703125, 9.9013671875, 10.54052734375, 11.1796875, 11.81884765625, 12.4580078125, 13.09716796875, 13.736328125, 14.37548828125, 15.0146484375, 15.65380859375, 16.29296875, 16.93212890625, 17.5712890625, 18.21044921875, 18.849609375, 19.48876953125, 20.1279296875, 20.76708984375, 21.40625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 9.0, 15.0, 21.0, 32.0, 50.0, 67.0, 104.0, 154.0, 289.0, 402.0, 680.0, 1078.0, 1633.0, 2702.0, 4429.0, 7429.0, 12554.0, 21029.0, 36921.0, 65233.0, 112800.0, 173991.0, 203012.0, 162739.0, 101590.0, 58369.0, 33626.0, 19300.0, 11126.0, 6666.0, 3907.0, 2448.0, 1499.0, 901.0, 594.0, 414.0, 247.0, 168.0, 98.0, 78.0, 42.0, 31.0, 11.0, 14.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-27.515625, -26.639404296875, -25.76318359375, -24.886962890625, -24.0107421875, -23.134521484375, -22.25830078125, -21.382080078125, -20.505859375, -19.629638671875, -18.75341796875, -17.877197265625, -17.0009765625, -16.124755859375, -15.24853515625, -14.372314453125, -13.49609375, -12.619873046875, -11.74365234375, -10.867431640625, -9.9912109375, -9.114990234375, -8.23876953125, -7.362548828125, -6.486328125, -5.610107421875, -4.73388671875, -3.857666015625, -2.9814453125, -2.105224609375, -1.22900390625, -0.352783203125, 0.5234375, 1.399658203125, 2.27587890625, 3.152099609375, 4.0283203125, 4.904541015625, 5.78076171875, 6.656982421875, 7.533203125, 8.409423828125, 9.28564453125, 10.161865234375, 11.0380859375, 11.914306640625, 12.79052734375, 13.666748046875, 14.54296875, 15.419189453125, 16.29541015625, 17.171630859375, 18.0478515625, 18.924072265625, 19.80029296875, 20.676513671875, 21.552734375, 22.428955078125, 23.30517578125, 24.181396484375, 25.0576171875, 25.933837890625, 26.81005859375, 27.686279296875, 28.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 11.0, 8.0, 13.0, 11.0, 12.0, 12.0, 12.0, 23.0, 28.0, 28.0, 25.0, 31.0, 32.0, 36.0, 28.0, 38.0, 38.0, 48.0, 46.0, 58.0, 44.0, 35.0, 38.0, 36.0, 27.0, 35.0, 38.0, 34.0, 25.0, 28.0, 25.0, 19.0, 13.0, 9.0, 9.0, 17.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.53125, -13.11181640625, -12.6923828125, -12.27294921875, -11.853515625, -11.43408203125, -11.0146484375, -10.59521484375, -10.17578125, -9.75634765625, -9.3369140625, -8.91748046875, -8.498046875, -8.07861328125, -7.6591796875, -7.23974609375, -6.8203125, -6.40087890625, -5.9814453125, -5.56201171875, -5.142578125, -4.72314453125, -4.3037109375, -3.88427734375, -3.46484375, -3.04541015625, -2.6259765625, -2.20654296875, -1.787109375, -1.36767578125, -0.9482421875, -0.52880859375, -0.109375, 0.31005859375, 0.7294921875, 1.14892578125, 1.568359375, 1.98779296875, 2.4072265625, 2.82666015625, 3.24609375, 3.66552734375, 4.0849609375, 4.50439453125, 4.923828125, 5.34326171875, 5.7626953125, 6.18212890625, 6.6015625, 7.02099609375, 7.4404296875, 7.85986328125, 8.279296875, 8.69873046875, 9.1181640625, 9.53759765625, 9.95703125, 10.37646484375, 10.7958984375, 11.21533203125, 11.634765625, 12.05419921875, 12.4736328125, 12.89306640625, 13.3125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 15.0, 21.0, 42.0, 53.0, 78.0, 142.0, 184.0, 274.0, 496.0, 845.0, 1517.0, 2812.0, 5452.0, 12209.0, 28325.0, 66843.0, 149869.0, 260805.0, 257528.0, 145049.0, 65011.0, 27314.0, 11883.0, 5524.0, 2698.0, 1485.0, 777.0, 503.0, 272.0, 171.0, 107.0, 71.0, 56.0, 37.0, 24.0, 20.0, 12.0, 9.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.4375, -19.8695068359375, -19.301513671875, -18.7335205078125, -18.16552734375, -17.5975341796875, -17.029541015625, -16.4615478515625, -15.8935546875, -15.3255615234375, -14.757568359375, -14.1895751953125, -13.62158203125, -13.0535888671875, -12.485595703125, -11.9176025390625, -11.349609375, -10.7816162109375, -10.213623046875, -9.6456298828125, -9.07763671875, -8.5096435546875, -7.941650390625, -7.3736572265625, -6.8056640625, -6.2376708984375, -5.669677734375, -5.1016845703125, -4.53369140625, -3.9656982421875, -3.397705078125, -2.8297119140625, -2.26171875, -1.6937255859375, -1.125732421875, -0.5577392578125, 0.01025390625, 0.5782470703125, 1.146240234375, 1.7142333984375, 2.2822265625, 2.8502197265625, 3.418212890625, 3.9862060546875, 4.55419921875, 5.1221923828125, 5.690185546875, 6.2581787109375, 6.826171875, 7.3941650390625, 7.962158203125, 8.5301513671875, 9.09814453125, 9.6661376953125, 10.234130859375, 10.8021240234375, 11.3701171875, 11.9381103515625, 12.506103515625, 13.0740966796875, 13.64208984375, 14.2100830078125, 14.778076171875, 15.3460693359375, 15.9140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 16.0, 23.0, 29.0, 32.0, 37.0, 31.0, 50.0, 43.0, 65.0, 62.0, 83.0, 72.0, 52.0, 62.0, 50.0, 48.0, 48.0, 35.0, 25.0, 19.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001163482666015625, -0.0011239498853683472, -0.0010844171047210693, -0.0010448843240737915, -0.0010053515434265137, -0.0009658187627792358, -0.000926285982131958, -0.0008867532014846802, -0.0008472204208374023, -0.0008076876401901245, -0.0007681548595428467, -0.0007286220788955688, -0.000689089298248291, -0.0006495565176010132, -0.0006100237369537354, -0.0005704909563064575, -0.0005309581756591797, -0.0004914253950119019, -0.000451892614364624, -0.0004123598337173462, -0.00037282705307006836, -0.00033329427242279053, -0.0002937614917755127, -0.00025422871112823486, -0.00021469593048095703, -0.0001751631498336792, -0.00013563036918640137, -9.609758853912354e-05, -5.65648078918457e-05, -1.703202724456787e-05, 2.250075340270996e-05, 6.203353404998779e-05, 0.00010156631469726562, 0.00014109909534454346, 0.0001806318759918213, 0.00022016465663909912, 0.00025969743728637695, 0.0002992302179336548, 0.0003387629985809326, 0.00037829577922821045, 0.0004178285598754883, 0.0004573613405227661, 0.0004968941211700439, 0.0005364269018173218, 0.0005759596824645996, 0.0006154924631118774, 0.0006550252437591553, 0.0006945580244064331, 0.0007340908050537109, 0.0007736235857009888, 0.0008131563663482666, 0.0008526891469955444, 0.0008922219276428223, 0.0009317547082901001, 0.0009712874889373779, 0.0010108202695846558, 0.0010503530502319336, 0.0010898858308792114, 0.0011294186115264893, 0.001168951392173767, 0.001208484172821045, 0.0012480169534683228, 0.0012875497341156006, 0.0013270825147628784, 0.0013666152954101562]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 8.0, 9.0, 13.0, 9.0, 26.0, 32.0, 29.0, 54.0, 81.0, 89.0, 152.0, 242.0, 360.0, 521.0, 806.0, 1308.0, 2197.0, 3724.0, 6616.0, 12642.0, 24058.0, 47295.0, 89436.0, 154725.0, 211447.0, 200126.0, 134117.0, 74774.0, 39156.0, 20106.0, 10390.0, 5700.0, 3190.0, 1846.0, 1143.0, 705.0, 444.0, 296.0, 201.0, 139.0, 83.0, 78.0, 42.0, 41.0, 39.0, 16.0, 20.0, 10.0, 4.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.0546875, -12.6448974609375, -12.235107421875, -11.8253173828125, -11.41552734375, -11.0057373046875, -10.595947265625, -10.1861572265625, -9.7763671875, -9.3665771484375, -8.956787109375, -8.5469970703125, -8.13720703125, -7.7274169921875, -7.317626953125, -6.9078369140625, -6.498046875, -6.0882568359375, -5.678466796875, -5.2686767578125, -4.85888671875, -4.4490966796875, -4.039306640625, -3.6295166015625, -3.2197265625, -2.8099365234375, -2.400146484375, -1.9903564453125, -1.58056640625, -1.1707763671875, -0.760986328125, -0.3511962890625, 0.05859375, 0.4683837890625, 0.878173828125, 1.2879638671875, 1.69775390625, 2.1075439453125, 2.517333984375, 2.9271240234375, 3.3369140625, 3.7467041015625, 4.156494140625, 4.5662841796875, 4.97607421875, 5.3858642578125, 5.795654296875, 6.2054443359375, 6.615234375, 7.0250244140625, 7.434814453125, 7.8446044921875, 8.25439453125, 8.6641845703125, 9.073974609375, 9.4837646484375, 9.8935546875, 10.3033447265625, 10.713134765625, 11.1229248046875, 11.53271484375, 11.9425048828125, 12.352294921875, 12.7620849609375, 13.171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 12.0, 13.0, 17.0, 26.0, 16.0, 27.0, 36.0, 35.0, 34.0, 44.0, 70.0, 50.0, 48.0, 57.0, 69.0, 55.0, 57.0, 51.0, 35.0, 43.0, 36.0, 29.0, 17.0, 25.0, 13.0, 20.0, 12.0, 9.0, 6.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.09539794921875, -2.9876708984375, -2.87994384765625, -2.772216796875, -2.66448974609375, -2.5567626953125, -2.44903564453125, -2.34130859375, -2.23358154296875, -2.1258544921875, -2.01812744140625, -1.910400390625, -1.80267333984375, -1.6949462890625, -1.58721923828125, -1.4794921875, -1.37176513671875, -1.2640380859375, -1.15631103515625, -1.048583984375, -0.94085693359375, -0.8331298828125, -0.72540283203125, -0.61767578125, -0.50994873046875, -0.4022216796875, -0.29449462890625, -0.186767578125, -0.07904052734375, 0.0286865234375, 0.13641357421875, 0.244140625, 0.35186767578125, 0.4595947265625, 0.56732177734375, 0.675048828125, 0.78277587890625, 0.8905029296875, 0.99822998046875, 1.10595703125, 1.21368408203125, 1.3214111328125, 1.42913818359375, 1.536865234375, 1.64459228515625, 1.7523193359375, 1.86004638671875, 1.9677734375, 2.07550048828125, 2.1832275390625, 2.29095458984375, 2.398681640625, 2.50640869140625, 2.6141357421875, 2.72186279296875, 2.82958984375, 2.93731689453125, 3.0450439453125, 3.15277099609375, 3.260498046875, 3.36822509765625, 3.4759521484375, 3.58367919921875, 3.69140625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 7.0, 8.0, 8.0, 13.0, 20.0, 14.0, 20.0, 20.0, 30.0, 27.0, 47.0, 40.0, 45.0, 61.0, 61.0, 60.0, 58.0, 61.0, 53.0, 51.0, 41.0, 46.0, 27.0, 29.0, 39.0, 26.0, 22.0, 13.0, 5.0, 11.0, 2.0, 6.0, 5.0, 0.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.87222671508789, -30.914466857910156, -29.956707000732422, -28.998945236206055, -28.04118537902832, -27.083425521850586, -26.12566566467285, -25.167903900146484, -24.21014404296875, -23.252384185791016, -22.29462432861328, -21.336862564086914, -20.37910270690918, -19.421342849731445, -18.46358299255371, -17.505821228027344, -16.54806137084961, -15.590301513671875, -14.632540702819824, -13.67478084564209, -12.717020034790039, -11.759260177612305, -10.80150032043457, -9.84373950958252, -8.885980606079102, -7.928220272064209, -6.970459938049316, -6.012700080871582, -5.054939270019531, -4.097179412841797, -3.1394190788269043, -2.1816587448120117, -1.223897933959961, -0.26613765954971313, 0.6916226148605347, 1.6493828296661377, 2.6071431636810303, 3.5649032592773438, 4.522663593292236, 5.480423927307129, 6.4381842613220215, 7.395944595336914, 8.353704452514648, 9.3114652633667, 10.269225120544434, 11.226985931396484, 12.184745788574219, 13.142505645751953, 14.100266456604004, 15.058026313781738, 16.01578712463379, 16.973546981811523, 17.931306838989258, 18.889068603515625, 19.84682846069336, 20.804588317871094, 21.762348175048828, 22.720108032226562, 23.677867889404297, 24.635629653930664, 25.5933895111084, 26.551149368286133, 27.508909225463867, 28.466670989990234, 29.42443084716797]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 10.0, 7.0, 10.0, 12.0, 12.0, 24.0, 18.0, 23.0, 27.0, 42.0, 23.0, 36.0, 36.0, 41.0, 52.0, 46.0, 37.0, 39.0, 42.0, 46.0, 56.0, 50.0, 40.0, 37.0, 27.0, 36.0, 25.0, 22.0, 24.0, 27.0, 16.0, 14.0, 13.0, 12.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.52432632446289, -28.70242691040039, -27.880525588989258, -27.058624267578125, -26.236724853515625, -25.414825439453125, -24.592924118041992, -23.77102279663086, -22.94912338256836, -22.12722396850586, -21.305322647094727, -20.483421325683594, -19.661521911621094, -18.839622497558594, -18.01772117614746, -17.195819854736328, -16.373920440673828, -15.552020072937012, -14.730119705200195, -13.908219337463379, -13.086318969726562, -12.264418601989746, -11.44251823425293, -10.620617866516113, -9.798717498779297, -8.97681713104248, -8.154916763305664, -7.333016395568848, -6.511116027832031, -5.689215660095215, -4.867315292358398, -4.045414924621582, -3.2235145568847656, -2.401614189147949, -1.5797138214111328, -0.7578134536743164, 0.0640869140625, 0.8859872817993164, 1.7078876495361328, 2.529788017272949, 3.3516883850097656, 4.173588752746582, 4.995489120483398, 5.817389488220215, 6.639289855957031, 7.461190223693848, 8.283090591430664, 9.10499095916748, 9.926891326904297, 10.748791694641113, 11.57069206237793, 12.392592430114746, 13.214492797851562, 14.036393165588379, 14.858293533325195, 15.680193901062012, 16.502094268798828, 17.323993682861328, 18.14589500427246, 18.967796325683594, 19.789695739746094, 20.611595153808594, 21.433496475219727, 22.25539779663086, 23.07729721069336]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 14.0, 8.0, 5.0, 22.0, 19.0, 24.0, 39.0, 46.0, 64.0, 89.0, 123.0, 176.0, 275.0, 444.0, 837.0, 1605.0, 4089.0, 506287.0, 5432.0, 2087.0, 935.0, 572.0, 322.0, 201.0, 138.0, 95.0, 60.0, 50.0, 39.0, 28.0, 22.0, 10.0, 14.0, 17.0, 15.0, 6.0, 5.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0], "bins": [-618.67529296875, -600.8162841796875, -582.957275390625, -565.0983276367188, -547.2393188476562, -529.3803100585938, -511.52130126953125, -493.66229248046875, -475.8033142089844, -457.9443054199219, -440.0853271484375, -422.226318359375, -404.3673095703125, -386.5083312988281, -368.6493225097656, -350.79034423828125, -332.93133544921875, -315.07232666015625, -297.2133483886719, -279.3543395996094, -261.495361328125, -243.6363525390625, -225.77734375, -207.91835021972656, -190.05935668945312, -172.2003631591797, -154.34136962890625, -136.48236083984375, -118.62336730957031, -100.76437377929688, -82.9053726196289, -65.04637145996094, -47.18743896484375, -29.328441619873047, -11.469444274902344, 6.389553070068359, 24.248550415039062, 42.1075439453125, 59.96654510498047, 77.82554626464844, 95.68453979492188, 113.54353332519531, 131.40252685546875, 149.26153564453125, 167.1205291748047, 184.97952270507812, 202.83853149414062, 220.69752502441406, 238.5565185546875, 256.41552734375, 274.2745056152344, 292.1335144042969, 309.99249267578125, 327.85150146484375, 345.71051025390625, 363.56951904296875, 381.4284973144531, 399.2875061035156, 417.146484375, 435.0054931640625, 452.864501953125, 470.7234802246094, 488.5824890136719, 506.44146728515625, 524.3004760742188]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 9.0, 6.0, 9.0, 12.0, 9.0, 21.0, 21.0, 22.0, 19.0, 39.0, 36.0, 31.0, 30.0, 39.0, 48.0, 40.0, 50.0, 35.0, 1067.0, 41.0, 52.0, 51.0, 45.0, 40.0, 30.0, 34.0, 29.0, 25.0, 23.0, 27.0, 20.0, 16.0, 13.0, 14.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-949.3104248046875, -923.1917724609375, -897.0731201171875, -870.9544677734375, -844.8358154296875, -818.7171630859375, -792.5985107421875, -766.4797973632812, -740.3611450195312, -714.2424926757812, -688.1238403320312, -662.0051879882812, -635.8865356445312, -609.767822265625, -583.649169921875, -557.530517578125, -531.411865234375, -505.293212890625, -479.174560546875, -453.055908203125, -426.9372253417969, -400.8185729980469, -374.6999206542969, -348.58123779296875, -322.462646484375, -296.343994140625, -270.225341796875, -244.10667419433594, -217.98800659179688, -191.86935424804688, -165.75070190429688, -139.6320343017578, -113.51336669921875, -87.39470672607422, -61.27605056762695, -35.15739440917969, -9.038734436035156, 17.079925537109375, 43.198577880859375, 69.31724548339844, 95.43589782714844, 121.55455780029297, 147.6732177734375, 173.7918701171875, 199.9105224609375, 226.02919006347656, 252.14784240722656, 278.2665100097656, 304.3851623535156, 330.5038146972656, 356.6224670410156, 382.74114990234375, 408.85980224609375, 434.97845458984375, 461.09710693359375, 487.21575927734375, 513.3344116210938, 539.4530639648438, 565.5717163085938, 591.6903686523438, 617.8090209960938, 643.927734375, 670.04638671875, 696.1650390625, 722.28369140625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 16.0, 11.0, 26.0, 34.0, 35.0, 62.0, 68.0, 69.0, 83.0, 134.0, 165.0, 178.0, 259.0, 315.0, 344.0, 426.0, 494.0, 608.0, 713.0, 904.0, 1259.0, 1812.0, 2353.0, 3734.0, 16856.0, 31192476.0, 13317.0, 5525.0, 3383.0, 3105.0, 2660.0, 1672.0, 672.0, 314.0, 163.0, 79.0, 53.0, 38.0, 24.0, 19.0, 12.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1011.7003784179688, -986.0008544921875, -960.3013305664062, -934.601806640625, -908.9022827148438, -883.2027587890625, -857.5032958984375, -831.8037109375, -806.104248046875, -780.4047241210938, -754.7052001953125, -729.0056762695312, -703.30615234375, -677.6066284179688, -651.9071044921875, -626.2076416015625, -600.508056640625, -574.8085327148438, -549.1090087890625, -523.4094848632812, -497.7099609375, -472.01043701171875, -446.3109436035156, -420.6114196777344, -394.9118957519531, -369.2123718261719, -343.5128479003906, -317.8133544921875, -292.11383056640625, -266.414306640625, -240.71478271484375, -215.0152587890625, -189.315673828125, -163.61614990234375, -137.9166259765625, -112.21711730957031, -86.51759338378906, -60.81806945800781, -35.118560791015625, -9.419036865234375, 16.280487060546875, 41.98000717163086, 67.67952728271484, 93.37904357910156, 119.07856750488281, 144.77809143066406, 170.47760009765625, 196.1771240234375, 221.87664794921875, 247.576171875, 273.27569580078125, 298.9752197265625, 324.67474365234375, 350.374267578125, 376.0737609863281, 401.7732849121094, 427.4728088378906, 453.1723327636719, 478.8718566894531, 504.57135009765625, 530.2708740234375, 555.9703979492188, 581.669921875, 607.3694458007812, 633.0689697265625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 19.0, 33.0, 55.0, 93.0, 117.0, 179.0, 261.0, 507.0, 791.0, 1235.0, 2062.0, 3519.0, 6021.0, 10128.0, 17478.0, 31410.0, 57965.0, 108811.0, 213528.0, 449444.0, 1085266.0, 2149341.0, 1185804.0, 484018.0, 227976.0, 115907.0, 61278.0, 33579.0, 18518.0, 10496.0, 6203.0, 3607.0, 2156.0, 1297.0, 888.0, 507.0, 316.0, 225.0, 144.0, 76.0, 47.0, 44.0, 18.0, 19.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.181640625, -61.11328125, -59.044921875, -56.9765625, -54.908203125, -52.83984375, -50.771484375, -48.703125, -46.634765625, -44.56640625, -42.498046875, -40.4296875, -38.361328125, -36.29296875, -34.224609375, -32.15625, -30.087890625, -28.01953125, -25.951171875, -23.8828125, -21.814453125, -19.74609375, -17.677734375, -15.609375, -13.541015625, -11.47265625, -9.404296875, -7.3359375, -5.267578125, -3.19921875, -1.130859375, 0.9375, 3.005859375, 5.07421875, 7.142578125, 9.2109375, 11.279296875, 13.34765625, 15.416015625, 17.484375, 19.552734375, 21.62109375, 23.689453125, 25.7578125, 27.826171875, 29.89453125, 31.962890625, 34.03125, 36.099609375, 38.16796875, 40.236328125, 42.3046875, 44.373046875, 46.44140625, 48.509765625, 50.578125, 52.646484375, 54.71484375, 56.783203125, 58.8515625, 60.919921875, 62.98828125, 65.056640625, 67.125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 7.0, 4.0, 6.0, 15.0, 10.0, 17.0, 29.0, 21.0, 30.0, 37.0, 56.0, 49.0, 92.0, 125.0, 141.0, 155.0, 191.0, 192.0, 190.0, 120.0, 103.0, 65.0, 75.0, 51.0, 41.0, 28.0, 27.0, 27.0, 17.0, 23.0, 12.0, 10.0, 11.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.921875, -26.02587890625, -25.1298828125, -24.23388671875, -23.337890625, -22.44189453125, -21.5458984375, -20.64990234375, -19.75390625, -18.85791015625, -17.9619140625, -17.06591796875, -16.169921875, -15.27392578125, -14.3779296875, -13.48193359375, -12.5859375, -11.68994140625, -10.7939453125, -9.89794921875, -9.001953125, -8.10595703125, -7.2099609375, -6.31396484375, -5.41796875, -4.52197265625, -3.6259765625, -2.72998046875, -1.833984375, -0.93798828125, -0.0419921875, 0.85400390625, 1.75, 2.64599609375, 3.5419921875, 4.43798828125, 5.333984375, 6.22998046875, 7.1259765625, 8.02197265625, 8.91796875, 9.81396484375, 10.7099609375, 11.60595703125, 12.501953125, 13.39794921875, 14.2939453125, 15.18994140625, 16.0859375, 16.98193359375, 17.8779296875, 18.77392578125, 19.669921875, 20.56591796875, 21.4619140625, 22.35791015625, 23.25390625, 24.14990234375, 25.0458984375, 25.94189453125, 26.837890625, 27.73388671875, 28.6298828125, 29.52587890625, 30.421875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 17.0, 18.0, 43.0, 70.0, 126.0, 187.0, 291.0, 510.0, 767.0, 1178.0, 1864.0, 2819.0, 4536.0, 7286.0, 11707.0, 18704.0, 30457.0, 49536.0, 79766.0, 128317.0, 214897.0, 377048.0, 785860.0, 1770570.0, 1421950.0, 602614.0, 309151.0, 181198.0, 110968.0, 68525.0, 41935.0, 25781.0, 16005.0, 10111.0, 6179.0, 3767.0, 2527.0, 1558.0, 1011.0, 599.0, 397.0, 208.0, 133.0, 77.0, 54.0, 35.0, 31.0, 18.0, 12.0, 9.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.301513671875, -27.35302734375, -26.404541015625, -25.4560546875, -24.507568359375, -23.55908203125, -22.610595703125, -21.662109375, -20.713623046875, -19.76513671875, -18.816650390625, -17.8681640625, -16.919677734375, -15.97119140625, -15.022705078125, -14.07421875, -13.125732421875, -12.17724609375, -11.228759765625, -10.2802734375, -9.331787109375, -8.38330078125, -7.434814453125, -6.486328125, -5.537841796875, -4.58935546875, -3.640869140625, -2.6923828125, -1.743896484375, -0.79541015625, 0.153076171875, 1.1015625, 2.050048828125, 2.99853515625, 3.947021484375, 4.8955078125, 5.843994140625, 6.79248046875, 7.740966796875, 8.689453125, 9.637939453125, 10.58642578125, 11.534912109375, 12.4833984375, 13.431884765625, 14.38037109375, 15.328857421875, 16.27734375, 17.225830078125, 18.17431640625, 19.122802734375, 20.0712890625, 21.019775390625, 21.96826171875, 22.916748046875, 23.865234375, 24.813720703125, 25.76220703125, 26.710693359375, 27.6591796875, 28.607666015625, 29.55615234375, 30.504638671875, 31.453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 12.0, 7.0, 7.0, 10.0, 17.0, 11.0, 19.0, 18.0, 12.0, 27.0, 37.0, 41.0, 45.0, 54.0, 65.0, 119.0, 179.0, 191.0, 267.0, 193.0, 155.0, 115.0, 102.0, 55.0, 40.0, 33.0, 28.0, 26.0, 20.0, 18.0, 17.0, 18.0, 12.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.3125, -38.1015625, -36.890625, -35.6796875, -34.46875, -33.2578125, -32.046875, -30.8359375, -29.625, -28.4140625, -27.203125, -25.9921875, -24.78125, -23.5703125, -22.359375, -21.1484375, -19.9375, -18.7265625, -17.515625, -16.3046875, -15.09375, -13.8828125, -12.671875, -11.4609375, -10.25, -9.0390625, -7.828125, -6.6171875, -5.40625, -4.1953125, -2.984375, -1.7734375, -0.5625, 0.6484375, 1.859375, 3.0703125, 4.28125, 5.4921875, 6.703125, 7.9140625, 9.125, 10.3359375, 11.546875, 12.7578125, 13.96875, 15.1796875, 16.390625, 17.6015625, 18.8125, 20.0234375, 21.234375, 22.4453125, 23.65625, 24.8671875, 26.078125, 27.2890625, 28.5, 29.7109375, 30.921875, 32.1328125, 33.34375, 34.5546875, 35.765625, 36.9765625, 38.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 1.0, 7.0, 3.0, 10.0, 7.0, 8.0, 16.0, 34.0, 44.0, 76.0, 93.0, 132.0, 217.0, 305.0, 444.0, 698.0, 1076.0, 1718.0, 2787.0, 4815.0, 8926.0, 16826.0, 34449.0, 78720.0, 334024.0, 5588492.0, 120772.0, 47326.0, 22306.0, 11699.0, 6159.0, 3337.0, 2180.0, 1319.0, 819.0, 490.0, 302.0, 228.0, 182.0, 121.0, 82.0, 57.0, 47.0, 21.0, 18.0, 16.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-123.5625, -120.052734375, -116.54296875, -113.033203125, -109.5234375, -106.013671875, -102.50390625, -98.994140625, -95.484375, -91.974609375, -88.46484375, -84.955078125, -81.4453125, -77.935546875, -74.42578125, -70.916015625, -67.40625, -63.896484375, -60.38671875, -56.876953125, -53.3671875, -49.857421875, -46.34765625, -42.837890625, -39.328125, -35.818359375, -32.30859375, -28.798828125, -25.2890625, -21.779296875, -18.26953125, -14.759765625, -11.25, -7.740234375, -4.23046875, -0.720703125, 2.7890625, 6.298828125, 9.80859375, 13.318359375, 16.828125, 20.337890625, 23.84765625, 27.357421875, 30.8671875, 34.376953125, 37.88671875, 41.396484375, 44.90625, 48.416015625, 51.92578125, 55.435546875, 58.9453125, 62.455078125, 65.96484375, 69.474609375, 72.984375, 76.494140625, 80.00390625, 83.513671875, 87.0234375, 90.533203125, 94.04296875, 97.552734375, 101.0625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 9.0, 7.0, 8.0, 16.0, 13.0, 16.0, 26.0, 24.0, 26.0, 38.0, 42.0, 40.0, 59.0, 92.0, 162.0, 339.0, 419.0, 186.0, 100.0, 61.0, 42.0, 45.0, 45.0, 34.0, 22.0, 18.0, 27.0, 19.0, 15.0, 12.0, 7.0, 12.0, 8.0, 6.0, 4.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4375, -65.0439453125, -62.650390625, -60.2568359375, -57.86328125, -55.4697265625, -53.076171875, -50.6826171875, -48.2890625, -45.8955078125, -43.501953125, -41.1083984375, -38.71484375, -36.3212890625, -33.927734375, -31.5341796875, -29.140625, -26.7470703125, -24.353515625, -21.9599609375, -19.56640625, -17.1728515625, -14.779296875, -12.3857421875, -9.9921875, -7.5986328125, -5.205078125, -2.8115234375, -0.41796875, 1.9755859375, 4.369140625, 6.7626953125, 9.15625, 11.5498046875, 13.943359375, 16.3369140625, 18.73046875, 21.1240234375, 23.517578125, 25.9111328125, 28.3046875, 30.6982421875, 33.091796875, 35.4853515625, 37.87890625, 40.2724609375, 42.666015625, 45.0595703125, 47.453125, 49.8466796875, 52.240234375, 54.6337890625, 57.02734375, 59.4208984375, 61.814453125, 64.2080078125, 66.6015625, 68.9951171875, 71.388671875, 73.7822265625, 76.17578125, 78.5693359375, 80.962890625, 83.3564453125, 85.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 3.0, 5.0, 3.0, 11.0, 18.0, 21.0, 14.0, 21.0, 29.0, 46.0, 85.0, 130.0, 236.0, 111.0, 64.0, 60.0, 30.0, 29.0, 25.0, 12.0, 22.0, 9.0, 3.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3233.22998046875, -3155.23974609375, -3077.24951171875, -2999.25927734375, -2921.26904296875, -2843.27880859375, -2765.28857421875, -2687.29833984375, -2609.30810546875, -2531.31787109375, -2453.32763671875, -2375.33740234375, -2297.34716796875, -2219.35693359375, -2141.36669921875, -2063.37646484375, -1985.386474609375, -1907.396240234375, -1829.406005859375, -1751.415771484375, -1673.425537109375, -1595.435302734375, -1517.4451904296875, -1439.4549560546875, -1361.4647216796875, -1283.4744873046875, -1205.4842529296875, -1127.4940185546875, -1049.50390625, -971.5136108398438, -893.5234375, -815.533203125, -737.5428466796875, -659.5526123046875, -581.5623779296875, -503.57220458984375, -425.58197021484375, -347.59173583984375, -269.6015319824219, -191.611328125, -113.62109375, -35.63087463378906, 42.359344482421875, 120.34956359863281, 198.33978271484375, 276.33001708984375, 354.3202209472656, 432.3104248046875, 510.3006591796875, 588.2908935546875, 666.2811279296875, 744.2713012695312, 822.2615356445312, 900.2517700195312, 978.241943359375, 1056.232177734375, 1134.222412109375, 1212.212646484375, 1290.202880859375, 1368.193115234375, 1446.183349609375, 1524.173583984375, 1602.1636962890625, 1680.1539306640625, 1758.1441650390625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 11.0, 7.0, 13.0, 13.0, 16.0, 11.0, 15.0, 18.0, 14.0, 24.0, 21.0, 24.0, 33.0, 45.0, 62.0, 126.0, 127.0, 78.0, 53.0, 35.0, 25.0, 13.0, 24.0, 18.0, 21.0, 22.0, 20.0, 12.0, 10.0, 14.0, 13.0, 7.0, 6.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2016.4866943359375, -1949.412841796875, -1882.3389892578125, -1815.26513671875, -1748.1912841796875, -1681.117431640625, -1614.04345703125, -1546.9697265625, -1479.895751953125, -1412.8218994140625, -1345.748046875, -1278.6741943359375, -1211.600341796875, -1144.5264892578125, -1077.45263671875, -1010.3787231445312, -943.304931640625, -876.2310791015625, -809.1572265625, -742.0833740234375, -675.009521484375, -607.9356689453125, -540.8617553710938, -473.78790283203125, -406.71405029296875, -339.64019775390625, -272.56634521484375, -205.49246215820312, -138.41860961914062, -71.34475708007812, -4.2708740234375, 62.802978515625, 129.876708984375, 196.9505615234375, 264.0244140625, 331.0982971191406, 398.1721496582031, 465.2460021972656, 532.3198852539062, 599.3937377929688, 666.4675903320312, 733.5414428710938, 800.6152954101562, 867.689208984375, 934.7630615234375, 1001.8369140625, 1068.9107666015625, 1135.984619140625, 1203.0584716796875, 1270.13232421875, 1337.2061767578125, 1404.280029296875, 1471.3538818359375, 1538.427734375, 1605.501708984375, 1672.575439453125, 1739.6494140625, 1806.7232666015625, 1873.797119140625, 1940.8709716796875, 2007.94482421875, 2075.018798828125, 2142.092529296875, 2209.16650390625, 2276.240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 16.0, 22.0, 27.0, 30.0, 52.0, 69.0, 99.0, 152.0, 194.0, 328.0, 452.0, 650.0, 948.0, 1521.0, 2418.0, 3946.0, 6571.0, 11784.0, 24813.0, 66532.0, 313118.0, 3306225.0, 343523.0, 66571.0, 22076.0, 9760.0, 4925.0, 2857.0, 1711.0, 1023.0, 675.0, 407.0, 271.0, 175.0, 111.0, 69.0, 49.0, 31.0, 19.0, 14.0, 14.0, 11.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.578125, -25.849853515625, -25.12158203125, -24.393310546875, -23.6650390625, -22.936767578125, -22.20849609375, -21.480224609375, -20.751953125, -20.023681640625, -19.29541015625, -18.567138671875, -17.8388671875, -17.110595703125, -16.38232421875, -15.654052734375, -14.92578125, -14.197509765625, -13.46923828125, -12.740966796875, -12.0126953125, -11.284423828125, -10.55615234375, -9.827880859375, -9.099609375, -8.371337890625, -7.64306640625, -6.914794921875, -6.1865234375, -5.458251953125, -4.72998046875, -4.001708984375, -3.2734375, -2.545166015625, -1.81689453125, -1.088623046875, -0.3603515625, 0.367919921875, 1.09619140625, 1.824462890625, 2.552734375, 3.281005859375, 4.00927734375, 4.737548828125, 5.4658203125, 6.194091796875, 6.92236328125, 7.650634765625, 8.37890625, 9.107177734375, 9.83544921875, 10.563720703125, 11.2919921875, 12.020263671875, 12.74853515625, 13.476806640625, 14.205078125, 14.933349609375, 15.66162109375, 16.389892578125, 17.1181640625, 17.846435546875, 18.57470703125, 19.302978515625, 20.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 14.0, 5.0, 18.0, 33.0, 50.0, 64.0, 97.0, 161.0, 194.0, 110.0, 78.0, 45.0, 36.0, 19.0, 13.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.568511962890625, -2.49053955078125, -2.412567138671875, -2.3345947265625, -2.256622314453125, -2.17864990234375, -2.100677490234375, -2.022705078125, -1.944732666015625, -1.86676025390625, -1.788787841796875, -1.7108154296875, -1.632843017578125, -1.55487060546875, -1.476898193359375, -1.39892578125, -1.320953369140625, -1.24298095703125, -1.165008544921875, -1.0870361328125, -1.009063720703125, -0.93109130859375, -0.853118896484375, -0.775146484375, -0.697174072265625, -0.61920166015625, -0.541229248046875, -0.4632568359375, -0.385284423828125, -0.30731201171875, -0.229339599609375, -0.1513671875, -0.073394775390625, 0.00457763671875, 0.082550048828125, 0.1605224609375, 0.238494873046875, 0.31646728515625, 0.394439697265625, 0.472412109375, 0.550384521484375, 0.62835693359375, 0.706329345703125, 0.7843017578125, 0.862274169921875, 0.94024658203125, 1.018218994140625, 1.09619140625, 1.174163818359375, 1.25213623046875, 1.330108642578125, 1.4080810546875, 1.486053466796875, 1.56402587890625, 1.641998291015625, 1.719970703125, 1.797943115234375, 1.87591552734375, 1.953887939453125, 2.0318603515625, 2.109832763671875, 2.18780517578125, 2.265777587890625, 2.34375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 12.0, 18.0, 27.0, 33.0, 45.0, 56.0, 77.0, 135.0, 245.0, 361.0, 666.0, 1241.0, 2568.0, 6071.0, 17541.0, 65625.0, 354826.0, 2721496.0, 847103.0, 129662.0, 29757.0, 9388.0, 3598.0, 1608.0, 863.0, 504.0, 253.0, 159.0, 115.0, 63.0, 47.0, 41.0, 23.0, 13.0, 11.0, 8.0, 10.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.109375, -27.275390625, -26.44140625, -25.607421875, -24.7734375, -23.939453125, -23.10546875, -22.271484375, -21.4375, -20.603515625, -19.76953125, -18.935546875, -18.1015625, -17.267578125, -16.43359375, -15.599609375, -14.765625, -13.931640625, -13.09765625, -12.263671875, -11.4296875, -10.595703125, -9.76171875, -8.927734375, -8.09375, -7.259765625, -6.42578125, -5.591796875, -4.7578125, -3.923828125, -3.08984375, -2.255859375, -1.421875, -0.587890625, 0.24609375, 1.080078125, 1.9140625, 2.748046875, 3.58203125, 4.416015625, 5.25, 6.083984375, 6.91796875, 7.751953125, 8.5859375, 9.419921875, 10.25390625, 11.087890625, 11.921875, 12.755859375, 13.58984375, 14.423828125, 15.2578125, 16.091796875, 16.92578125, 17.759765625, 18.59375, 19.427734375, 20.26171875, 21.095703125, 21.9296875, 22.763671875, 23.59765625, 24.431640625, 25.265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 4.0, 16.0, 13.0, 13.0, 18.0, 27.0, 36.0, 62.0, 45.0, 86.0, 110.0, 134.0, 165.0, 293.0, 367.0, 740.0, 508.0, 354.0, 265.0, 171.0, 135.0, 116.0, 93.0, 71.0, 51.0, 44.0, 28.0, 29.0, 19.0, 11.0, 6.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -4.993408203125, -4.78369140625, -4.573974609375, -4.3642578125, -4.154541015625, -3.94482421875, -3.735107421875, -3.525390625, -3.315673828125, -3.10595703125, -2.896240234375, -2.6865234375, -2.476806640625, -2.26708984375, -2.057373046875, -1.84765625, -1.637939453125, -1.42822265625, -1.218505859375, -1.0087890625, -0.799072265625, -0.58935546875, -0.379638671875, -0.169921875, 0.039794921875, 0.24951171875, 0.459228515625, 0.6689453125, 0.878662109375, 1.08837890625, 1.298095703125, 1.5078125, 1.717529296875, 1.92724609375, 2.136962890625, 2.3466796875, 2.556396484375, 2.76611328125, 2.975830078125, 3.185546875, 3.395263671875, 3.60498046875, 3.814697265625, 4.0244140625, 4.234130859375, 4.44384765625, 4.653564453125, 4.86328125, 5.072998046875, 5.28271484375, 5.492431640625, 5.7021484375, 5.911865234375, 6.12158203125, 6.331298828125, 6.541015625, 6.750732421875, 6.96044921875, 7.170166015625, 7.3798828125, 7.589599609375, 7.79931640625, 8.009033203125, 8.21875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 16.0, 25.0, 30.0, 53.0, 79.0, 124.0, 144.0, 141.0, 121.0, 88.0, 67.0, 34.0, 24.0, 16.0, 10.0, 6.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.24186706542969, -83.62004089355469, -80.99822235107422, -78.37639617919922, -75.75457763671875, -73.13275146484375, -70.51092529296875, -67.88910675048828, -65.26728057861328, -62.64545822143555, -60.02363586425781, -57.40180969238281, -54.77998733520508, -52.158164978027344, -49.53634262084961, -46.914520263671875, -44.29269790649414, -41.670875549316406, -39.04905319213867, -36.42723083496094, -33.80540466308594, -31.183582305908203, -28.56175994873047, -25.9399356842041, -23.318113327026367, -20.696290969848633, -18.074466705322266, -15.452644348144531, -12.83082103729248, -10.20899772644043, -7.587175369262695, -4.965351104736328, -2.3435287475585938, 0.27829432487487793, 2.9001173973083496, 5.521940231323242, 8.143763542175293, 10.765586853027344, 13.387409210205078, 16.009233474731445, 18.63105583190918, 21.252878189086914, 23.87470245361328, 26.496524810791016, 29.11834716796875, 31.740171432495117, 34.36199188232422, 36.98381805419922, 39.60564041137695, 42.22746276855469, 44.84928512573242, 47.471107482910156, 50.092933654785156, 52.71475601196289, 55.336578369140625, 57.958404541015625, 60.580223083496094, 63.20204544067383, 65.82386779785156, 68.44569396972656, 71.06751251220703, 73.68933868408203, 76.3111572265625, 78.9329833984375, 81.5548095703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 10.0, 11.0, 15.0, 41.0, 24.0, 33.0, 32.0, 49.0, 62.0, 42.0, 57.0, 50.0, 55.0, 68.0, 52.0, 69.0, 62.0, 51.0, 32.0, 40.0, 32.0, 27.0, 27.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.68160247802734, -74.87442779541016, -73.06725311279297, -71.26007843017578, -69.4529037475586, -67.6457290649414, -65.83855438232422, -64.03138732910156, -62.22420883178711, -60.41703414916992, -58.609859466552734, -56.80268478393555, -54.995513916015625, -53.18833923339844, -51.38116455078125, -49.57398986816406, -47.766815185546875, -45.95964050292969, -44.1524658203125, -42.34529113769531, -40.538116455078125, -38.73094177246094, -36.923770904541016, -35.11659622192383, -33.30942153930664, -31.502246856689453, -29.695072174072266, -27.88789939880371, -26.080724716186523, -24.273550033569336, -22.46637725830078, -20.659202575683594, -18.852027893066406, -17.04485321044922, -15.237679481506348, -13.430505752563477, -11.623331069946289, -9.816156387329102, -8.00898265838623, -6.201808929443359, -4.394634246826172, -2.5874600410461426, -0.7802858352661133, 1.026888370513916, 2.8340625762939453, 4.641237258911133, 6.448410987854004, 8.255584716796875, 10.062759399414062, 11.86993408203125, 13.677107810974121, 15.484281539916992, 17.29145622253418, 19.098630905151367, 20.905803680419922, 22.71297836303711, 24.520153045654297, 26.327327728271484, 28.134502410888672, 29.941675186157227, 31.748849868774414, 33.55602264404297, 35.363197326660156, 37.170372009277344, 38.97754669189453]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 9.0, 8.0, 13.0, 10.0, 17.0, 26.0, 42.0, 48.0, 84.0, 143.0, 196.0, 284.0, 430.0, 614.0, 1077.0, 1764.0, 3091.0, 6382.0, 15220.0, 40714.0, 141256.0, 559740.0, 192602.0, 50691.0, 18029.0, 7482.0, 3560.0, 1900.0, 1088.0, 721.0, 439.0, 271.0, 175.0, 119.0, 87.0, 73.0, 48.0, 28.0, 20.0, 27.0, 13.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.7208251953125, -15.238525390625, -14.7562255859375, -14.27392578125, -13.7916259765625, -13.309326171875, -12.8270263671875, -12.3447265625, -11.8624267578125, -11.380126953125, -10.8978271484375, -10.41552734375, -9.9332275390625, -9.450927734375, -8.9686279296875, -8.486328125, -8.0040283203125, -7.521728515625, -7.0394287109375, -6.55712890625, -6.0748291015625, -5.592529296875, -5.1102294921875, -4.6279296875, -4.1456298828125, -3.663330078125, -3.1810302734375, -2.69873046875, -2.2164306640625, -1.734130859375, -1.2518310546875, -0.76953125, -0.2872314453125, 0.195068359375, 0.6773681640625, 1.15966796875, 1.6419677734375, 2.124267578125, 2.6065673828125, 3.0888671875, 3.5711669921875, 4.053466796875, 4.5357666015625, 5.01806640625, 5.5003662109375, 5.982666015625, 6.4649658203125, 6.947265625, 7.4295654296875, 7.911865234375, 8.3941650390625, 8.87646484375, 9.3587646484375, 9.841064453125, 10.3233642578125, 10.8056640625, 11.2879638671875, 11.770263671875, 12.2525634765625, 12.73486328125, 13.2171630859375, 13.699462890625, 14.1817626953125, 14.6640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 16.0, 16.0, 26.0, 31.0, 40.0, 46.0, 56.0, 86.0, 91.0, 89.0, 91.0, 83.0, 73.0, 53.0, 51.0, 33.0, 29.0, 18.0, 16.0, 10.0, 9.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.20416259765625, -2.1212158203125, -2.03826904296875, -1.955322265625, -1.87237548828125, -1.7894287109375, -1.70648193359375, -1.62353515625, -1.54058837890625, -1.4576416015625, -1.37469482421875, -1.291748046875, -1.20880126953125, -1.1258544921875, -1.04290771484375, -0.9599609375, -0.87701416015625, -0.7940673828125, -0.71112060546875, -0.628173828125, -0.54522705078125, -0.4622802734375, -0.37933349609375, -0.29638671875, -0.21343994140625, -0.1304931640625, -0.04754638671875, 0.035400390625, 0.11834716796875, 0.2012939453125, 0.28424072265625, 0.3671875, 0.45013427734375, 0.5330810546875, 0.61602783203125, 0.698974609375, 0.78192138671875, 0.8648681640625, 0.94781494140625, 1.03076171875, 1.11370849609375, 1.1966552734375, 1.27960205078125, 1.362548828125, 1.44549560546875, 1.5284423828125, 1.61138916015625, 1.6943359375, 1.77728271484375, 1.8602294921875, 1.94317626953125, 2.026123046875, 2.10906982421875, 2.1920166015625, 2.27496337890625, 2.35791015625, 2.44085693359375, 2.5238037109375, 2.60675048828125, 2.689697265625, 2.77264404296875, 2.8555908203125, 2.93853759765625, 3.021484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 8.0, 7.0, 17.0, 20.0, 25.0, 41.0, 56.0, 78.0, 112.0, 186.0, 242.0, 406.0, 636.0, 1081.0, 1674.0, 3289.0, 6143.0, 12354.0, 28694.0, 75426.0, 272453.0, 450254.0, 119193.0, 40872.0, 17284.0, 8038.0, 4154.0, 2277.0, 1310.0, 811.0, 496.0, 320.0, 200.0, 116.0, 94.0, 61.0, 39.0, 22.0, 24.0, 14.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-12.5078125, -12.14208984375, -11.7763671875, -11.41064453125, -11.044921875, -10.67919921875, -10.3134765625, -9.94775390625, -9.58203125, -9.21630859375, -8.8505859375, -8.48486328125, -8.119140625, -7.75341796875, -7.3876953125, -7.02197265625, -6.65625, -6.29052734375, -5.9248046875, -5.55908203125, -5.193359375, -4.82763671875, -4.4619140625, -4.09619140625, -3.73046875, -3.36474609375, -2.9990234375, -2.63330078125, -2.267578125, -1.90185546875, -1.5361328125, -1.17041015625, -0.8046875, -0.43896484375, -0.0732421875, 0.29248046875, 0.658203125, 1.02392578125, 1.3896484375, 1.75537109375, 2.12109375, 2.48681640625, 2.8525390625, 3.21826171875, 3.583984375, 3.94970703125, 4.3154296875, 4.68115234375, 5.046875, 5.41259765625, 5.7783203125, 6.14404296875, 6.509765625, 6.87548828125, 7.2412109375, 7.60693359375, 7.97265625, 8.33837890625, 8.7041015625, 9.06982421875, 9.435546875, 9.80126953125, 10.1669921875, 10.53271484375, 10.8984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 10.0, 6.0, 7.0, 11.0, 11.0, 22.0, 26.0, 23.0, 32.0, 29.0, 26.0, 29.0, 38.0, 34.0, 31.0, 38.0, 40.0, 49.0, 52.0, 52.0, 53.0, 43.0, 33.0, 50.0, 31.0, 30.0, 29.0, 28.0, 23.0, 21.0, 19.0, 12.0, 14.0, 19.0, 6.0, 11.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-12.5390625, -12.1859130859375, -11.832763671875, -11.4796142578125, -11.12646484375, -10.7733154296875, -10.420166015625, -10.0670166015625, -9.7138671875, -9.3607177734375, -9.007568359375, -8.6544189453125, -8.30126953125, -7.9481201171875, -7.594970703125, -7.2418212890625, -6.888671875, -6.5355224609375, -6.182373046875, -5.8292236328125, -5.47607421875, -5.1229248046875, -4.769775390625, -4.4166259765625, -4.0634765625, -3.7103271484375, -3.357177734375, -3.0040283203125, -2.65087890625, -2.2977294921875, -1.944580078125, -1.5914306640625, -1.23828125, -0.8851318359375, -0.531982421875, -0.1788330078125, 0.17431640625, 0.5274658203125, 0.880615234375, 1.2337646484375, 1.5869140625, 1.9400634765625, 2.293212890625, 2.6463623046875, 2.99951171875, 3.3526611328125, 3.705810546875, 4.0589599609375, 4.412109375, 4.7652587890625, 5.118408203125, 5.4715576171875, 5.82470703125, 6.1778564453125, 6.531005859375, 6.8841552734375, 7.2373046875, 7.5904541015625, 7.943603515625, 8.2967529296875, 8.64990234375, 9.0030517578125, 9.356201171875, 9.7093505859375, 10.0625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 11.0, 16.0, 36.0, 44.0, 101.0, 191.0, 423.0, 1140.0, 3612.0, 17816.0, 230767.0, 736416.0, 47968.0, 6956.0, 1821.0, 658.0, 251.0, 147.0, 54.0, 34.0, 21.0, 21.0, 13.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.109375, -13.626708984375, -13.14404296875, -12.661376953125, -12.1787109375, -11.696044921875, -11.21337890625, -10.730712890625, -10.248046875, -9.765380859375, -9.28271484375, -8.800048828125, -8.3173828125, -7.834716796875, -7.35205078125, -6.869384765625, -6.38671875, -5.904052734375, -5.42138671875, -4.938720703125, -4.4560546875, -3.973388671875, -3.49072265625, -3.008056640625, -2.525390625, -2.042724609375, -1.56005859375, -1.077392578125, -0.5947265625, -0.112060546875, 0.37060546875, 0.853271484375, 1.3359375, 1.818603515625, 2.30126953125, 2.783935546875, 3.2666015625, 3.749267578125, 4.23193359375, 4.714599609375, 5.197265625, 5.679931640625, 6.16259765625, 6.645263671875, 7.1279296875, 7.610595703125, 8.09326171875, 8.575927734375, 9.05859375, 9.541259765625, 10.02392578125, 10.506591796875, 10.9892578125, 11.471923828125, 11.95458984375, 12.437255859375, 12.919921875, 13.402587890625, 13.88525390625, 14.367919921875, 14.8505859375, 15.333251953125, 15.81591796875, 16.298583984375, 16.78125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 26.0, 32.0, 43.0, 93.0, 89.0, 157.0, 126.0, 142.0, 89.0, 73.0, 35.0, 28.0, 17.0, 16.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006003379821777344, -0.0005805566906929016, -0.0005607753992080688, -0.0005409941077232361, -0.0005212128162384033, -0.0005014315247535706, -0.0004816502332687378, -0.00046186894178390503, -0.00044208765029907227, -0.0004223063588142395, -0.00040252506732940674, -0.000382743775844574, -0.0003629624843597412, -0.00034318119287490845, -0.0003233999013900757, -0.0003036186099052429, -0.00028383731842041016, -0.0002640560269355774, -0.00024427473545074463, -0.00022449344396591187, -0.0002047121524810791, -0.00018493086099624634, -0.00016514956951141357, -0.0001453682780265808, -0.00012558698654174805, -0.00010580569505691528, -8.602440357208252e-05, -6.624311208724976e-05, -4.646182060241699e-05, -2.668052911758423e-05, -6.899237632751465e-06, 1.2882053852081299e-05, 3.266334533691406e-05, 5.2444636821746826e-05, 7.222592830657959e-05, 9.200721979141235e-05, 0.00011178851127624512, 0.00013156980276107788, 0.00015135109424591064, 0.0001711323857307434, 0.00019091367721557617, 0.00021069496870040894, 0.0002304762601852417, 0.00025025755167007446, 0.0002700388431549072, 0.00028982013463974, 0.00030960142612457275, 0.0003293827176094055, 0.0003491640090942383, 0.00036894530057907104, 0.0003887265920639038, 0.00040850788354873657, 0.00042828917503356934, 0.0004480704665184021, 0.00046785175800323486, 0.0004876330494880676, 0.0005074143409729004, 0.0005271956324577332, 0.0005469769239425659, 0.0005667582154273987, 0.0005865395069122314, 0.0006063207983970642, 0.000626102089881897, 0.0006458833813667297, 0.0006656646728515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 8.0, 11.0, 4.0, 13.0, 18.0, 25.0, 30.0, 45.0, 92.0, 137.0, 226.0, 433.0, 860.0, 2021.0, 5727.0, 20902.0, 124671.0, 672890.0, 182277.0, 26647.0, 6908.0, 2471.0, 959.0, 466.0, 232.0, 174.0, 124.0, 56.0, 32.0, 27.0, 16.0, 12.0, 9.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.12646484375, -9.7841796875, -9.44189453125, -9.099609375, -8.75732421875, -8.4150390625, -8.07275390625, -7.73046875, -7.38818359375, -7.0458984375, -6.70361328125, -6.361328125, -6.01904296875, -5.6767578125, -5.33447265625, -4.9921875, -4.64990234375, -4.3076171875, -3.96533203125, -3.623046875, -3.28076171875, -2.9384765625, -2.59619140625, -2.25390625, -1.91162109375, -1.5693359375, -1.22705078125, -0.884765625, -0.54248046875, -0.2001953125, 0.14208984375, 0.484375, 0.82666015625, 1.1689453125, 1.51123046875, 1.853515625, 2.19580078125, 2.5380859375, 2.88037109375, 3.22265625, 3.56494140625, 3.9072265625, 4.24951171875, 4.591796875, 4.93408203125, 5.2763671875, 5.61865234375, 5.9609375, 6.30322265625, 6.6455078125, 6.98779296875, 7.330078125, 7.67236328125, 8.0146484375, 8.35693359375, 8.69921875, 9.04150390625, 9.3837890625, 9.72607421875, 10.068359375, 10.41064453125, 10.7529296875, 11.09521484375, 11.4375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 15.0, 14.0, 26.0, 35.0, 44.0, 69.0, 75.0, 102.0, 95.0, 131.0, 118.0, 75.0, 55.0, 45.0, 29.0, 22.0, 19.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.0133056640625, -6.760986328125, -6.5086669921875, -6.25634765625, -6.0040283203125, -5.751708984375, -5.4993896484375, -5.2470703125, -4.9947509765625, -4.742431640625, -4.4901123046875, -4.23779296875, -3.9854736328125, -3.733154296875, -3.4808349609375, -3.228515625, -2.9761962890625, -2.723876953125, -2.4715576171875, -2.21923828125, -1.9669189453125, -1.714599609375, -1.4622802734375, -1.2099609375, -0.9576416015625, -0.705322265625, -0.4530029296875, -0.20068359375, 0.0516357421875, 0.303955078125, 0.5562744140625, 0.80859375, 1.0609130859375, 1.313232421875, 1.5655517578125, 1.81787109375, 2.0701904296875, 2.322509765625, 2.5748291015625, 2.8271484375, 3.0794677734375, 3.331787109375, 3.5841064453125, 3.83642578125, 4.0887451171875, 4.341064453125, 4.5933837890625, 4.845703125, 5.0980224609375, 5.350341796875, 5.6026611328125, 5.85498046875, 6.1072998046875, 6.359619140625, 6.6119384765625, 6.8642578125, 7.1165771484375, 7.368896484375, 7.6212158203125, 7.87353515625, 8.1258544921875, 8.378173828125, 8.6304931640625, 8.8828125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 22.0, 35.0, 51.0, 143.0, 269.0, 216.0, 103.0, 44.0, 25.0, 19.0, 9.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.60899353027344, -132.98910522460938, -128.36923217773438, -123.74935150146484, -119.12947082519531, -114.50958251953125, -109.88970184326172, -105.26982116699219, -100.64994049072266, -96.03005981445312, -91.4101791381836, -86.79029846191406, -82.17041015625, -77.550537109375, -72.93064880371094, -68.3107681274414, -63.690887451171875, -59.071006774902344, -54.45112609863281, -49.831241607666016, -45.211360931396484, -40.59148025512695, -35.971595764160156, -31.351715087890625, -26.731834411621094, -22.111953735351562, -17.4920711517334, -12.87218952178955, -8.252307891845703, -3.632427215576172, 0.9874553680419922, 5.607337951660156, 10.22723388671875, 14.847115516662598, 19.466997146606445, 24.08687973022461, 28.70676040649414, 33.32664108276367, 37.94652557373047, 42.56640625, 47.18628692626953, 51.80616760253906, 56.426048278808594, 61.04593276977539, 65.66581726074219, 70.28569030761719, 74.90557861328125, 79.52545928955078, 84.14533996582031, 88.76522064208984, 93.38510131835938, 98.0049819946289, 102.62486267089844, 107.2447509765625, 111.86463165283203, 116.48451232910156, 121.1043930053711, 125.72427368164062, 130.3441619873047, 134.9640350341797, 139.58392333984375, 144.20379638671875, 148.8236846923828, 153.44357299804688, 158.06344604492188]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 11.0, 6.0, 18.0, 22.0, 50.0, 82.0, 105.0, 137.0, 145.0, 136.0, 96.0, 56.0, 27.0, 21.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-210.1232147216797, -204.0203399658203, -197.91744995117188, -191.8145751953125, -185.71168518066406, -179.6088104248047, -173.50592041015625, -167.40304565429688, -161.3001708984375, -155.19729614257812, -149.0944061279297, -142.9915313720703, -136.88864135742188, -130.7857666015625, -124.6828842163086, -118.58000183105469, -112.47711181640625, -106.37422943115234, -100.27134704589844, -94.16847229003906, -88.06558227539062, -81.96270751953125, -75.85982513427734, -69.75694274902344, -63.65406036376953, -57.551177978515625, -51.44829559326172, -45.34541702270508, -39.24253463745117, -33.139652252197266, -27.036773681640625, -20.93389129638672, -14.831024169921875, -8.728142738342285, -2.6252613067626953, 3.477619171142578, 9.580501556396484, 15.68338394165039, 21.78626251220703, 27.889144897460938, 33.992027282714844, 40.09490966796875, 46.197792053222656, 52.3006706237793, 58.4035530090332, 64.50643920898438, 70.60931396484375, 76.71219635009766, 82.81507873535156, 88.91796112060547, 95.02084350585938, 101.12371826171875, 107.22660827636719, 113.32948303222656, 119.43236541748047, 125.53524780273438, 131.63812255859375, 137.74099731445312, 143.84388732910156, 149.94676208496094, 156.04965209960938, 162.15252685546875, 168.25540161132812, 174.35829162597656, 180.461181640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 9.0, 9.0, 10.0, 19.0, 37.0, 52.0, 93.0, 176.0, 299.0, 582.0, 1175.0, 2738.0, 7303.0, 24075.0, 124118.0, 3645417.0, 327120.0, 41793.0, 11115.0, 4023.0, 1818.0, 903.0, 532.0, 279.0, 159.0, 126.0, 81.0, 52.0, 39.0, 27.0, 20.0, 23.0, 13.0, 16.0, 4.0, 10.0, 1.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.6875, -35.2021484375, -33.716796875, -32.2314453125, -30.74609375, -29.2607421875, -27.775390625, -26.2900390625, -24.8046875, -23.3193359375, -21.833984375, -20.3486328125, -18.86328125, -17.3779296875, -15.892578125, -14.4072265625, -12.921875, -11.4365234375, -9.951171875, -8.4658203125, -6.98046875, -5.4951171875, -4.009765625, -2.5244140625, -1.0390625, 0.4462890625, 1.931640625, 3.4169921875, 4.90234375, 6.3876953125, 7.873046875, 9.3583984375, 10.84375, 12.3291015625, 13.814453125, 15.2998046875, 16.78515625, 18.2705078125, 19.755859375, 21.2412109375, 22.7265625, 24.2119140625, 25.697265625, 27.1826171875, 28.66796875, 30.1533203125, 31.638671875, 33.1240234375, 34.609375, 36.0947265625, 37.580078125, 39.0654296875, 40.55078125, 42.0361328125, 43.521484375, 45.0068359375, 46.4921875, 47.9775390625, 49.462890625, 50.9482421875, 52.43359375, 53.9189453125, 55.404296875, 56.8896484375, 58.375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 9.0, 10.0, 6.0, 18.0, 14.0, 27.0, 44.0, 43.0, 55.0, 63.0, 93.0, 75.0, 88.0, 80.0, 78.0, 70.0, 54.0, 38.0, 25.0, 33.0, 13.0, 7.0, 8.0, 13.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.880859375, -1.79681396484375, -1.7127685546875, -1.62872314453125, -1.544677734375, -1.46063232421875, -1.3765869140625, -1.29254150390625, -1.20849609375, -1.12445068359375, -1.0404052734375, -0.95635986328125, -0.872314453125, -0.78826904296875, -0.7042236328125, -0.62017822265625, -0.5361328125, -0.45208740234375, -0.3680419921875, -0.28399658203125, -0.199951171875, -0.11590576171875, -0.0318603515625, 0.05218505859375, 0.13623046875, 0.22027587890625, 0.3043212890625, 0.38836669921875, 0.472412109375, 0.55645751953125, 0.6405029296875, 0.72454833984375, 0.80859375, 0.89263916015625, 0.9766845703125, 1.06072998046875, 1.144775390625, 1.22882080078125, 1.3128662109375, 1.39691162109375, 1.48095703125, 1.56500244140625, 1.6490478515625, 1.73309326171875, 1.817138671875, 1.90118408203125, 1.9852294921875, 2.06927490234375, 2.1533203125, 2.23736572265625, 2.3214111328125, 2.40545654296875, 2.489501953125, 2.57354736328125, 2.6575927734375, 2.74163818359375, 2.82568359375, 2.90972900390625, 2.9937744140625, 3.07781982421875, 3.161865234375, 3.24591064453125, 3.3299560546875, 3.41400146484375, 3.498046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 13.0, 6.0, 12.0, 13.0, 20.0, 24.0, 44.0, 86.0, 83.0, 132.0, 217.0, 330.0, 532.0, 917.0, 1527.0, 3015.0, 6192.0, 14269.0, 37039.0, 115990.0, 528724.0, 2986614.0, 356639.0, 88909.0, 29769.0, 11808.0, 5148.0, 2556.0, 1441.0, 851.0, 445.0, 335.0, 191.0, 111.0, 84.0, 51.0, 33.0, 27.0, 24.0, 17.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.4375, -26.53466796875, -25.6318359375, -24.72900390625, -23.826171875, -22.92333984375, -22.0205078125, -21.11767578125, -20.21484375, -19.31201171875, -18.4091796875, -17.50634765625, -16.603515625, -15.70068359375, -14.7978515625, -13.89501953125, -12.9921875, -12.08935546875, -11.1865234375, -10.28369140625, -9.380859375, -8.47802734375, -7.5751953125, -6.67236328125, -5.76953125, -4.86669921875, -3.9638671875, -3.06103515625, -2.158203125, -1.25537109375, -0.3525390625, 0.55029296875, 1.453125, 2.35595703125, 3.2587890625, 4.16162109375, 5.064453125, 5.96728515625, 6.8701171875, 7.77294921875, 8.67578125, 9.57861328125, 10.4814453125, 11.38427734375, 12.287109375, 13.18994140625, 14.0927734375, 14.99560546875, 15.8984375, 16.80126953125, 17.7041015625, 18.60693359375, 19.509765625, 20.41259765625, 21.3154296875, 22.21826171875, 23.12109375, 24.02392578125, 24.9267578125, 25.82958984375, 26.732421875, 27.63525390625, 28.5380859375, 29.44091796875, 30.34375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 13.0, 16.0, 15.0, 37.0, 27.0, 64.0, 107.0, 191.0, 338.0, 809.0, 1535.0, 336.0, 205.0, 101.0, 116.0, 46.0, 40.0, 12.0, 17.0, 14.0, 6.0, 8.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.54052734375, -6.3232421875, -6.10595703125, -5.888671875, -5.67138671875, -5.4541015625, -5.23681640625, -5.01953125, -4.80224609375, -4.5849609375, -4.36767578125, -4.150390625, -3.93310546875, -3.7158203125, -3.49853515625, -3.28125, -3.06396484375, -2.8466796875, -2.62939453125, -2.412109375, -2.19482421875, -1.9775390625, -1.76025390625, -1.54296875, -1.32568359375, -1.1083984375, -0.89111328125, -0.673828125, -0.45654296875, -0.2392578125, -0.02197265625, 0.1953125, 0.41259765625, 0.6298828125, 0.84716796875, 1.064453125, 1.28173828125, 1.4990234375, 1.71630859375, 1.93359375, 2.15087890625, 2.3681640625, 2.58544921875, 2.802734375, 3.02001953125, 3.2373046875, 3.45458984375, 3.671875, 3.88916015625, 4.1064453125, 4.32373046875, 4.541015625, 4.75830078125, 4.9755859375, 5.19287109375, 5.41015625, 5.62744140625, 5.8447265625, 6.06201171875, 6.279296875, 6.49658203125, 6.7138671875, 6.93115234375, 7.1484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 11.0, 16.0, 25.0, 44.0, 71.0, 132.0, 181.0, 164.0, 132.0, 102.0, 55.0, 31.0, 15.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.51515579223633, -50.81681442260742, -49.11847686767578, -47.420135498046875, -45.721797943115234, -44.02345657348633, -42.32511901855469, -40.62677764892578, -38.928436279296875, -37.23009490966797, -35.53175735473633, -33.83341598510742, -32.13507843017578, -30.436737060546875, -28.7383975982666, -27.040058135986328, -25.341718673706055, -23.64337921142578, -21.945039749145508, -20.246700286865234, -18.548358917236328, -16.850019454956055, -15.151679992675781, -13.453339576721191, -11.755000114440918, -10.056660652160645, -8.358320236206055, -6.659980773925781, -4.96164083480835, -3.263300895690918, -1.5649614334106445, 0.1333789825439453, 1.8317184448242188, 3.5300583839416504, 5.228398323059082, 6.9267377853393555, 8.625078201293945, 10.323417663574219, 12.021757125854492, 13.720097541809082, 15.418437004089355, 17.116777420043945, 18.81511688232422, 20.513456344604492, 22.211795806884766, 23.910137176513672, 25.608474731445312, 27.30681610107422, 29.005155563354492, 30.703495025634766, 32.40183639526367, 34.10017395019531, 35.79851531982422, 37.496856689453125, 39.195194244384766, 40.89353561401367, 42.59187316894531, 44.29021453857422, 45.98855209350586, 47.686893463134766, 49.385231018066406, 51.08357238769531, 52.78191375732422, 54.48025131225586, 56.178592681884766]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 8.0, 8.0, 10.0, 15.0, 13.0, 17.0, 21.0, 29.0, 27.0, 42.0, 47.0, 56.0, 69.0, 90.0, 47.0, 69.0, 55.0, 61.0, 55.0, 46.0, 40.0, 36.0, 22.0, 25.0, 23.0, 15.0, 9.0, 10.0, 7.0, 10.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.689048767089844, -21.85130500793457, -21.013561248779297, -20.175819396972656, -19.338075637817383, -18.50033187866211, -17.66259002685547, -16.824846267700195, -15.987102508544922, -15.149358749389648, -14.311615943908691, -13.473873138427734, -12.636129379272461, -11.798385620117188, -10.96064281463623, -10.122900009155273, -9.28515625, -8.447412490844727, -7.6096696853637695, -6.771926403045654, -5.934183120727539, -5.096439838409424, -4.258696556091309, -3.4209532737731934, -2.583209991455078, -1.745466709136963, -0.9077234268188477, -0.06998014450073242, 0.7677631378173828, 1.605506420135498, 2.4432497024536133, 3.2809929847717285, 4.118736267089844, 4.956479549407959, 5.794222831726074, 6.6319661140441895, 7.469709396362305, 8.307453155517578, 9.145195960998535, 9.982938766479492, 10.820682525634766, 11.658426284790039, 12.496169090270996, 13.333911895751953, 14.171655654907227, 15.0093994140625, 15.847142219543457, 16.684885025024414, 17.522628784179688, 18.36037254333496, 19.198116302490234, 20.035858154296875, 20.87360191345215, 21.711345672607422, 22.549087524414062, 23.386831283569336, 24.22457504272461, 25.062318801879883, 25.900062561035156, 26.737804412841797, 27.57554817199707, 28.413291931152344, 29.251033782958984, 30.088777542114258, 30.92652130126953]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 12.0, 32.0, 41.0, 60.0, 102.0, 156.0, 291.0, 580.0, 973.0, 1994.0, 4499.0, 10806.0, 31788.0, 120404.0, 537246.0, 254247.0, 55803.0, 17091.0, 6581.0, 2801.0, 1383.0, 711.0, 369.0, 216.0, 125.0, 83.0, 43.0, 34.0, 15.0, 10.0, 9.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.484375, -26.66943359375, -25.8544921875, -25.03955078125, -24.224609375, -23.40966796875, -22.5947265625, -21.77978515625, -20.96484375, -20.14990234375, -19.3349609375, -18.52001953125, -17.705078125, -16.89013671875, -16.0751953125, -15.26025390625, -14.4453125, -13.63037109375, -12.8154296875, -12.00048828125, -11.185546875, -10.37060546875, -9.5556640625, -8.74072265625, -7.92578125, -7.11083984375, -6.2958984375, -5.48095703125, -4.666015625, -3.85107421875, -3.0361328125, -2.22119140625, -1.40625, -0.59130859375, 0.2236328125, 1.03857421875, 1.853515625, 2.66845703125, 3.4833984375, 4.29833984375, 5.11328125, 5.92822265625, 6.7431640625, 7.55810546875, 8.373046875, 9.18798828125, 10.0029296875, 10.81787109375, 11.6328125, 12.44775390625, 13.2626953125, 14.07763671875, 14.892578125, 15.70751953125, 16.5224609375, 17.33740234375, 18.15234375, 18.96728515625, 19.7822265625, 20.59716796875, 21.412109375, 22.22705078125, 23.0419921875, 23.85693359375, 24.671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 8.0, 5.0, 13.0, 15.0, 26.0, 27.0, 26.0, 39.0, 52.0, 55.0, 58.0, 68.0, 54.0, 60.0, 79.0, 71.0, 56.0, 52.0, 42.0, 34.0, 33.0, 25.0, 26.0, 19.0, 12.0, 10.0, 6.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1875, -2.1134033203125, -2.039306640625, -1.9652099609375, -1.89111328125, -1.8170166015625, -1.742919921875, -1.6688232421875, -1.5947265625, -1.5206298828125, -1.446533203125, -1.3724365234375, -1.29833984375, -1.2242431640625, -1.150146484375, -1.0760498046875, -1.001953125, -0.9278564453125, -0.853759765625, -0.7796630859375, -0.70556640625, -0.6314697265625, -0.557373046875, -0.4832763671875, -0.4091796875, -0.3350830078125, -0.260986328125, -0.1868896484375, -0.11279296875, -0.0386962890625, 0.035400390625, 0.1094970703125, 0.18359375, 0.2576904296875, 0.331787109375, 0.4058837890625, 0.47998046875, 0.5540771484375, 0.628173828125, 0.7022705078125, 0.7763671875, 0.8504638671875, 0.924560546875, 0.9986572265625, 1.07275390625, 1.1468505859375, 1.220947265625, 1.2950439453125, 1.369140625, 1.4432373046875, 1.517333984375, 1.5914306640625, 1.66552734375, 1.7396240234375, 1.813720703125, 1.8878173828125, 1.9619140625, 2.0360107421875, 2.110107421875, 2.1842041015625, 2.25830078125, 2.3323974609375, 2.406494140625, 2.4805908203125, 2.5546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 25.0, 28.0, 45.0, 49.0, 85.0, 99.0, 159.0, 257.0, 451.0, 646.0, 1096.0, 1795.0, 3093.0, 5644.0, 11431.0, 25399.0, 67262.0, 220980.0, 439017.0, 174086.0, 54710.0, 21041.0, 9482.0, 4790.0, 2750.0, 1579.0, 927.0, 576.0, 358.0, 213.0, 163.0, 90.0, 71.0, 45.0, 26.0, 25.0, 15.0, 18.0, 6.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.3828125, -13.93896484375, -13.4951171875, -13.05126953125, -12.607421875, -12.16357421875, -11.7197265625, -11.27587890625, -10.83203125, -10.38818359375, -9.9443359375, -9.50048828125, -9.056640625, -8.61279296875, -8.1689453125, -7.72509765625, -7.28125, -6.83740234375, -6.3935546875, -5.94970703125, -5.505859375, -5.06201171875, -4.6181640625, -4.17431640625, -3.73046875, -3.28662109375, -2.8427734375, -2.39892578125, -1.955078125, -1.51123046875, -1.0673828125, -0.62353515625, -0.1796875, 0.26416015625, 0.7080078125, 1.15185546875, 1.595703125, 2.03955078125, 2.4833984375, 2.92724609375, 3.37109375, 3.81494140625, 4.2587890625, 4.70263671875, 5.146484375, 5.59033203125, 6.0341796875, 6.47802734375, 6.921875, 7.36572265625, 7.8095703125, 8.25341796875, 8.697265625, 9.14111328125, 9.5849609375, 10.02880859375, 10.47265625, 10.91650390625, 11.3603515625, 11.80419921875, 12.248046875, 12.69189453125, 13.1357421875, 13.57958984375, 14.0234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 8.0, 10.0, 12.0, 16.0, 19.0, 17.0, 21.0, 22.0, 31.0, 39.0, 40.0, 39.0, 41.0, 58.0, 62.0, 69.0, 42.0, 55.0, 50.0, 42.0, 55.0, 30.0, 43.0, 41.0, 32.0, 22.0, 12.0, 17.0, 11.0, 15.0, 6.0, 2.0, 7.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.849853515625, -9.54345703125, -9.237060546875, -8.9306640625, -8.624267578125, -8.31787109375, -8.011474609375, -7.705078125, -7.398681640625, -7.09228515625, -6.785888671875, -6.4794921875, -6.173095703125, -5.86669921875, -5.560302734375, -5.25390625, -4.947509765625, -4.64111328125, -4.334716796875, -4.0283203125, -3.721923828125, -3.41552734375, -3.109130859375, -2.802734375, -2.496337890625, -2.18994140625, -1.883544921875, -1.5771484375, -1.270751953125, -0.96435546875, -0.657958984375, -0.3515625, -0.045166015625, 0.26123046875, 0.567626953125, 0.8740234375, 1.180419921875, 1.48681640625, 1.793212890625, 2.099609375, 2.406005859375, 2.71240234375, 3.018798828125, 3.3251953125, 3.631591796875, 3.93798828125, 4.244384765625, 4.55078125, 4.857177734375, 5.16357421875, 5.469970703125, 5.7763671875, 6.082763671875, 6.38916015625, 6.695556640625, 7.001953125, 7.308349609375, 7.61474609375, 7.921142578125, 8.2275390625, 8.533935546875, 8.84033203125, 9.146728515625, 9.453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 18.0, 14.0, 16.0, 36.0, 46.0, 100.0, 145.0, 283.0, 485.0, 986.0, 2185.0, 5365.0, 14407.0, 45120.0, 163934.0, 421548.0, 276846.0, 79425.0, 23527.0, 8024.0, 3197.0, 1414.0, 619.0, 336.0, 183.0, 109.0, 72.0, 32.0, 24.0, 14.0, 11.0, 9.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9771728515625, -10.594970703125, -10.2127685546875, -9.83056640625, -9.4483642578125, -9.066162109375, -8.6839599609375, -8.3017578125, -7.9195556640625, -7.537353515625, -7.1551513671875, -6.77294921875, -6.3907470703125, -6.008544921875, -5.6263427734375, -5.244140625, -4.8619384765625, -4.479736328125, -4.0975341796875, -3.71533203125, -3.3331298828125, -2.950927734375, -2.5687255859375, -2.1865234375, -1.8043212890625, -1.422119140625, -1.0399169921875, -0.65771484375, -0.2755126953125, 0.106689453125, 0.4888916015625, 0.87109375, 1.2532958984375, 1.635498046875, 2.0177001953125, 2.39990234375, 2.7821044921875, 3.164306640625, 3.5465087890625, 3.9287109375, 4.3109130859375, 4.693115234375, 5.0753173828125, 5.45751953125, 5.8397216796875, 6.221923828125, 6.6041259765625, 6.986328125, 7.3685302734375, 7.750732421875, 8.1329345703125, 8.51513671875, 8.8973388671875, 9.279541015625, 9.6617431640625, 10.0439453125, 10.4261474609375, 10.808349609375, 11.1905517578125, 11.57275390625, 11.9549560546875, 12.337158203125, 12.7193603515625, 13.1015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 15.0, 34.0, 67.0, 179.0, 284.0, 199.0, 106.0, 42.0, 25.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015134811401367188, -0.001452133059501648, -0.0013907849788665771, -0.0013294368982315063, -0.0012680888175964355, -0.0012067407369613647, -0.001145392656326294, -0.0010840445756912231, -0.0010226964950561523, -0.0009613484144210815, -0.0009000003337860107, -0.0008386522531509399, -0.0007773041725158691, -0.0007159560918807983, -0.0006546080112457275, -0.0005932599306106567, -0.0005319118499755859, -0.00047056376934051514, -0.00040921568870544434, -0.00034786760807037354, -0.00028651952743530273, -0.00022517144680023193, -0.00016382336616516113, -0.00010247528553009033, -4.112720489501953e-05, 2.022087574005127e-05, 8.156895637512207e-05, 0.00014291703701019287, 0.00020426511764526367, 0.00026561319828033447, 0.0003269612789154053, 0.0003883093595504761, 0.0004496574401855469, 0.0005110055208206177, 0.0005723536014556885, 0.0006337016820907593, 0.0006950497627258301, 0.0007563978433609009, 0.0008177459239959717, 0.0008790940046310425, 0.0009404420852661133, 0.001001790165901184, 0.0010631382465362549, 0.0011244863271713257, 0.0011858344078063965, 0.0012471824884414673, 0.001308530569076538, 0.0013698786497116089, 0.0014312267303466797, 0.0014925748109817505, 0.0015539228916168213, 0.001615270972251892, 0.0016766190528869629, 0.0017379671335220337, 0.0017993152141571045, 0.0018606632947921753, 0.001922011375427246, 0.001983359456062317, 0.0020447075366973877, 0.0021060556173324585, 0.0021674036979675293, 0.0022287517786026, 0.002290099859237671, 0.0023514479398727417, 0.0024127960205078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 27.0, 45.0, 32.0, 66.0, 126.0, 199.0, 355.0, 593.0, 1073.0, 1964.0, 3501.0, 6765.0, 13617.0, 28553.0, 63608.0, 137257.0, 247745.0, 259705.0, 151186.0, 69627.0, 31577.0, 15014.0, 7306.0, 3803.0, 2039.0, 1136.0, 655.0, 404.0, 209.0, 117.0, 89.0, 54.0, 30.0, 26.0, 8.0, 12.0, 6.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.72265625, -7.4818115234375, -7.240966796875, -7.0001220703125, -6.75927734375, -6.5184326171875, -6.277587890625, -6.0367431640625, -5.7958984375, -5.5550537109375, -5.314208984375, -5.0733642578125, -4.83251953125, -4.5916748046875, -4.350830078125, -4.1099853515625, -3.869140625, -3.6282958984375, -3.387451171875, -3.1466064453125, -2.90576171875, -2.6649169921875, -2.424072265625, -2.1832275390625, -1.9423828125, -1.7015380859375, -1.460693359375, -1.2198486328125, -0.97900390625, -0.7381591796875, -0.497314453125, -0.2564697265625, -0.015625, 0.2252197265625, 0.466064453125, 0.7069091796875, 0.94775390625, 1.1885986328125, 1.429443359375, 1.6702880859375, 1.9111328125, 2.1519775390625, 2.392822265625, 2.6336669921875, 2.87451171875, 3.1153564453125, 3.356201171875, 3.5970458984375, 3.837890625, 4.0787353515625, 4.319580078125, 4.5604248046875, 4.80126953125, 5.0421142578125, 5.282958984375, 5.5238037109375, 5.7646484375, 6.0054931640625, 6.246337890625, 6.4871826171875, 6.72802734375, 6.9688720703125, 7.209716796875, 7.4505615234375, 7.69140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 9.0, 8.0, 25.0, 17.0, 19.0, 22.0, 26.0, 37.0, 61.0, 48.0, 76.0, 59.0, 71.0, 53.0, 64.0, 54.0, 72.0, 46.0, 44.0, 33.0, 29.0, 27.0, 17.0, 17.0, 12.0, 11.0, 7.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.491455078125, -6.30322265625, -6.114990234375, -5.9267578125, -5.738525390625, -5.55029296875, -5.362060546875, -5.173828125, -4.985595703125, -4.79736328125, -4.609130859375, -4.4208984375, -4.232666015625, -4.04443359375, -3.856201171875, -3.66796875, -3.479736328125, -3.29150390625, -3.103271484375, -2.9150390625, -2.726806640625, -2.53857421875, -2.350341796875, -2.162109375, -1.973876953125, -1.78564453125, -1.597412109375, -1.4091796875, -1.220947265625, -1.03271484375, -0.844482421875, -0.65625, -0.468017578125, -0.27978515625, -0.091552734375, 0.0966796875, 0.284912109375, 0.47314453125, 0.661376953125, 0.849609375, 1.037841796875, 1.22607421875, 1.414306640625, 1.6025390625, 1.790771484375, 1.97900390625, 2.167236328125, 2.35546875, 2.543701171875, 2.73193359375, 2.920166015625, 3.1083984375, 3.296630859375, 3.48486328125, 3.673095703125, 3.861328125, 4.049560546875, 4.23779296875, 4.426025390625, 4.6142578125, 4.802490234375, 4.99072265625, 5.178955078125, 5.3671875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 16.0, 24.0, 56.0, 99.0, 154.0, 203.0, 167.0, 114.0, 72.0, 46.0, 20.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.61648559570312, -73.21717071533203, -68.81785583496094, -64.41854858398438, -60.01923370361328, -55.61991882324219, -51.22060775756836, -46.82129669189453, -42.42198181152344, -38.022666931152344, -33.623355865478516, -29.224042892456055, -24.824729919433594, -20.425416946411133, -16.026103973388672, -11.626791000366211, -7.22747802734375, -2.828165054321289, 1.5711479187011719, 5.970460891723633, 10.369773864746094, 14.769086837768555, 19.168399810791016, 23.567712783813477, 27.967025756835938, 32.36634063720703, 36.76565170288086, 41.16496276855469, 45.56427764892578, 49.963592529296875, 54.3629035949707, 58.76221466064453, 63.16154479980469, 67.56085968017578, 71.96017456054688, 76.35948181152344, 80.75879669189453, 85.15811157226562, 89.55741882324219, 93.95673370361328, 98.35604858398438, 102.75536346435547, 107.15467834472656, 111.55398559570312, 115.95330047607422, 120.35261535644531, 124.75192260742188, 129.1512451171875, 133.55055236816406, 137.94985961914062, 142.34918212890625, 146.7484893798828, 151.14779663085938, 155.547119140625, 159.94642639160156, 164.3457489013672, 168.74505615234375, 173.1443634033203, 177.54368591308594, 181.9429931640625, 186.34231567382812, 190.7416229248047, 195.14093017578125, 199.54025268554688, 203.93955993652344]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 14.0, 5.0, 16.0, 13.0, 25.0, 41.0, 40.0, 43.0, 50.0, 58.0, 67.0, 85.0, 79.0, 76.0, 77.0, 73.0, 50.0, 48.0, 43.0, 21.0, 23.0, 10.0, 8.0, 11.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.6422119140625, -83.86802673339844, -81.09383392333984, -78.31964874267578, -75.54545593261719, -72.77127075195312, -69.99708557128906, -67.22289276123047, -64.44869995117188, -61.67451095581055, -58.90032196044922, -56.126136779785156, -53.35194396972656, -50.5777587890625, -47.80356979370117, -45.029380798339844, -42.25519561767578, -39.48100662231445, -36.706817626953125, -33.93263244628906, -31.1584415435791, -28.384252548217773, -25.610065460205078, -22.83587646484375, -20.061687469482422, -17.287498474121094, -14.513310432434082, -11.73912239074707, -8.964933395385742, -6.190744400024414, -3.4165573120117188, -0.6423683166503906, 2.1318130493164062, 4.906001567840576, 7.680190086364746, 10.454378128051758, 13.228567123413086, 16.002756118774414, 18.77694320678711, 21.551132202148438, 24.325321197509766, 27.099510192871094, 29.873699188232422, 32.64788818359375, 35.42207336425781, 38.196266174316406, 40.97045135498047, 43.7446403503418, 46.518829345703125, 49.29301834106445, 52.06720733642578, 54.841392517089844, 57.61558532714844, 60.3897705078125, 63.16395950317383, 65.93814849853516, 68.71234130859375, 71.48652648925781, 74.2607192993164, 77.03490447998047, 79.80909729003906, 82.58328247070312, 85.35746765136719, 88.13166046142578, 90.90584564208984]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 17.0, 26.0, 40.0, 56.0, 92.0, 118.0, 174.0, 268.0, 392.0, 653.0, 1024.0, 1724.0, 2871.0, 4886.0, 8887.0, 16985.0, 36851.0, 101079.0, 596391.0, 3155171.0, 166823.0, 52073.0, 22255.0, 11055.0, 5760.0, 3353.0, 1957.0, 1217.0, 714.0, 453.0, 315.0, 176.0, 120.0, 89.0, 43.0, 47.0, 26.0, 29.0, 15.0, 8.0, 14.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.3125, -34.1025390625, -32.892578125, -31.6826171875, -30.47265625, -29.2626953125, -28.052734375, -26.8427734375, -25.6328125, -24.4228515625, -23.212890625, -22.0029296875, -20.79296875, -19.5830078125, -18.373046875, -17.1630859375, -15.953125, -14.7431640625, -13.533203125, -12.3232421875, -11.11328125, -9.9033203125, -8.693359375, -7.4833984375, -6.2734375, -5.0634765625, -3.853515625, -2.6435546875, -1.43359375, -0.2236328125, 0.986328125, 2.1962890625, 3.40625, 4.6162109375, 5.826171875, 7.0361328125, 8.24609375, 9.4560546875, 10.666015625, 11.8759765625, 13.0859375, 14.2958984375, 15.505859375, 16.7158203125, 17.92578125, 19.1357421875, 20.345703125, 21.5556640625, 22.765625, 23.9755859375, 25.185546875, 26.3955078125, 27.60546875, 28.8154296875, 30.025390625, 31.2353515625, 32.4453125, 33.6552734375, 34.865234375, 36.0751953125, 37.28515625, 38.4951171875, 39.705078125, 40.9150390625, 42.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 4.0, 8.0, 9.0, 20.0, 15.0, 16.0, 19.0, 21.0, 33.0, 33.0, 25.0, 26.0, 35.0, 38.0, 48.0, 59.0, 56.0, 63.0, 43.0, 53.0, 40.0, 43.0, 37.0, 40.0, 31.0, 21.0, 34.0, 23.0, 15.0, 8.0, 13.0, 16.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.787109375, -1.729949951171875, -1.67279052734375, -1.615631103515625, -1.5584716796875, -1.501312255859375, -1.44415283203125, -1.386993408203125, -1.329833984375, -1.272674560546875, -1.21551513671875, -1.158355712890625, -1.1011962890625, -1.044036865234375, -0.98687744140625, -0.929718017578125, -0.87255859375, -0.815399169921875, -0.75823974609375, -0.701080322265625, -0.6439208984375, -0.586761474609375, -0.52960205078125, -0.472442626953125, -0.415283203125, -0.358123779296875, -0.30096435546875, -0.243804931640625, -0.1866455078125, -0.129486083984375, -0.07232666015625, -0.015167236328125, 0.0419921875, 0.099151611328125, 0.15631103515625, 0.213470458984375, 0.2706298828125, 0.327789306640625, 0.38494873046875, 0.442108154296875, 0.499267578125, 0.556427001953125, 0.61358642578125, 0.670745849609375, 0.7279052734375, 0.785064697265625, 0.84222412109375, 0.899383544921875, 0.95654296875, 1.013702392578125, 1.07086181640625, 1.128021240234375, 1.1851806640625, 1.242340087890625, 1.29949951171875, 1.356658935546875, 1.413818359375, 1.470977783203125, 1.52813720703125, 1.585296630859375, 1.6424560546875, 1.699615478515625, 1.75677490234375, 1.813934326171875, 1.87109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 11.0, 16.0, 19.0, 36.0, 60.0, 82.0, 196.0, 284.0, 854.0, 4983.0, 97144.0, 3972283.0, 111388.0, 5386.0, 813.0, 300.0, 148.0, 89.0, 63.0, 42.0, 18.0, 19.0, 14.0, 9.0, 2.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-148.875, -144.296875, -139.71875, -135.140625, -130.5625, -125.984375, -121.40625, -116.828125, -112.25, -107.671875, -103.09375, -98.515625, -93.9375, -89.359375, -84.78125, -80.203125, -75.625, -71.046875, -66.46875, -61.890625, -57.3125, -52.734375, -48.15625, -43.578125, -39.0, -34.421875, -29.84375, -25.265625, -20.6875, -16.109375, -11.53125, -6.953125, -2.375, 2.203125, 6.78125, 11.359375, 15.9375, 20.515625, 25.09375, 29.671875, 34.25, 38.828125, 43.40625, 47.984375, 52.5625, 57.140625, 61.71875, 66.296875, 70.875, 75.453125, 80.03125, 84.609375, 89.1875, 93.765625, 98.34375, 102.921875, 107.5, 112.078125, 116.65625, 121.234375, 125.8125, 130.390625, 134.96875, 139.546875, 144.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 5.0, 4.0, 13.0, 11.0, 13.0, 22.0, 34.0, 29.0, 45.0, 60.0, 92.0, 182.0, 281.0, 655.0, 1577.0, 430.0, 215.0, 113.0, 85.0, 64.0, 50.0, 33.0, 17.0, 13.0, 3.0, 7.0, 10.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.948486328125, -7.70166015625, -7.454833984375, -7.2080078125, -6.961181640625, -6.71435546875, -6.467529296875, -6.220703125, -5.973876953125, -5.72705078125, -5.480224609375, -5.2333984375, -4.986572265625, -4.73974609375, -4.492919921875, -4.24609375, -3.999267578125, -3.75244140625, -3.505615234375, -3.2587890625, -3.011962890625, -2.76513671875, -2.518310546875, -2.271484375, -2.024658203125, -1.77783203125, -1.531005859375, -1.2841796875, -1.037353515625, -0.79052734375, -0.543701171875, -0.296875, -0.050048828125, 0.19677734375, 0.443603515625, 0.6904296875, 0.937255859375, 1.18408203125, 1.430908203125, 1.677734375, 1.924560546875, 2.17138671875, 2.418212890625, 2.6650390625, 2.911865234375, 3.15869140625, 3.405517578125, 3.65234375, 3.899169921875, 4.14599609375, 4.392822265625, 4.6396484375, 4.886474609375, 5.13330078125, 5.380126953125, 5.626953125, 5.873779296875, 6.12060546875, 6.367431640625, 6.6142578125, 6.861083984375, 7.10791015625, 7.354736328125, 7.6015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 9.0, 11.0, 18.0, 30.0, 31.0, 34.0, 73.0, 94.0, 81.0, 112.0, 123.0, 103.0, 72.0, 63.0, 39.0, 42.0, 21.0, 14.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.46728515625, -58.737606048583984, -57.007930755615234, -55.27825164794922, -53.5485725402832, -51.81889343261719, -50.08921813964844, -48.35953903198242, -46.629859924316406, -44.90018081665039, -43.17050552368164, -41.440826416015625, -39.71114730834961, -37.981468200683594, -36.251792907714844, -34.52211380004883, -32.79243850708008, -31.062761306762695, -29.33308219909668, -27.603404998779297, -25.87372589111328, -24.1440486907959, -22.414371490478516, -20.6846923828125, -18.955015182495117, -17.225337982177734, -15.495658874511719, -13.765981674194336, -12.036303520202637, -10.306625366210938, -8.576948165893555, -6.8472700119018555, -5.117591857910156, -3.387913942337036, -1.658236026763916, 0.071441650390625, 1.8011198043823242, 3.5307979583740234, 5.260475158691406, 6.9901533126831055, 8.719831466674805, 10.449509620666504, 12.179187774658203, 13.908864974975586, 15.638543128967285, 17.368221282958984, 19.097898483276367, 20.82757568359375, 22.557254791259766, 24.28693199157715, 26.016611099243164, 27.746288299560547, 29.475967407226562, 31.205644607543945, 32.93532180786133, 34.665000915527344, 36.394676208496094, 38.12435531616211, 39.85403060913086, 41.583709716796875, 43.31338882446289, 45.043067932128906, 46.772743225097656, 48.50242233276367, 50.23210144042969]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 4.0, 14.0, 12.0, 12.0, 15.0, 21.0, 20.0, 35.0, 33.0, 34.0, 34.0, 45.0, 42.0, 44.0, 43.0, 45.0, 44.0, 53.0, 42.0, 64.0, 47.0, 39.0, 38.0, 35.0, 28.0, 35.0, 15.0, 19.0, 11.0, 22.0, 13.0, 5.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.74311828613281, -36.74064254760742, -35.73816680908203, -34.735694885253906, -33.733219146728516, -32.730743408203125, -31.728269577026367, -30.72579574584961, -29.72332000732422, -28.720844268798828, -27.71837043762207, -26.715896606445312, -25.713420867919922, -24.71094512939453, -23.708471298217773, -22.705997467041016, -21.703521728515625, -20.701045989990234, -19.698572158813477, -18.69609832763672, -17.693622589111328, -16.691146850585938, -15.68867301940918, -14.686198234558105, -13.683723449707031, -12.681248664855957, -11.678773880004883, -10.676299095153809, -9.673824310302734, -8.67134952545166, -7.668874740600586, -6.666399955749512, -5.663928985595703, -4.661454200744629, -3.6589794158935547, -2.6565046310424805, -1.6540298461914062, -0.651555061340332, 0.3509197235107422, 1.3533945083618164, 2.3558692932128906, 3.358344078063965, 4.360818862915039, 5.363293647766113, 6.3657684326171875, 7.368243217468262, 8.370718002319336, 9.37319278717041, 10.375667572021484, 11.378142356872559, 12.380617141723633, 13.383091926574707, 14.385566711425781, 15.388041496276855, 16.39051628112793, 17.392990112304688, 18.395465850830078, 19.39794158935547, 20.400415420532227, 21.402889251708984, 22.405364990234375, 23.407840728759766, 24.410314559936523, 25.41278839111328, 26.415264129638672]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 16.0, 18.0, 39.0, 56.0, 66.0, 116.0, 116.0, 241.0, 316.0, 502.0, 690.0, 1103.0, 1670.0, 2628.0, 3822.0, 6118.0, 9319.0, 15378.0, 23997.0, 37458.0, 58637.0, 90336.0, 127972.0, 161209.0, 155587.0, 119964.0, 82488.0, 53889.0, 34565.0, 21601.0, 13559.0, 8912.0, 5556.0, 3642.0, 2373.0, 1516.0, 1035.0, 705.0, 439.0, 297.0, 201.0, 129.0, 83.0, 62.0, 35.0, 29.0, 16.0, 14.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.0390625, -11.6494140625, -11.259765625, -10.8701171875, -10.48046875, -10.0908203125, -9.701171875, -9.3115234375, -8.921875, -8.5322265625, -8.142578125, -7.7529296875, -7.36328125, -6.9736328125, -6.583984375, -6.1943359375, -5.8046875, -5.4150390625, -5.025390625, -4.6357421875, -4.24609375, -3.8564453125, -3.466796875, -3.0771484375, -2.6875, -2.2978515625, -1.908203125, -1.5185546875, -1.12890625, -0.7392578125, -0.349609375, 0.0400390625, 0.4296875, 0.8193359375, 1.208984375, 1.5986328125, 1.98828125, 2.3779296875, 2.767578125, 3.1572265625, 3.546875, 3.9365234375, 4.326171875, 4.7158203125, 5.10546875, 5.4951171875, 5.884765625, 6.2744140625, 6.6640625, 7.0537109375, 7.443359375, 7.8330078125, 8.22265625, 8.6123046875, 9.001953125, 9.3916015625, 9.78125, 10.1708984375, 10.560546875, 10.9501953125, 11.33984375, 11.7294921875, 12.119140625, 12.5087890625, 12.8984375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 9.0, 3.0, 7.0, 12.0, 7.0, 10.0, 16.0, 18.0, 17.0, 14.0, 27.0, 21.0, 40.0, 25.0, 28.0, 25.0, 34.0, 37.0, 34.0, 46.0, 40.0, 36.0, 46.0, 46.0, 40.0, 46.0, 54.0, 32.0, 32.0, 26.0, 27.0, 24.0, 15.0, 21.0, 17.0, 11.0, 9.0, 7.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.654296875, -1.5994720458984375, -1.544647216796875, -1.4898223876953125, -1.43499755859375, -1.3801727294921875, -1.325347900390625, -1.2705230712890625, -1.2156982421875, -1.1608734130859375, -1.106048583984375, -1.0512237548828125, -0.99639892578125, -0.9415740966796875, -0.886749267578125, -0.8319244384765625, -0.777099609375, -0.7222747802734375, -0.667449951171875, -0.6126251220703125, -0.55780029296875, -0.5029754638671875, -0.448150634765625, -0.3933258056640625, -0.3385009765625, -0.2836761474609375, -0.228851318359375, -0.1740264892578125, -0.11920166015625, -0.0643768310546875, -0.009552001953125, 0.0452728271484375, 0.10009765625, 0.1549224853515625, 0.209747314453125, 0.2645721435546875, 0.31939697265625, 0.3742218017578125, 0.429046630859375, 0.4838714599609375, 0.5386962890625, 0.5935211181640625, 0.648345947265625, 0.7031707763671875, 0.75799560546875, 0.8128204345703125, 0.867645263671875, 0.9224700927734375, 0.977294921875, 1.0321197509765625, 1.086944580078125, 1.1417694091796875, 1.19659423828125, 1.2514190673828125, 1.306243896484375, 1.3610687255859375, 1.4158935546875, 1.4707183837890625, 1.525543212890625, 1.5803680419921875, 1.63519287109375, 1.6900177001953125, 1.744842529296875, 1.7996673583984375, 1.8544921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 12.0, 17.0, 33.0, 78.0, 117.0, 217.0, 474.0, 921.0, 2161.0, 5920.0, 19335.0, 78743.0, 295138.0, 436053.0, 154275.0, 38271.0, 10418.0, 3493.0, 1456.0, 676.0, 355.0, 169.0, 75.0, 52.0, 24.0, 23.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.451171875, -37.08984375, -35.728515625, -34.3671875, -33.005859375, -31.64453125, -30.283203125, -28.921875, -27.560546875, -26.19921875, -24.837890625, -23.4765625, -22.115234375, -20.75390625, -19.392578125, -18.03125, -16.669921875, -15.30859375, -13.947265625, -12.5859375, -11.224609375, -9.86328125, -8.501953125, -7.140625, -5.779296875, -4.41796875, -3.056640625, -1.6953125, -0.333984375, 1.02734375, 2.388671875, 3.75, 5.111328125, 6.47265625, 7.833984375, 9.1953125, 10.556640625, 11.91796875, 13.279296875, 14.640625, 16.001953125, 17.36328125, 18.724609375, 20.0859375, 21.447265625, 22.80859375, 24.169921875, 25.53125, 26.892578125, 28.25390625, 29.615234375, 30.9765625, 32.337890625, 33.69921875, 35.060546875, 36.421875, 37.783203125, 39.14453125, 40.505859375, 41.8671875, 43.228515625, 44.58984375, 45.951171875, 47.3125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 10.0, 5.0, 4.0, 8.0, 14.0, 10.0, 14.0, 16.0, 15.0, 28.0, 23.0, 35.0, 29.0, 44.0, 40.0, 28.0, 44.0, 45.0, 47.0, 47.0, 53.0, 44.0, 42.0, 32.0, 48.0, 37.0, 29.0, 26.0, 44.0, 22.0, 19.0, 19.0, 13.0, 12.0, 10.0, 12.0, 7.0, 6.0, 7.0, 9.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.8984375, -13.4517822265625, -13.005126953125, -12.5584716796875, -12.11181640625, -11.6651611328125, -11.218505859375, -10.7718505859375, -10.3251953125, -9.8785400390625, -9.431884765625, -8.9852294921875, -8.53857421875, -8.0919189453125, -7.645263671875, -7.1986083984375, -6.751953125, -6.3052978515625, -5.858642578125, -5.4119873046875, -4.96533203125, -4.5186767578125, -4.072021484375, -3.6253662109375, -3.1787109375, -2.7320556640625, -2.285400390625, -1.8387451171875, -1.39208984375, -0.9454345703125, -0.498779296875, -0.0521240234375, 0.39453125, 0.8411865234375, 1.287841796875, 1.7344970703125, 2.18115234375, 2.6278076171875, 3.074462890625, 3.5211181640625, 3.9677734375, 4.4144287109375, 4.861083984375, 5.3077392578125, 5.75439453125, 6.2010498046875, 6.647705078125, 7.0943603515625, 7.541015625, 7.9876708984375, 8.434326171875, 8.8809814453125, 9.32763671875, 9.7742919921875, 10.220947265625, 10.6676025390625, 11.1142578125, 11.5609130859375, 12.007568359375, 12.4542236328125, 12.90087890625, 13.3475341796875, 13.794189453125, 14.2408447265625, 14.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 13.0, 16.0, 15.0, 22.0, 35.0, 63.0, 111.0, 136.0, 192.0, 285.0, 480.0, 852.0, 1476.0, 2860.0, 5851.0, 14101.0, 43576.0, 213277.0, 548535.0, 159010.0, 34637.0, 11927.0, 5161.0, 2532.0, 1331.0, 796.0, 431.0, 295.0, 171.0, 129.0, 60.0, 53.0, 30.0, 21.0, 21.0, 11.0, 15.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.21875, -34.09765625, -32.9765625, -31.85546875, -30.734375, -29.61328125, -28.4921875, -27.37109375, -26.25, -25.12890625, -24.0078125, -22.88671875, -21.765625, -20.64453125, -19.5234375, -18.40234375, -17.28125, -16.16015625, -15.0390625, -13.91796875, -12.796875, -11.67578125, -10.5546875, -9.43359375, -8.3125, -7.19140625, -6.0703125, -4.94921875, -3.828125, -2.70703125, -1.5859375, -0.46484375, 0.65625, 1.77734375, 2.8984375, 4.01953125, 5.140625, 6.26171875, 7.3828125, 8.50390625, 9.625, 10.74609375, 11.8671875, 12.98828125, 14.109375, 15.23046875, 16.3515625, 17.47265625, 18.59375, 19.71484375, 20.8359375, 21.95703125, 23.078125, 24.19921875, 25.3203125, 26.44140625, 27.5625, 28.68359375, 29.8046875, 30.92578125, 32.046875, 33.16796875, 34.2890625, 35.41015625, 36.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 4.0, 12.0, 12.0, 18.0, 25.0, 20.0, 41.0, 24.0, 48.0, 57.0, 101.0, 104.0, 95.0, 104.0, 83.0, 54.0, 49.0, 36.0, 26.0, 22.0, 11.0, 12.0, 11.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003467559814453125, -0.0033602118492126465, -0.003252863883972168, -0.0031455159187316895, -0.003038167953491211, -0.0029308199882507324, -0.002823472023010254, -0.0027161240577697754, -0.002608776092529297, -0.0025014281272888184, -0.00239408016204834, -0.0022867321968078613, -0.002179384231567383, -0.0020720362663269043, -0.0019646883010864258, -0.0018573403358459473, -0.0017499923706054688, -0.0016426444053649902, -0.0015352964401245117, -0.0014279484748840332, -0.0013206005096435547, -0.0012132525444030762, -0.0011059045791625977, -0.0009985566139221191, -0.0008912086486816406, -0.0007838606834411621, -0.0006765127182006836, -0.0005691647529602051, -0.00046181678771972656, -0.00035446882247924805, -0.00024712085723876953, -0.00013977289199829102, -3.24249267578125e-05, 7.492303848266602e-05, 0.00018227100372314453, 0.00028961896896362305, 0.00039696693420410156, 0.0005043148994445801, 0.0006116628646850586, 0.0007190108299255371, 0.0008263587951660156, 0.0009337067604064941, 0.0010410547256469727, 0.0011484026908874512, 0.0012557506561279297, 0.0013630986213684082, 0.0014704465866088867, 0.0015777945518493652, 0.0016851425170898438, 0.0017924904823303223, 0.0018998384475708008, 0.0020071864128112793, 0.002114534378051758, 0.0022218823432922363, 0.002329230308532715, 0.0024365782737731934, 0.002543926239013672, 0.0026512742042541504, 0.002758622169494629, 0.0028659701347351074, 0.002973318099975586, 0.0030806660652160645, 0.003188014030456543, 0.0032953619956970215, 0.0034027099609375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 12.0, 17.0, 14.0, 21.0, 39.0, 43.0, 75.0, 107.0, 167.0, 229.0, 337.0, 519.0, 784.0, 1233.0, 1957.0, 3273.0, 5628.0, 10962.0, 24009.0, 65414.0, 225534.0, 424839.0, 185259.0, 54398.0, 20570.0, 9696.0, 5193.0, 2972.0, 1837.0, 1150.0, 723.0, 481.0, 297.0, 229.0, 135.0, 128.0, 67.0, 44.0, 32.0, 39.0, 20.0, 14.0, 5.0, 5.0, 9.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-24.875, -24.130615234375, -23.38623046875, -22.641845703125, -21.8974609375, -21.153076171875, -20.40869140625, -19.664306640625, -18.919921875, -18.175537109375, -17.43115234375, -16.686767578125, -15.9423828125, -15.197998046875, -14.45361328125, -13.709228515625, -12.96484375, -12.220458984375, -11.47607421875, -10.731689453125, -9.9873046875, -9.242919921875, -8.49853515625, -7.754150390625, -7.009765625, -6.265380859375, -5.52099609375, -4.776611328125, -4.0322265625, -3.287841796875, -2.54345703125, -1.799072265625, -1.0546875, -0.310302734375, 0.43408203125, 1.178466796875, 1.9228515625, 2.667236328125, 3.41162109375, 4.156005859375, 4.900390625, 5.644775390625, 6.38916015625, 7.133544921875, 7.8779296875, 8.622314453125, 9.36669921875, 10.111083984375, 10.85546875, 11.599853515625, 12.34423828125, 13.088623046875, 13.8330078125, 14.577392578125, 15.32177734375, 16.066162109375, 16.810546875, 17.554931640625, 18.29931640625, 19.043701171875, 19.7880859375, 20.532470703125, 21.27685546875, 22.021240234375, 22.765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 0.0, 3.0, 4.0, 5.0, 10.0, 7.0, 5.0, 21.0, 14.0, 22.0, 44.0, 41.0, 50.0, 68.0, 78.0, 101.0, 99.0, 96.0, 81.0, 47.0, 48.0, 26.0, 26.0, 20.0, 18.0, 7.0, 14.0, 7.0, 6.0, 2.0, 5.0, 4.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.40625, -15.894287109375, -15.38232421875, -14.870361328125, -14.3583984375, -13.846435546875, -13.33447265625, -12.822509765625, -12.310546875, -11.798583984375, -11.28662109375, -10.774658203125, -10.2626953125, -9.750732421875, -9.23876953125, -8.726806640625, -8.21484375, -7.702880859375, -7.19091796875, -6.678955078125, -6.1669921875, -5.655029296875, -5.14306640625, -4.631103515625, -4.119140625, -3.607177734375, -3.09521484375, -2.583251953125, -2.0712890625, -1.559326171875, -1.04736328125, -0.535400390625, -0.0234375, 0.488525390625, 1.00048828125, 1.512451171875, 2.0244140625, 2.536376953125, 3.04833984375, 3.560302734375, 4.072265625, 4.584228515625, 5.09619140625, 5.608154296875, 6.1201171875, 6.632080078125, 7.14404296875, 7.656005859375, 8.16796875, 8.679931640625, 9.19189453125, 9.703857421875, 10.2158203125, 10.727783203125, 11.23974609375, 11.751708984375, 12.263671875, 12.775634765625, 13.28759765625, 13.799560546875, 14.3115234375, 14.823486328125, 15.33544921875, 15.847412109375, 16.359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 12.0, 18.0, 31.0, 87.0, 113.0, 168.0, 199.0, 177.0, 87.0, 53.0, 23.0, 11.0, 8.0, 4.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.0165252685547, -177.53866577148438, -166.06082153320312, -154.5829620361328, -143.10511779785156, -131.62725830078125, -120.14940643310547, -108.67155456542969, -97.1937026977539, -85.71585083007812, -74.23799896240234, -62.7601432800293, -51.282291412353516, -39.804439544677734, -28.326583862304688, -16.848731994628906, -5.370880126953125, 6.106972694396973, 17.58482551574707, 29.062679290771484, 40.540531158447266, 52.01838302612305, 63.496238708496094, 74.97409057617188, 86.45194244384766, 97.92979431152344, 109.40764617919922, 120.885498046875, 132.3633575439453, 143.84120178222656, 155.31906127929688, 166.79690551757812, 178.27474975585938, 189.7526092529297, 201.23045349121094, 212.70831298828125, 224.1861572265625, 235.6640167236328, 247.14187622070312, 258.6197204589844, 270.0975646972656, 281.5754089355469, 293.05328369140625, 304.5311279296875, 316.00897216796875, 327.48681640625, 338.9646911621094, 350.4425354003906, 361.92041015625, 373.39825439453125, 384.8761291503906, 396.3539733886719, 407.8318176269531, 419.3096618652344, 430.78753662109375, 442.265380859375, 453.74322509765625, 465.2210693359375, 476.6989440917969, 488.1767883300781, 499.6546325683594, 511.1324768066406, 522.6103515625, 534.0881958007812, 545.5660400390625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 13.0, 17.0, 19.0, 28.0, 38.0, 38.0, 47.0, 41.0, 65.0, 78.0, 71.0, 88.0, 65.0, 68.0, 64.0, 57.0, 43.0, 43.0, 29.0, 20.0, 16.0, 14.0, 9.0, 14.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.1793975830078, -173.3857421875, -167.59210205078125, -161.79844665527344, -156.0048065185547, -150.21115112304688, -144.41751098632812, -138.6238555908203, -132.8302001953125, -127.03655242919922, -121.24290466308594, -115.44924926757812, -109.65560913085938, -103.86195373535156, -98.06830596923828, -92.274658203125, -86.48101806640625, -80.68737030029297, -74.89372253417969, -69.10006713867188, -63.30642318725586, -57.51277542114258, -51.71912384033203, -45.92547607421875, -40.13182830810547, -34.33818054199219, -28.544530868530273, -22.75088119506836, -16.957233428955078, -11.163585662841797, -5.36993408203125, 0.42371368408203125, 6.21734619140625, 12.010994911193848, 17.804643630981445, 23.59829330444336, 29.39194107055664, 35.18558883666992, 40.97924041748047, 46.77288818359375, 52.56653594970703, 58.36018371582031, 64.1538314819336, 69.94747924804688, 75.74113464355469, 81.53477478027344, 87.32843017578125, 93.12207794189453, 98.91572570800781, 104.7093734741211, 110.50302124023438, 116.29667663574219, 122.09031677246094, 127.88397216796875, 133.6776123046875, 139.4712677001953, 145.26492309570312, 151.05857849121094, 156.8522186279297, 162.6458740234375, 168.43951416015625, 174.23316955566406, 180.02682495117188, 185.82046508789062, 191.61410522460938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 10.0, 17.0, 17.0, 33.0, 67.0, 88.0, 194.0, 597.0, 2413.0, 18610.0, 538328.0, 3598158.0, 31366.0, 3367.0, 572.0, 191.0, 89.0, 60.0, 40.0, 24.0, 17.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.125, -150.14453125, -144.1640625, -138.18359375, -132.203125, -126.22265625, -120.2421875, -114.26171875, -108.28125, -102.30078125, -96.3203125, -90.33984375, -84.359375, -78.37890625, -72.3984375, -66.41796875, -60.4375, -54.45703125, -48.4765625, -42.49609375, -36.515625, -30.53515625, -24.5546875, -18.57421875, -12.59375, -6.61328125, -0.6328125, 5.34765625, 11.328125, 17.30859375, 23.2890625, 29.26953125, 35.25, 41.23046875, 47.2109375, 53.19140625, 59.171875, 65.15234375, 71.1328125, 77.11328125, 83.09375, 89.07421875, 95.0546875, 101.03515625, 107.015625, 112.99609375, 118.9765625, 124.95703125, 130.9375, 136.91796875, 142.8984375, 148.87890625, 154.859375, 160.83984375, 166.8203125, 172.80078125, 178.78125, 184.76171875, 190.7421875, 196.72265625, 202.703125, 208.68359375, 214.6640625, 220.64453125, 226.625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 13.0, 16.0, 19.0, 25.0, 34.0, 55.0, 71.0, 65.0, 70.0, 107.0, 91.0, 82.0, 88.0, 64.0, 54.0, 37.0, 31.0, 27.0, 19.0, 9.0, 11.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.92889404296875, -4.7601318359375, -4.59136962890625, -4.422607421875, -4.25384521484375, -4.0850830078125, -3.91632080078125, -3.74755859375, -3.57879638671875, -3.4100341796875, -3.24127197265625, -3.072509765625, -2.90374755859375, -2.7349853515625, -2.56622314453125, -2.3974609375, -2.22869873046875, -2.0599365234375, -1.89117431640625, -1.722412109375, -1.55364990234375, -1.3848876953125, -1.21612548828125, -1.04736328125, -0.87860107421875, -0.7098388671875, -0.54107666015625, -0.372314453125, -0.20355224609375, -0.0347900390625, 0.13397216796875, 0.302734375, 0.47149658203125, 0.6402587890625, 0.80902099609375, 0.977783203125, 1.14654541015625, 1.3153076171875, 1.48406982421875, 1.65283203125, 1.82159423828125, 1.9903564453125, 2.15911865234375, 2.327880859375, 2.49664306640625, 2.6654052734375, 2.83416748046875, 3.0029296875, 3.17169189453125, 3.3404541015625, 3.50921630859375, 3.677978515625, 3.84674072265625, 4.0155029296875, 4.18426513671875, 4.35302734375, 4.52178955078125, 4.6905517578125, 4.85931396484375, 5.028076171875, 5.19683837890625, 5.3656005859375, 5.53436279296875, 5.703125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 10.0, 10.0, 18.0, 11.0, 23.0, 24.0, 34.0, 37.0, 46.0, 69.0, 118.0, 435.0, 2520.0, 23020.0, 514919.0, 3570769.0, 75198.0, 5810.0, 768.0, 175.0, 44.0, 35.0, 37.0, 17.0, 23.0, 17.0, 20.0, 21.0, 10.0, 12.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.5, -177.724609375, -172.94921875, -168.173828125, -163.3984375, -158.623046875, -153.84765625, -149.072265625, -144.296875, -139.521484375, -134.74609375, -129.970703125, -125.1953125, -120.419921875, -115.64453125, -110.869140625, -106.09375, -101.318359375, -96.54296875, -91.767578125, -86.9921875, -82.216796875, -77.44140625, -72.666015625, -67.890625, -63.115234375, -58.33984375, -53.564453125, -48.7890625, -44.013671875, -39.23828125, -34.462890625, -29.6875, -24.912109375, -20.13671875, -15.361328125, -10.5859375, -5.810546875, -1.03515625, 3.740234375, 8.515625, 13.291015625, 18.06640625, 22.841796875, 27.6171875, 32.392578125, 37.16796875, 41.943359375, 46.71875, 51.494140625, 56.26953125, 61.044921875, 65.8203125, 70.595703125, 75.37109375, 80.146484375, 84.921875, 89.697265625, 94.47265625, 99.248046875, 104.0234375, 108.798828125, 113.57421875, 118.349609375, 123.125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 12.0, 25.0, 40.0, 59.0, 111.0, 190.0, 383.0, 1774.0, 823.0, 309.0, 169.0, 72.0, 43.0, 36.0, 13.0, 11.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-35.21875, -34.5260009765625, -33.833251953125, -33.1405029296875, -32.44775390625, -31.7550048828125, -31.062255859375, -30.3695068359375, -29.6767578125, -28.9840087890625, -28.291259765625, -27.5985107421875, -26.90576171875, -26.2130126953125, -25.520263671875, -24.8275146484375, -24.134765625, -23.4420166015625, -22.749267578125, -22.0565185546875, -21.36376953125, -20.6710205078125, -19.978271484375, -19.2855224609375, -18.5927734375, -17.9000244140625, -17.207275390625, -16.5145263671875, -15.82177734375, -15.1290283203125, -14.436279296875, -13.7435302734375, -13.05078125, -12.3580322265625, -11.665283203125, -10.9725341796875, -10.27978515625, -9.5870361328125, -8.894287109375, -8.2015380859375, -7.5087890625, -6.8160400390625, -6.123291015625, -5.4305419921875, -4.73779296875, -4.0450439453125, -3.352294921875, -2.6595458984375, -1.966796875, -1.2740478515625, -0.581298828125, 0.1114501953125, 0.80419921875, 1.4969482421875, 2.189697265625, 2.8824462890625, 3.5751953125, 4.2679443359375, 4.960693359375, 5.6534423828125, 6.34619140625, 7.0389404296875, 7.731689453125, 8.4244384765625, 9.1171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 11.0, 8.0, 22.0, 27.0, 58.0, 99.0, 129.0, 171.0, 157.0, 131.0, 84.0, 42.0, 27.0, 16.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.67965698242188, -86.5381088256836, -82.39656829833984, -78.25502014160156, -74.11347961425781, -69.97193145751953, -65.83038330078125, -61.6888427734375, -57.547298431396484, -53.40575408935547, -49.26420974731445, -45.12266540527344, -40.981117248535156, -36.839576721191406, -32.698028564453125, -28.55648422241211, -24.414939880371094, -20.273395538330078, -16.131851196289062, -11.990304946899414, -7.848760604858398, -3.707216262817383, 0.4343299865722656, 4.575874328613281, 8.717418670654297, 12.858963012695312, 17.000507354736328, 21.142053604125977, 25.283597946166992, 29.425142288208008, 33.566688537597656, 37.70823287963867, 41.84977722167969, 45.9913215637207, 50.13286590576172, 54.2744140625, 58.41595458984375, 62.55750274658203, 66.69905090332031, 70.84059143066406, 74.98213195800781, 79.1236801147461, 83.26522064208984, 87.40676879882812, 91.54830932617188, 95.68985748291016, 99.83140563964844, 103.97294616699219, 108.11449432373047, 112.25604248046875, 116.3975830078125, 120.53913116455078, 124.68067169189453, 128.8222198486328, 132.96376037597656, 137.10531616210938, 141.24685668945312, 145.38839721679688, 149.5299530029297, 153.67149353027344, 157.8130340576172, 161.95457458496094, 166.09613037109375, 170.2376708984375, 174.37921142578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 3.0, 8.0, 8.0, 12.0, 17.0, 13.0, 17.0, 17.0, 17.0, 21.0, 22.0, 33.0, 31.0, 32.0, 42.0, 41.0, 45.0, 56.0, 31.0, 37.0, 47.0, 59.0, 35.0, 39.0, 34.0, 29.0, 31.0, 27.0, 32.0, 23.0, 14.0, 20.0, 17.0, 11.0, 10.0, 11.0, 9.0, 9.0, 7.0, 6.0, 7.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-54.44488525390625, -52.906551361083984, -51.368221282958984, -49.82988739013672, -48.29155349731445, -46.75321960449219, -45.21488952636719, -43.67655563354492, -42.138221740722656, -40.59988784790039, -39.06155776977539, -37.523223876953125, -35.98488998413086, -34.446556091308594, -32.908226013183594, -31.369892120361328, -29.831560134887695, -28.293228149414062, -26.754894256591797, -25.216562271118164, -23.6782283782959, -22.139896392822266, -20.6015625, -19.063230514526367, -17.524898529052734, -15.986565589904785, -14.448232650756836, -12.909900665283203, -11.371566772460938, -9.833234786987305, -8.294901847839355, -6.756568908691406, -5.218235015869141, -3.6799020767211914, -2.1415693759918213, -0.6032366752624512, 0.935096263885498, 2.4734292030334473, 4.011761665344238, 5.5500946044921875, 7.088427543640137, 8.626760482788086, 10.165093421936035, 11.703426361083984, 13.241758346557617, 14.780092239379883, 16.318424224853516, 17.85675811767578, 19.395090103149414, 20.933422088623047, 22.471755981445312, 24.010087966918945, 25.54842185974121, 27.086753845214844, 28.62508773803711, 30.163419723510742, 31.701751708984375, 33.24008560180664, 34.77841567993164, 36.316749572753906, 37.85508346557617, 39.39341735839844, 40.93174743652344, 42.4700813293457, 44.00841522216797]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 12.0, 13.0, 24.0, 30.0, 39.0, 58.0, 89.0, 92.0, 139.0, 236.0, 350.0, 548.0, 976.0, 1898.0, 4173.0, 10338.0, 29336.0, 82643.0, 211275.0, 350419.0, 219420.0, 86185.0, 30455.0, 10877.0, 4211.0, 1929.0, 1027.0, 607.0, 334.0, 246.0, 167.0, 111.0, 72.0, 63.0, 43.0, 30.0, 20.0, 20.0, 12.0, 3.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.125, -34.044921875, -32.96484375, -31.884765625, -30.8046875, -29.724609375, -28.64453125, -27.564453125, -26.484375, -25.404296875, -24.32421875, -23.244140625, -22.1640625, -21.083984375, -20.00390625, -18.923828125, -17.84375, -16.763671875, -15.68359375, -14.603515625, -13.5234375, -12.443359375, -11.36328125, -10.283203125, -9.203125, -8.123046875, -7.04296875, -5.962890625, -4.8828125, -3.802734375, -2.72265625, -1.642578125, -0.5625, 0.517578125, 1.59765625, 2.677734375, 3.7578125, 4.837890625, 5.91796875, 6.998046875, 8.078125, 9.158203125, 10.23828125, 11.318359375, 12.3984375, 13.478515625, 14.55859375, 15.638671875, 16.71875, 17.798828125, 18.87890625, 19.958984375, 21.0390625, 22.119140625, 23.19921875, 24.279296875, 25.359375, 26.439453125, 27.51953125, 28.599609375, 29.6796875, 30.759765625, 31.83984375, 32.919921875, 34.0]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 6.0, 8.0, 9.0, 20.0, 38.0, 40.0, 54.0, 54.0, 87.0, 71.0, 89.0, 79.0, 87.0, 62.0, 64.0, 52.0, 39.0, 36.0, 27.0, 25.0, 24.0, 10.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.16021728515625, -4.9844970703125, -4.80877685546875, -4.633056640625, -4.45733642578125, -4.2816162109375, -4.10589599609375, -3.93017578125, -3.75445556640625, -3.5787353515625, -3.40301513671875, -3.227294921875, -3.05157470703125, -2.8758544921875, -2.70013427734375, -2.5244140625, -2.34869384765625, -2.1729736328125, -1.99725341796875, -1.821533203125, -1.64581298828125, -1.4700927734375, -1.29437255859375, -1.11865234375, -0.94293212890625, -0.7672119140625, -0.59149169921875, -0.415771484375, -0.24005126953125, -0.0643310546875, 0.11138916015625, 0.287109375, 0.46282958984375, 0.6385498046875, 0.81427001953125, 0.989990234375, 1.16571044921875, 1.3414306640625, 1.51715087890625, 1.69287109375, 1.86859130859375, 2.0443115234375, 2.22003173828125, 2.395751953125, 2.57147216796875, 2.7471923828125, 2.92291259765625, 3.0986328125, 3.27435302734375, 3.4500732421875, 3.62579345703125, 3.801513671875, 3.97723388671875, 4.1529541015625, 4.32867431640625, 4.50439453125, 4.68011474609375, 4.8558349609375, 5.03155517578125, 5.207275390625, 5.38299560546875, 5.5587158203125, 5.73443603515625, 5.91015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 18.0, 26.0, 31.0, 66.0, 75.0, 139.0, 242.0, 419.0, 760.0, 1377.0, 3141.0, 8163.0, 25922.0, 91283.0, 296564.0, 405585.0, 150516.0, 42715.0, 12577.0, 4550.0, 1998.0, 1029.0, 509.0, 313.0, 209.0, 117.0, 78.0, 40.0, 25.0, 12.0, 14.0, 9.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.71435546875, -39.3662109375, -38.01806640625, -36.669921875, -35.32177734375, -33.9736328125, -32.62548828125, -31.27734375, -29.92919921875, -28.5810546875, -27.23291015625, -25.884765625, -24.53662109375, -23.1884765625, -21.84033203125, -20.4921875, -19.14404296875, -17.7958984375, -16.44775390625, -15.099609375, -13.75146484375, -12.4033203125, -11.05517578125, -9.70703125, -8.35888671875, -7.0107421875, -5.66259765625, -4.314453125, -2.96630859375, -1.6181640625, -0.27001953125, 1.078125, 2.42626953125, 3.7744140625, 5.12255859375, 6.470703125, 7.81884765625, 9.1669921875, 10.51513671875, 11.86328125, 13.21142578125, 14.5595703125, 15.90771484375, 17.255859375, 18.60400390625, 19.9521484375, 21.30029296875, 22.6484375, 23.99658203125, 25.3447265625, 26.69287109375, 28.041015625, 29.38916015625, 30.7373046875, 32.08544921875, 33.43359375, 34.78173828125, 36.1298828125, 37.47802734375, 38.826171875, 40.17431640625, 41.5224609375, 42.87060546875, 44.21875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 7.0, 4.0, 8.0, 7.0, 12.0, 19.0, 24.0, 20.0, 26.0, 34.0, 39.0, 42.0, 52.0, 50.0, 55.0, 54.0, 52.0, 47.0, 51.0, 48.0, 55.0, 40.0, 41.0, 37.0, 25.0, 34.0, 28.0, 15.0, 15.0, 9.0, 7.0, 7.0, 8.0, 7.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.114501953125, -19.38525390625, -18.656005859375, -17.9267578125, -17.197509765625, -16.46826171875, -15.739013671875, -15.009765625, -14.280517578125, -13.55126953125, -12.822021484375, -12.0927734375, -11.363525390625, -10.63427734375, -9.905029296875, -9.17578125, -8.446533203125, -7.71728515625, -6.988037109375, -6.2587890625, -5.529541015625, -4.80029296875, -4.071044921875, -3.341796875, -2.612548828125, -1.88330078125, -1.154052734375, -0.4248046875, 0.304443359375, 1.03369140625, 1.762939453125, 2.4921875, 3.221435546875, 3.95068359375, 4.679931640625, 5.4091796875, 6.138427734375, 6.86767578125, 7.596923828125, 8.326171875, 9.055419921875, 9.78466796875, 10.513916015625, 11.2431640625, 11.972412109375, 12.70166015625, 13.430908203125, 14.16015625, 14.889404296875, 15.61865234375, 16.347900390625, 17.0771484375, 17.806396484375, 18.53564453125, 19.264892578125, 19.994140625, 20.723388671875, 21.45263671875, 22.181884765625, 22.9111328125, 23.640380859375, 24.36962890625, 25.098876953125, 25.828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 11.0, 8.0, 4.0, 13.0, 14.0, 14.0, 29.0, 37.0, 63.0, 119.0, 181.0, 318.0, 522.0, 1147.0, 2438.0, 6281.0, 19911.0, 81039.0, 329669.0, 432661.0, 129229.0, 29805.0, 8774.0, 3298.0, 1437.0, 637.0, 336.0, 207.0, 127.0, 76.0, 35.0, 35.0, 34.0, 15.0, 7.0, 9.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.445068359375, -20.73388671875, -20.022705078125, -19.3115234375, -18.600341796875, -17.88916015625, -17.177978515625, -16.466796875, -15.755615234375, -15.04443359375, -14.333251953125, -13.6220703125, -12.910888671875, -12.19970703125, -11.488525390625, -10.77734375, -10.066162109375, -9.35498046875, -8.643798828125, -7.9326171875, -7.221435546875, -6.51025390625, -5.799072265625, -5.087890625, -4.376708984375, -3.66552734375, -2.954345703125, -2.2431640625, -1.531982421875, -0.82080078125, -0.109619140625, 0.6015625, 1.312744140625, 2.02392578125, 2.735107421875, 3.4462890625, 4.157470703125, 4.86865234375, 5.579833984375, 6.291015625, 7.002197265625, 7.71337890625, 8.424560546875, 9.1357421875, 9.846923828125, 10.55810546875, 11.269287109375, 11.98046875, 12.691650390625, 13.40283203125, 14.114013671875, 14.8251953125, 15.536376953125, 16.24755859375, 16.958740234375, 17.669921875, 18.381103515625, 19.09228515625, 19.803466796875, 20.5146484375, 21.225830078125, 21.93701171875, 22.648193359375, 23.359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 11.0, 9.0, 14.0, 15.0, 16.0, 26.0, 30.0, 38.0, 50.0, 68.0, 81.0, 76.0, 102.0, 79.0, 82.0, 73.0, 61.0, 31.0, 36.0, 21.0, 15.0, 11.0, 10.0, 7.0, 5.0, 8.0, 4.0, 0.0, 9.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0030155181884765625, -0.00293537974357605, -0.002855241298675537, -0.0027751028537750244, -0.0026949644088745117, -0.002614825963973999, -0.0025346875190734863, -0.0024545490741729736, -0.002374410629272461, -0.0022942721843719482, -0.0022141337394714355, -0.002133995294570923, -0.00205385684967041, -0.0019737184047698975, -0.0018935799598693848, -0.001813441514968872, -0.0017333030700683594, -0.0016531646251678467, -0.001573026180267334, -0.0014928877353668213, -0.0014127492904663086, -0.001332610845565796, -0.0012524724006652832, -0.0011723339557647705, -0.0010921955108642578, -0.0010120570659637451, -0.0009319186210632324, -0.0008517801761627197, -0.000771641731262207, -0.0006915032863616943, -0.0006113648414611816, -0.0005312263965606689, -0.00045108795166015625, -0.00037094950675964355, -0.00029081106185913086, -0.00021067261695861816, -0.00013053417205810547, -5.0395727157592773e-05, 2.9742717742919922e-05, 0.00010988116264343262, 0.0001900196075439453, 0.000270158052444458, 0.0003502964973449707, 0.0004304349422454834, 0.0005105733871459961, 0.0005907118320465088, 0.0006708502769470215, 0.0007509887218475342, 0.0008311271667480469, 0.0009112656116485596, 0.0009914040565490723, 0.001071542501449585, 0.0011516809463500977, 0.0012318193912506104, 0.001311957836151123, 0.0013920962810516357, 0.0014722347259521484, 0.0015523731708526611, 0.0016325116157531738, 0.0017126500606536865, 0.0017927885055541992, 0.001872926950454712, 0.0019530653953552246, 0.0020332038402557373, 0.00211334228515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 9.0, 15.0, 18.0, 23.0, 57.0, 65.0, 105.0, 192.0, 325.0, 673.0, 1548.0, 4115.0, 11891.0, 49518.0, 262732.0, 529896.0, 144874.0, 29223.0, 8018.0, 2760.0, 1158.0, 588.0, 282.0, 175.0, 102.0, 59.0, 43.0, 22.0, 18.0, 19.0, 10.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.15625, -31.317138671875, -30.47802734375, -29.638916015625, -28.7998046875, -27.960693359375, -27.12158203125, -26.282470703125, -25.443359375, -24.604248046875, -23.76513671875, -22.926025390625, -22.0869140625, -21.247802734375, -20.40869140625, -19.569580078125, -18.73046875, -17.891357421875, -17.05224609375, -16.213134765625, -15.3740234375, -14.534912109375, -13.69580078125, -12.856689453125, -12.017578125, -11.178466796875, -10.33935546875, -9.500244140625, -8.6611328125, -7.822021484375, -6.98291015625, -6.143798828125, -5.3046875, -4.465576171875, -3.62646484375, -2.787353515625, -1.9482421875, -1.109130859375, -0.27001953125, 0.569091796875, 1.408203125, 2.247314453125, 3.08642578125, 3.925537109375, 4.7646484375, 5.603759765625, 6.44287109375, 7.281982421875, 8.12109375, 8.960205078125, 9.79931640625, 10.638427734375, 11.4775390625, 12.316650390625, 13.15576171875, 13.994873046875, 14.833984375, 15.673095703125, 16.51220703125, 17.351318359375, 18.1904296875, 19.029541015625, 19.86865234375, 20.707763671875, 21.546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 17.0, 36.0, 35.0, 34.0, 55.0, 68.0, 69.0, 77.0, 92.0, 88.0, 90.0, 83.0, 54.0, 50.0, 37.0, 30.0, 15.0, 7.0, 16.0, 8.0, 7.0, 5.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.2769775390625, -9.843017578125, -9.4090576171875, -8.97509765625, -8.5411376953125, -8.107177734375, -7.6732177734375, -7.2392578125, -6.8052978515625, -6.371337890625, -5.9373779296875, -5.50341796875, -5.0694580078125, -4.635498046875, -4.2015380859375, -3.767578125, -3.3336181640625, -2.899658203125, -2.4656982421875, -2.03173828125, -1.5977783203125, -1.163818359375, -0.7298583984375, -0.2958984375, 0.1380615234375, 0.572021484375, 1.0059814453125, 1.43994140625, 1.8739013671875, 2.307861328125, 2.7418212890625, 3.17578125, 3.6097412109375, 4.043701171875, 4.4776611328125, 4.91162109375, 5.3455810546875, 5.779541015625, 6.2135009765625, 6.6474609375, 7.0814208984375, 7.515380859375, 7.9493408203125, 8.38330078125, 8.8172607421875, 9.251220703125, 9.6851806640625, 10.119140625, 10.5531005859375, 10.987060546875, 11.4210205078125, 11.85498046875, 12.2889404296875, 12.722900390625, 13.1568603515625, 13.5908203125, 14.0247802734375, 14.458740234375, 14.8927001953125, 15.32666015625, 15.7606201171875, 16.194580078125, 16.6285400390625, 17.0625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 15.0, 19.0, 27.0, 46.0, 66.0, 93.0, 125.0, 146.0, 116.0, 101.0, 75.0, 51.0, 30.0, 20.0, 20.0, 20.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.0174102783203, -228.56361389160156, -221.1098175048828, -213.65602111816406, -206.2022247314453, -198.74842834472656, -191.29461669921875, -183.8408203125, -176.38702392578125, -168.9332275390625, -161.47943115234375, -154.025634765625, -146.57183837890625, -139.1180419921875, -131.66424560546875, -124.21044158935547, -116.75665283203125, -109.3028564453125, -101.84906005859375, -94.395263671875, -86.94146728515625, -79.4876708984375, -72.03386688232422, -64.58007049560547, -57.12627410888672, -49.67247772216797, -42.21868133544922, -34.7648811340332, -27.311084747314453, -19.857288360595703, -12.403488159179688, -4.9496917724609375, 2.5041046142578125, 9.957901954650879, 17.411699295043945, 24.865497589111328, 32.31929397583008, 39.77309036254883, 47.226890563964844, 54.680686950683594, 62.134483337402344, 69.5882797241211, 77.04207611083984, 84.49588012695312, 91.94967651367188, 99.40347290039062, 106.85726928710938, 114.31106567382812, 121.76486206054688, 129.21865844726562, 136.67245483398438, 144.12625122070312, 151.58004760742188, 159.03384399414062, 166.48764038085938, 173.94143676757812, 181.39523315429688, 188.84902954101562, 196.30282592773438, 203.75662231445312, 211.21041870117188, 218.66421508789062, 226.11801147460938, 233.57180786132812, 241.02561950683594]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 5.0, 8.0, 7.0, 12.0, 25.0, 17.0, 22.0, 22.0, 41.0, 47.0, 43.0, 46.0, 50.0, 65.0, 58.0, 62.0, 68.0, 63.0, 66.0, 44.0, 55.0, 48.0, 31.0, 20.0, 18.0, 15.0, 14.0, 8.0, 10.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-195.95518493652344, -189.98155212402344, -184.00791931152344, -178.03427124023438, -172.06063842773438, -166.08700561523438, -160.11337280273438, -154.13973999023438, -148.16610717773438, -142.19247436523438, -136.21884155273438, -130.24520874023438, -124.27156066894531, -118.29792785644531, -112.32429504394531, -106.35066223144531, -100.37701416015625, -94.40338134765625, -88.42974090576172, -82.45610809326172, -76.48246765136719, -70.50883483886719, -64.53520202636719, -58.56156539916992, -52.587928771972656, -46.61429214477539, -40.640655517578125, -34.667022705078125, -28.69338607788086, -22.719749450683594, -16.746116638183594, -10.772480010986328, -4.798828125, 1.1748075485229492, 7.148443222045898, 13.122077941894531, 19.095714569091797, 25.069351196289062, 31.042984008789062, 37.01662063598633, 42.990257263183594, 48.96389389038086, 54.937530517578125, 60.911163330078125, 66.88479614257812, 72.85843658447266, 78.83206939697266, 84.80570983886719, 90.77934265136719, 96.75297546386719, 102.72661590576172, 108.70024871826172, 114.67388916015625, 120.64752197265625, 126.62115478515625, 132.59478759765625, 138.56842041015625, 144.54205322265625, 150.51568603515625, 156.48931884765625, 162.4629669189453, 168.4365997314453, 174.4102325439453, 180.3838653564453, 186.35751342773438]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 21.0, 20.0, 44.0, 71.0, 210.0, 625.0, 3059.0, 31976.0, 4023299.0, 127020.0, 6318.0, 988.0, 295.0, 148.0, 80.0, 41.0, 29.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.0, -185.744140625, -179.48828125, -173.232421875, -166.9765625, -160.720703125, -154.46484375, -148.208984375, -141.953125, -135.697265625, -129.44140625, -123.185546875, -116.9296875, -110.673828125, -104.41796875, -98.162109375, -91.90625, -85.650390625, -79.39453125, -73.138671875, -66.8828125, -60.626953125, -54.37109375, -48.115234375, -41.859375, -35.603515625, -29.34765625, -23.091796875, -16.8359375, -10.580078125, -4.32421875, 1.931640625, 8.1875, 14.443359375, 20.69921875, 26.955078125, 33.2109375, 39.466796875, 45.72265625, 51.978515625, 58.234375, 64.490234375, 70.74609375, 77.001953125, 83.2578125, 89.513671875, 95.76953125, 102.025390625, 108.28125, 114.537109375, 120.79296875, 127.048828125, 133.3046875, 139.560546875, 145.81640625, 152.072265625, 158.328125, 164.583984375, 170.83984375, 177.095703125, 183.3515625, 189.607421875, 195.86328125, 202.119140625, 208.375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 10.0, 18.0, 28.0, 45.0, 60.0, 79.0, 99.0, 111.0, 114.0, 113.0, 85.0, 79.0, 54.0, 36.0, 30.0, 16.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.58251953125, -8.2900390625, -7.99755859375, -7.705078125, -7.41259765625, -7.1201171875, -6.82763671875, -6.53515625, -6.24267578125, -5.9501953125, -5.65771484375, -5.365234375, -5.07275390625, -4.7802734375, -4.48779296875, -4.1953125, -3.90283203125, -3.6103515625, -3.31787109375, -3.025390625, -2.73291015625, -2.4404296875, -2.14794921875, -1.85546875, -1.56298828125, -1.2705078125, -0.97802734375, -0.685546875, -0.39306640625, -0.1005859375, 0.19189453125, 0.484375, 0.77685546875, 1.0693359375, 1.36181640625, 1.654296875, 1.94677734375, 2.2392578125, 2.53173828125, 2.82421875, 3.11669921875, 3.4091796875, 3.70166015625, 3.994140625, 4.28662109375, 4.5791015625, 4.87158203125, 5.1640625, 5.45654296875, 5.7490234375, 6.04150390625, 6.333984375, 6.62646484375, 6.9189453125, 7.21142578125, 7.50390625, 7.79638671875, 8.0888671875, 8.38134765625, 8.673828125, 8.96630859375, 9.2587890625, 9.55126953125, 9.84375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 10.0, 6.0, 15.0, 20.0, 30.0, 52.0, 79.0, 108.0, 182.0, 245.0, 397.0, 689.0, 1191.0, 2125.0, 3907.0, 7731.0, 17531.0, 43438.0, 128958.0, 611340.0, 2940878.0, 298710.0, 81984.0, 29459.0, 12331.0, 5629.0, 3019.0, 1599.0, 990.0, 563.0, 352.0, 228.0, 138.0, 116.0, 68.0, 47.0, 35.0, 23.0, 18.0, 11.0, 5.0, 4.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-41.25, -39.97314453125, -38.6962890625, -37.41943359375, -36.142578125, -34.86572265625, -33.5888671875, -32.31201171875, -31.03515625, -29.75830078125, -28.4814453125, -27.20458984375, -25.927734375, -24.65087890625, -23.3740234375, -22.09716796875, -20.8203125, -19.54345703125, -18.2666015625, -16.98974609375, -15.712890625, -14.43603515625, -13.1591796875, -11.88232421875, -10.60546875, -9.32861328125, -8.0517578125, -6.77490234375, -5.498046875, -4.22119140625, -2.9443359375, -1.66748046875, -0.390625, 0.88623046875, 2.1630859375, 3.43994140625, 4.716796875, 5.99365234375, 7.2705078125, 8.54736328125, 9.82421875, 11.10107421875, 12.3779296875, 13.65478515625, 14.931640625, 16.20849609375, 17.4853515625, 18.76220703125, 20.0390625, 21.31591796875, 22.5927734375, 23.86962890625, 25.146484375, 26.42333984375, 27.7001953125, 28.97705078125, 30.25390625, 31.53076171875, 32.8076171875, 34.08447265625, 35.361328125, 36.63818359375, 37.9150390625, 39.19189453125, 40.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 8.0, 16.0, 10.0, 25.0, 39.0, 43.0, 60.0, 83.0, 135.0, 251.0, 435.0, 1569.0, 580.0, 291.0, 162.0, 104.0, 74.0, 44.0, 29.0, 20.0, 17.0, 11.0, 5.0, 12.0, 4.0, 6.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.767333984375, -10.37841796875, -9.989501953125, -9.6005859375, -9.211669921875, -8.82275390625, -8.433837890625, -8.044921875, -7.656005859375, -7.26708984375, -6.878173828125, -6.4892578125, -6.100341796875, -5.71142578125, -5.322509765625, -4.93359375, -4.544677734375, -4.15576171875, -3.766845703125, -3.3779296875, -2.989013671875, -2.60009765625, -2.211181640625, -1.822265625, -1.433349609375, -1.04443359375, -0.655517578125, -0.2666015625, 0.122314453125, 0.51123046875, 0.900146484375, 1.2890625, 1.677978515625, 2.06689453125, 2.455810546875, 2.8447265625, 3.233642578125, 3.62255859375, 4.011474609375, 4.400390625, 4.789306640625, 5.17822265625, 5.567138671875, 5.9560546875, 6.344970703125, 6.73388671875, 7.122802734375, 7.51171875, 7.900634765625, 8.28955078125, 8.678466796875, 9.0673828125, 9.456298828125, 9.84521484375, 10.234130859375, 10.623046875, 11.011962890625, 11.40087890625, 11.789794921875, 12.1787109375, 12.567626953125, 12.95654296875, 13.345458984375, 13.734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 8.0, 9.0, 18.0, 20.0, 56.0, 99.0, 111.0, 143.0, 158.0, 141.0, 94.0, 66.0, 27.0, 13.0, 15.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-103.37364196777344, -100.0563735961914, -96.73910522460938, -93.42183685302734, -90.10456848144531, -86.78730010986328, -83.47003173828125, -80.15276336669922, -76.83549499511719, -73.51822662353516, -70.20095825195312, -66.8836898803711, -63.56642150878906, -60.24915313720703, -56.931884765625, -53.61461639404297, -50.29734802246094, -46.980079650878906, -43.662811279296875, -40.345542907714844, -37.02827453613281, -33.71100616455078, -30.39373779296875, -27.07646942138672, -23.759201049804688, -20.441932678222656, -17.124664306640625, -13.807395935058594, -10.490127563476562, -7.172859191894531, -3.8555908203125, -0.5383224487304688, 2.7789459228515625, 6.096214294433594, 9.413482666015625, 12.730751037597656, 16.048019409179688, 19.36528778076172, 22.68255615234375, 25.99982452392578, 29.317092895507812, 32.634361267089844, 35.951629638671875, 39.268898010253906, 42.58616638183594, 45.90343475341797, 49.220703125, 52.53797149658203, 55.85523986816406, 59.172508239746094, 62.489776611328125, 65.80704498291016, 69.12431335449219, 72.44158172607422, 75.75885009765625, 79.07611846923828, 82.39338684082031, 85.71065521240234, 89.02792358398438, 92.3451919555664, 95.66246032714844, 98.97972869873047, 102.2969970703125, 105.61426544189453, 108.93153381347656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 7.0, 22.0, 17.0, 29.0, 44.0, 45.0, 56.0, 55.0, 69.0, 76.0, 73.0, 80.0, 75.0, 56.0, 52.0, 61.0, 36.0, 39.0, 27.0, 20.0, 17.0, 11.0, 10.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.8619384765625, -69.64143371582031, -67.4209213256836, -65.2004165649414, -62.97990417480469, -60.7593994140625, -58.53889083862305, -56.318382263183594, -54.09787368774414, -51.87736511230469, -49.656856536865234, -47.43634796142578, -45.215843200683594, -42.995330810546875, -40.77482604980469, -38.554317474365234, -36.33380889892578, -34.11330032348633, -31.892791748046875, -29.672285079956055, -27.4517765045166, -25.23126792907715, -23.010761260986328, -20.790252685546875, -18.569744110107422, -16.34923553466797, -14.128727912902832, -11.908220291137695, -9.687711715698242, -7.467203140258789, -5.246695518493652, -3.0261878967285156, -0.8056716918945312, 1.4148364067077637, 3.6353445053100586, 5.8558526039123535, 8.076360702514648, 10.296869277954102, 12.517376899719238, 14.737884521484375, 16.958393096923828, 19.17890167236328, 21.399410247802734, 23.619916915893555, 25.840425491333008, 28.06093406677246, 30.28144073486328, 32.501949310302734, 34.72245788574219, 36.94296646118164, 39.163475036621094, 41.38398361206055, 43.6044921875, 45.82499694824219, 48.04550552368164, 50.266014099121094, 52.48652267456055, 54.70703125, 56.92753982543945, 59.148048400878906, 61.368553161621094, 63.58906555175781, 65.8095703125, 68.03007507324219, 70.2505874633789]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 11.0, 8.0, 14.0, 14.0, 27.0, 29.0, 45.0, 65.0, 93.0, 104.0, 148.0, 208.0, 295.0, 492.0, 760.0, 1259.0, 2359.0, 4772.0, 11018.0, 27549.0, 73853.0, 187845.0, 346620.0, 232535.0, 95748.0, 35971.0, 13954.0, 5791.0, 2806.0, 1495.0, 880.0, 555.0, 332.0, 225.0, 178.0, 114.0, 91.0, 61.0, 61.0, 41.0, 35.0, 22.0, 12.0, 19.0, 6.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.203125, -29.277587890625, -28.35205078125, -27.426513671875, -26.5009765625, -25.575439453125, -24.64990234375, -23.724365234375, -22.798828125, -21.873291015625, -20.94775390625, -20.022216796875, -19.0966796875, -18.171142578125, -17.24560546875, -16.320068359375, -15.39453125, -14.468994140625, -13.54345703125, -12.617919921875, -11.6923828125, -10.766845703125, -9.84130859375, -8.915771484375, -7.990234375, -7.064697265625, -6.13916015625, -5.213623046875, -4.2880859375, -3.362548828125, -2.43701171875, -1.511474609375, -0.5859375, 0.339599609375, 1.26513671875, 2.190673828125, 3.1162109375, 4.041748046875, 4.96728515625, 5.892822265625, 6.818359375, 7.743896484375, 8.66943359375, 9.594970703125, 10.5205078125, 11.446044921875, 12.37158203125, 13.297119140625, 14.22265625, 15.148193359375, 16.07373046875, 16.999267578125, 17.9248046875, 18.850341796875, 19.77587890625, 20.701416015625, 21.626953125, 22.552490234375, 23.47802734375, 24.403564453125, 25.3291015625, 26.254638671875, 27.18017578125, 28.105712890625, 29.03125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 13.0, 26.0, 23.0, 42.0, 65.0, 70.0, 92.0, 95.0, 123.0, 108.0, 90.0, 77.0, 56.0, 37.0, 21.0, 19.0, 12.0, 9.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1796875, -8.8953857421875, -8.611083984375, -8.3267822265625, -8.04248046875, -7.7581787109375, -7.473876953125, -7.1895751953125, -6.9052734375, -6.6209716796875, -6.336669921875, -6.0523681640625, -5.76806640625, -5.4837646484375, -5.199462890625, -4.9151611328125, -4.630859375, -4.3465576171875, -4.062255859375, -3.7779541015625, -3.49365234375, -3.2093505859375, -2.925048828125, -2.6407470703125, -2.3564453125, -2.0721435546875, -1.787841796875, -1.5035400390625, -1.21923828125, -0.9349365234375, -0.650634765625, -0.3663330078125, -0.08203125, 0.2022705078125, 0.486572265625, 0.7708740234375, 1.05517578125, 1.3394775390625, 1.623779296875, 1.9080810546875, 2.1923828125, 2.4766845703125, 2.760986328125, 3.0452880859375, 3.32958984375, 3.6138916015625, 3.898193359375, 4.1824951171875, 4.466796875, 4.7510986328125, 5.035400390625, 5.3197021484375, 5.60400390625, 5.8883056640625, 6.172607421875, 6.4569091796875, 6.7412109375, 7.0255126953125, 7.309814453125, 7.5941162109375, 7.87841796875, 8.1627197265625, 8.447021484375, 8.7313232421875, 9.015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 15.0, 13.0, 26.0, 38.0, 41.0, 64.0, 94.0, 153.0, 227.0, 323.0, 506.0, 787.0, 1282.0, 2132.0, 4017.0, 7553.0, 14868.0, 31739.0, 68965.0, 142422.0, 247907.0, 249001.0, 142870.0, 69079.0, 31918.0, 15283.0, 7623.0, 3934.0, 2177.0, 1278.0, 727.0, 495.0, 302.0, 212.0, 143.0, 98.0, 61.0, 54.0, 33.0, 33.0, 14.0, 13.0, 10.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.015625, -21.3681640625, -20.720703125, -20.0732421875, -19.42578125, -18.7783203125, -18.130859375, -17.4833984375, -16.8359375, -16.1884765625, -15.541015625, -14.8935546875, -14.24609375, -13.5986328125, -12.951171875, -12.3037109375, -11.65625, -11.0087890625, -10.361328125, -9.7138671875, -9.06640625, -8.4189453125, -7.771484375, -7.1240234375, -6.4765625, -5.8291015625, -5.181640625, -4.5341796875, -3.88671875, -3.2392578125, -2.591796875, -1.9443359375, -1.296875, -0.6494140625, -0.001953125, 0.6455078125, 1.29296875, 1.9404296875, 2.587890625, 3.2353515625, 3.8828125, 4.5302734375, 5.177734375, 5.8251953125, 6.47265625, 7.1201171875, 7.767578125, 8.4150390625, 9.0625, 9.7099609375, 10.357421875, 11.0048828125, 11.65234375, 12.2998046875, 12.947265625, 13.5947265625, 14.2421875, 14.8896484375, 15.537109375, 16.1845703125, 16.83203125, 17.4794921875, 18.126953125, 18.7744140625, 19.421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 7.0, 7.0, 4.0, 7.0, 11.0, 12.0, 19.0, 16.0, 20.0, 16.0, 24.0, 23.0, 42.0, 27.0, 29.0, 32.0, 32.0, 32.0, 42.0, 55.0, 45.0, 34.0, 41.0, 34.0, 45.0, 37.0, 41.0, 35.0, 28.0, 25.0, 34.0, 30.0, 21.0, 16.0, 10.0, 13.0, 4.0, 8.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.1875, -20.575439453125, -19.96337890625, -19.351318359375, -18.7392578125, -18.127197265625, -17.51513671875, -16.903076171875, -16.291015625, -15.678955078125, -15.06689453125, -14.454833984375, -13.8427734375, -13.230712890625, -12.61865234375, -12.006591796875, -11.39453125, -10.782470703125, -10.17041015625, -9.558349609375, -8.9462890625, -8.334228515625, -7.72216796875, -7.110107421875, -6.498046875, -5.885986328125, -5.27392578125, -4.661865234375, -4.0498046875, -3.437744140625, -2.82568359375, -2.213623046875, -1.6015625, -0.989501953125, -0.37744140625, 0.234619140625, 0.8466796875, 1.458740234375, 2.07080078125, 2.682861328125, 3.294921875, 3.906982421875, 4.51904296875, 5.131103515625, 5.7431640625, 6.355224609375, 6.96728515625, 7.579345703125, 8.19140625, 8.803466796875, 9.41552734375, 10.027587890625, 10.6396484375, 11.251708984375, 11.86376953125, 12.475830078125, 13.087890625, 13.699951171875, 14.31201171875, 14.924072265625, 15.5361328125, 16.148193359375, 16.76025390625, 17.372314453125, 17.984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 11.0, 5.0, 8.0, 18.0, 19.0, 28.0, 40.0, 44.0, 100.0, 119.0, 200.0, 341.0, 629.0, 1196.0, 2520.0, 5773.0, 14580.0, 42132.0, 136179.0, 366015.0, 316327.0, 107584.0, 33481.0, 11721.0, 4781.0, 2200.0, 1087.0, 555.0, 338.0, 172.0, 106.0, 68.0, 55.0, 33.0, 31.0, 13.0, 11.0, 10.0, 14.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.890625, -11.5291748046875, -11.167724609375, -10.8062744140625, -10.44482421875, -10.0833740234375, -9.721923828125, -9.3604736328125, -8.9990234375, -8.6375732421875, -8.276123046875, -7.9146728515625, -7.55322265625, -7.1917724609375, -6.830322265625, -6.4688720703125, -6.107421875, -5.7459716796875, -5.384521484375, -5.0230712890625, -4.66162109375, -4.3001708984375, -3.938720703125, -3.5772705078125, -3.2158203125, -2.8543701171875, -2.492919921875, -2.1314697265625, -1.77001953125, -1.4085693359375, -1.047119140625, -0.6856689453125, -0.32421875, 0.0372314453125, 0.398681640625, 0.7601318359375, 1.12158203125, 1.4830322265625, 1.844482421875, 2.2059326171875, 2.5673828125, 2.9288330078125, 3.290283203125, 3.6517333984375, 4.01318359375, 4.3746337890625, 4.736083984375, 5.0975341796875, 5.458984375, 5.8204345703125, 6.181884765625, 6.5433349609375, 6.90478515625, 7.2662353515625, 7.627685546875, 7.9891357421875, 8.3505859375, 8.7120361328125, 9.073486328125, 9.4349365234375, 9.79638671875, 10.1578369140625, 10.519287109375, 10.8807373046875, 11.2421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 11.0, 14.0, 12.0, 23.0, 23.0, 25.0, 39.0, 30.0, 35.0, 42.0, 41.0, 72.0, 75.0, 69.0, 76.0, 58.0, 69.0, 40.0, 36.0, 34.0, 33.0, 19.0, 11.0, 15.0, 10.0, 13.0, 5.0, 9.0, 3.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00146484375, -0.0014165490865707397, -0.0013682544231414795, -0.0013199597597122192, -0.001271665096282959, -0.0012233704328536987, -0.0011750757694244385, -0.0011267811059951782, -0.001078486442565918, -0.0010301917791366577, -0.0009818971157073975, -0.0009336024522781372, -0.000885307788848877, -0.0008370131254196167, -0.0007887184619903564, -0.0007404237985610962, -0.0006921291351318359, -0.0006438344717025757, -0.0005955398082733154, -0.0005472451448440552, -0.0004989504814147949, -0.00045065581798553467, -0.0004023611545562744, -0.00035406649112701416, -0.0003057718276977539, -0.00025747716426849365, -0.0002091825008392334, -0.00016088783740997314, -0.00011259317398071289, -6.429851055145264e-05, -1.6003847122192383e-05, 3.229081630706787e-05, 8.058547973632812e-05, 0.00012888014316558838, 0.00017717480659484863, 0.0002254694700241089, 0.00027376413345336914, 0.0003220587968826294, 0.00037035346031188965, 0.0004186481237411499, 0.00046694278717041016, 0.0005152374505996704, 0.0005635321140289307, 0.0006118267774581909, 0.0006601214408874512, 0.0007084161043167114, 0.0007567107677459717, 0.0008050054311752319, 0.0008533000946044922, 0.0009015947580337524, 0.0009498894214630127, 0.000998184084892273, 0.0010464787483215332, 0.0010947734117507935, 0.0011430680751800537, 0.001191362738609314, 0.0012396574020385742, 0.0012879520654678345, 0.0013362467288970947, 0.001384541392326355, 0.0014328360557556152, 0.0014811307191848755, 0.0015294253826141357, 0.001577720046043396, 0.0016260147094726562]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 17.0, 9.0, 25.0, 23.0, 46.0, 75.0, 119.0, 242.0, 379.0, 693.0, 1545.0, 3244.0, 8295.0, 23705.0, 80879.0, 314874.0, 430954.0, 128281.0, 35050.0, 11667.0, 4438.0, 2002.0, 895.0, 428.0, 244.0, 151.0, 95.0, 59.0, 32.0, 24.0, 17.0, 19.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.828125, -15.3905029296875, -14.952880859375, -14.5152587890625, -14.07763671875, -13.6400146484375, -13.202392578125, -12.7647705078125, -12.3271484375, -11.8895263671875, -11.451904296875, -11.0142822265625, -10.57666015625, -10.1390380859375, -9.701416015625, -9.2637939453125, -8.826171875, -8.3885498046875, -7.950927734375, -7.5133056640625, -7.07568359375, -6.6380615234375, -6.200439453125, -5.7628173828125, -5.3251953125, -4.8875732421875, -4.449951171875, -4.0123291015625, -3.57470703125, -3.1370849609375, -2.699462890625, -2.2618408203125, -1.82421875, -1.3865966796875, -0.948974609375, -0.5113525390625, -0.07373046875, 0.3638916015625, 0.801513671875, 1.2391357421875, 1.6767578125, 2.1143798828125, 2.552001953125, 2.9896240234375, 3.42724609375, 3.8648681640625, 4.302490234375, 4.7401123046875, 5.177734375, 5.6153564453125, 6.052978515625, 6.4906005859375, 6.92822265625, 7.3658447265625, 7.803466796875, 8.2410888671875, 8.6787109375, 9.1163330078125, 9.553955078125, 9.9915771484375, 10.42919921875, 10.8668212890625, 11.304443359375, 11.7420654296875, 12.1796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 6.0, 15.0, 18.0, 13.0, 27.0, 36.0, 40.0, 65.0, 68.0, 73.0, 95.0, 109.0, 84.0, 66.0, 61.0, 47.0, 38.0, 32.0, 17.0, 19.0, 12.0, 7.0, 6.0, 12.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.3541259765625, -6.052001953125, -5.7498779296875, -5.44775390625, -5.1456298828125, -4.843505859375, -4.5413818359375, -4.2392578125, -3.9371337890625, -3.635009765625, -3.3328857421875, -3.03076171875, -2.7286376953125, -2.426513671875, -2.1243896484375, -1.822265625, -1.5201416015625, -1.218017578125, -0.9158935546875, -0.61376953125, -0.3116455078125, -0.009521484375, 0.2926025390625, 0.5947265625, 0.8968505859375, 1.198974609375, 1.5010986328125, 1.80322265625, 2.1053466796875, 2.407470703125, 2.7095947265625, 3.01171875, 3.3138427734375, 3.615966796875, 3.9180908203125, 4.22021484375, 4.5223388671875, 4.824462890625, 5.1265869140625, 5.4287109375, 5.7308349609375, 6.032958984375, 6.3350830078125, 6.63720703125, 6.9393310546875, 7.241455078125, 7.5435791015625, 7.845703125, 8.1478271484375, 8.449951171875, 8.7520751953125, 9.05419921875, 9.3563232421875, 9.658447265625, 9.9605712890625, 10.2626953125, 10.5648193359375, 10.866943359375, 11.1690673828125, 11.47119140625, 11.7733154296875, 12.075439453125, 12.3775634765625, 12.6796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 24.0, 40.0, 46.0, 90.0, 124.0, 138.0, 135.0, 127.0, 98.0, 66.0, 28.0, 32.0, 15.0, 9.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.49996948242188, -204.92770385742188, -198.35545349121094, -191.78318786621094, -185.21092224121094, -178.638671875, -172.06640625, -165.494140625, -158.921875, -152.349609375, -145.77735900878906, -139.20509338378906, -132.63282775878906, -126.0605697631836, -119.48831176757812, -112.91604614257812, -106.34378814697266, -99.77153015136719, -93.19926452636719, -86.62700653076172, -80.05474090576172, -73.48248291015625, -66.91021728515625, -60.33795928955078, -53.76569747924805, -47.19343566894531, -40.62117385864258, -34.048912048339844, -27.476652145385742, -20.90439224243164, -14.332130432128906, -7.759868621826172, -1.1876068115234375, 5.384654521942139, 11.956915855407715, 18.529176712036133, 25.101438522338867, 31.67369842529297, 38.2459602355957, 44.81822204589844, 51.39048385620117, 57.962745666503906, 64.53500366210938, 71.10726928710938, 77.67952728271484, 84.25178527832031, 90.82405090332031, 97.39631652832031, 103.96857452392578, 110.54083251953125, 117.11309814453125, 123.68535614013672, 130.2576141357422, 136.8298797607422, 143.4021453857422, 149.97439575195312, 156.54666137695312, 163.11892700195312, 169.69117736816406, 176.26344299316406, 182.83570861816406, 189.407958984375, 195.980224609375, 202.552490234375, 209.124755859375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 8.0, 5.0, 8.0, 10.0, 22.0, 15.0, 19.0, 22.0, 28.0, 27.0, 41.0, 45.0, 45.0, 39.0, 58.0, 37.0, 43.0, 47.0, 48.0, 66.0, 41.0, 38.0, 36.0, 47.0, 31.0, 24.0, 27.0, 23.0, 13.0, 17.0, 13.0, 11.0, 11.0, 3.0, 4.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-120.724609375, -116.72987365722656, -112.73514556884766, -108.74040985107422, -104.74567413330078, -100.75094604492188, -96.75621032714844, -92.761474609375, -88.76673889160156, -84.77200317382812, -80.77727508544922, -76.78253936767578, -72.78780364990234, -68.79307556152344, -64.79833984375, -60.80360412597656, -56.808876037597656, -52.814144134521484, -48.81940841674805, -44.824676513671875, -40.82994079589844, -36.835208892822266, -32.840476989746094, -28.84574317932129, -24.851009368896484, -20.85627555847168, -16.861541748046875, -12.866809844970703, -8.872076034545898, -4.877342224121094, -0.8826103210449219, 3.112123489379883, 7.1068572998046875, 11.101591110229492, 15.09632396697998, 19.09105682373047, 23.085790634155273, 27.080524444580078, 31.07525634765625, 35.06999206542969, 39.06472396850586, 43.05945587158203, 47.05419158935547, 51.04892349243164, 55.04365539550781, 59.03839111328125, 63.03312301635742, 67.0278549194336, 71.02259063720703, 75.01732635498047, 79.01205444335938, 83.00679016113281, 87.00152587890625, 90.99626159667969, 94.9909896850586, 98.98572540283203, 102.98045349121094, 106.97518920898438, 110.96991729736328, 114.96465301513672, 118.95938873291016, 122.95411682128906, 126.9488525390625, 130.94358825683594, 134.93832397460938]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 21.0, 38.0, 34.0, 55.0, 58.0, 98.0, 180.0, 287.0, 493.0, 844.0, 1588.0, 3339.0, 7836.0, 22828.0, 102599.0, 3652070.0, 336811.0, 43053.0, 12459.0, 4885.0, 2190.0, 1008.0, 571.0, 320.0, 190.0, 110.0, 75.0, 48.0, 35.0, 27.0, 16.0, 11.0, 16.0, 18.0, 13.0, 5.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.625, -46.0234375, -44.421875, -42.8203125, -41.21875, -39.6171875, -38.015625, -36.4140625, -34.8125, -33.2109375, -31.609375, -30.0078125, -28.40625, -26.8046875, -25.203125, -23.6015625, -22.0, -20.3984375, -18.796875, -17.1953125, -15.59375, -13.9921875, -12.390625, -10.7890625, -9.1875, -7.5859375, -5.984375, -4.3828125, -2.78125, -1.1796875, 0.421875, 2.0234375, 3.625, 5.2265625, 6.828125, 8.4296875, 10.03125, 11.6328125, 13.234375, 14.8359375, 16.4375, 18.0390625, 19.640625, 21.2421875, 22.84375, 24.4453125, 26.046875, 27.6484375, 29.25, 30.8515625, 32.453125, 34.0546875, 35.65625, 37.2578125, 38.859375, 40.4609375, 42.0625, 43.6640625, 45.265625, 46.8671875, 48.46875, 50.0703125, 51.671875, 53.2734375, 54.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 19.0, 15.0, 24.0, 43.0, 53.0, 65.0, 75.0, 69.0, 98.0, 100.0, 84.0, 77.0, 79.0, 58.0, 40.0, 26.0, 22.0, 9.0, 14.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.62493896484375, -7.3709716796875, -7.11700439453125, -6.863037109375, -6.60906982421875, -6.3551025390625, -6.10113525390625, -5.84716796875, -5.59320068359375, -5.3392333984375, -5.08526611328125, -4.831298828125, -4.57733154296875, -4.3233642578125, -4.06939697265625, -3.8154296875, -3.56146240234375, -3.3074951171875, -3.05352783203125, -2.799560546875, -2.54559326171875, -2.2916259765625, -2.03765869140625, -1.78369140625, -1.52972412109375, -1.2757568359375, -1.02178955078125, -0.767822265625, -0.51385498046875, -0.2598876953125, -0.00592041015625, 0.248046875, 0.50201416015625, 0.7559814453125, 1.00994873046875, 1.263916015625, 1.51788330078125, 1.7718505859375, 2.02581787109375, 2.27978515625, 2.53375244140625, 2.7877197265625, 3.04168701171875, 3.295654296875, 3.54962158203125, 3.8035888671875, 4.05755615234375, 4.3115234375, 4.56549072265625, 4.8194580078125, 5.07342529296875, 5.327392578125, 5.58135986328125, 5.8353271484375, 6.08929443359375, 6.34326171875, 6.59722900390625, 6.8511962890625, 7.10516357421875, 7.359130859375, 7.61309814453125, 7.8670654296875, 8.12103271484375, 8.375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 1.0, 5.0, 5.0, 8.0, 12.0, 12.0, 21.0, 27.0, 26.0, 36.0, 57.0, 69.0, 104.0, 166.0, 200.0, 307.0, 526.0, 922.0, 1665.0, 3151.0, 6965.0, 16274.0, 43733.0, 146577.0, 1279774.0, 2448249.0, 164017.0, 48090.0, 17865.0, 7693.0, 3468.0, 1797.0, 913.0, 546.0, 336.0, 188.0, 139.0, 95.0, 81.0, 41.0, 23.0, 25.0, 20.0, 8.0, 16.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.03125, -32.031494140625, -31.03173828125, -30.031982421875, -29.0322265625, -28.032470703125, -27.03271484375, -26.032958984375, -25.033203125, -24.033447265625, -23.03369140625, -22.033935546875, -21.0341796875, -20.034423828125, -19.03466796875, -18.034912109375, -17.03515625, -16.035400390625, -15.03564453125, -14.035888671875, -13.0361328125, -12.036376953125, -11.03662109375, -10.036865234375, -9.037109375, -8.037353515625, -7.03759765625, -6.037841796875, -5.0380859375, -4.038330078125, -3.03857421875, -2.038818359375, -1.0390625, -0.039306640625, 0.96044921875, 1.960205078125, 2.9599609375, 3.959716796875, 4.95947265625, 5.959228515625, 6.958984375, 7.958740234375, 8.95849609375, 9.958251953125, 10.9580078125, 11.957763671875, 12.95751953125, 13.957275390625, 14.95703125, 15.956787109375, 16.95654296875, 17.956298828125, 18.9560546875, 19.955810546875, 20.95556640625, 21.955322265625, 22.955078125, 23.954833984375, 24.95458984375, 25.954345703125, 26.9541015625, 27.953857421875, 28.95361328125, 29.953369140625, 30.953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 10.0, 18.0, 23.0, 32.0, 66.0, 101.0, 229.0, 555.0, 2145.0, 452.0, 155.0, 107.0, 58.0, 35.0, 29.0, 20.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.8953857421875, -16.431396484375, -15.9674072265625, -15.50341796875, -15.0394287109375, -14.575439453125, -14.1114501953125, -13.6474609375, -13.1834716796875, -12.719482421875, -12.2554931640625, -11.79150390625, -11.3275146484375, -10.863525390625, -10.3995361328125, -9.935546875, -9.4715576171875, -9.007568359375, -8.5435791015625, -8.07958984375, -7.6156005859375, -7.151611328125, -6.6876220703125, -6.2236328125, -5.7596435546875, -5.295654296875, -4.8316650390625, -4.36767578125, -3.9036865234375, -3.439697265625, -2.9757080078125, -2.51171875, -2.0477294921875, -1.583740234375, -1.1197509765625, -0.65576171875, -0.1917724609375, 0.272216796875, 0.7362060546875, 1.2001953125, 1.6641845703125, 2.128173828125, 2.5921630859375, 3.05615234375, 3.5201416015625, 3.984130859375, 4.4481201171875, 4.912109375, 5.3760986328125, 5.840087890625, 6.3040771484375, 6.76806640625, 7.2320556640625, 7.696044921875, 8.1600341796875, 8.6240234375, 9.0880126953125, 9.552001953125, 10.0159912109375, 10.47998046875, 10.9439697265625, 11.407958984375, 11.8719482421875, 12.3359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 17.0, 27.0, 53.0, 109.0, 153.0, 180.0, 155.0, 125.0, 82.0, 50.0, 18.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.70103454589844, -126.7995376586914, -123.89804077148438, -120.99653625488281, -118.09503936767578, -115.19354248046875, -112.29204559326172, -109.39054870605469, -106.48904418945312, -103.5875473022461, -100.68605041503906, -97.7845458984375, -94.88304901123047, -91.98155212402344, -89.0800552368164, -86.17855834960938, -83.27706146240234, -80.37556457519531, -77.47406768798828, -74.57257080078125, -71.67106628417969, -68.76956939697266, -65.86807250976562, -62.966575622558594, -60.0650749206543, -57.163578033447266, -54.26207733154297, -51.36058044433594, -48.459083557128906, -45.55758285522461, -42.65608596801758, -39.75458526611328, -36.85308074951172, -33.95158386230469, -31.05008316040039, -28.14858627319336, -25.247087478637695, -22.34558868408203, -19.444091796875, -16.542593002319336, -13.641094207763672, -10.739595413208008, -7.83809757232666, -4.9365997314453125, -2.0351009368896484, 0.8663978576660156, 3.767894744873047, 6.669393539428711, 9.570892333984375, 12.472391128540039, 15.373888969421387, 18.275386810302734, 21.1768856048584, 24.078384399414062, 26.979881286621094, 29.881380081176758, 32.78287887573242, 35.68437576293945, 38.58587646484375, 41.48737335205078, 44.38887023925781, 47.29037094116211, 50.19186782836914, 53.09336853027344, 55.99486541748047]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 13.0, 16.0, 22.0, 28.0, 17.0, 24.0, 22.0, 25.0, 29.0, 46.0, 33.0, 52.0, 52.0, 56.0, 53.0, 59.0, 37.0, 51.0, 39.0, 41.0, 38.0, 37.0, 38.0, 32.0, 27.0, 23.0, 14.0, 13.0, 16.0, 12.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.12269973754883, -40.94355010986328, -39.764404296875, -38.58525466918945, -37.40610885620117, -36.226959228515625, -35.047813415527344, -33.8686637878418, -32.68951416015625, -31.510366439819336, -30.331218719482422, -29.152070999145508, -27.972923278808594, -26.793773651123047, -25.614625930786133, -24.43547821044922, -23.256332397460938, -22.077184677124023, -20.89803695678711, -19.718889236450195, -18.53974151611328, -17.360591888427734, -16.18144416809082, -15.002296447753906, -13.823148727416992, -12.644001007080078, -11.464853286743164, -10.285704612731934, -9.10655689239502, -7.9274091720581055, -6.748260974884033, -5.569112777709961, -4.3899688720703125, -3.2108209133148193, -2.031672954559326, -0.852524995803833, 0.32662296295166016, 1.5057706832885742, 2.6849188804626465, 3.8640670776367188, 5.043214797973633, 6.222362518310547, 7.401510715484619, 8.580658912658691, 9.759806632995605, 10.93895435333252, 12.11810302734375, 13.297250747680664, 14.476398468017578, 15.655546188354492, 16.834693908691406, 18.01384162902832, 19.192989349365234, 20.37213897705078, 21.551286697387695, 22.73043441772461, 23.909582138061523, 25.088729858398438, 26.26787757873535, 27.447025299072266, 28.626174926757812, 29.805320739746094, 30.98447036743164, 32.16361999511719, 33.34276580810547]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 13.0, 12.0, 11.0, 22.0, 30.0, 42.0, 76.0, 109.0, 115.0, 193.0, 241.0, 374.0, 644.0, 1127.0, 2273.0, 5123.0, 13063.0, 37406.0, 111186.0, 299889.0, 355985.0, 143196.0, 48151.0, 16811.0, 6356.0, 2707.0, 1329.0, 727.0, 448.0, 239.0, 199.0, 136.0, 94.0, 62.0, 36.0, 33.0, 19.0, 19.0, 8.0, 10.0, 12.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.875, -30.882568359375, -29.89013671875, -28.897705078125, -27.9052734375, -26.912841796875, -25.92041015625, -24.927978515625, -23.935546875, -22.943115234375, -21.95068359375, -20.958251953125, -19.9658203125, -18.973388671875, -17.98095703125, -16.988525390625, -15.99609375, -15.003662109375, -14.01123046875, -13.018798828125, -12.0263671875, -11.033935546875, -10.04150390625, -9.049072265625, -8.056640625, -7.064208984375, -6.07177734375, -5.079345703125, -4.0869140625, -3.094482421875, -2.10205078125, -1.109619140625, -0.1171875, 0.875244140625, 1.86767578125, 2.860107421875, 3.8525390625, 4.844970703125, 5.83740234375, 6.829833984375, 7.822265625, 8.814697265625, 9.80712890625, 10.799560546875, 11.7919921875, 12.784423828125, 13.77685546875, 14.769287109375, 15.76171875, 16.754150390625, 17.74658203125, 18.739013671875, 19.7314453125, 20.723876953125, 21.71630859375, 22.708740234375, 23.701171875, 24.693603515625, 25.68603515625, 26.678466796875, 27.6708984375, 28.663330078125, 29.65576171875, 30.648193359375, 31.640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 6.0, 10.0, 7.0, 22.0, 28.0, 35.0, 47.0, 56.0, 75.0, 90.0, 102.0, 121.0, 88.0, 76.0, 76.0, 61.0, 38.0, 17.0, 22.0, 10.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.34375, -8.0657958984375, -7.787841796875, -7.5098876953125, -7.23193359375, -6.9539794921875, -6.676025390625, -6.3980712890625, -6.1201171875, -5.8421630859375, -5.564208984375, -5.2862548828125, -5.00830078125, -4.7303466796875, -4.452392578125, -4.1744384765625, -3.896484375, -3.6185302734375, -3.340576171875, -3.0626220703125, -2.78466796875, -2.5067138671875, -2.228759765625, -1.9508056640625, -1.6728515625, -1.3948974609375, -1.116943359375, -0.8389892578125, -0.56103515625, -0.2830810546875, -0.005126953125, 0.2728271484375, 0.55078125, 0.8287353515625, 1.106689453125, 1.3846435546875, 1.66259765625, 1.9405517578125, 2.218505859375, 2.4964599609375, 2.7744140625, 3.0523681640625, 3.330322265625, 3.6082763671875, 3.88623046875, 4.1641845703125, 4.442138671875, 4.7200927734375, 4.998046875, 5.2760009765625, 5.553955078125, 5.8319091796875, 6.10986328125, 6.3878173828125, 6.665771484375, 6.9437255859375, 7.2216796875, 7.4996337890625, 7.777587890625, 8.0555419921875, 8.33349609375, 8.6114501953125, 8.889404296875, 9.1673583984375, 9.4453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 8.0, 18.0, 26.0, 30.0, 40.0, 68.0, 114.0, 155.0, 254.0, 395.0, 683.0, 1058.0, 1795.0, 3520.0, 6893.0, 15314.0, 36679.0, 87755.0, 193174.0, 316057.0, 211300.0, 98146.0, 41208.0, 17380.0, 7675.0, 3787.0, 1910.0, 1126.0, 720.0, 436.0, 279.0, 196.0, 111.0, 72.0, 61.0, 35.0, 19.0, 14.0, 14.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.71875, -20.08251953125, -19.4462890625, -18.81005859375, -18.173828125, -17.53759765625, -16.9013671875, -16.26513671875, -15.62890625, -14.99267578125, -14.3564453125, -13.72021484375, -13.083984375, -12.44775390625, -11.8115234375, -11.17529296875, -10.5390625, -9.90283203125, -9.2666015625, -8.63037109375, -7.994140625, -7.35791015625, -6.7216796875, -6.08544921875, -5.44921875, -4.81298828125, -4.1767578125, -3.54052734375, -2.904296875, -2.26806640625, -1.6318359375, -0.99560546875, -0.359375, 0.27685546875, 0.9130859375, 1.54931640625, 2.185546875, 2.82177734375, 3.4580078125, 4.09423828125, 4.73046875, 5.36669921875, 6.0029296875, 6.63916015625, 7.275390625, 7.91162109375, 8.5478515625, 9.18408203125, 9.8203125, 10.45654296875, 11.0927734375, 11.72900390625, 12.365234375, 13.00146484375, 13.6376953125, 14.27392578125, 14.91015625, 15.54638671875, 16.1826171875, 16.81884765625, 17.455078125, 18.09130859375, 18.7275390625, 19.36376953125, 20.0]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 9.0, 18.0, 23.0, 19.0, 18.0, 24.0, 39.0, 41.0, 41.0, 45.0, 49.0, 48.0, 44.0, 79.0, 55.0, 54.0, 45.0, 46.0, 44.0, 41.0, 26.0, 36.0, 28.0, 19.0, 13.0, 17.0, 15.0, 15.0, 11.0, 4.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.28076171875, -17.5927734375, -16.90478515625, -16.216796875, -15.52880859375, -14.8408203125, -14.15283203125, -13.46484375, -12.77685546875, -12.0888671875, -11.40087890625, -10.712890625, -10.02490234375, -9.3369140625, -8.64892578125, -7.9609375, -7.27294921875, -6.5849609375, -5.89697265625, -5.208984375, -4.52099609375, -3.8330078125, -3.14501953125, -2.45703125, -1.76904296875, -1.0810546875, -0.39306640625, 0.294921875, 0.98291015625, 1.6708984375, 2.35888671875, 3.046875, 3.73486328125, 4.4228515625, 5.11083984375, 5.798828125, 6.48681640625, 7.1748046875, 7.86279296875, 8.55078125, 9.23876953125, 9.9267578125, 10.61474609375, 11.302734375, 11.99072265625, 12.6787109375, 13.36669921875, 14.0546875, 14.74267578125, 15.4306640625, 16.11865234375, 16.806640625, 17.49462890625, 18.1826171875, 18.87060546875, 19.55859375, 20.24658203125, 20.9345703125, 21.62255859375, 22.310546875, 22.99853515625, 23.6865234375, 24.37451171875, 25.0625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 14.0, 32.0, 25.0, 54.0, 98.0, 181.0, 321.0, 690.0, 1609.0, 4611.0, 15995.0, 67960.0, 338909.0, 470499.0, 113143.0, 23813.0, 6600.0, 2194.0, 871.0, 385.0, 200.0, 109.0, 73.0, 39.0, 32.0, 15.0, 15.0, 11.0, 12.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.6015625, -15.1309814453125, -14.660400390625, -14.1898193359375, -13.71923828125, -13.2486572265625, -12.778076171875, -12.3074951171875, -11.8369140625, -11.3663330078125, -10.895751953125, -10.4251708984375, -9.95458984375, -9.4840087890625, -9.013427734375, -8.5428466796875, -8.072265625, -7.6016845703125, -7.131103515625, -6.6605224609375, -6.18994140625, -5.7193603515625, -5.248779296875, -4.7781982421875, -4.3076171875, -3.8370361328125, -3.366455078125, -2.8958740234375, -2.42529296875, -1.9547119140625, -1.484130859375, -1.0135498046875, -0.54296875, -0.0723876953125, 0.398193359375, 0.8687744140625, 1.33935546875, 1.8099365234375, 2.280517578125, 2.7510986328125, 3.2216796875, 3.6922607421875, 4.162841796875, 4.6334228515625, 5.10400390625, 5.5745849609375, 6.045166015625, 6.5157470703125, 6.986328125, 7.4569091796875, 7.927490234375, 8.3980712890625, 8.86865234375, 9.3392333984375, 9.809814453125, 10.2803955078125, 10.7509765625, 11.2215576171875, 11.692138671875, 12.1627197265625, 12.63330078125, 13.1038818359375, 13.574462890625, 14.0450439453125, 14.515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 11.0, 11.0, 17.0, 23.0, 41.0, 44.0, 54.0, 102.0, 120.0, 137.0, 118.0, 90.0, 55.0, 46.0, 31.0, 20.0, 18.0, 15.0, 11.0, 4.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00229644775390625, -0.0022152066230773926, -0.002133965492248535, -0.0020527243614196777, -0.0019714832305908203, -0.0018902420997619629, -0.0018090009689331055, -0.001727759838104248, -0.0016465187072753906, -0.0015652775764465332, -0.0014840364456176758, -0.0014027953147888184, -0.001321554183959961, -0.0012403130531311035, -0.001159071922302246, -0.0010778307914733887, -0.0009965896606445312, -0.0009153485298156738, -0.0008341073989868164, -0.000752866268157959, -0.0006716251373291016, -0.0005903840065002441, -0.0005091428756713867, -0.0004279017448425293, -0.0003466606140136719, -0.00026541948318481445, -0.00018417835235595703, -0.00010293722152709961, -2.1696090698242188e-05, 5.9545040130615234e-05, 0.00014078617095947266, 0.00022202730178833008, 0.0003032684326171875, 0.0003845095634460449, 0.00046575069427490234, 0.0005469918251037598, 0.0006282329559326172, 0.0007094740867614746, 0.000790715217590332, 0.0008719563484191895, 0.0009531974792480469, 0.0010344386100769043, 0.0011156797409057617, 0.0011969208717346191, 0.0012781620025634766, 0.001359403133392334, 0.0014406442642211914, 0.0015218853950500488, 0.0016031265258789062, 0.0016843676567077637, 0.001765608787536621, 0.0018468499183654785, 0.001928091049194336, 0.0020093321800231934, 0.0020905733108520508, 0.002171814441680908, 0.0022530555725097656, 0.002334296703338623, 0.0024155378341674805, 0.002496778964996338, 0.0025780200958251953, 0.0026592612266540527, 0.00274050235748291, 0.0028217434883117676, 0.002902984619140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 9.0, 10.0, 15.0, 20.0, 16.0, 29.0, 51.0, 88.0, 129.0, 193.0, 374.0, 660.0, 1385.0, 2882.0, 8303.0, 30649.0, 161063.0, 591567.0, 199003.0, 36291.0, 9456.0, 3253.0, 1396.0, 710.0, 406.0, 210.0, 119.0, 89.0, 52.0, 28.0, 26.0, 21.0, 12.0, 12.0, 1.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.390625, -16.8564453125, -16.322265625, -15.7880859375, -15.25390625, -14.7197265625, -14.185546875, -13.6513671875, -13.1171875, -12.5830078125, -12.048828125, -11.5146484375, -10.98046875, -10.4462890625, -9.912109375, -9.3779296875, -8.84375, -8.3095703125, -7.775390625, -7.2412109375, -6.70703125, -6.1728515625, -5.638671875, -5.1044921875, -4.5703125, -4.0361328125, -3.501953125, -2.9677734375, -2.43359375, -1.8994140625, -1.365234375, -0.8310546875, -0.296875, 0.2373046875, 0.771484375, 1.3056640625, 1.83984375, 2.3740234375, 2.908203125, 3.4423828125, 3.9765625, 4.5107421875, 5.044921875, 5.5791015625, 6.11328125, 6.6474609375, 7.181640625, 7.7158203125, 8.25, 8.7841796875, 9.318359375, 9.8525390625, 10.38671875, 10.9208984375, 11.455078125, 11.9892578125, 12.5234375, 13.0576171875, 13.591796875, 14.1259765625, 14.66015625, 15.1943359375, 15.728515625, 16.2626953125, 16.796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 7.0, 7.0, 8.0, 7.0, 8.0, 9.0, 14.0, 17.0, 28.0, 35.0, 43.0, 48.0, 62.0, 73.0, 67.0, 83.0, 80.0, 64.0, 80.0, 47.0, 57.0, 39.0, 25.0, 20.0, 16.0, 15.0, 12.0, 6.0, 6.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.92919921875, -6.6708984375, -6.41259765625, -6.154296875, -5.89599609375, -5.6376953125, -5.37939453125, -5.12109375, -4.86279296875, -4.6044921875, -4.34619140625, -4.087890625, -3.82958984375, -3.5712890625, -3.31298828125, -3.0546875, -2.79638671875, -2.5380859375, -2.27978515625, -2.021484375, -1.76318359375, -1.5048828125, -1.24658203125, -0.98828125, -0.72998046875, -0.4716796875, -0.21337890625, 0.044921875, 0.30322265625, 0.5615234375, 0.81982421875, 1.078125, 1.33642578125, 1.5947265625, 1.85302734375, 2.111328125, 2.36962890625, 2.6279296875, 2.88623046875, 3.14453125, 3.40283203125, 3.6611328125, 3.91943359375, 4.177734375, 4.43603515625, 4.6943359375, 4.95263671875, 5.2109375, 5.46923828125, 5.7275390625, 5.98583984375, 6.244140625, 6.50244140625, 6.7607421875, 7.01904296875, 7.27734375, 7.53564453125, 7.7939453125, 8.05224609375, 8.310546875, 8.56884765625, 8.8271484375, 9.08544921875, 9.34375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 11.0, 17.0, 26.0, 41.0, 51.0, 56.0, 64.0, 104.0, 106.0, 98.0, 94.0, 71.0, 84.0, 49.0, 42.0, 21.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.43487548828125, -136.9160919189453, -132.39732360839844, -127.8785400390625, -123.3597640991211, -118.84098815917969, -114.32220458984375, -109.80342864990234, -105.28465270996094, -100.76587677001953, -96.2470932006836, -91.72831726074219, -87.20954132080078, -82.69076538085938, -78.17198181152344, -73.65320587158203, -69.1344223022461, -64.61564636230469, -60.096866607666016, -55.578086853027344, -51.05931091308594, -46.540531158447266, -42.021751403808594, -37.50297546386719, -32.984195709228516, -28.465417861938477, -23.946640014648438, -19.427860260009766, -14.909082412719727, -10.390304565429688, -5.871524810791016, -1.3527469635009766, 3.1660308837890625, 7.68480920791626, 12.203587532043457, 16.722366333007812, 21.24114418029785, 25.75992202758789, 30.278701782226562, 34.79747772216797, 39.31625747680664, 43.83503723144531, 48.35381317138672, 52.87259292602539, 57.39137268066406, 61.91014862060547, 66.42892456054688, 70.94770812988281, 75.46648406982422, 79.98526000976562, 84.50404357910156, 89.02281951904297, 93.54159545898438, 98.06037902832031, 102.57915496826172, 107.09793090820312, 111.61671447753906, 116.13549041748047, 120.6542739868164, 125.17304992675781, 129.69183349609375, 134.21060180664062, 138.72938537597656, 143.2481689453125, 147.76693725585938]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 2.0, 8.0, 10.0, 9.0, 26.0, 14.0, 27.0, 23.0, 26.0, 31.0, 39.0, 37.0, 38.0, 45.0, 40.0, 34.0, 56.0, 33.0, 41.0, 34.0, 47.0, 55.0, 40.0, 34.0, 35.0, 34.0, 26.0, 23.0, 13.0, 20.0, 14.0, 16.0, 12.0, 10.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.88111877441406, -95.6190185546875, -92.35691833496094, -89.09481811523438, -85.83271026611328, -82.57061004638672, -79.30850982666016, -76.0464096069336, -72.7843017578125, -69.52220153808594, -66.26010131835938, -62.99799728393555, -59.73589324951172, -56.473793029785156, -53.211692810058594, -49.94959259033203, -46.68749237060547, -43.425392150878906, -40.16328811645508, -36.901187896728516, -33.63908386230469, -30.376983642578125, -27.114883422851562, -23.852781295776367, -20.590679168701172, -17.328577041625977, -14.066475868225098, -10.804374694824219, -7.542272567749023, -4.280170440673828, -1.0180702209472656, 2.2440319061279297, 5.506134033203125, 8.76823616027832, 12.0303373336792, 15.292438507080078, 18.554540634155273, 21.81664276123047, 25.07874298095703, 28.340845108032227, 31.602947235107422, 34.865047454833984, 38.12715148925781, 41.389251708984375, 44.65135192871094, 47.913455963134766, 51.17555618286133, 54.437660217285156, 57.69976043701172, 60.96186065673828, 64.22396087646484, 67.48606872558594, 70.7481689453125, 74.01026916503906, 77.27236938476562, 80.53446960449219, 83.79656982421875, 87.05867004394531, 90.32077026367188, 93.58287048339844, 96.84497833251953, 100.1070785522461, 103.36917877197266, 106.63127899169922, 109.89338684082031]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 16.0, 21.0, 14.0, 30.0, 43.0, 57.0, 112.0, 164.0, 267.0, 478.0, 904.0, 1771.0, 3656.0, 8923.0, 26100.0, 107766.0, 2593141.0, 1314425.0, 97563.0, 23821.0, 8198.0, 3402.0, 1500.0, 750.0, 427.0, 225.0, 135.0, 92.0, 70.0, 37.0, 37.0, 27.0, 17.0, 13.0, 13.0, 11.0, 10.0, 8.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.29638671875, -38.9052734375, -37.51416015625, -36.123046875, -34.73193359375, -33.3408203125, -31.94970703125, -30.55859375, -29.16748046875, -27.7763671875, -26.38525390625, -24.994140625, -23.60302734375, -22.2119140625, -20.82080078125, -19.4296875, -18.03857421875, -16.6474609375, -15.25634765625, -13.865234375, -12.47412109375, -11.0830078125, -9.69189453125, -8.30078125, -6.90966796875, -5.5185546875, -4.12744140625, -2.736328125, -1.34521484375, 0.0458984375, 1.43701171875, 2.828125, 4.21923828125, 5.6103515625, 7.00146484375, 8.392578125, 9.78369140625, 11.1748046875, 12.56591796875, 13.95703125, 15.34814453125, 16.7392578125, 18.13037109375, 19.521484375, 20.91259765625, 22.3037109375, 23.69482421875, 25.0859375, 26.47705078125, 27.8681640625, 29.25927734375, 30.650390625, 32.04150390625, 33.4326171875, 34.82373046875, 36.21484375, 37.60595703125, 38.9970703125, 40.38818359375, 41.779296875, 43.17041015625, 44.5615234375, 45.95263671875, 47.34375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 3.0, 11.0, 18.0, 30.0, 29.0, 46.0, 66.0, 68.0, 93.0, 89.0, 109.0, 98.0, 72.0, 79.0, 71.0, 37.0, 36.0, 20.0, 11.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.591552734375, -8.31591796875, -8.040283203125, -7.7646484375, -7.489013671875, -7.21337890625, -6.937744140625, -6.662109375, -6.386474609375, -6.11083984375, -5.835205078125, -5.5595703125, -5.283935546875, -5.00830078125, -4.732666015625, -4.45703125, -4.181396484375, -3.90576171875, -3.630126953125, -3.3544921875, -3.078857421875, -2.80322265625, -2.527587890625, -2.251953125, -1.976318359375, -1.70068359375, -1.425048828125, -1.1494140625, -0.873779296875, -0.59814453125, -0.322509765625, -0.046875, 0.228759765625, 0.50439453125, 0.780029296875, 1.0556640625, 1.331298828125, 1.60693359375, 1.882568359375, 2.158203125, 2.433837890625, 2.70947265625, 2.985107421875, 3.2607421875, 3.536376953125, 3.81201171875, 4.087646484375, 4.36328125, 4.638916015625, 4.91455078125, 5.190185546875, 5.4658203125, 5.741455078125, 6.01708984375, 6.292724609375, 6.568359375, 6.843994140625, 7.11962890625, 7.395263671875, 7.6708984375, 7.946533203125, 8.22216796875, 8.497802734375, 8.7734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 15.0, 26.0, 46.0, 69.0, 103.0, 155.0, 264.0, 493.0, 983.0, 2519.0, 8486.0, 44795.0, 708405.0, 3302595.0, 103714.0, 14623.0, 3831.0, 1508.0, 703.0, 375.0, 219.0, 106.0, 94.0, 50.0, 29.0, 24.0, 11.0, 13.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.21875, -61.369140625, -59.51953125, -57.669921875, -55.8203125, -53.970703125, -52.12109375, -50.271484375, -48.421875, -46.572265625, -44.72265625, -42.873046875, -41.0234375, -39.173828125, -37.32421875, -35.474609375, -33.625, -31.775390625, -29.92578125, -28.076171875, -26.2265625, -24.376953125, -22.52734375, -20.677734375, -18.828125, -16.978515625, -15.12890625, -13.279296875, -11.4296875, -9.580078125, -7.73046875, -5.880859375, -4.03125, -2.181640625, -0.33203125, 1.517578125, 3.3671875, 5.216796875, 7.06640625, 8.916015625, 10.765625, 12.615234375, 14.46484375, 16.314453125, 18.1640625, 20.013671875, 21.86328125, 23.712890625, 25.5625, 27.412109375, 29.26171875, 31.111328125, 32.9609375, 34.810546875, 36.66015625, 38.509765625, 40.359375, 42.208984375, 44.05859375, 45.908203125, 47.7578125, 49.607421875, 51.45703125, 53.306640625, 55.15625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 14.0, 14.0, 32.0, 83.0, 133.0, 341.0, 1258.0, 1475.0, 376.0, 158.0, 82.0, 33.0, 27.0, 14.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.742431640625, -18.95361328125, -18.164794921875, -17.3759765625, -16.587158203125, -15.79833984375, -15.009521484375, -14.220703125, -13.431884765625, -12.64306640625, -11.854248046875, -11.0654296875, -10.276611328125, -9.48779296875, -8.698974609375, -7.91015625, -7.121337890625, -6.33251953125, -5.543701171875, -4.7548828125, -3.966064453125, -3.17724609375, -2.388427734375, -1.599609375, -0.810791015625, -0.02197265625, 0.766845703125, 1.5556640625, 2.344482421875, 3.13330078125, 3.922119140625, 4.7109375, 5.499755859375, 6.28857421875, 7.077392578125, 7.8662109375, 8.655029296875, 9.44384765625, 10.232666015625, 11.021484375, 11.810302734375, 12.59912109375, 13.387939453125, 14.1767578125, 14.965576171875, 15.75439453125, 16.543212890625, 17.33203125, 18.120849609375, 18.90966796875, 19.698486328125, 20.4873046875, 21.276123046875, 22.06494140625, 22.853759765625, 23.642578125, 24.431396484375, 25.22021484375, 26.009033203125, 26.7978515625, 27.586669921875, 28.37548828125, 29.164306640625, 29.953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 19.0, 29.0, 52.0, 81.0, 112.0, 134.0, 138.0, 126.0, 99.0, 81.0, 44.0, 28.0, 21.0, 12.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.51722717285156, -123.79232788085938, -120.06743621826172, -116.34253692626953, -112.61764526367188, -108.89274597167969, -105.1678466796875, -101.44294738769531, -97.71805572509766, -93.99315643310547, -90.26826477050781, -86.54336547851562, -82.81846618652344, -79.09357452392578, -75.3686752319336, -71.64378356933594, -67.91888427734375, -64.19398498535156, -60.469093322753906, -56.74419403076172, -53.0192985534668, -49.294403076171875, -45.56950378417969, -41.844608306884766, -38.119712829589844, -34.39481735229492, -30.669919967651367, -26.945022583007812, -23.22012710571289, -19.49523162841797, -15.770334243774414, -12.04543685913086, -8.320549011230469, -4.5956525802612305, -0.8707561492919922, 2.854140281677246, 6.579036712646484, 10.303932189941406, 14.028829574584961, 17.753726959228516, 21.478622436523438, 25.20351791381836, 28.928415298461914, 32.65331268310547, 36.37820816040039, 40.10310363769531, 43.8280029296875, 47.55289840698242, 51.277793884277344, 55.002689361572266, 58.72758483886719, 62.452484130859375, 66.17738342285156, 69.90227508544922, 73.6271743774414, 77.35206604003906, 81.07696533203125, 84.80186462402344, 88.5267562866211, 92.25165557861328, 95.97654724121094, 99.70144653320312, 103.42634582519531, 107.1512451171875, 110.87613677978516]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 13.0, 23.0, 24.0, 30.0, 54.0, 58.0, 63.0, 62.0, 68.0, 85.0, 96.0, 88.0, 61.0, 64.0, 48.0, 34.0, 35.0, 21.0, 17.0, 20.0, 13.0, 3.0, 1.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.40766143798828, -96.59231567382812, -93.77696228027344, -90.96161651611328, -88.14627075195312, -85.33092498779297, -82.51557922363281, -79.70022583007812, -76.88488006591797, -74.06953430175781, -71.25418090820312, -68.43883514404297, -65.62348937988281, -62.808143615722656, -59.992794036865234, -57.17744445800781, -54.362098693847656, -51.5467529296875, -48.73140335083008, -45.916053771972656, -43.1007080078125, -40.285362243652344, -37.47001266479492, -34.6546630859375, -31.839317321777344, -29.023969650268555, -26.208621978759766, -23.393274307250977, -20.577926635742188, -17.7625789642334, -14.94723129272461, -12.13188362121582, -9.3165283203125, -6.501180648803711, -3.685832977294922, -0.8704853057861328, 1.9448623657226562, 4.760210037231445, 7.575557708740234, 10.390905380249023, 13.206253051757812, 16.0216007232666, 18.83694839477539, 21.65229606628418, 24.46764373779297, 27.282991409301758, 30.098339080810547, 32.91368865966797, 35.729034423828125, 38.54438018798828, 41.3597297668457, 44.175079345703125, 46.99042510986328, 49.80577087402344, 52.62112045288086, 55.43647003173828, 58.25181579589844, 61.067161560058594, 63.882511138916016, 66.69786071777344, 69.5132064819336, 72.32855224609375, 75.14390563964844, 77.9592514038086, 80.77459716796875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 10.0, 15.0, 24.0, 50.0, 85.0, 106.0, 238.0, 374.0, 715.0, 1457.0, 3838.0, 16806.0, 112253.0, 629587.0, 239385.0, 33373.0, 6194.0, 1991.0, 934.0, 471.0, 267.0, 146.0, 90.0, 56.0, 31.0, 16.0, 7.0, 8.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-82.1875, -80.11669921875, -78.0458984375, -75.97509765625, -73.904296875, -71.83349609375, -69.7626953125, -67.69189453125, -65.62109375, -63.55029296875, -61.4794921875, -59.40869140625, -57.337890625, -55.26708984375, -53.1962890625, -51.12548828125, -49.0546875, -46.98388671875, -44.9130859375, -42.84228515625, -40.771484375, -38.70068359375, -36.6298828125, -34.55908203125, -32.48828125, -30.41748046875, -28.3466796875, -26.27587890625, -24.205078125, -22.13427734375, -20.0634765625, -17.99267578125, -15.921875, -13.85107421875, -11.7802734375, -9.70947265625, -7.638671875, -5.56787109375, -3.4970703125, -1.42626953125, 0.64453125, 2.71533203125, 4.7861328125, 6.85693359375, 8.927734375, 10.99853515625, 13.0693359375, 15.14013671875, 17.2109375, 19.28173828125, 21.3525390625, 23.42333984375, 25.494140625, 27.56494140625, 29.6357421875, 31.70654296875, 33.77734375, 35.84814453125, 37.9189453125, 39.98974609375, 42.060546875, 44.13134765625, 46.2021484375, 48.27294921875, 50.34375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 18.0, 17.0, 32.0, 54.0, 61.0, 93.0, 96.0, 113.0, 107.0, 94.0, 89.0, 69.0, 56.0, 32.0, 24.0, 19.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.3939208984375, -8.092529296875, -7.7911376953125, -7.48974609375, -7.1883544921875, -6.886962890625, -6.5855712890625, -6.2841796875, -5.9827880859375, -5.681396484375, -5.3800048828125, -5.07861328125, -4.7772216796875, -4.475830078125, -4.1744384765625, -3.873046875, -3.5716552734375, -3.270263671875, -2.9688720703125, -2.66748046875, -2.3660888671875, -2.064697265625, -1.7633056640625, -1.4619140625, -1.1605224609375, -0.859130859375, -0.5577392578125, -0.25634765625, 0.0450439453125, 0.346435546875, 0.6478271484375, 0.94921875, 1.2506103515625, 1.552001953125, 1.8533935546875, 2.15478515625, 2.4561767578125, 2.757568359375, 3.0589599609375, 3.3603515625, 3.6617431640625, 3.963134765625, 4.2645263671875, 4.56591796875, 4.8673095703125, 5.168701171875, 5.4700927734375, 5.771484375, 6.0728759765625, 6.374267578125, 6.6756591796875, 6.97705078125, 7.2784423828125, 7.579833984375, 7.8812255859375, 8.1826171875, 8.4840087890625, 8.785400390625, 9.0867919921875, 9.38818359375, 9.6895751953125, 9.990966796875, 10.2923583984375, 10.59375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 17.0, 17.0, 25.0, 53.0, 75.0, 135.0, 212.0, 336.0, 600.0, 1182.0, 2286.0, 4775.0, 11130.0, 26591.0, 64900.0, 156769.0, 342762.0, 254668.0, 106116.0, 43504.0, 17756.0, 7613.0, 3351.0, 1585.0, 868.0, 490.0, 274.0, 137.0, 111.0, 69.0, 43.0, 32.0, 23.0, 17.0, 9.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.691162109375, -17.05419921875, -16.417236328125, -15.7802734375, -15.143310546875, -14.50634765625, -13.869384765625, -13.232421875, -12.595458984375, -11.95849609375, -11.321533203125, -10.6845703125, -10.047607421875, -9.41064453125, -8.773681640625, -8.13671875, -7.499755859375, -6.86279296875, -6.225830078125, -5.5888671875, -4.951904296875, -4.31494140625, -3.677978515625, -3.041015625, -2.404052734375, -1.76708984375, -1.130126953125, -0.4931640625, 0.143798828125, 0.78076171875, 1.417724609375, 2.0546875, 2.691650390625, 3.32861328125, 3.965576171875, 4.6025390625, 5.239501953125, 5.87646484375, 6.513427734375, 7.150390625, 7.787353515625, 8.42431640625, 9.061279296875, 9.6982421875, 10.335205078125, 10.97216796875, 11.609130859375, 12.24609375, 12.883056640625, 13.52001953125, 14.156982421875, 14.7939453125, 15.430908203125, 16.06787109375, 16.704833984375, 17.341796875, 17.978759765625, 18.61572265625, 19.252685546875, 19.8896484375, 20.526611328125, 21.16357421875, 21.800537109375, 22.4375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 13.0, 6.0, 15.0, 19.0, 21.0, 27.0, 12.0, 24.0, 15.0, 24.0, 33.0, 29.0, 29.0, 27.0, 35.0, 29.0, 48.0, 42.0, 35.0, 34.0, 43.0, 37.0, 28.0, 37.0, 35.0, 33.0, 33.0, 23.0, 21.0, 25.0, 11.0, 23.0, 22.0, 16.0, 8.0, 12.0, 14.0, 10.0, 2.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.359375, -13.9122314453125, -13.465087890625, -13.0179443359375, -12.57080078125, -12.1236572265625, -11.676513671875, -11.2293701171875, -10.7822265625, -10.3350830078125, -9.887939453125, -9.4407958984375, -8.99365234375, -8.5465087890625, -8.099365234375, -7.6522216796875, -7.205078125, -6.7579345703125, -6.310791015625, -5.8636474609375, -5.41650390625, -4.9693603515625, -4.522216796875, -4.0750732421875, -3.6279296875, -3.1807861328125, -2.733642578125, -2.2864990234375, -1.83935546875, -1.3922119140625, -0.945068359375, -0.4979248046875, -0.05078125, 0.3963623046875, 0.843505859375, 1.2906494140625, 1.73779296875, 2.1849365234375, 2.632080078125, 3.0792236328125, 3.5263671875, 3.9735107421875, 4.420654296875, 4.8677978515625, 5.31494140625, 5.7620849609375, 6.209228515625, 6.6563720703125, 7.103515625, 7.5506591796875, 7.997802734375, 8.4449462890625, 8.89208984375, 9.3392333984375, 9.786376953125, 10.2335205078125, 10.6806640625, 11.1278076171875, 11.574951171875, 12.0220947265625, 12.46923828125, 12.9163818359375, 13.363525390625, 13.8106689453125, 14.2578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 11.0, 4.0, 8.0, 15.0, 25.0, 31.0, 80.0, 110.0, 199.0, 406.0, 804.0, 1911.0, 5373.0, 19338.0, 98804.0, 519117.0, 331120.0, 52741.0, 12033.0, 3717.0, 1374.0, 624.0, 313.0, 152.0, 116.0, 58.0, 18.0, 21.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.46875, -17.888427734375, -17.30810546875, -16.727783203125, -16.1474609375, -15.567138671875, -14.98681640625, -14.406494140625, -13.826171875, -13.245849609375, -12.66552734375, -12.085205078125, -11.5048828125, -10.924560546875, -10.34423828125, -9.763916015625, -9.18359375, -8.603271484375, -8.02294921875, -7.442626953125, -6.8623046875, -6.281982421875, -5.70166015625, -5.121337890625, -4.541015625, -3.960693359375, -3.38037109375, -2.800048828125, -2.2197265625, -1.639404296875, -1.05908203125, -0.478759765625, 0.1015625, 0.681884765625, 1.26220703125, 1.842529296875, 2.4228515625, 3.003173828125, 3.58349609375, 4.163818359375, 4.744140625, 5.324462890625, 5.90478515625, 6.485107421875, 7.0654296875, 7.645751953125, 8.22607421875, 8.806396484375, 9.38671875, 9.967041015625, 10.54736328125, 11.127685546875, 11.7080078125, 12.288330078125, 12.86865234375, 13.448974609375, 14.029296875, 14.609619140625, 15.18994140625, 15.770263671875, 16.3505859375, 16.930908203125, 17.51123046875, 18.091552734375, 18.671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 8.0, 3.0, 8.0, 15.0, 17.0, 15.0, 22.0, 29.0, 35.0, 62.0, 52.0, 89.0, 113.0, 117.0, 96.0, 56.0, 47.0, 46.0, 31.0, 17.0, 21.0, 16.0, 20.0, 13.0, 6.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002231597900390625, -0.0021696239709854126, -0.0021076500415802, -0.002045676112174988, -0.0019837021827697754, -0.001921728253364563, -0.0018597543239593506, -0.0017977803945541382, -0.0017358064651489258, -0.0016738325357437134, -0.001611858606338501, -0.0015498846769332886, -0.0014879107475280762, -0.0014259368181228638, -0.0013639628887176514, -0.001301988959312439, -0.0012400150299072266, -0.0011780411005020142, -0.0011160671710968018, -0.0010540932416915894, -0.000992119312286377, -0.0009301453828811646, -0.0008681714534759521, -0.0008061975240707397, -0.0007442235946655273, -0.0006822496652603149, -0.0006202757358551025, -0.0005583018064498901, -0.0004963278770446777, -0.00043435394763946533, -0.00037238001823425293, -0.00031040608882904053, -0.0002484321594238281, -0.00018645823001861572, -0.00012448430061340332, -6.251037120819092e-05, -5.364418029785156e-07, 6.143748760223389e-05, 0.0001234114170074463, 0.0001853853464126587, 0.0002473592758178711, 0.0003093332052230835, 0.0003713071346282959, 0.0004332810640335083, 0.0004952549934387207, 0.0005572289228439331, 0.0006192028522491455, 0.0006811767816543579, 0.0007431507110595703, 0.0008051246404647827, 0.0008670985698699951, 0.0009290724992752075, 0.00099104642868042, 0.0010530203580856323, 0.0011149942874908447, 0.0011769682168960571, 0.0012389421463012695, 0.001300916075706482, 0.0013628900051116943, 0.0014248639345169067, 0.0014868378639221191, 0.0015488117933273315, 0.001610785722732544, 0.0016727596521377563, 0.0017347335815429688]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 10.0, 11.0, 13.0, 23.0, 29.0, 51.0, 81.0, 146.0, 247.0, 455.0, 783.0, 1626.0, 3616.0, 9609.0, 31163.0, 131027.0, 484661.0, 292777.0, 63755.0, 17267.0, 6078.0, 2467.0, 1208.0, 574.0, 336.0, 203.0, 110.0, 73.0, 61.0, 27.0, 21.0, 18.0, 8.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-15.6328125, -15.1697998046875, -14.706787109375, -14.2437744140625, -13.78076171875, -13.3177490234375, -12.854736328125, -12.3917236328125, -11.9287109375, -11.4656982421875, -11.002685546875, -10.5396728515625, -10.07666015625, -9.6136474609375, -9.150634765625, -8.6876220703125, -8.224609375, -7.7615966796875, -7.298583984375, -6.8355712890625, -6.37255859375, -5.9095458984375, -5.446533203125, -4.9835205078125, -4.5205078125, -4.0574951171875, -3.594482421875, -3.1314697265625, -2.66845703125, -2.2054443359375, -1.742431640625, -1.2794189453125, -0.81640625, -0.3533935546875, 0.109619140625, 0.5726318359375, 1.03564453125, 1.4986572265625, 1.961669921875, 2.4246826171875, 2.8876953125, 3.3507080078125, 3.813720703125, 4.2767333984375, 4.73974609375, 5.2027587890625, 5.665771484375, 6.1287841796875, 6.591796875, 7.0548095703125, 7.517822265625, 7.9808349609375, 8.44384765625, 8.9068603515625, 9.369873046875, 9.8328857421875, 10.2958984375, 10.7589111328125, 11.221923828125, 11.6849365234375, 12.14794921875, 12.6109619140625, 13.073974609375, 13.5369873046875, 14.0]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 6.0, 15.0, 9.0, 15.0, 25.0, 33.0, 30.0, 41.0, 77.0, 65.0, 86.0, 74.0, 100.0, 60.0, 70.0, 50.0, 42.0, 28.0, 35.0, 15.0, 23.0, 23.0, 10.0, 10.0, 13.0, 10.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01171875, -6.74200439453125, -6.4722900390625, -6.20257568359375, -5.932861328125, -5.66314697265625, -5.3934326171875, -5.12371826171875, -4.85400390625, -4.58428955078125, -4.3145751953125, -4.04486083984375, -3.775146484375, -3.50543212890625, -3.2357177734375, -2.96600341796875, -2.6962890625, -2.42657470703125, -2.1568603515625, -1.88714599609375, -1.617431640625, -1.34771728515625, -1.0780029296875, -0.80828857421875, -0.53857421875, -0.26885986328125, 0.0008544921875, 0.27056884765625, 0.540283203125, 0.80999755859375, 1.0797119140625, 1.34942626953125, 1.619140625, 1.88885498046875, 2.1585693359375, 2.42828369140625, 2.697998046875, 2.96771240234375, 3.2374267578125, 3.50714111328125, 3.77685546875, 4.04656982421875, 4.3162841796875, 4.58599853515625, 4.855712890625, 5.12542724609375, 5.3951416015625, 5.66485595703125, 5.9345703125, 6.20428466796875, 6.4739990234375, 6.74371337890625, 7.013427734375, 7.28314208984375, 7.5528564453125, 7.82257080078125, 8.09228515625, 8.36199951171875, 8.6317138671875, 8.90142822265625, 9.171142578125, 9.44085693359375, 9.7105712890625, 9.98028564453125, 10.25]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 6.0, 5.0, 5.0, 9.0, 5.0, 17.0, 20.0, 25.0, 26.0, 45.0, 42.0, 51.0, 72.0, 63.0, 78.0, 90.0, 91.0, 70.0, 65.0, 50.0, 38.0, 36.0, 27.0, 16.0, 9.0, 13.0, 7.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-125.41755676269531, -121.87175750732422, -118.3259506225586, -114.7801513671875, -111.2343521118164, -107.68855285644531, -104.14274597167969, -100.5969467163086, -97.0511474609375, -93.5053482055664, -89.95954132080078, -86.41374206542969, -82.8679428100586, -79.3221435546875, -75.77633666992188, -72.23053741455078, -68.68473815917969, -65.1389389038086, -61.593135833740234, -58.047332763671875, -54.50153350830078, -50.95573043823242, -47.40992736816406, -43.86412811279297, -40.318321228027344, -36.772518157958984, -33.22671890258789, -29.68091583251953, -26.135116577148438, -22.589313507080078, -19.04351234436035, -15.497711181640625, -11.951911926269531, -8.406110763549805, -4.86030912399292, -1.3145074844360352, 2.2312936782836914, 5.777095794677734, 9.322896957397461, 12.868698120117188, 16.414499282836914, 19.96030044555664, 23.506101608276367, 27.051902770996094, 30.597705841064453, 34.14350891113281, 37.689308166503906, 41.235107421875, 44.78091049194336, 48.32671356201172, 51.87251281738281, 55.41831588745117, 58.964115142822266, 62.509918212890625, 66.05571746826172, 69.60151672363281, 73.14732360839844, 76.69312286376953, 80.23892974853516, 83.78472900390625, 87.33052825927734, 90.87632751464844, 94.42213439941406, 97.96793365478516, 101.51373291015625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 17.0, 15.0, 17.0, 26.0, 29.0, 29.0, 29.0, 54.0, 39.0, 54.0, 69.0, 53.0, 59.0, 66.0, 57.0, 56.0, 36.0, 35.0, 34.0, 33.0, 30.0, 30.0, 20.0, 22.0, 25.0, 12.0, 12.0, 13.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.90045166015625, -116.26812744140625, -112.63581085205078, -109.00348663330078, -105.37116241455078, -101.73884582519531, -98.10652160644531, -94.47419738769531, -90.84187316894531, -87.20954895019531, -83.57723236083984, -79.94490814208984, -76.31258392333984, -72.68026733398438, -69.04794311523438, -65.41561889648438, -61.78329849243164, -58.150978088378906, -54.518653869628906, -50.88633346557617, -47.25400924682617, -43.62168884277344, -39.98936462402344, -36.3570442199707, -32.72472381591797, -29.0924015045166, -25.460079193115234, -21.8277587890625, -18.1954345703125, -14.563114166259766, -10.930791854858398, -7.298469543457031, -3.6661453247070312, -0.033823251724243164, 3.598498821258545, 7.230820655822754, 10.863142967224121, 14.495464324951172, 18.12778663635254, 21.760108947753906, 25.392431259155273, 29.02475357055664, 32.657073974609375, 36.289398193359375, 39.92171859741211, 43.554039001464844, 47.186363220214844, 50.818687438964844, 54.45100784301758, 58.08332824707031, 61.71565246582031, 65.34797668457031, 68.98029327392578, 72.61261749267578, 76.24494171142578, 79.87725830078125, 83.50958251953125, 87.14190673828125, 90.77422332763672, 94.40654754638672, 98.03887176513672, 101.67118835449219, 105.30351257324219, 108.93583679199219, 112.56816101074219]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 29.0, 48.0, 78.0, 135.0, 296.0, 572.0, 1656.0, 5785.0, 46577.0, 3968622.0, 156142.0, 10570.0, 2219.0, 761.0, 341.0, 174.0, 82.0, 46.0, 29.0, 16.0, 15.0, 11.0, 8.0, 6.0, 2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.5625, -62.5380859375, -59.513671875, -56.4892578125, -53.46484375, -50.4404296875, -47.416015625, -44.3916015625, -41.3671875, -38.3427734375, -35.318359375, -32.2939453125, -29.26953125, -26.2451171875, -23.220703125, -20.1962890625, -17.171875, -14.1474609375, -11.123046875, -8.0986328125, -5.07421875, -2.0498046875, 0.974609375, 3.9990234375, 7.0234375, 10.0478515625, 13.072265625, 16.0966796875, 19.12109375, 22.1455078125, 25.169921875, 28.1943359375, 31.21875, 34.2431640625, 37.267578125, 40.2919921875, 43.31640625, 46.3408203125, 49.365234375, 52.3896484375, 55.4140625, 58.4384765625, 61.462890625, 64.4873046875, 67.51171875, 70.5361328125, 73.560546875, 76.5849609375, 79.609375, 82.6337890625, 85.658203125, 88.6826171875, 91.70703125, 94.7314453125, 97.755859375, 100.7802734375, 103.8046875, 106.8291015625, 109.853515625, 112.8779296875, 115.90234375, 118.9267578125, 121.951171875, 124.9755859375, 128.0]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 22.0, 14.0, 21.0, 44.0, 52.0, 72.0, 71.0, 109.0, 109.0, 103.0, 87.0, 87.0, 48.0, 47.0, 46.0, 24.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.5072021484375, -8.209716796875, -7.9122314453125, -7.61474609375, -7.3172607421875, -7.019775390625, -6.7222900390625, -6.4248046875, -6.1273193359375, -5.829833984375, -5.5323486328125, -5.23486328125, -4.9373779296875, -4.639892578125, -4.3424072265625, -4.044921875, -3.7474365234375, -3.449951171875, -3.1524658203125, -2.85498046875, -2.5574951171875, -2.260009765625, -1.9625244140625, -1.6650390625, -1.3675537109375, -1.070068359375, -0.7725830078125, -0.47509765625, -0.1776123046875, 0.119873046875, 0.4173583984375, 0.71484375, 1.0123291015625, 1.309814453125, 1.6072998046875, 1.90478515625, 2.2022705078125, 2.499755859375, 2.7972412109375, 3.0947265625, 3.3922119140625, 3.689697265625, 3.9871826171875, 4.28466796875, 4.5821533203125, 4.879638671875, 5.1771240234375, 5.474609375, 5.7720947265625, 6.069580078125, 6.3670654296875, 6.66455078125, 6.9620361328125, 7.259521484375, 7.5570068359375, 7.8544921875, 8.1519775390625, 8.449462890625, 8.7469482421875, 9.04443359375, 9.3419189453125, 9.639404296875, 9.9368896484375, 10.234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 11.0, 10.0, 10.0, 15.0, 13.0, 19.0, 23.0, 28.0, 45.0, 93.0, 190.0, 383.0, 788.0, 1839.0, 4816.0, 14791.0, 57840.0, 363705.0, 3392602.0, 286309.0, 49689.0, 13083.0, 4485.0, 1735.0, 811.0, 384.0, 197.0, 111.0, 68.0, 56.0, 30.0, 23.0, 22.0, 17.0, 6.0, 3.0, 2.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.0625, -35.986572265625, -34.91064453125, -33.834716796875, -32.7587890625, -31.682861328125, -30.60693359375, -29.531005859375, -28.455078125, -27.379150390625, -26.30322265625, -25.227294921875, -24.1513671875, -23.075439453125, -21.99951171875, -20.923583984375, -19.84765625, -18.771728515625, -17.69580078125, -16.619873046875, -15.5439453125, -14.468017578125, -13.39208984375, -12.316162109375, -11.240234375, -10.164306640625, -9.08837890625, -8.012451171875, -6.9365234375, -5.860595703125, -4.78466796875, -3.708740234375, -2.6328125, -1.556884765625, -0.48095703125, 0.594970703125, 1.6708984375, 2.746826171875, 3.82275390625, 4.898681640625, 5.974609375, 7.050537109375, 8.12646484375, 9.202392578125, 10.2783203125, 11.354248046875, 12.43017578125, 13.506103515625, 14.58203125, 15.657958984375, 16.73388671875, 17.809814453125, 18.8857421875, 19.961669921875, 21.03759765625, 22.113525390625, 23.189453125, 24.265380859375, 25.34130859375, 26.417236328125, 27.4931640625, 28.569091796875, 29.64501953125, 30.720947265625, 31.796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 21.0, 29.0, 44.0, 59.0, 69.0, 127.0, 210.0, 414.0, 1583.0, 703.0, 293.0, 171.0, 101.0, 62.0, 55.0, 35.0, 16.0, 12.0, 13.0, 7.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.6875, -10.3399658203125, -9.992431640625, -9.6448974609375, -9.29736328125, -8.9498291015625, -8.602294921875, -8.2547607421875, -7.9072265625, -7.5596923828125, -7.212158203125, -6.8646240234375, -6.51708984375, -6.1695556640625, -5.822021484375, -5.4744873046875, -5.126953125, -4.7794189453125, -4.431884765625, -4.0843505859375, -3.73681640625, -3.3892822265625, -3.041748046875, -2.6942138671875, -2.3466796875, -1.9991455078125, -1.651611328125, -1.3040771484375, -0.95654296875, -0.6090087890625, -0.261474609375, 0.0860595703125, 0.43359375, 0.7811279296875, 1.128662109375, 1.4761962890625, 1.82373046875, 2.1712646484375, 2.518798828125, 2.8663330078125, 3.2138671875, 3.5614013671875, 3.908935546875, 4.2564697265625, 4.60400390625, 4.9515380859375, 5.299072265625, 5.6466064453125, 5.994140625, 6.3416748046875, 6.689208984375, 7.0367431640625, 7.38427734375, 7.7318115234375, 8.079345703125, 8.4268798828125, 8.7744140625, 9.1219482421875, 9.469482421875, 9.8170166015625, 10.16455078125, 10.5120849609375, 10.859619140625, 11.2071533203125, 11.5546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 13.0, 15.0, 23.0, 45.0, 47.0, 71.0, 72.0, 88.0, 83.0, 110.0, 111.0, 72.0, 56.0, 41.0, 26.0, 35.0, 28.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.73387145996094, -69.87832641601562, -68.02277374267578, -66.16722869873047, -64.31168365478516, -62.45613098144531, -60.6005859375, -58.74503707885742, -56.889488220214844, -55.033939361572266, -53.17839431762695, -51.322845458984375, -49.4672966003418, -47.61174774169922, -45.756202697753906, -43.90065383911133, -42.04510498046875, -40.18955612182617, -38.33401107788086, -36.47846221923828, -34.6229133605957, -32.767364501953125, -30.911819458007812, -29.056270599365234, -27.200725555419922, -25.345178604125977, -23.4896297454834, -21.634082794189453, -19.778533935546875, -17.92298698425293, -16.067440032958984, -14.211891174316406, -12.356342315673828, -10.500794410705566, -8.645246505737305, -6.789699077606201, -4.9341511726379395, -3.078603744506836, -1.2230558395385742, 0.6324920654296875, 2.488039970397949, 4.343587875366211, 6.199135780334473, 8.054683685302734, 9.91023063659668, 11.765778541564941, 13.621326446533203, 15.476874351501465, 17.332422256469727, 19.187969207763672, 21.04351806640625, 22.899065017700195, 24.754613876342773, 26.61016082763672, 28.465709686279297, 30.321256637573242, 32.17680358886719, 34.032352447509766, 35.88789749145508, 37.743446350097656, 39.598995208740234, 41.45454406738281, 43.310089111328125, 45.1656379699707, 47.02118682861328]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 13.0, 12.0, 6.0, 13.0, 18.0, 22.0, 30.0, 31.0, 29.0, 39.0, 44.0, 47.0, 45.0, 44.0, 59.0, 44.0, 44.0, 63.0, 57.0, 43.0, 41.0, 36.0, 30.0, 46.0, 25.0, 23.0, 14.0, 17.0, 20.0, 9.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.77099609375, -45.430599212646484, -44.09020233154297, -42.74980545043945, -41.40940856933594, -40.069007873535156, -38.728614807128906, -37.388214111328125, -36.04781723022461, -34.707420349121094, -33.36702346801758, -32.02662658691406, -30.686227798461914, -29.3458309173584, -28.005434036254883, -26.665035247802734, -25.32464027404785, -23.984243392944336, -22.64384651184082, -21.303447723388672, -19.963050842285156, -18.62265396118164, -17.282257080078125, -15.941859245300293, -14.601462364196777, -13.261065483093262, -11.92066764831543, -10.580270767211914, -9.239873886108398, -7.899476051330566, -6.559079170227051, -5.218681335449219, -3.878284454345703, -2.5378870964050293, -1.1974899768829346, 0.14290714263916016, 1.483304500579834, 2.823701858520508, 4.164098739624023, 5.5044965744018555, 6.844893455505371, 8.185290336608887, 9.525688171386719, 10.866085052490234, 12.20648193359375, 13.546879768371582, 14.887276649475098, 16.22767448425293, 17.568071365356445, 18.90846824645996, 20.248865127563477, 21.589263916015625, 22.92966079711914, 24.270057678222656, 25.610454559326172, 26.950851440429688, 28.291248321533203, 29.63164520263672, 30.972042083740234, 32.31243896484375, 33.652835845947266, 34.99323272705078, 36.33363342285156, 37.67403030395508, 39.014427185058594]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 25.0, 26.0, 28.0, 44.0, 76.0, 123.0, 169.0, 278.0, 425.0, 720.0, 1303.0, 2895.0, 7398.0, 24327.0, 93599.0, 355478.0, 406300.0, 111195.0, 28773.0, 8646.0, 3161.0, 1444.0, 800.0, 469.0, 260.0, 176.0, 111.0, 78.0, 55.0, 35.0, 30.0, 27.0, 19.0, 10.0, 2.0, 5.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.21875, -45.8720703125, -44.525390625, -43.1787109375, -41.83203125, -40.4853515625, -39.138671875, -37.7919921875, -36.4453125, -35.0986328125, -33.751953125, -32.4052734375, -31.05859375, -29.7119140625, -28.365234375, -27.0185546875, -25.671875, -24.3251953125, -22.978515625, -21.6318359375, -20.28515625, -18.9384765625, -17.591796875, -16.2451171875, -14.8984375, -13.5517578125, -12.205078125, -10.8583984375, -9.51171875, -8.1650390625, -6.818359375, -5.4716796875, -4.125, -2.7783203125, -1.431640625, -0.0849609375, 1.26171875, 2.6083984375, 3.955078125, 5.3017578125, 6.6484375, 7.9951171875, 9.341796875, 10.6884765625, 12.03515625, 13.3818359375, 14.728515625, 16.0751953125, 17.421875, 18.7685546875, 20.115234375, 21.4619140625, 22.80859375, 24.1552734375, 25.501953125, 26.8486328125, 28.1953125, 29.5419921875, 30.888671875, 32.2353515625, 33.58203125, 34.9287109375, 36.275390625, 37.6220703125, 38.96875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 11.0, 19.0, 27.0, 30.0, 58.0, 56.0, 60.0, 90.0, 101.0, 103.0, 97.0, 89.0, 64.0, 51.0, 42.0, 37.0, 21.0, 13.0, 10.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2462158203125, -7.953369140625, -7.6605224609375, -7.36767578125, -7.0748291015625, -6.781982421875, -6.4891357421875, -6.1962890625, -5.9034423828125, -5.610595703125, -5.3177490234375, -5.02490234375, -4.7320556640625, -4.439208984375, -4.1463623046875, -3.853515625, -3.5606689453125, -3.267822265625, -2.9749755859375, -2.68212890625, -2.3892822265625, -2.096435546875, -1.8035888671875, -1.5107421875, -1.2178955078125, -0.925048828125, -0.6322021484375, -0.33935546875, -0.0465087890625, 0.246337890625, 0.5391845703125, 0.83203125, 1.1248779296875, 1.417724609375, 1.7105712890625, 2.00341796875, 2.2962646484375, 2.589111328125, 2.8819580078125, 3.1748046875, 3.4676513671875, 3.760498046875, 4.0533447265625, 4.34619140625, 4.6390380859375, 4.931884765625, 5.2247314453125, 5.517578125, 5.8104248046875, 6.103271484375, 6.3961181640625, 6.68896484375, 6.9818115234375, 7.274658203125, 7.5675048828125, 7.8603515625, 8.1531982421875, 8.446044921875, 8.7388916015625, 9.03173828125, 9.3245849609375, 9.617431640625, 9.9102783203125, 10.203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 5.0, 11.0, 12.0, 18.0, 25.0, 34.0, 53.0, 87.0, 113.0, 167.0, 300.0, 499.0, 805.0, 1496.0, 3393.0, 8820.0, 25753.0, 78945.0, 239478.0, 417237.0, 180677.0, 58892.0, 19119.0, 6725.0, 2698.0, 1305.0, 666.0, 409.0, 250.0, 175.0, 110.0, 78.0, 51.0, 47.0, 19.0, 18.0, 17.0, 13.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0], "bins": [-26.984375, -26.242431640625, -25.50048828125, -24.758544921875, -24.0166015625, -23.274658203125, -22.53271484375, -21.790771484375, -21.048828125, -20.306884765625, -19.56494140625, -18.822998046875, -18.0810546875, -17.339111328125, -16.59716796875, -15.855224609375, -15.11328125, -14.371337890625, -13.62939453125, -12.887451171875, -12.1455078125, -11.403564453125, -10.66162109375, -9.919677734375, -9.177734375, -8.435791015625, -7.69384765625, -6.951904296875, -6.2099609375, -5.468017578125, -4.72607421875, -3.984130859375, -3.2421875, -2.500244140625, -1.75830078125, -1.016357421875, -0.2744140625, 0.467529296875, 1.20947265625, 1.951416015625, 2.693359375, 3.435302734375, 4.17724609375, 4.919189453125, 5.6611328125, 6.403076171875, 7.14501953125, 7.886962890625, 8.62890625, 9.370849609375, 10.11279296875, 10.854736328125, 11.5966796875, 12.338623046875, 13.08056640625, 13.822509765625, 14.564453125, 15.306396484375, 16.04833984375, 16.790283203125, 17.5322265625, 18.274169921875, 19.01611328125, 19.758056640625, 20.5]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 7.0, 5.0, 8.0, 13.0, 22.0, 15.0, 26.0, 26.0, 28.0, 24.0, 33.0, 47.0, 56.0, 51.0, 48.0, 39.0, 52.0, 56.0, 53.0, 71.0, 60.0, 41.0, 31.0, 42.0, 32.0, 27.0, 15.0, 18.0, 12.0, 16.0, 8.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0], "bins": [-29.546875, -28.8427734375, -28.138671875, -27.4345703125, -26.73046875, -26.0263671875, -25.322265625, -24.6181640625, -23.9140625, -23.2099609375, -22.505859375, -21.8017578125, -21.09765625, -20.3935546875, -19.689453125, -18.9853515625, -18.28125, -17.5771484375, -16.873046875, -16.1689453125, -15.46484375, -14.7607421875, -14.056640625, -13.3525390625, -12.6484375, -11.9443359375, -11.240234375, -10.5361328125, -9.83203125, -9.1279296875, -8.423828125, -7.7197265625, -7.015625, -6.3115234375, -5.607421875, -4.9033203125, -4.19921875, -3.4951171875, -2.791015625, -2.0869140625, -1.3828125, -0.6787109375, 0.025390625, 0.7294921875, 1.43359375, 2.1376953125, 2.841796875, 3.5458984375, 4.25, 4.9541015625, 5.658203125, 6.3623046875, 7.06640625, 7.7705078125, 8.474609375, 9.1787109375, 9.8828125, 10.5869140625, 11.291015625, 11.9951171875, 12.69921875, 13.4033203125, 14.107421875, 14.8115234375, 15.515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 9.0, 17.0, 12.0, 15.0, 34.0, 48.0, 86.0, 142.0, 242.0, 428.0, 790.0, 1482.0, 2993.0, 6450.0, 15348.0, 39694.0, 115507.0, 311611.0, 342234.0, 134087.0, 45586.0, 17540.0, 7444.0, 3211.0, 1611.0, 816.0, 460.0, 235.0, 147.0, 92.0, 62.0, 31.0, 33.0, 17.0, 11.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.2734375, -9.9627685546875, -9.652099609375, -9.3414306640625, -9.03076171875, -8.7200927734375, -8.409423828125, -8.0987548828125, -7.7880859375, -7.4774169921875, -7.166748046875, -6.8560791015625, -6.54541015625, -6.2347412109375, -5.924072265625, -5.6134033203125, -5.302734375, -4.9920654296875, -4.681396484375, -4.3707275390625, -4.06005859375, -3.7493896484375, -3.438720703125, -3.1280517578125, -2.8173828125, -2.5067138671875, -2.196044921875, -1.8853759765625, -1.57470703125, -1.2640380859375, -0.953369140625, -0.6427001953125, -0.33203125, -0.0213623046875, 0.289306640625, 0.5999755859375, 0.91064453125, 1.2213134765625, 1.531982421875, 1.8426513671875, 2.1533203125, 2.4639892578125, 2.774658203125, 3.0853271484375, 3.39599609375, 3.7066650390625, 4.017333984375, 4.3280029296875, 4.638671875, 4.9493408203125, 5.260009765625, 5.5706787109375, 5.88134765625, 6.1920166015625, 6.502685546875, 6.8133544921875, 7.1240234375, 7.4346923828125, 7.745361328125, 8.0560302734375, 8.36669921875, 8.6773681640625, 8.988037109375, 9.2987060546875, 9.609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 7.0, 5.0, 2.0, 15.0, 19.0, 16.0, 32.0, 34.0, 60.0, 60.0, 98.0, 144.0, 126.0, 86.0, 61.0, 57.0, 39.0, 30.0, 24.0, 22.0, 17.0, 9.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00200653076171875, -0.0019353926181793213, -0.0018642544746398926, -0.0017931163311004639, -0.0017219781875610352, -0.0016508400440216064, -0.0015797019004821777, -0.001508563756942749, -0.0014374256134033203, -0.0013662874698638916, -0.0012951493263244629, -0.0012240111827850342, -0.0011528730392456055, -0.0010817348957061768, -0.001010596752166748, -0.0009394586086273193, -0.0008683204650878906, -0.0007971823215484619, -0.0007260441780090332, -0.0006549060344696045, -0.0005837678909301758, -0.0005126297473907471, -0.00044149160385131836, -0.00037035346031188965, -0.00029921531677246094, -0.00022807717323303223, -0.00015693902969360352, -8.58008861541748e-05, -1.4662742614746094e-05, 5.647540092468262e-05, 0.00012761354446411133, 0.00019875168800354004, 0.00026988983154296875, 0.00034102797508239746, 0.00041216611862182617, 0.0004833042621612549, 0.0005544424057006836, 0.0006255805492401123, 0.000696718692779541, 0.0007678568363189697, 0.0008389949798583984, 0.0009101331233978271, 0.0009812712669372559, 0.0010524094104766846, 0.0011235475540161133, 0.001194685697555542, 0.0012658238410949707, 0.0013369619846343994, 0.0014081001281738281, 0.0014792382717132568, 0.0015503764152526855, 0.0016215145587921143, 0.001692652702331543, 0.0017637908458709717, 0.0018349289894104004, 0.001906067132949829, 0.001977205276489258, 0.0020483434200286865, 0.0021194815635681152, 0.002190619707107544, 0.0022617578506469727, 0.0023328959941864014, 0.00240403413772583, 0.002475172281265259, 0.0025463104248046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 5.0, 3.0, 13.0, 19.0, 29.0, 49.0, 75.0, 114.0, 186.0, 304.0, 525.0, 1016.0, 2023.0, 4722.0, 12580.0, 39430.0, 156911.0, 477326.0, 260012.0, 62935.0, 18077.0, 6471.0, 2760.0, 1305.0, 685.0, 384.0, 215.0, 139.0, 75.0, 62.0, 31.0, 25.0, 14.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-15.484375, -15.0941162109375, -14.703857421875, -14.3135986328125, -13.92333984375, -13.5330810546875, -13.142822265625, -12.7525634765625, -12.3623046875, -11.9720458984375, -11.581787109375, -11.1915283203125, -10.80126953125, -10.4110107421875, -10.020751953125, -9.6304931640625, -9.240234375, -8.8499755859375, -8.459716796875, -8.0694580078125, -7.67919921875, -7.2889404296875, -6.898681640625, -6.5084228515625, -6.1181640625, -5.7279052734375, -5.337646484375, -4.9473876953125, -4.55712890625, -4.1668701171875, -3.776611328125, -3.3863525390625, -2.99609375, -2.6058349609375, -2.215576171875, -1.8253173828125, -1.43505859375, -1.0447998046875, -0.654541015625, -0.2642822265625, 0.1259765625, 0.5162353515625, 0.906494140625, 1.2967529296875, 1.68701171875, 2.0772705078125, 2.467529296875, 2.8577880859375, 3.248046875, 3.6383056640625, 4.028564453125, 4.4188232421875, 4.80908203125, 5.1993408203125, 5.589599609375, 5.9798583984375, 6.3701171875, 6.7603759765625, 7.150634765625, 7.5408935546875, 7.93115234375, 8.3214111328125, 8.711669921875, 9.1019287109375, 9.4921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 2.0, 10.0, 6.0, 9.0, 18.0, 17.0, 24.0, 34.0, 31.0, 64.0, 62.0, 61.0, 95.0, 85.0, 78.0, 80.0, 80.0, 62.0, 38.0, 29.0, 20.0, 24.0, 16.0, 10.0, 7.0, 12.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.3046875, -8.01611328125, -7.7275390625, -7.43896484375, -7.150390625, -6.86181640625, -6.5732421875, -6.28466796875, -5.99609375, -5.70751953125, -5.4189453125, -5.13037109375, -4.841796875, -4.55322265625, -4.2646484375, -3.97607421875, -3.6875, -3.39892578125, -3.1103515625, -2.82177734375, -2.533203125, -2.24462890625, -1.9560546875, -1.66748046875, -1.37890625, -1.09033203125, -0.8017578125, -0.51318359375, -0.224609375, 0.06396484375, 0.3525390625, 0.64111328125, 0.9296875, 1.21826171875, 1.5068359375, 1.79541015625, 2.083984375, 2.37255859375, 2.6611328125, 2.94970703125, 3.23828125, 3.52685546875, 3.8154296875, 4.10400390625, 4.392578125, 4.68115234375, 4.9697265625, 5.25830078125, 5.546875, 5.83544921875, 6.1240234375, 6.41259765625, 6.701171875, 6.98974609375, 7.2783203125, 7.56689453125, 7.85546875, 8.14404296875, 8.4326171875, 8.72119140625, 9.009765625, 9.29833984375, 9.5869140625, 9.87548828125, 10.1640625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 9.0, 8.0, 11.0, 14.0, 23.0, 36.0, 60.0, 76.0, 73.0, 93.0, 92.0, 96.0, 108.0, 82.0, 60.0, 42.0, 36.0, 19.0, 16.0, 14.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.5966339111328, -152.22000122070312, -147.84336853027344, -143.46673583984375, -139.09010314941406, -134.71347045898438, -130.3368377685547, -125.960205078125, -121.58357238769531, -117.20693969726562, -112.83030700683594, -108.45367431640625, -104.07704162597656, -99.70040893554688, -95.32377624511719, -90.9471435546875, -86.57051849365234, -82.19388580322266, -77.81725311279297, -73.44062042236328, -69.0639877319336, -64.6873550415039, -60.310726165771484, -55.9340934753418, -51.55746078491211, -47.18082809448242, -42.804195404052734, -38.42756652832031, -34.050933837890625, -29.674299240112305, -25.29766845703125, -20.921035766601562, -16.544403076171875, -12.167770385742188, -7.791138648986816, -3.4145069122314453, 0.9621257781982422, 5.33875846862793, 9.715389251708984, 14.092021942138672, 18.46865463256836, 22.845287322998047, 27.221920013427734, 31.59855079650879, 35.975181579589844, 40.35181427001953, 44.72844696044922, 49.105079650878906, 53.481712341308594, 57.85834503173828, 62.23497772216797, 66.61161041259766, 70.98824310302734, 75.36487579345703, 79.74150085449219, 84.11813354492188, 88.49476623535156, 92.87139892578125, 97.24803161621094, 101.62466430664062, 106.00129699707031, 110.3779296875, 114.75456237792969, 119.13119506835938, 123.50782775878906]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 14.0, 10.0, 8.0, 16.0, 11.0, 21.0, 14.0, 21.0, 17.0, 24.0, 25.0, 31.0, 24.0, 47.0, 48.0, 33.0, 41.0, 35.0, 45.0, 40.0, 39.0, 35.0, 46.0, 43.0, 39.0, 27.0, 18.0, 39.0, 30.0, 15.0, 19.0, 11.0, 13.0, 14.0, 10.0, 9.0, 10.0, 7.0, 7.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.59815979003906, -82.72219848632812, -79.84624481201172, -76.97028350830078, -74.09432220458984, -71.21836853027344, -68.3424072265625, -65.46644592285156, -62.590492248535156, -59.714534759521484, -56.83857345581055, -53.962615966796875, -51.0866584777832, -48.21070098876953, -45.334739685058594, -42.45878219604492, -39.582820892333984, -36.70686340332031, -33.830902099609375, -30.954944610595703, -28.07898712158203, -25.203027725219727, -22.327068328857422, -19.45111083984375, -16.575151443481445, -13.699193000793457, -10.823234558105469, -7.947275161743164, -5.071316719055176, -2.1953582763671875, 0.6806011199951172, 3.556558609008789, 6.432518005371094, 9.308476448059082, 12.18443489074707, 15.060394287109375, 17.936351776123047, 20.81231117248535, 23.688270568847656, 26.564228057861328, 29.440187454223633, 32.31614685058594, 35.19210433959961, 38.06806182861328, 40.94402313232422, 43.81998062133789, 46.69593811035156, 49.5718994140625, 52.44785690307617, 55.323814392089844, 58.19977569580078, 61.07573318481445, 63.951690673828125, 66.82765197753906, 69.70361328125, 72.5795669555664, 75.45552825927734, 78.33148956298828, 81.20744323730469, 84.08340454101562, 86.95936584472656, 89.83531951904297, 92.7112808227539, 95.58723449707031, 98.46319580078125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 5.0, 8.0, 4.0, 8.0, 14.0, 16.0, 16.0, 25.0, 37.0, 44.0, 64.0, 98.0, 143.0, 223.0, 327.0, 535.0, 957.0, 1731.0, 3550.0, 8124.0, 21890.0, 79635.0, 665378.0, 3222135.0, 137535.0, 31867.0, 10620.0, 4370.0, 2143.0, 1080.0, 554.0, 346.0, 227.0, 151.0, 110.0, 65.0, 50.0, 35.0, 24.0, 23.0, 26.0, 14.0, 16.0, 18.0, 11.0, 6.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-33.28125, -32.00927734375, -30.7373046875, -29.46533203125, -28.193359375, -26.92138671875, -25.6494140625, -24.37744140625, -23.10546875, -21.83349609375, -20.5615234375, -19.28955078125, -18.017578125, -16.74560546875, -15.4736328125, -14.20166015625, -12.9296875, -11.65771484375, -10.3857421875, -9.11376953125, -7.841796875, -6.56982421875, -5.2978515625, -4.02587890625, -2.75390625, -1.48193359375, -0.2099609375, 1.06201171875, 2.333984375, 3.60595703125, 4.8779296875, 6.14990234375, 7.421875, 8.69384765625, 9.9658203125, 11.23779296875, 12.509765625, 13.78173828125, 15.0537109375, 16.32568359375, 17.59765625, 18.86962890625, 20.1416015625, 21.41357421875, 22.685546875, 23.95751953125, 25.2294921875, 26.50146484375, 27.7734375, 29.04541015625, 30.3173828125, 31.58935546875, 32.861328125, 34.13330078125, 35.4052734375, 36.67724609375, 37.94921875, 39.22119140625, 40.4931640625, 41.76513671875, 43.037109375, 44.30908203125, 45.5810546875, 46.85302734375, 48.125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 13.0, 21.0, 28.0, 44.0, 36.0, 65.0, 70.0, 79.0, 94.0, 86.0, 79.0, 67.0, 75.0, 58.0, 44.0, 48.0, 28.0, 12.0, 11.0, 5.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8416748046875, -7.573974609375, -7.3062744140625, -7.03857421875, -6.7708740234375, -6.503173828125, -6.2354736328125, -5.9677734375, -5.7000732421875, -5.432373046875, -5.1646728515625, -4.89697265625, -4.6292724609375, -4.361572265625, -4.0938720703125, -3.826171875, -3.5584716796875, -3.290771484375, -3.0230712890625, -2.75537109375, -2.4876708984375, -2.219970703125, -1.9522705078125, -1.6845703125, -1.4168701171875, -1.149169921875, -0.8814697265625, -0.61376953125, -0.3460693359375, -0.078369140625, 0.1893310546875, 0.45703125, 0.7247314453125, 0.992431640625, 1.2601318359375, 1.52783203125, 1.7955322265625, 2.063232421875, 2.3309326171875, 2.5986328125, 2.8663330078125, 3.134033203125, 3.4017333984375, 3.66943359375, 3.9371337890625, 4.204833984375, 4.4725341796875, 4.740234375, 5.0079345703125, 5.275634765625, 5.5433349609375, 5.81103515625, 6.0787353515625, 6.346435546875, 6.6141357421875, 6.8818359375, 7.1495361328125, 7.417236328125, 7.6849365234375, 7.95263671875, 8.2203369140625, 8.488037109375, 8.7557373046875, 9.0234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 10.0, 16.0, 12.0, 19.0, 32.0, 32.0, 37.0, 72.0, 122.0, 199.0, 439.0, 1012.0, 3718.0, 24234.0, 417907.0, 3630769.0, 102526.0, 9873.0, 1911.0, 604.0, 268.0, 159.0, 88.0, 55.0, 46.0, 36.0, 30.0, 16.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-71.25, -69.3388671875, -67.427734375, -65.5166015625, -63.60546875, -61.6943359375, -59.783203125, -57.8720703125, -55.9609375, -54.0498046875, -52.138671875, -50.2275390625, -48.31640625, -46.4052734375, -44.494140625, -42.5830078125, -40.671875, -38.7607421875, -36.849609375, -34.9384765625, -33.02734375, -31.1162109375, -29.205078125, -27.2939453125, -25.3828125, -23.4716796875, -21.560546875, -19.6494140625, -17.73828125, -15.8271484375, -13.916015625, -12.0048828125, -10.09375, -8.1826171875, -6.271484375, -4.3603515625, -2.44921875, -0.5380859375, 1.373046875, 3.2841796875, 5.1953125, 7.1064453125, 9.017578125, 10.9287109375, 12.83984375, 14.7509765625, 16.662109375, 18.5732421875, 20.484375, 22.3955078125, 24.306640625, 26.2177734375, 28.12890625, 30.0400390625, 31.951171875, 33.8623046875, 35.7734375, 37.6845703125, 39.595703125, 41.5068359375, 43.41796875, 45.3291015625, 47.240234375, 49.1513671875, 51.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 20.0, 25.0, 75.0, 207.0, 557.0, 2189.0, 632.0, 213.0, 81.0, 36.0, 17.0, 12.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.053955078125, -19.12353515625, -18.193115234375, -17.2626953125, -16.332275390625, -15.40185546875, -14.471435546875, -13.541015625, -12.610595703125, -11.68017578125, -10.749755859375, -9.8193359375, -8.888916015625, -7.95849609375, -7.028076171875, -6.09765625, -5.167236328125, -4.23681640625, -3.306396484375, -2.3759765625, -1.445556640625, -0.51513671875, 0.415283203125, 1.345703125, 2.276123046875, 3.20654296875, 4.136962890625, 5.0673828125, 5.997802734375, 6.92822265625, 7.858642578125, 8.7890625, 9.719482421875, 10.64990234375, 11.580322265625, 12.5107421875, 13.441162109375, 14.37158203125, 15.302001953125, 16.232421875, 17.162841796875, 18.09326171875, 19.023681640625, 19.9541015625, 20.884521484375, 21.81494140625, 22.745361328125, 23.67578125, 24.606201171875, 25.53662109375, 26.467041015625, 27.3974609375, 28.327880859375, 29.25830078125, 30.188720703125, 31.119140625, 32.049560546875, 32.97998046875, 33.910400390625, 34.8408203125, 35.771240234375, 36.70166015625, 37.632080078125, 38.5625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 13.0, 13.0, 27.0, 37.0, 80.0, 81.0, 98.0, 109.0, 94.0, 106.0, 92.0, 88.0, 40.0, 32.0, 29.0, 16.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-86.02826690673828, -83.38094329833984, -80.73361206054688, -78.08628845214844, -75.43896484375, -72.79164123535156, -70.14431762695312, -67.49698638916016, -64.84966278076172, -62.20233917236328, -59.55501174926758, -56.907684326171875, -54.26036071777344, -51.613037109375, -48.9657096862793, -46.318382263183594, -43.671058654785156, -41.02373504638672, -38.376407623291016, -35.72908020019531, -33.081756591796875, -30.434431076049805, -27.787105560302734, -25.139780044555664, -22.492454528808594, -19.845129013061523, -17.197803497314453, -14.550477981567383, -11.903152465820312, -9.255826950073242, -6.608501434326172, -3.9611759185791016, -1.3138427734375, 1.3334827423095703, 3.9808082580566406, 6.628133773803711, 9.275459289550781, 11.922784805297852, 14.570110321044922, 17.217435836791992, 19.864761352539062, 22.512086868286133, 25.159412384033203, 27.806737899780273, 30.454063415527344, 33.10138702392578, 35.748714447021484, 38.39604187011719, 41.043365478515625, 43.69068908691406, 46.338016510009766, 48.98534393310547, 51.632667541503906, 54.279991149902344, 56.92731857299805, 59.57464599609375, 62.22196960449219, 64.86929321289062, 67.51661682128906, 70.16394805908203, 72.81127166748047, 75.4585952758789, 78.10592651367188, 80.75325012207031, 83.40057373046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 10.0, 3.0, 4.0, 7.0, 11.0, 6.0, 17.0, 27.0, 25.0, 24.0, 32.0, 35.0, 42.0, 47.0, 51.0, 60.0, 69.0, 55.0, 44.0, 66.0, 60.0, 36.0, 40.0, 46.0, 43.0, 27.0, 26.0, 22.0, 15.0, 16.0, 13.0, 10.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-68.8824234008789, -67.05390167236328, -65.22537994384766, -63.39685821533203, -61.568336486816406, -59.73981475830078, -57.91129684448242, -56.0827751159668, -54.25425338745117, -52.42573165893555, -50.59720993041992, -48.7686882019043, -46.94017028808594, -45.11164855957031, -43.28312683105469, -41.45460510253906, -39.62608337402344, -37.79756164550781, -35.96903991699219, -34.14051818847656, -32.31199645996094, -30.483476638793945, -28.654956817626953, -26.826435089111328, -24.997913360595703, -23.169391632080078, -21.340869903564453, -19.51235008239746, -17.683828353881836, -15.855306625366211, -14.026785850524902, -12.198265075683594, -10.369743347167969, -8.541221618652344, -6.712700843811035, -4.884179592132568, -3.0556583404541016, -1.2271366119384766, 0.601384162902832, 2.4299049377441406, 4.258426666259766, 6.086947917938232, 7.915469169616699, 9.743989944458008, 11.572511672973633, 13.401033401489258, 15.229554176330566, 17.058074951171875, 18.8865966796875, 20.715118408203125, 22.54364013671875, 24.372159957885742, 26.200681686401367, 28.029203414916992, 29.857723236083984, 31.68624496459961, 33.514766693115234, 35.34328842163086, 37.171810150146484, 39.00033187866211, 40.82884979248047, 42.657371520996094, 44.48589324951172, 46.314414978027344, 48.14293670654297]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 9.0, 21.0, 8.0, 13.0, 30.0, 45.0, 67.0, 90.0, 152.0, 280.0, 482.0, 973.0, 2125.0, 5638.0, 18178.0, 86124.0, 594388.0, 277085.0, 44899.0, 11167.0, 3626.0, 1495.0, 677.0, 384.0, 204.0, 111.0, 86.0, 63.0, 30.0, 31.0, 19.0, 6.0, 14.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.90625, -46.298828125, -44.69140625, -43.083984375, -41.4765625, -39.869140625, -38.26171875, -36.654296875, -35.046875, -33.439453125, -31.83203125, -30.224609375, -28.6171875, -27.009765625, -25.40234375, -23.794921875, -22.1875, -20.580078125, -18.97265625, -17.365234375, -15.7578125, -14.150390625, -12.54296875, -10.935546875, -9.328125, -7.720703125, -6.11328125, -4.505859375, -2.8984375, -1.291015625, 0.31640625, 1.923828125, 3.53125, 5.138671875, 6.74609375, 8.353515625, 9.9609375, 11.568359375, 13.17578125, 14.783203125, 16.390625, 17.998046875, 19.60546875, 21.212890625, 22.8203125, 24.427734375, 26.03515625, 27.642578125, 29.25, 30.857421875, 32.46484375, 34.072265625, 35.6796875, 37.287109375, 38.89453125, 40.501953125, 42.109375, 43.716796875, 45.32421875, 46.931640625, 48.5390625, 50.146484375, 51.75390625, 53.361328125, 54.96875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 16.0, 32.0, 34.0, 53.0, 45.0, 98.0, 102.0, 103.0, 88.0, 76.0, 85.0, 68.0, 60.0, 38.0, 30.0, 18.0, 8.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.1021728515625, -8.798095703125, -8.4940185546875, -8.18994140625, -7.8858642578125, -7.581787109375, -7.2777099609375, -6.9736328125, -6.6695556640625, -6.365478515625, -6.0614013671875, -5.75732421875, -5.4532470703125, -5.149169921875, -4.8450927734375, -4.541015625, -4.2369384765625, -3.932861328125, -3.6287841796875, -3.32470703125, -3.0206298828125, -2.716552734375, -2.4124755859375, -2.1083984375, -1.8043212890625, -1.500244140625, -1.1961669921875, -0.89208984375, -0.5880126953125, -0.283935546875, 0.0201416015625, 0.32421875, 0.6282958984375, 0.932373046875, 1.2364501953125, 1.54052734375, 1.8446044921875, 2.148681640625, 2.4527587890625, 2.7568359375, 3.0609130859375, 3.364990234375, 3.6690673828125, 3.97314453125, 4.2772216796875, 4.581298828125, 4.8853759765625, 5.189453125, 5.4935302734375, 5.797607421875, 6.1016845703125, 6.40576171875, 6.7098388671875, 7.013916015625, 7.3179931640625, 7.6220703125, 7.9261474609375, 8.230224609375, 8.5343017578125, 8.83837890625, 9.1424560546875, 9.446533203125, 9.7506103515625, 10.0546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 13.0, 13.0, 16.0, 17.0, 18.0, 42.0, 48.0, 84.0, 126.0, 146.0, 264.0, 395.0, 615.0, 1152.0, 2411.0, 5648.0, 15564.0, 47542.0, 159908.0, 506126.0, 214542.0, 61121.0, 19361.0, 7126.0, 2872.0, 1407.0, 666.0, 408.0, 262.0, 176.0, 154.0, 99.0, 42.0, 50.0, 27.0, 36.0, 27.0, 10.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0], "bins": [-30.921875, -30.14111328125, -29.3603515625, -28.57958984375, -27.798828125, -27.01806640625, -26.2373046875, -25.45654296875, -24.67578125, -23.89501953125, -23.1142578125, -22.33349609375, -21.552734375, -20.77197265625, -19.9912109375, -19.21044921875, -18.4296875, -17.64892578125, -16.8681640625, -16.08740234375, -15.306640625, -14.52587890625, -13.7451171875, -12.96435546875, -12.18359375, -11.40283203125, -10.6220703125, -9.84130859375, -9.060546875, -8.27978515625, -7.4990234375, -6.71826171875, -5.9375, -5.15673828125, -4.3759765625, -3.59521484375, -2.814453125, -2.03369140625, -1.2529296875, -0.47216796875, 0.30859375, 1.08935546875, 1.8701171875, 2.65087890625, 3.431640625, 4.21240234375, 4.9931640625, 5.77392578125, 6.5546875, 7.33544921875, 8.1162109375, 8.89697265625, 9.677734375, 10.45849609375, 11.2392578125, 12.02001953125, 12.80078125, 13.58154296875, 14.3623046875, 15.14306640625, 15.923828125, 16.70458984375, 17.4853515625, 18.26611328125, 19.046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 10.0, 8.0, 10.0, 19.0, 11.0, 22.0, 21.0, 13.0, 32.0, 22.0, 31.0, 42.0, 37.0, 45.0, 53.0, 41.0, 35.0, 44.0, 46.0, 46.0, 44.0, 38.0, 38.0, 40.0, 31.0, 25.0, 27.0, 22.0, 28.0, 21.0, 12.0, 7.0, 12.0, 12.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-20.53125, -19.943359375, -19.35546875, -18.767578125, -18.1796875, -17.591796875, -17.00390625, -16.416015625, -15.828125, -15.240234375, -14.65234375, -14.064453125, -13.4765625, -12.888671875, -12.30078125, -11.712890625, -11.125, -10.537109375, -9.94921875, -9.361328125, -8.7734375, -8.185546875, -7.59765625, -7.009765625, -6.421875, -5.833984375, -5.24609375, -4.658203125, -4.0703125, -3.482421875, -2.89453125, -2.306640625, -1.71875, -1.130859375, -0.54296875, 0.044921875, 0.6328125, 1.220703125, 1.80859375, 2.396484375, 2.984375, 3.572265625, 4.16015625, 4.748046875, 5.3359375, 5.923828125, 6.51171875, 7.099609375, 7.6875, 8.275390625, 8.86328125, 9.451171875, 10.0390625, 10.626953125, 11.21484375, 11.802734375, 12.390625, 12.978515625, 13.56640625, 14.154296875, 14.7421875, 15.330078125, 15.91796875, 16.505859375, 17.09375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 4.0, 13.0, 19.0, 23.0, 41.0, 78.0, 174.0, 296.0, 667.0, 1737.0, 5365.0, 20974.0, 124121.0, 667856.0, 188768.0, 27814.0, 6913.0, 2198.0, 754.0, 344.0, 186.0, 84.0, 46.0, 24.0, 20.0, 16.0, 8.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.91748046875, -13.4130859375, -12.90869140625, -12.404296875, -11.89990234375, -11.3955078125, -10.89111328125, -10.38671875, -9.88232421875, -9.3779296875, -8.87353515625, -8.369140625, -7.86474609375, -7.3603515625, -6.85595703125, -6.3515625, -5.84716796875, -5.3427734375, -4.83837890625, -4.333984375, -3.82958984375, -3.3251953125, -2.82080078125, -2.31640625, -1.81201171875, -1.3076171875, -0.80322265625, -0.298828125, 0.20556640625, 0.7099609375, 1.21435546875, 1.71875, 2.22314453125, 2.7275390625, 3.23193359375, 3.736328125, 4.24072265625, 4.7451171875, 5.24951171875, 5.75390625, 6.25830078125, 6.7626953125, 7.26708984375, 7.771484375, 8.27587890625, 8.7802734375, 9.28466796875, 9.7890625, 10.29345703125, 10.7978515625, 11.30224609375, 11.806640625, 12.31103515625, 12.8154296875, 13.31982421875, 13.82421875, 14.32861328125, 14.8330078125, 15.33740234375, 15.841796875, 16.34619140625, 16.8505859375, 17.35498046875, 17.859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 16.0, 10.0, 12.0, 19.0, 12.0, 17.0, 23.0, 34.0, 62.0, 98.0, 121.0, 149.0, 127.0, 74.0, 35.0, 31.0, 24.0, 19.0, 9.0, 12.0, 7.0, 9.0, 5.0, 11.0, 6.0, 5.0, 3.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0021076202392578125, -0.0020460784435272217, -0.001984536647796631, -0.00192299485206604, -0.0018614530563354492, -0.0017999112606048584, -0.0017383694648742676, -0.0016768276691436768, -0.001615285873413086, -0.0015537440776824951, -0.0014922022819519043, -0.0014306604862213135, -0.0013691186904907227, -0.0013075768947601318, -0.001246035099029541, -0.0011844933032989502, -0.0011229515075683594, -0.0010614097118377686, -0.0009998679161071777, -0.0009383261203765869, -0.0008767843246459961, -0.0008152425289154053, -0.0007537007331848145, -0.0006921589374542236, -0.0006306171417236328, -0.000569075345993042, -0.0005075335502624512, -0.00044599175453186035, -0.00038444995880126953, -0.0003229081630706787, -0.0002613663673400879, -0.00019982457160949707, -0.00013828277587890625, -7.674098014831543e-05, -1.519918441772461e-05, 4.634261131286621e-05, 0.00010788440704345703, 0.00016942620277404785, 0.00023096799850463867, 0.0002925097942352295, 0.0003540515899658203, 0.00041559338569641113, 0.00047713518142700195, 0.0005386769771575928, 0.0006002187728881836, 0.0006617605686187744, 0.0007233023643493652, 0.0007848441600799561, 0.0008463859558105469, 0.0009079277515411377, 0.0009694695472717285, 0.0010310113430023193, 0.0010925531387329102, 0.001154094934463501, 0.0012156367301940918, 0.0012771785259246826, 0.0013387203216552734, 0.0014002621173858643, 0.001461803913116455, 0.001523345708847046, 0.0015848875045776367, 0.0016464293003082275, 0.0017079710960388184, 0.0017695128917694092, 0.0018310546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 9.0, 20.0, 23.0, 26.0, 43.0, 74.0, 103.0, 188.0, 308.0, 526.0, 1256.0, 2833.0, 7497.0, 23110.0, 87234.0, 490591.0, 345013.0, 61801.0, 17429.0, 5939.0, 2270.0, 1032.0, 525.0, 285.0, 149.0, 90.0, 72.0, 35.0, 24.0, 14.0, 11.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0780029296875, -11.710693359375, -11.3433837890625, -10.97607421875, -10.6087646484375, -10.241455078125, -9.8741455078125, -9.5068359375, -9.1395263671875, -8.772216796875, -8.4049072265625, -8.03759765625, -7.6702880859375, -7.302978515625, -6.9356689453125, -6.568359375, -6.2010498046875, -5.833740234375, -5.4664306640625, -5.09912109375, -4.7318115234375, -4.364501953125, -3.9971923828125, -3.6298828125, -3.2625732421875, -2.895263671875, -2.5279541015625, -2.16064453125, -1.7933349609375, -1.426025390625, -1.0587158203125, -0.69140625, -0.3240966796875, 0.043212890625, 0.4105224609375, 0.77783203125, 1.1451416015625, 1.512451171875, 1.8797607421875, 2.2470703125, 2.6143798828125, 2.981689453125, 3.3489990234375, 3.71630859375, 4.0836181640625, 4.450927734375, 4.8182373046875, 5.185546875, 5.5528564453125, 5.920166015625, 6.2874755859375, 6.65478515625, 7.0220947265625, 7.389404296875, 7.7567138671875, 8.1240234375, 8.4913330078125, 8.858642578125, 9.2259521484375, 9.59326171875, 9.9605712890625, 10.327880859375, 10.6951904296875, 11.0625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 4.0, 8.0, 9.0, 6.0, 13.0, 16.0, 16.0, 16.0, 28.0, 30.0, 44.0, 42.0, 48.0, 70.0, 78.0, 58.0, 73.0, 81.0, 54.0, 50.0, 36.0, 40.0, 41.0, 19.0, 23.0, 9.0, 11.0, 14.0, 6.0, 8.0, 8.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.30859375, -6.1268310546875, -5.945068359375, -5.7633056640625, -5.58154296875, -5.3997802734375, -5.218017578125, -5.0362548828125, -4.8544921875, -4.6727294921875, -4.490966796875, -4.3092041015625, -4.12744140625, -3.9456787109375, -3.763916015625, -3.5821533203125, -3.400390625, -3.2186279296875, -3.036865234375, -2.8551025390625, -2.67333984375, -2.4915771484375, -2.309814453125, -2.1280517578125, -1.9462890625, -1.7645263671875, -1.582763671875, -1.4010009765625, -1.21923828125, -1.0374755859375, -0.855712890625, -0.6739501953125, -0.4921875, -0.3104248046875, -0.128662109375, 0.0531005859375, 0.23486328125, 0.4166259765625, 0.598388671875, 0.7801513671875, 0.9619140625, 1.1436767578125, 1.325439453125, 1.5072021484375, 1.68896484375, 1.8707275390625, 2.052490234375, 2.2342529296875, 2.416015625, 2.5977783203125, 2.779541015625, 2.9613037109375, 3.14306640625, 3.3248291015625, 3.506591796875, 3.6883544921875, 3.8701171875, 4.0518798828125, 4.233642578125, 4.4154052734375, 4.59716796875, 4.7789306640625, 4.960693359375, 5.1424560546875, 5.32421875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 9.0, 23.0, 24.0, 55.0, 72.0, 119.0, 180.0, 150.0, 151.0, 87.0, 49.0, 33.0, 25.0, 9.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.94160461425781, -120.88534545898438, -113.8290786743164, -106.77281188964844, -99.716552734375, -92.66029357910156, -85.6040267944336, -78.54776000976562, -71.49150085449219, -64.43524169921875, -57.37897491455078, -50.32271194458008, -43.266448974609375, -36.21018600463867, -29.15392303466797, -22.097660064697266, -15.041397094726562, -7.985134124755859, -0.9288711547851562, 6.127391815185547, 13.18365478515625, 20.239917755126953, 27.296180725097656, 34.35244369506836, 41.40870666503906, 48.464969635009766, 55.52123260498047, 62.57749557495117, 69.63375854492188, 76.69001770019531, 83.74628448486328, 90.80255126953125, 97.85879516601562, 104.91505432128906, 111.97132110595703, 119.027587890625, 126.08384704589844, 133.14010620117188, 140.19638061523438, 147.2526397705078, 154.30889892578125, 161.3651580810547, 168.42141723632812, 175.47769165039062, 182.53395080566406, 189.5902099609375, 196.646484375, 203.70274353027344, 210.75900268554688, 217.8152618408203, 224.87152099609375, 231.92779541015625, 238.9840545654297, 246.04031372070312, 253.09658813476562, 260.15283203125, 267.2091064453125, 274.265380859375, 281.3216247558594, 288.3778991699219, 295.43414306640625, 302.49041748046875, 309.54669189453125, 316.6029357910156, 323.6592102050781]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 12.0, 13.0, 13.0, 8.0, 17.0, 23.0, 19.0, 21.0, 21.0, 23.0, 29.0, 29.0, 37.0, 31.0, 45.0, 31.0, 37.0, 30.0, 42.0, 44.0, 36.0, 56.0, 46.0, 32.0, 25.0, 26.0, 35.0, 30.0, 28.0, 21.0, 20.0, 20.0, 12.0, 25.0, 15.0, 12.0, 5.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-89.68400573730469, -86.8517837524414, -84.01956176757812, -81.18733978271484, -78.35511779785156, -75.52288818359375, -72.690673828125, -69.85844421386719, -67.0262222290039, -64.19400024414062, -61.361778259277344, -58.52955627441406, -55.697330474853516, -52.865108489990234, -50.03288650512695, -47.200660705566406, -44.36844253540039, -41.53622055053711, -38.70399856567383, -35.87177276611328, -33.03955078125, -30.20732879638672, -27.375106811523438, -24.542882919311523, -21.710660934448242, -18.87843894958496, -16.046215057373047, -13.213993072509766, -10.381770133972168, -7.54954719543457, -4.717325210571289, -1.885101318359375, 0.9471206665039062, 3.779343366622925, 6.611566066741943, 9.443788528442383, 12.27601146697998, 15.108234405517578, 17.94045639038086, 20.772680282592773, 23.604902267456055, 26.437124252319336, 29.26934814453125, 32.10157012939453, 34.93379211425781, 37.766014099121094, 40.598236083984375, 43.43046188354492, 46.2626838684082, 49.094905853271484, 51.927127838134766, 54.75935363769531, 57.591575622558594, 60.423797607421875, 63.256019592285156, 66.08824157714844, 68.92046356201172, 71.752685546875, 74.58490753173828, 77.41712951660156, 80.24935150146484, 83.08157348632812, 85.91380310058594, 88.74602508544922, 91.5782470703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 8.0, 10.0, 12.0, 22.0, 25.0, 31.0, 53.0, 66.0, 80.0, 122.0, 194.0, 321.0, 494.0, 979.0, 1712.0, 3741.0, 9044.0, 26926.0, 120348.0, 3460724.0, 483472.0, 58187.0, 16135.0, 5936.0, 2666.0, 1165.0, 645.0, 402.0, 196.0, 164.0, 78.0, 57.0, 47.0, 41.0, 39.0, 29.0, 23.0, 12.0, 11.0, 14.0, 8.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-39.6875, -38.20556640625, -36.7236328125, -35.24169921875, -33.759765625, -32.27783203125, -30.7958984375, -29.31396484375, -27.83203125, -26.35009765625, -24.8681640625, -23.38623046875, -21.904296875, -20.42236328125, -18.9404296875, -17.45849609375, -15.9765625, -14.49462890625, -13.0126953125, -11.53076171875, -10.048828125, -8.56689453125, -7.0849609375, -5.60302734375, -4.12109375, -2.63916015625, -1.1572265625, 0.32470703125, 1.806640625, 3.28857421875, 4.7705078125, 6.25244140625, 7.734375, 9.21630859375, 10.6982421875, 12.18017578125, 13.662109375, 15.14404296875, 16.6259765625, 18.10791015625, 19.58984375, 21.07177734375, 22.5537109375, 24.03564453125, 25.517578125, 26.99951171875, 28.4814453125, 29.96337890625, 31.4453125, 32.92724609375, 34.4091796875, 35.89111328125, 37.373046875, 38.85498046875, 40.3369140625, 41.81884765625, 43.30078125, 44.78271484375, 46.2646484375, 47.74658203125, 49.228515625, 50.71044921875, 52.1923828125, 53.67431640625, 55.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 12.0, 22.0, 24.0, 39.0, 50.0, 52.0, 78.0, 77.0, 112.0, 95.0, 88.0, 80.0, 55.0, 55.0, 39.0, 40.0, 21.0, 18.0, 9.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.7315673828125, -8.431884765625, -8.1322021484375, -7.83251953125, -7.5328369140625, -7.233154296875, -6.9334716796875, -6.6337890625, -6.3341064453125, -6.034423828125, -5.7347412109375, -5.43505859375, -5.1353759765625, -4.835693359375, -4.5360107421875, -4.236328125, -3.9366455078125, -3.636962890625, -3.3372802734375, -3.03759765625, -2.7379150390625, -2.438232421875, -2.1385498046875, -1.8388671875, -1.5391845703125, -1.239501953125, -0.9398193359375, -0.64013671875, -0.3404541015625, -0.040771484375, 0.2589111328125, 0.55859375, 0.8582763671875, 1.157958984375, 1.4576416015625, 1.75732421875, 2.0570068359375, 2.356689453125, 2.6563720703125, 2.9560546875, 3.2557373046875, 3.555419921875, 3.8551025390625, 4.15478515625, 4.4544677734375, 4.754150390625, 5.0538330078125, 5.353515625, 5.6531982421875, 5.952880859375, 6.2525634765625, 6.55224609375, 6.8519287109375, 7.151611328125, 7.4512939453125, 7.7509765625, 8.0506591796875, 8.350341796875, 8.6500244140625, 8.94970703125, 9.2493896484375, 9.549072265625, 9.8487548828125, 10.1484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 8.0, 16.0, 29.0, 35.0, 51.0, 57.0, 106.0, 159.0, 214.0, 316.0, 545.0, 856.0, 1348.0, 2615.0, 4986.0, 11256.0, 29239.0, 89735.0, 421608.0, 3144900.0, 356061.0, 80996.0, 27285.0, 10784.0, 4909.0, 2534.0, 1338.0, 815.0, 468.0, 312.0, 225.0, 134.0, 86.0, 74.0, 48.0, 42.0, 18.0, 17.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -24.043212890625, -23.22705078125, -22.410888671875, -21.5947265625, -20.778564453125, -19.96240234375, -19.146240234375, -18.330078125, -17.513916015625, -16.69775390625, -15.881591796875, -15.0654296875, -14.249267578125, -13.43310546875, -12.616943359375, -11.80078125, -10.984619140625, -10.16845703125, -9.352294921875, -8.5361328125, -7.719970703125, -6.90380859375, -6.087646484375, -5.271484375, -4.455322265625, -3.63916015625, -2.822998046875, -2.0068359375, -1.190673828125, -0.37451171875, 0.441650390625, 1.2578125, 2.073974609375, 2.89013671875, 3.706298828125, 4.5224609375, 5.338623046875, 6.15478515625, 6.970947265625, 7.787109375, 8.603271484375, 9.41943359375, 10.235595703125, 11.0517578125, 11.867919921875, 12.68408203125, 13.500244140625, 14.31640625, 15.132568359375, 15.94873046875, 16.764892578125, 17.5810546875, 18.397216796875, 19.21337890625, 20.029541015625, 20.845703125, 21.661865234375, 22.47802734375, 23.294189453125, 24.1103515625, 24.926513671875, 25.74267578125, 26.558837890625, 27.375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 9.0, 15.0, 22.0, 33.0, 49.0, 75.0, 124.0, 199.0, 447.0, 1476.0, 874.0, 281.0, 159.0, 89.0, 56.0, 48.0, 31.0, 17.0, 17.0, 8.0, 7.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.6640625, -15.2503662109375, -14.836669921875, -14.4229736328125, -14.00927734375, -13.5955810546875, -13.181884765625, -12.7681884765625, -12.3544921875, -11.9407958984375, -11.527099609375, -11.1134033203125, -10.69970703125, -10.2860107421875, -9.872314453125, -9.4586181640625, -9.044921875, -8.6312255859375, -8.217529296875, -7.8038330078125, -7.39013671875, -6.9764404296875, -6.562744140625, -6.1490478515625, -5.7353515625, -5.3216552734375, -4.907958984375, -4.4942626953125, -4.08056640625, -3.6668701171875, -3.253173828125, -2.8394775390625, -2.42578125, -2.0120849609375, -1.598388671875, -1.1846923828125, -0.77099609375, -0.3572998046875, 0.056396484375, 0.4700927734375, 0.8837890625, 1.2974853515625, 1.711181640625, 2.1248779296875, 2.53857421875, 2.9522705078125, 3.365966796875, 3.7796630859375, 4.193359375, 4.6070556640625, 5.020751953125, 5.4344482421875, 5.84814453125, 6.2618408203125, 6.675537109375, 7.0892333984375, 7.5029296875, 7.9166259765625, 8.330322265625, 8.7440185546875, 9.15771484375, 9.5714111328125, 9.985107421875, 10.3988037109375, 10.8125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 19.0, 45.0, 69.0, 88.0, 107.0, 124.0, 144.0, 133.0, 86.0, 60.0, 55.0, 32.0, 13.0, 11.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.95199584960938, -114.00220489501953, -111.05241394042969, -108.10262298583984, -105.15283203125, -102.20304107666016, -99.25325012207031, -96.303466796875, -93.35366821289062, -90.40387725830078, -87.45408630371094, -84.5042953491211, -81.55450439453125, -78.6047134399414, -75.65492248535156, -72.70513916015625, -69.7553482055664, -66.80555725097656, -63.85576629638672, -60.905975341796875, -57.95618438720703, -55.00639343261719, -52.05660629272461, -49.106815338134766, -46.15702438354492, -43.20723342895508, -40.257442474365234, -37.307655334472656, -34.35786437988281, -31.408071517944336, -28.458282470703125, -25.50849151611328, -22.558692932128906, -19.608901977539062, -16.65911102294922, -13.709321975708008, -10.759531021118164, -7.80974006652832, -4.859951019287109, -1.9101600646972656, 1.0396308898925781, 3.9894213676452637, 6.939211845397949, 9.889001846313477, 12.83879280090332, 15.788583755493164, 18.738372802734375, 21.68816375732422, 24.637954711914062, 27.587745666503906, 30.53753662109375, 33.487327575683594, 36.43711853027344, 39.38690948486328, 42.33669662475586, 45.2864875793457, 48.23627853393555, 51.18606948852539, 54.135860443115234, 57.08564758300781, 60.035438537597656, 62.9852294921875, 65.93502044677734, 68.88481140136719, 71.83460235595703]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 4.0, 6.0, 11.0, 11.0, 12.0, 31.0, 24.0, 26.0, 33.0, 32.0, 31.0, 30.0, 39.0, 34.0, 40.0, 56.0, 51.0, 59.0, 66.0, 40.0, 36.0, 44.0, 40.0, 35.0, 32.0, 26.0, 27.0, 27.0, 16.0, 9.0, 16.0, 12.0, 12.0, 11.0, 5.0, 1.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.68795394897461, -47.32981872558594, -45.971683502197266, -44.613548278808594, -43.255409240722656, -41.897274017333984, -40.53913879394531, -39.18100357055664, -37.82286834716797, -36.4647331237793, -35.106597900390625, -33.74846267700195, -32.39032745361328, -31.032190322875977, -29.674053192138672, -28.31591796875, -26.957782745361328, -25.599647521972656, -24.241512298583984, -22.88337516784668, -21.525239944458008, -20.167104721069336, -18.80896759033203, -17.45083236694336, -16.092697143554688, -14.734561920166016, -13.376425743103027, -12.018289566040039, -10.660154342651367, -9.302019119262695, -7.943882942199707, -6.585746765136719, -5.2276153564453125, -3.8694796562194824, -2.5113439559936523, -1.1532082557678223, 0.2049274444580078, 1.563063144683838, 2.921198844909668, 4.279335021972656, 5.637470245361328, 6.995605945587158, 8.353741645812988, 9.711877822875977, 11.070013046264648, 12.42814826965332, 13.786284446716309, 15.144420623779297, 16.50255584716797, 17.86069107055664, 19.218826293945312, 20.576963424682617, 21.93509864807129, 23.29323387145996, 24.651371002197266, 26.009506225585938, 27.36764144897461, 28.72577667236328, 30.083911895751953, 31.442049026489258, 32.80018615722656, 34.158321380615234, 35.516456604003906, 36.87459182739258, 38.23272705078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 10.0, 11.0, 7.0, 15.0, 16.0, 26.0, 59.0, 87.0, 205.0, 362.0, 899.0, 2617.0, 12639.0, 90632.0, 775945.0, 141516.0, 18174.0, 3385.0, 1002.0, 442.0, 216.0, 129.0, 70.0, 43.0, 21.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.75, -54.6162109375, -52.482421875, -50.3486328125, -48.21484375, -46.0810546875, -43.947265625, -41.8134765625, -39.6796875, -37.5458984375, -35.412109375, -33.2783203125, -31.14453125, -29.0107421875, -26.876953125, -24.7431640625, -22.609375, -20.4755859375, -18.341796875, -16.2080078125, -14.07421875, -11.9404296875, -9.806640625, -7.6728515625, -5.5390625, -3.4052734375, -1.271484375, 0.8623046875, 2.99609375, 5.1298828125, 7.263671875, 9.3974609375, 11.53125, 13.6650390625, 15.798828125, 17.9326171875, 20.06640625, 22.2001953125, 24.333984375, 26.4677734375, 28.6015625, 30.7353515625, 32.869140625, 35.0029296875, 37.13671875, 39.2705078125, 41.404296875, 43.5380859375, 45.671875, 47.8056640625, 49.939453125, 52.0732421875, 54.20703125, 56.3408203125, 58.474609375, 60.6083984375, 62.7421875, 64.8759765625, 67.009765625, 69.1435546875, 71.27734375, 73.4111328125, 75.544921875, 77.6787109375, 79.8125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 12.0, 22.0, 28.0, 40.0, 47.0, 51.0, 76.0, 86.0, 100.0, 76.0, 94.0, 71.0, 58.0, 57.0, 39.0, 42.0, 29.0, 25.0, 7.0, 11.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.724853515625, -8.42626953125, -8.127685546875, -7.8291015625, -7.530517578125, -7.23193359375, -6.933349609375, -6.634765625, -6.336181640625, -6.03759765625, -5.739013671875, -5.4404296875, -5.141845703125, -4.84326171875, -4.544677734375, -4.24609375, -3.947509765625, -3.64892578125, -3.350341796875, -3.0517578125, -2.753173828125, -2.45458984375, -2.156005859375, -1.857421875, -1.558837890625, -1.26025390625, -0.961669921875, -0.6630859375, -0.364501953125, -0.06591796875, 0.232666015625, 0.53125, 0.829833984375, 1.12841796875, 1.427001953125, 1.7255859375, 2.024169921875, 2.32275390625, 2.621337890625, 2.919921875, 3.218505859375, 3.51708984375, 3.815673828125, 4.1142578125, 4.412841796875, 4.71142578125, 5.010009765625, 5.30859375, 5.607177734375, 5.90576171875, 6.204345703125, 6.5029296875, 6.801513671875, 7.10009765625, 7.398681640625, 7.697265625, 7.995849609375, 8.29443359375, 8.593017578125, 8.8916015625, 9.190185546875, 9.48876953125, 9.787353515625, 10.0859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 19.0, 15.0, 37.0, 35.0, 52.0, 106.0, 156.0, 271.0, 511.0, 1000.0, 2241.0, 5576.0, 14518.0, 40184.0, 145566.0, 588157.0, 177380.0, 45304.0, 16314.0, 6149.0, 2483.0, 1098.0, 552.0, 311.0, 172.0, 105.0, 66.0, 54.0, 35.0, 17.0, 10.0, 8.0, 10.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.796875, -22.933349609375, -22.06982421875, -21.206298828125, -20.3427734375, -19.479248046875, -18.61572265625, -17.752197265625, -16.888671875, -16.025146484375, -15.16162109375, -14.298095703125, -13.4345703125, -12.571044921875, -11.70751953125, -10.843994140625, -9.98046875, -9.116943359375, -8.25341796875, -7.389892578125, -6.5263671875, -5.662841796875, -4.79931640625, -3.935791015625, -3.072265625, -2.208740234375, -1.34521484375, -0.481689453125, 0.3818359375, 1.245361328125, 2.10888671875, 2.972412109375, 3.8359375, 4.699462890625, 5.56298828125, 6.426513671875, 7.2900390625, 8.153564453125, 9.01708984375, 9.880615234375, 10.744140625, 11.607666015625, 12.47119140625, 13.334716796875, 14.1982421875, 15.061767578125, 15.92529296875, 16.788818359375, 17.65234375, 18.515869140625, 19.37939453125, 20.242919921875, 21.1064453125, 21.969970703125, 22.83349609375, 23.697021484375, 24.560546875, 25.424072265625, 26.28759765625, 27.151123046875, 28.0146484375, 28.878173828125, 29.74169921875, 30.605224609375, 31.46875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 8.0, 8.0, 13.0, 15.0, 15.0, 14.0, 35.0, 37.0, 28.0, 42.0, 44.0, 36.0, 52.0, 61.0, 55.0, 55.0, 52.0, 50.0, 65.0, 39.0, 47.0, 32.0, 32.0, 27.0, 23.0, 18.0, 18.0, 14.0, 12.0, 7.0, 11.0, 8.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.65625, -27.8466796875, -27.037109375, -26.2275390625, -25.41796875, -24.6083984375, -23.798828125, -22.9892578125, -22.1796875, -21.3701171875, -20.560546875, -19.7509765625, -18.94140625, -18.1318359375, -17.322265625, -16.5126953125, -15.703125, -14.8935546875, -14.083984375, -13.2744140625, -12.46484375, -11.6552734375, -10.845703125, -10.0361328125, -9.2265625, -8.4169921875, -7.607421875, -6.7978515625, -5.98828125, -5.1787109375, -4.369140625, -3.5595703125, -2.75, -1.9404296875, -1.130859375, -0.3212890625, 0.48828125, 1.2978515625, 2.107421875, 2.9169921875, 3.7265625, 4.5361328125, 5.345703125, 6.1552734375, 6.96484375, 7.7744140625, 8.583984375, 9.3935546875, 10.203125, 11.0126953125, 11.822265625, 12.6318359375, 13.44140625, 14.2509765625, 15.060546875, 15.8701171875, 16.6796875, 17.4892578125, 18.298828125, 19.1083984375, 19.91796875, 20.7275390625, 21.537109375, 22.3466796875, 23.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 3.0, 6.0, 2.0, 5.0, 23.0, 10.0, 11.0, 18.0, 28.0, 37.0, 46.0, 69.0, 116.0, 232.0, 455.0, 992.0, 2346.0, 5643.0, 17021.0, 69443.0, 530978.0, 351053.0, 48587.0, 13022.0, 4706.0, 1956.0, 830.0, 354.0, 184.0, 109.0, 60.0, 41.0, 39.0, 25.0, 16.0, 12.0, 15.0, 13.0, 7.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3046875, -12.900146484375, -12.49560546875, -12.091064453125, -11.6865234375, -11.281982421875, -10.87744140625, -10.472900390625, -10.068359375, -9.663818359375, -9.25927734375, -8.854736328125, -8.4501953125, -8.045654296875, -7.64111328125, -7.236572265625, -6.83203125, -6.427490234375, -6.02294921875, -5.618408203125, -5.2138671875, -4.809326171875, -4.40478515625, -4.000244140625, -3.595703125, -3.191162109375, -2.78662109375, -2.382080078125, -1.9775390625, -1.572998046875, -1.16845703125, -0.763916015625, -0.359375, 0.045166015625, 0.44970703125, 0.854248046875, 1.2587890625, 1.663330078125, 2.06787109375, 2.472412109375, 2.876953125, 3.281494140625, 3.68603515625, 4.090576171875, 4.4951171875, 4.899658203125, 5.30419921875, 5.708740234375, 6.11328125, 6.517822265625, 6.92236328125, 7.326904296875, 7.7314453125, 8.135986328125, 8.54052734375, 8.945068359375, 9.349609375, 9.754150390625, 10.15869140625, 10.563232421875, 10.9677734375, 11.372314453125, 11.77685546875, 12.181396484375, 12.5859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 13.0, 13.0, 15.0, 24.0, 34.0, 60.0, 112.0, 270.0, 220.0, 86.0, 44.0, 22.0, 24.0, 4.0, 17.0, 12.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026397705078125, -0.0025512278079986572, -0.0024626851081848145, -0.0023741424083709717, -0.002285599708557129, -0.002197057008743286, -0.0021085143089294434, -0.0020199716091156006, -0.0019314289093017578, -0.001842886209487915, -0.0017543435096740723, -0.0016658008098602295, -0.0015772581100463867, -0.001488715410232544, -0.0014001727104187012, -0.0013116300106048584, -0.0012230873107910156, -0.0011345446109771729, -0.00104600191116333, -0.0009574592113494873, -0.0008689165115356445, -0.0007803738117218018, -0.000691831111907959, -0.0006032884120941162, -0.0005147457122802734, -0.00042620301246643066, -0.0003376603126525879, -0.0002491176128387451, -0.00016057491302490234, -7.203221321105957e-05, 1.6510486602783203e-05, 0.00010505318641662598, 0.00019359588623046875, 0.0002821385860443115, 0.0003706812858581543, 0.00045922398567199707, 0.0005477666854858398, 0.0006363093852996826, 0.0007248520851135254, 0.0008133947849273682, 0.0009019374847412109, 0.0009904801845550537, 0.0010790228843688965, 0.0011675655841827393, 0.001256108283996582, 0.0013446509838104248, 0.0014331936836242676, 0.0015217363834381104, 0.0016102790832519531, 0.001698821783065796, 0.0017873644828796387, 0.0018759071826934814, 0.0019644498825073242, 0.002052992582321167, 0.0021415352821350098, 0.0022300779819488525, 0.0023186206817626953, 0.002407163381576538, 0.002495706081390381, 0.0025842487812042236, 0.0026727914810180664, 0.002761334180831909, 0.002849876880645752, 0.0029384195804595947, 0.0030269622802734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 8.0, 10.0, 14.0, 14.0, 13.0, 20.0, 39.0, 43.0, 46.0, 72.0, 112.0, 213.0, 397.0, 796.0, 1730.0, 4344.0, 12930.0, 45471.0, 302210.0, 575828.0, 74439.0, 19134.0, 6040.0, 2370.0, 1073.0, 478.0, 230.0, 135.0, 78.0, 67.0, 34.0, 23.0, 26.0, 22.0, 20.0, 14.0, 7.0, 3.0, 7.0, 7.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.4888916015625, -11.094970703125, -10.7010498046875, -10.30712890625, -9.9132080078125, -9.519287109375, -9.1253662109375, -8.7314453125, -8.3375244140625, -7.943603515625, -7.5496826171875, -7.15576171875, -6.7618408203125, -6.367919921875, -5.9739990234375, -5.580078125, -5.1861572265625, -4.792236328125, -4.3983154296875, -4.00439453125, -3.6104736328125, -3.216552734375, -2.8226318359375, -2.4287109375, -2.0347900390625, -1.640869140625, -1.2469482421875, -0.85302734375, -0.4591064453125, -0.065185546875, 0.3287353515625, 0.72265625, 1.1165771484375, 1.510498046875, 1.9044189453125, 2.29833984375, 2.6922607421875, 3.086181640625, 3.4801025390625, 3.8740234375, 4.2679443359375, 4.661865234375, 5.0557861328125, 5.44970703125, 5.8436279296875, 6.237548828125, 6.6314697265625, 7.025390625, 7.4193115234375, 7.813232421875, 8.2071533203125, 8.60107421875, 8.9949951171875, 9.388916015625, 9.7828369140625, 10.1767578125, 10.5706787109375, 10.964599609375, 11.3585205078125, 11.75244140625, 12.1463623046875, 12.540283203125, 12.9342041015625, 13.328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 0.0, 3.0, 5.0, 9.0, 8.0, 13.0, 21.0, 31.0, 28.0, 67.0, 93.0, 120.0, 119.0, 136.0, 102.0, 85.0, 40.0, 27.0, 27.0, 14.0, 11.0, 11.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.6640625, -10.356201171875, -10.04833984375, -9.740478515625, -9.4326171875, -9.124755859375, -8.81689453125, -8.509033203125, -8.201171875, -7.893310546875, -7.58544921875, -7.277587890625, -6.9697265625, -6.661865234375, -6.35400390625, -6.046142578125, -5.73828125, -5.430419921875, -5.12255859375, -4.814697265625, -4.5068359375, -4.198974609375, -3.89111328125, -3.583251953125, -3.275390625, -2.967529296875, -2.65966796875, -2.351806640625, -2.0439453125, -1.736083984375, -1.42822265625, -1.120361328125, -0.8125, -0.504638671875, -0.19677734375, 0.111083984375, 0.4189453125, 0.726806640625, 1.03466796875, 1.342529296875, 1.650390625, 1.958251953125, 2.26611328125, 2.573974609375, 2.8818359375, 3.189697265625, 3.49755859375, 3.805419921875, 4.11328125, 4.421142578125, 4.72900390625, 5.036865234375, 5.3447265625, 5.652587890625, 5.96044921875, 6.268310546875, 6.576171875, 6.884033203125, 7.19189453125, 7.499755859375, 7.8076171875, 8.115478515625, 8.42333984375, 8.731201171875, 9.0390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 6.0, 5.0, 17.0, 26.0, 33.0, 48.0, 63.0, 72.0, 92.0, 103.0, 105.0, 94.0, 85.0, 67.0, 57.0, 43.0, 28.0, 17.0, 13.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.11668395996094, -98.92745971679688, -94.73824310302734, -90.54901885986328, -86.35980224609375, -82.17057800292969, -77.98135375976562, -73.79212951660156, -69.60291290283203, -65.41368865966797, -61.22447204589844, -57.035247802734375, -52.84602737426758, -48.65680694580078, -44.46758270263672, -40.27836227416992, -36.089141845703125, -31.899921417236328, -27.7106990814209, -23.52147674560547, -19.332256317138672, -15.143035888671875, -10.953813552856445, -6.764591217041016, -2.5753707885742188, 1.6138505935668945, 5.803071975708008, 9.992293357849121, 14.181514739990234, 18.37073516845703, 22.55995750427246, 26.74917984008789, 30.93841552734375, 35.12763595581055, 39.316856384277344, 43.506080627441406, 47.6953010559082, 51.884521484375, 56.07374572753906, 60.26296615600586, 64.45218658447266, 68.64141082763672, 72.83062744140625, 77.01985168457031, 81.20907592773438, 85.3982925415039, 89.58751678466797, 93.7767333984375, 97.96595764160156, 102.15518188476562, 106.34439849853516, 110.53362274169922, 114.72283935546875, 118.91206359863281, 123.10128784179688, 127.29051208496094, 131.479736328125, 135.66896057128906, 139.85818481445312, 144.04739379882812, 148.2366180419922, 152.42584228515625, 156.6150665283203, 160.80429077148438, 164.99349975585938]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 21.0, 7.0, 20.0, 22.0, 25.0, 26.0, 39.0, 35.0, 42.0, 47.0, 41.0, 48.0, 42.0, 49.0, 51.0, 49.0, 51.0, 42.0, 44.0, 42.0, 41.0, 37.0, 32.0, 31.0, 20.0, 12.0, 15.0, 12.0, 13.0, 6.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.07212829589844, -126.45592498779297, -122.8397216796875, -119.22351837158203, -115.60731506347656, -111.9911117553711, -108.37490844726562, -104.75871276855469, -101.14250183105469, -97.52629852294922, -93.91009521484375, -90.29389190673828, -86.67768859863281, -83.06148529052734, -79.44528198242188, -75.82908630371094, -72.21288299560547, -68.5966796875, -64.98047637939453, -61.36427307128906, -57.748069763183594, -54.131866455078125, -50.51566696166992, -46.89946365356445, -43.283260345458984, -39.667057037353516, -36.05085372924805, -32.434654235839844, -28.818449020385742, -25.202245712280273, -21.586044311523438, -17.96984100341797, -14.3536376953125, -10.737434387207031, -7.121232032775879, -3.5050296783447266, 0.11117362976074219, 3.727376937866211, 7.343578338623047, 10.959781646728516, 14.575984954833984, 18.192188262939453, 21.808391571044922, 25.424592971801758, 29.040796279907227, 32.65699768066406, 36.27320098876953, 39.889404296875, 43.50560760498047, 47.12181091308594, 50.738014221191406, 54.354217529296875, 57.970420837402344, 61.58662414550781, 65.20281982421875, 68.81903076171875, 72.43522644042969, 76.05142974853516, 79.66763305664062, 83.2838363647461, 86.90003967285156, 90.51624298095703, 94.1324462890625, 97.74864196777344, 101.36485290527344]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 16.0, 14.0, 17.0, 16.0, 35.0, 54.0, 68.0, 118.0, 201.0, 316.0, 504.0, 967.0, 1782.0, 4095.0, 10683.0, 35673.0, 191447.0, 3658232.0, 229882.0, 40058.0, 11787.0, 4291.0, 1806.0, 881.0, 465.0, 268.0, 178.0, 116.0, 81.0, 56.0, 39.0, 36.0, 15.0, 15.0, 18.0, 8.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-48.21875, -46.40185546875, -44.5849609375, -42.76806640625, -40.951171875, -39.13427734375, -37.3173828125, -35.50048828125, -33.68359375, -31.86669921875, -30.0498046875, -28.23291015625, -26.416015625, -24.59912109375, -22.7822265625, -20.96533203125, -19.1484375, -17.33154296875, -15.5146484375, -13.69775390625, -11.880859375, -10.06396484375, -8.2470703125, -6.43017578125, -4.61328125, -2.79638671875, -0.9794921875, 0.83740234375, 2.654296875, 4.47119140625, 6.2880859375, 8.10498046875, 9.921875, 11.73876953125, 13.5556640625, 15.37255859375, 17.189453125, 19.00634765625, 20.8232421875, 22.64013671875, 24.45703125, 26.27392578125, 28.0908203125, 29.90771484375, 31.724609375, 33.54150390625, 35.3583984375, 37.17529296875, 38.9921875, 40.80908203125, 42.6259765625, 44.44287109375, 46.259765625, 48.07666015625, 49.8935546875, 51.71044921875, 53.52734375, 55.34423828125, 57.1611328125, 58.97802734375, 60.794921875, 62.61181640625, 64.4287109375, 66.24560546875, 68.0625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 14.0, 19.0, 13.0, 36.0, 48.0, 66.0, 57.0, 67.0, 97.0, 94.0, 76.0, 75.0, 61.0, 62.0, 47.0, 41.0, 32.0, 31.0, 15.0, 9.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.5616455078125, -8.263916015625, -7.9661865234375, -7.66845703125, -7.3707275390625, -7.072998046875, -6.7752685546875, -6.4775390625, -6.1798095703125, -5.882080078125, -5.5843505859375, -5.28662109375, -4.9888916015625, -4.691162109375, -4.3934326171875, -4.095703125, -3.7979736328125, -3.500244140625, -3.2025146484375, -2.90478515625, -2.6070556640625, -2.309326171875, -2.0115966796875, -1.7138671875, -1.4161376953125, -1.118408203125, -0.8206787109375, -0.52294921875, -0.2252197265625, 0.072509765625, 0.3702392578125, 0.66796875, 0.9656982421875, 1.263427734375, 1.5611572265625, 1.85888671875, 2.1566162109375, 2.454345703125, 2.7520751953125, 3.0498046875, 3.3475341796875, 3.645263671875, 3.9429931640625, 4.24072265625, 4.5384521484375, 4.836181640625, 5.1339111328125, 5.431640625, 5.7293701171875, 6.027099609375, 6.3248291015625, 6.62255859375, 6.9202880859375, 7.218017578125, 7.5157470703125, 7.8134765625, 8.1112060546875, 8.408935546875, 8.7066650390625, 9.00439453125, 9.3021240234375, 9.599853515625, 9.8975830078125, 10.1953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 11.0, 10.0, 12.0, 11.0, 22.0, 24.0, 28.0, 49.0, 83.0, 113.0, 152.0, 256.0, 394.0, 709.0, 1246.0, 2579.0, 5635.0, 14125.0, 40219.0, 147741.0, 1880327.0, 1886183.0, 148099.0, 40433.0, 14105.0, 5833.0, 2636.0, 1315.0, 724.0, 417.0, 225.0, 163.0, 92.0, 83.0, 40.0, 55.0, 36.0, 24.0, 19.0, 10.0, 12.0, 14.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-33.375, -32.33203125, -31.2890625, -30.24609375, -29.203125, -28.16015625, -27.1171875, -26.07421875, -25.03125, -23.98828125, -22.9453125, -21.90234375, -20.859375, -19.81640625, -18.7734375, -17.73046875, -16.6875, -15.64453125, -14.6015625, -13.55859375, -12.515625, -11.47265625, -10.4296875, -9.38671875, -8.34375, -7.30078125, -6.2578125, -5.21484375, -4.171875, -3.12890625, -2.0859375, -1.04296875, 0.0, 1.04296875, 2.0859375, 3.12890625, 4.171875, 5.21484375, 6.2578125, 7.30078125, 8.34375, 9.38671875, 10.4296875, 11.47265625, 12.515625, 13.55859375, 14.6015625, 15.64453125, 16.6875, 17.73046875, 18.7734375, 19.81640625, 20.859375, 21.90234375, 22.9453125, 23.98828125, 25.03125, 26.07421875, 27.1171875, 28.16015625, 29.203125, 30.24609375, 31.2890625, 32.33203125, 33.375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 12.0, 4.0, 10.0, 28.0, 53.0, 78.0, 161.0, 382.0, 1948.0, 842.0, 272.0, 116.0, 71.0, 31.0, 18.0, 12.0, 12.0, 10.0, 5.0, 6.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.75, -23.048095703125, -22.34619140625, -21.644287109375, -20.9423828125, -20.240478515625, -19.53857421875, -18.836669921875, -18.134765625, -17.432861328125, -16.73095703125, -16.029052734375, -15.3271484375, -14.625244140625, -13.92333984375, -13.221435546875, -12.51953125, -11.817626953125, -11.11572265625, -10.413818359375, -9.7119140625, -9.010009765625, -8.30810546875, -7.606201171875, -6.904296875, -6.202392578125, -5.50048828125, -4.798583984375, -4.0966796875, -3.394775390625, -2.69287109375, -1.990966796875, -1.2890625, -0.587158203125, 0.11474609375, 0.816650390625, 1.5185546875, 2.220458984375, 2.92236328125, 3.624267578125, 4.326171875, 5.028076171875, 5.72998046875, 6.431884765625, 7.1337890625, 7.835693359375, 8.53759765625, 9.239501953125, 9.94140625, 10.643310546875, 11.34521484375, 12.047119140625, 12.7490234375, 13.450927734375, 14.15283203125, 14.854736328125, 15.556640625, 16.258544921875, 16.96044921875, 17.662353515625, 18.3642578125, 19.066162109375, 19.76806640625, 20.469970703125, 21.171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 14.0, 18.0, 52.0, 74.0, 133.0, 140.0, 173.0, 146.0, 127.0, 46.0, 33.0, 19.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-133.68490600585938, -130.12982177734375, -126.57474517822266, -123.01966094970703, -119.4645767211914, -115.90950012207031, -112.35441589355469, -108.79933166503906, -105.24425506591797, -101.68917083740234, -98.13409423828125, -94.57901000976562, -91.02392578125, -87.4688491821289, -83.91376495361328, -80.35868835449219, -76.80360412597656, -73.24851989746094, -69.69344329833984, -66.13835906982422, -62.58327865600586, -59.0281982421875, -55.473114013671875, -51.918033599853516, -48.362945556640625, -44.807865142822266, -41.25278091430664, -37.69770050048828, -34.14262008666992, -30.58753776550293, -27.032455444335938, -23.477375030517578, -19.92229461669922, -16.367212295532227, -12.812131881713867, -9.257049560546875, -5.701968193054199, -2.1468868255615234, 1.4081954956054688, 4.963275909423828, 8.51835823059082, 12.073439598083496, 15.628520965576172, 19.183603286743164, 22.738685607910156, 26.293766021728516, 29.848848342895508, 33.4039306640625, 36.95901107788086, 40.51409149169922, 44.069175720214844, 47.6242561340332, 51.17933654785156, 54.73442077636719, 58.28950119018555, 61.844581604003906, 65.39966583251953, 68.95475006103516, 72.50982666015625, 76.06491088867188, 79.6199951171875, 83.1750717163086, 86.73015594482422, 90.28523254394531, 93.84031677246094]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 12.0, 11.0, 13.0, 9.0, 14.0, 15.0, 19.0, 25.0, 20.0, 30.0, 22.0, 37.0, 45.0, 39.0, 44.0, 31.0, 45.0, 44.0, 33.0, 37.0, 31.0, 41.0, 37.0, 22.0, 50.0, 28.0, 28.0, 26.0, 22.0, 22.0, 20.0, 25.0, 12.0, 14.0, 9.0, 9.0, 5.0, 7.0, 3.0, 10.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.03485107421875, -39.71956253051758, -38.404273986816406, -37.08898162841797, -35.7736930847168, -34.458404541015625, -33.14311218261719, -31.827823638916016, -30.512535095214844, -29.197246551513672, -27.881956100463867, -26.566665649414062, -25.25137710571289, -23.93608856201172, -22.620798110961914, -21.30550765991211, -19.990219116210938, -18.674930572509766, -17.35964012145996, -16.044349670410156, -14.729061126708984, -13.413771629333496, -12.098482131958008, -10.78319263458252, -9.467903137207031, -8.152613639831543, -6.837324142456055, -5.522034645080566, -4.206745147705078, -2.89145565032959, -1.5761661529541016, -0.2608766555786133, 1.054412841796875, 2.3697023391723633, 3.6849918365478516, 5.00028133392334, 6.315570831298828, 7.630860328674316, 8.946149826049805, 10.261439323425293, 11.576728820800781, 12.89201831817627, 14.207307815551758, 15.522597312927246, 16.837886810302734, 18.153175354003906, 19.46846580505371, 20.783756256103516, 22.099044799804688, 23.41433334350586, 24.729623794555664, 26.04491424560547, 27.36020278930664, 28.675491333007812, 29.990781784057617, 31.306072235107422, 32.621360778808594, 33.936649322509766, 35.25193786621094, 36.567230224609375, 37.88251876831055, 39.19780731201172, 40.513099670410156, 41.82838821411133, 43.1436767578125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 15.0, 28.0, 40.0, 72.0, 120.0, 211.0, 427.0, 935.0, 2487.0, 8846.0, 43809.0, 255632.0, 601362.0, 107369.0, 19781.0, 4585.0, 1484.0, 645.0, 310.0, 148.0, 85.0, 57.0, 34.0, 26.0, 5.0, 11.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-61.3125, -59.7099609375, -58.107421875, -56.5048828125, -54.90234375, -53.2998046875, -51.697265625, -50.0947265625, -48.4921875, -46.8896484375, -45.287109375, -43.6845703125, -42.08203125, -40.4794921875, -38.876953125, -37.2744140625, -35.671875, -34.0693359375, -32.466796875, -30.8642578125, -29.26171875, -27.6591796875, -26.056640625, -24.4541015625, -22.8515625, -21.2490234375, -19.646484375, -18.0439453125, -16.44140625, -14.8388671875, -13.236328125, -11.6337890625, -10.03125, -8.4287109375, -6.826171875, -5.2236328125, -3.62109375, -2.0185546875, -0.416015625, 1.1865234375, 2.7890625, 4.3916015625, 5.994140625, 7.5966796875, 9.19921875, 10.8017578125, 12.404296875, 14.0068359375, 15.609375, 17.2119140625, 18.814453125, 20.4169921875, 22.01953125, 23.6220703125, 25.224609375, 26.8271484375, 28.4296875, 30.0322265625, 31.634765625, 33.2373046875, 34.83984375, 36.4423828125, 38.044921875, 39.6474609375, 41.25]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 18.0, 20.0, 24.0, 33.0, 34.0, 49.0, 57.0, 70.0, 91.0, 76.0, 87.0, 79.0, 65.0, 56.0, 47.0, 46.0, 36.0, 27.0, 18.0, 13.0, 14.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5684814453125, -8.261962890625, -7.9554443359375, -7.64892578125, -7.3424072265625, -7.035888671875, -6.7293701171875, -6.4228515625, -6.1163330078125, -5.809814453125, -5.5032958984375, -5.19677734375, -4.8902587890625, -4.583740234375, -4.2772216796875, -3.970703125, -3.6641845703125, -3.357666015625, -3.0511474609375, -2.74462890625, -2.4381103515625, -2.131591796875, -1.8250732421875, -1.5185546875, -1.2120361328125, -0.905517578125, -0.5989990234375, -0.29248046875, 0.0140380859375, 0.320556640625, 0.6270751953125, 0.93359375, 1.2401123046875, 1.546630859375, 1.8531494140625, 2.15966796875, 2.4661865234375, 2.772705078125, 3.0792236328125, 3.3857421875, 3.6922607421875, 3.998779296875, 4.3052978515625, 4.61181640625, 4.9183349609375, 5.224853515625, 5.5313720703125, 5.837890625, 6.1444091796875, 6.450927734375, 6.7574462890625, 7.06396484375, 7.3704833984375, 7.677001953125, 7.9835205078125, 8.2900390625, 8.5965576171875, 8.903076171875, 9.2095947265625, 9.51611328125, 9.8226318359375, 10.129150390625, 10.4356689453125, 10.7421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 8.0, 18.0, 34.0, 31.0, 55.0, 97.0, 171.0, 227.0, 471.0, 719.0, 1618.0, 4875.0, 20270.0, 100310.0, 545024.0, 301977.0, 55220.0, 11668.0, 3112.0, 1193.0, 573.0, 347.0, 211.0, 131.0, 70.0, 49.0, 22.0, 18.0, 11.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.125, -25.072265625, -24.01953125, -22.966796875, -21.9140625, -20.861328125, -19.80859375, -18.755859375, -17.703125, -16.650390625, -15.59765625, -14.544921875, -13.4921875, -12.439453125, -11.38671875, -10.333984375, -9.28125, -8.228515625, -7.17578125, -6.123046875, -5.0703125, -4.017578125, -2.96484375, -1.912109375, -0.859375, 0.193359375, 1.24609375, 2.298828125, 3.3515625, 4.404296875, 5.45703125, 6.509765625, 7.5625, 8.615234375, 9.66796875, 10.720703125, 11.7734375, 12.826171875, 13.87890625, 14.931640625, 15.984375, 17.037109375, 18.08984375, 19.142578125, 20.1953125, 21.248046875, 22.30078125, 23.353515625, 24.40625, 25.458984375, 26.51171875, 27.564453125, 28.6171875, 29.669921875, 30.72265625, 31.775390625, 32.828125, 33.880859375, 34.93359375, 35.986328125, 37.0390625, 38.091796875, 39.14453125, 40.197265625, 41.25]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 2.0, 2.0, 5.0, 6.0, 9.0, 16.0, 19.0, 17.0, 13.0, 23.0, 35.0, 29.0, 34.0, 34.0, 34.0, 40.0, 40.0, 53.0, 60.0, 55.0, 52.0, 51.0, 41.0, 43.0, 37.0, 49.0, 38.0, 21.0, 29.0, 25.0, 21.0, 7.0, 14.0, 13.0, 10.0, 10.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.609375, -26.7568359375, -25.904296875, -25.0517578125, -24.19921875, -23.3466796875, -22.494140625, -21.6416015625, -20.7890625, -19.9365234375, -19.083984375, -18.2314453125, -17.37890625, -16.5263671875, -15.673828125, -14.8212890625, -13.96875, -13.1162109375, -12.263671875, -11.4111328125, -10.55859375, -9.7060546875, -8.853515625, -8.0009765625, -7.1484375, -6.2958984375, -5.443359375, -4.5908203125, -3.73828125, -2.8857421875, -2.033203125, -1.1806640625, -0.328125, 0.5244140625, 1.376953125, 2.2294921875, 3.08203125, 3.9345703125, 4.787109375, 5.6396484375, 6.4921875, 7.3447265625, 8.197265625, 9.0498046875, 9.90234375, 10.7548828125, 11.607421875, 12.4599609375, 13.3125, 14.1650390625, 15.017578125, 15.8701171875, 16.72265625, 17.5751953125, 18.427734375, 19.2802734375, 20.1328125, 20.9853515625, 21.837890625, 22.6904296875, 23.54296875, 24.3955078125, 25.248046875, 26.1005859375, 26.953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 14.0, 17.0, 26.0, 45.0, 89.0, 135.0, 339.0, 781.0, 2145.0, 6073.0, 20639.0, 79764.0, 390713.0, 427740.0, 87528.0, 22209.0, 6541.0, 2131.0, 858.0, 376.0, 167.0, 78.0, 51.0, 38.0, 13.0, 9.0, 12.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.375, -11.9761962890625, -11.577392578125, -11.1785888671875, -10.77978515625, -10.3809814453125, -9.982177734375, -9.5833740234375, -9.1845703125, -8.7857666015625, -8.386962890625, -7.9881591796875, -7.58935546875, -7.1905517578125, -6.791748046875, -6.3929443359375, -5.994140625, -5.5953369140625, -5.196533203125, -4.7977294921875, -4.39892578125, -4.0001220703125, -3.601318359375, -3.2025146484375, -2.8037109375, -2.4049072265625, -2.006103515625, -1.6072998046875, -1.20849609375, -0.8096923828125, -0.410888671875, -0.0120849609375, 0.38671875, 0.7855224609375, 1.184326171875, 1.5831298828125, 1.98193359375, 2.3807373046875, 2.779541015625, 3.1783447265625, 3.5771484375, 3.9759521484375, 4.374755859375, 4.7735595703125, 5.17236328125, 5.5711669921875, 5.969970703125, 6.3687744140625, 6.767578125, 7.1663818359375, 7.565185546875, 7.9639892578125, 8.36279296875, 8.7615966796875, 9.160400390625, 9.5592041015625, 9.9580078125, 10.3568115234375, 10.755615234375, 11.1544189453125, 11.55322265625, 11.9520263671875, 12.350830078125, 12.7496337890625, 13.1484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 6.0, 14.0, 10.0, 25.0, 23.0, 23.0, 22.0, 27.0, 57.0, 72.0, 92.0, 117.0, 132.0, 89.0, 60.0, 43.0, 41.0, 28.0, 17.0, 17.0, 15.0, 15.0, 7.0, 2.0, 3.0, 6.0, 4.0, 9.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015287399291992188, -0.0014649778604507446, -0.0014012157917022705, -0.0013374537229537964, -0.0012736916542053223, -0.0012099295854568481, -0.001146167516708374, -0.0010824054479599, -0.0010186433792114258, -0.0009548813104629517, -0.0008911192417144775, -0.0008273571729660034, -0.0007635951042175293, -0.0006998330354690552, -0.0006360709667205811, -0.0005723088979721069, -0.0005085468292236328, -0.0004447847604751587, -0.00038102269172668457, -0.00031726062297821045, -0.00025349855422973633, -0.0001897364854812622, -0.00012597441673278809, -6.221234798431396e-05, 1.5497207641601562e-06, 6.531178951263428e-05, 0.0001290738582611084, 0.00019283592700958252, 0.00025659799575805664, 0.00032036006450653076, 0.0003841221332550049, 0.000447884202003479, 0.0005116462707519531, 0.0005754083395004272, 0.0006391704082489014, 0.0007029324769973755, 0.0007666945457458496, 0.0008304566144943237, 0.0008942186832427979, 0.000957980751991272, 0.001021742820739746, 0.0010855048894882202, 0.0011492669582366943, 0.0012130290269851685, 0.0012767910957336426, 0.0013405531644821167, 0.0014043152332305908, 0.001468077301979065, 0.001531839370727539, 0.0015956014394760132, 0.0016593635082244873, 0.0017231255769729614, 0.0017868876457214355, 0.0018506497144699097, 0.0019144117832183838, 0.001978173851966858, 0.002041935920715332, 0.002105697989463806, 0.0021694600582122803, 0.0022332221269607544, 0.0022969841957092285, 0.0023607462644577026, 0.0024245083332061768, 0.002488270401954651, 0.002552032470703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 9.0, 12.0, 34.0, 44.0, 63.0, 101.0, 208.0, 409.0, 862.0, 2255.0, 8471.0, 44792.0, 311958.0, 564835.0, 92587.0, 15821.0, 3727.0, 1217.0, 523.0, 231.0, 167.0, 79.0, 45.0, 35.0, 32.0, 14.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.24560546875, -16.7099609375, -16.17431640625, -15.638671875, -15.10302734375, -14.5673828125, -14.03173828125, -13.49609375, -12.96044921875, -12.4248046875, -11.88916015625, -11.353515625, -10.81787109375, -10.2822265625, -9.74658203125, -9.2109375, -8.67529296875, -8.1396484375, -7.60400390625, -7.068359375, -6.53271484375, -5.9970703125, -5.46142578125, -4.92578125, -4.39013671875, -3.8544921875, -3.31884765625, -2.783203125, -2.24755859375, -1.7119140625, -1.17626953125, -0.640625, -0.10498046875, 0.4306640625, 0.96630859375, 1.501953125, 2.03759765625, 2.5732421875, 3.10888671875, 3.64453125, 4.18017578125, 4.7158203125, 5.25146484375, 5.787109375, 6.32275390625, 6.8583984375, 7.39404296875, 7.9296875, 8.46533203125, 9.0009765625, 9.53662109375, 10.072265625, 10.60791015625, 11.1435546875, 11.67919921875, 12.21484375, 12.75048828125, 13.2861328125, 13.82177734375, 14.357421875, 14.89306640625, 15.4287109375, 15.96435546875, 16.5]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 19.0, 21.0, 27.0, 49.0, 73.0, 97.0, 105.0, 132.0, 139.0, 116.0, 80.0, 44.0, 37.0, 30.0, 18.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.484375, -24.927490234375, -24.37060546875, -23.813720703125, -23.2568359375, -22.699951171875, -22.14306640625, -21.586181640625, -21.029296875, -20.472412109375, -19.91552734375, -19.358642578125, -18.8017578125, -18.244873046875, -17.68798828125, -17.131103515625, -16.57421875, -16.017333984375, -15.46044921875, -14.903564453125, -14.3466796875, -13.789794921875, -13.23291015625, -12.676025390625, -12.119140625, -11.562255859375, -11.00537109375, -10.448486328125, -9.8916015625, -9.334716796875, -8.77783203125, -8.220947265625, -7.6640625, -7.107177734375, -6.55029296875, -5.993408203125, -5.4365234375, -4.879638671875, -4.32275390625, -3.765869140625, -3.208984375, -2.652099609375, -2.09521484375, -1.538330078125, -0.9814453125, -0.424560546875, 0.13232421875, 0.689208984375, 1.24609375, 1.802978515625, 2.35986328125, 2.916748046875, 3.4736328125, 4.030517578125, 4.58740234375, 5.144287109375, 5.701171875, 6.258056640625, 6.81494140625, 7.371826171875, 7.9287109375, 8.485595703125, 9.04248046875, 9.599365234375, 10.15625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 18.0, 30.0, 40.0, 72.0, 96.0, 116.0, 153.0, 147.0, 86.0, 79.0, 58.0, 35.0, 23.0, 13.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-294.32867431640625, -288.0148010253906, -281.700927734375, -275.3870544433594, -269.07318115234375, -262.7593078613281, -256.4454345703125, -250.1315460205078, -243.8176727294922, -237.50379943847656, -231.18992614746094, -224.8760528564453, -218.5621795654297, -212.248291015625, -205.93441772460938, -199.62054443359375, -193.30667114257812, -186.9927978515625, -180.67892456054688, -174.36505126953125, -168.05117797851562, -161.7373046875, -155.42343139648438, -149.1095428466797, -142.79568481445312, -136.4818115234375, -130.16793823242188, -123.85406494140625, -117.5401840209961, -111.22631072998047, -104.91243743896484, -98.59855651855469, -92.28468322753906, -85.97080993652344, -79.65693664550781, -73.34306335449219, -67.02918243408203, -60.715309143066406, -54.40143585205078, -48.08755874633789, -41.773685455322266, -35.45981216430664, -29.14593505859375, -22.832061767578125, -16.518186569213867, -10.20431137084961, -3.8904380798339844, 2.4234390258789062, 8.737312316894531, 15.051187515258789, 21.365062713623047, 27.678936004638672, 33.99281311035156, 40.30668640136719, 46.62055969238281, 52.9344367980957, 59.24831008911133, 65.56218719482422, 71.87606048583984, 78.18993377685547, 84.5038070678711, 90.81768798828125, 97.13156127929688, 103.4454345703125, 109.75930786132812]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 8.0, 10.0, 9.0, 24.0, 18.0, 18.0, 22.0, 28.0, 31.0, 34.0, 49.0, 39.0, 34.0, 44.0, 32.0, 55.0, 42.0, 53.0, 40.0, 47.0, 47.0, 39.0, 40.0, 35.0, 28.0, 21.0, 21.0, 16.0, 16.0, 10.0, 17.0, 13.0, 9.0, 6.0, 8.0, 4.0, 5.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-133.0745849609375, -128.9332275390625, -124.79186248779297, -120.65050506591797, -116.50914001464844, -112.36778259277344, -108.22642517089844, -104.08506774902344, -99.9437026977539, -95.8023452758789, -91.66098022460938, -87.51962280273438, -83.37826538085938, -79.23690032958984, -75.09554290771484, -70.95417785644531, -66.81282043457031, -62.67145919799805, -58.53009796142578, -54.38874053955078, -50.247379302978516, -46.10601806640625, -41.96466064453125, -37.823299407958984, -33.68193817138672, -29.540576934814453, -25.39921760559082, -21.257858276367188, -17.116497039794922, -12.975135803222656, -8.833776473999023, -4.692417144775391, -0.551055908203125, 3.590304374694824, 7.731664657592773, 11.873024940490723, 16.014385223388672, 20.155746459960938, 24.29710578918457, 28.438465118408203, 32.57982635498047, 36.721187591552734, 40.862548828125, 45.00390625, 49.145267486572266, 53.28662872314453, 57.42798614501953, 61.5693473815918, 65.71070861816406, 69.85206604003906, 73.9934310913086, 78.1347885131836, 82.27615356445312, 86.41751098632812, 90.55886840820312, 94.70022583007812, 98.84159088134766, 102.98294830322266, 107.12431335449219, 111.26567077636719, 115.40702819824219, 119.54839324951172, 123.68975067138672, 127.83111572265625, 131.97247314453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 3.0, 14.0, 19.0, 42.0, 52.0, 68.0, 107.0, 156.0, 215.0, 377.0, 597.0, 1003.0, 1843.0, 3618.0, 8034.0, 20951.0, 65184.0, 288100.0, 3277238.0, 402636.0, 81518.0, 24644.0, 9131.0, 3936.0, 1935.0, 1016.0, 569.0, 375.0, 249.0, 173.0, 113.0, 77.0, 76.0, 45.0, 41.0, 27.0, 22.0, 28.0, 18.0, 9.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.3125, -34.99609375, -33.6796875, -32.36328125, -31.046875, -29.73046875, -28.4140625, -27.09765625, -25.78125, -24.46484375, -23.1484375, -21.83203125, -20.515625, -19.19921875, -17.8828125, -16.56640625, -15.25, -13.93359375, -12.6171875, -11.30078125, -9.984375, -8.66796875, -7.3515625, -6.03515625, -4.71875, -3.40234375, -2.0859375, -0.76953125, 0.546875, 1.86328125, 3.1796875, 4.49609375, 5.8125, 7.12890625, 8.4453125, 9.76171875, 11.078125, 12.39453125, 13.7109375, 15.02734375, 16.34375, 17.66015625, 18.9765625, 20.29296875, 21.609375, 22.92578125, 24.2421875, 25.55859375, 26.875, 28.19140625, 29.5078125, 30.82421875, 32.140625, 33.45703125, 34.7734375, 36.08984375, 37.40625, 38.72265625, 40.0390625, 41.35546875, 42.671875, 43.98828125, 45.3046875, 46.62109375, 47.9375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 10.0, 6.0, 16.0, 20.0, 29.0, 19.0, 39.0, 52.0, 76.0, 62.0, 73.0, 78.0, 65.0, 86.0, 81.0, 54.0, 42.0, 56.0, 35.0, 26.0, 15.0, 19.0, 14.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.386474609375, -8.07763671875, -7.768798828125, -7.4599609375, -7.151123046875, -6.84228515625, -6.533447265625, -6.224609375, -5.915771484375, -5.60693359375, -5.298095703125, -4.9892578125, -4.680419921875, -4.37158203125, -4.062744140625, -3.75390625, -3.445068359375, -3.13623046875, -2.827392578125, -2.5185546875, -2.209716796875, -1.90087890625, -1.592041015625, -1.283203125, -0.974365234375, -0.66552734375, -0.356689453125, -0.0478515625, 0.260986328125, 0.56982421875, 0.878662109375, 1.1875, 1.496337890625, 1.80517578125, 2.114013671875, 2.4228515625, 2.731689453125, 3.04052734375, 3.349365234375, 3.658203125, 3.967041015625, 4.27587890625, 4.584716796875, 4.8935546875, 5.202392578125, 5.51123046875, 5.820068359375, 6.12890625, 6.437744140625, 6.74658203125, 7.055419921875, 7.3642578125, 7.673095703125, 7.98193359375, 8.290771484375, 8.599609375, 8.908447265625, 9.21728515625, 9.526123046875, 9.8349609375, 10.143798828125, 10.45263671875, 10.761474609375, 11.0703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 7.0, 8.0, 15.0, 15.0, 25.0, 36.0, 51.0, 49.0, 65.0, 92.0, 129.0, 197.0, 322.0, 533.0, 1119.0, 3519.0, 16001.0, 113731.0, 2854035.0, 1110489.0, 76723.0, 11887.0, 2822.0, 973.0, 480.0, 257.0, 200.0, 134.0, 98.0, 62.0, 56.0, 47.0, 23.0, 16.0, 13.0, 11.0, 13.0, 11.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-54.5625, -52.99951171875, -51.4365234375, -49.87353515625, -48.310546875, -46.74755859375, -45.1845703125, -43.62158203125, -42.05859375, -40.49560546875, -38.9326171875, -37.36962890625, -35.806640625, -34.24365234375, -32.6806640625, -31.11767578125, -29.5546875, -27.99169921875, -26.4287109375, -24.86572265625, -23.302734375, -21.73974609375, -20.1767578125, -18.61376953125, -17.05078125, -15.48779296875, -13.9248046875, -12.36181640625, -10.798828125, -9.23583984375, -7.6728515625, -6.10986328125, -4.546875, -2.98388671875, -1.4208984375, 0.14208984375, 1.705078125, 3.26806640625, 4.8310546875, 6.39404296875, 7.95703125, 9.52001953125, 11.0830078125, 12.64599609375, 14.208984375, 15.77197265625, 17.3349609375, 18.89794921875, 20.4609375, 22.02392578125, 23.5869140625, 25.14990234375, 26.712890625, 28.27587890625, 29.8388671875, 31.40185546875, 32.96484375, 34.52783203125, 36.0908203125, 37.65380859375, 39.216796875, 40.77978515625, 42.3427734375, 43.90576171875, 45.46875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 12.0, 27.0, 54.0, 166.0, 563.0, 2286.0, 618.0, 219.0, 75.0, 31.0, 11.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.1875, -37.90283203125, -36.6181640625, -35.33349609375, -34.048828125, -32.76416015625, -31.4794921875, -30.19482421875, -28.91015625, -27.62548828125, -26.3408203125, -25.05615234375, -23.771484375, -22.48681640625, -21.2021484375, -19.91748046875, -18.6328125, -17.34814453125, -16.0634765625, -14.77880859375, -13.494140625, -12.20947265625, -10.9248046875, -9.64013671875, -8.35546875, -7.07080078125, -5.7861328125, -4.50146484375, -3.216796875, -1.93212890625, -0.6474609375, 0.63720703125, 1.921875, 3.20654296875, 4.4912109375, 5.77587890625, 7.060546875, 8.34521484375, 9.6298828125, 10.91455078125, 12.19921875, 13.48388671875, 14.7685546875, 16.05322265625, 17.337890625, 18.62255859375, 19.9072265625, 21.19189453125, 22.4765625, 23.76123046875, 25.0458984375, 26.33056640625, 27.615234375, 28.89990234375, 30.1845703125, 31.46923828125, 32.75390625, 34.03857421875, 35.3232421875, 36.60791015625, 37.892578125, 39.17724609375, 40.4619140625, 41.74658203125, 43.03125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 22.0, 100.0, 194.0, 230.0, 216.0, 122.0, 55.0, 36.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.0732727050781, -260.47442626953125, -252.87559509277344, -245.27674865722656, -237.6779022216797, -230.07907104492188, -222.480224609375, -214.88137817382812, -207.28253173828125, -199.68368530273438, -192.08485412597656, -184.4860076904297, -176.8871612548828, -169.288330078125, -161.68948364257812, -154.09063720703125, -146.49180603027344, -138.89295959472656, -131.29412841796875, -123.69528198242188, -116.096435546875, -108.49759674072266, -100.89875793457031, -93.29991149902344, -85.7010726928711, -78.10223388671875, -70.50338745117188, -62.90454864501953, -55.30570602416992, -47.70686340332031, -40.10802459716797, -32.50918197631836, -24.910354614257812, -17.311511993408203, -9.712671279907227, -2.11383056640625, 5.485012054443359, 13.083854675292969, 20.682693481445312, 28.281536102294922, 35.88037872314453, 43.47922134399414, 51.07806396484375, 58.676902770996094, 66.27574157714844, 73.87458801269531, 81.47342681884766, 89.072265625, 96.67111206054688, 104.26995086669922, 111.8687973022461, 119.46763610839844, 127.06648254394531, 134.66531372070312, 142.26416015625, 149.86300659179688, 157.46185302734375, 165.06069946289062, 172.65953063964844, 180.2583770751953, 187.8572235107422, 195.4560546875, 203.05490112304688, 210.65374755859375, 218.25257873535156]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 5.0, 18.0, 16.0, 16.0, 26.0, 30.0, 31.0, 32.0, 58.0, 53.0, 45.0, 69.0, 59.0, 62.0, 59.0, 57.0, 49.0, 54.0, 45.0, 37.0, 28.0, 33.0, 26.0, 17.0, 16.0, 17.0, 8.0, 7.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.58464050292969, -78.99730682373047, -76.40998077392578, -73.82264709472656, -71.23532104492188, -68.64798736572266, -66.06065368652344, -63.47332763671875, -60.88599395751953, -58.29866409301758, -55.711334228515625, -53.124000549316406, -50.53667068481445, -47.9493408203125, -45.36201095581055, -42.774681091308594, -40.18735122680664, -37.60002136230469, -35.012691497802734, -32.42536163330078, -29.838027954101562, -27.25069808959961, -24.663368225097656, -22.07603645324707, -19.488706588745117, -16.901376724243164, -14.314044952392578, -11.726715087890625, -9.139384269714355, -6.552053451538086, -3.964723587036133, -1.3773918151855469, 1.2099380493164062, 3.7972686290740967, 6.384599208831787, 8.971929550170898, 11.559260368347168, 14.146591186523438, 16.73392105102539, 19.321252822875977, 21.90858268737793, 24.495912551879883, 27.08324432373047, 29.670574188232422, 32.257904052734375, 34.845237731933594, 37.43256378173828, 40.0198974609375, 42.60722732543945, 45.194557189941406, 47.78188705444336, 50.36921691894531, 52.95655059814453, 55.543880462646484, 58.13121032714844, 60.718544006347656, 63.305870056152344, 65.89320373535156, 68.48052978515625, 71.06786346435547, 73.65518951416016, 76.24252319335938, 78.82984924316406, 81.41718292236328, 84.0045166015625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 9.0, 8.0, 7.0, 12.0, 29.0, 30.0, 53.0, 91.0, 119.0, 237.0, 391.0, 747.0, 1712.0, 4204.0, 13426.0, 55198.0, 269865.0, 514934.0, 143085.0, 30768.0, 8171.0, 2808.0, 1260.0, 610.0, 300.0, 175.0, 115.0, 61.0, 37.0, 40.0, 14.0, 11.0, 9.0, 7.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.205078125, -34.87890625, -33.552734375, -32.2265625, -30.900390625, -29.57421875, -28.248046875, -26.921875, -25.595703125, -24.26953125, -22.943359375, -21.6171875, -20.291015625, -18.96484375, -17.638671875, -16.3125, -14.986328125, -13.66015625, -12.333984375, -11.0078125, -9.681640625, -8.35546875, -7.029296875, -5.703125, -4.376953125, -3.05078125, -1.724609375, -0.3984375, 0.927734375, 2.25390625, 3.580078125, 4.90625, 6.232421875, 7.55859375, 8.884765625, 10.2109375, 11.537109375, 12.86328125, 14.189453125, 15.515625, 16.841796875, 18.16796875, 19.494140625, 20.8203125, 22.146484375, 23.47265625, 24.798828125, 26.125, 27.451171875, 28.77734375, 30.103515625, 31.4296875, 32.755859375, 34.08203125, 35.408203125, 36.734375, 38.060546875, 39.38671875, 40.712890625, 42.0390625, 43.365234375, 44.69140625, 46.017578125, 47.34375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 4.0, 8.0, 20.0, 21.0, 31.0, 37.0, 32.0, 54.0, 57.0, 60.0, 74.0, 70.0, 86.0, 79.0, 67.0, 62.0, 42.0, 45.0, 27.0, 30.0, 24.0, 18.0, 12.0, 9.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.6712646484375, -8.350341796875, -8.0294189453125, -7.70849609375, -7.3875732421875, -7.066650390625, -6.7457275390625, -6.4248046875, -6.1038818359375, -5.782958984375, -5.4620361328125, -5.14111328125, -4.8201904296875, -4.499267578125, -4.1783447265625, -3.857421875, -3.5364990234375, -3.215576171875, -2.8946533203125, -2.57373046875, -2.2528076171875, -1.931884765625, -1.6109619140625, -1.2900390625, -0.9691162109375, -0.648193359375, -0.3272705078125, -0.00634765625, 0.3145751953125, 0.635498046875, 0.9564208984375, 1.27734375, 1.5982666015625, 1.919189453125, 2.2401123046875, 2.56103515625, 2.8819580078125, 3.202880859375, 3.5238037109375, 3.8447265625, 4.1656494140625, 4.486572265625, 4.8074951171875, 5.12841796875, 5.4493408203125, 5.770263671875, 6.0911865234375, 6.412109375, 6.7330322265625, 7.053955078125, 7.3748779296875, 7.69580078125, 8.0167236328125, 8.337646484375, 8.6585693359375, 8.9794921875, 9.3004150390625, 9.621337890625, 9.9422607421875, 10.26318359375, 10.5841064453125, 10.905029296875, 11.2259521484375, 11.546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 18.0, 11.0, 26.0, 34.0, 63.0, 86.0, 148.0, 197.0, 321.0, 489.0, 923.0, 1886.0, 4660.0, 15092.0, 58549.0, 280797.0, 511765.0, 129135.0, 29636.0, 8566.0, 3003.0, 1394.0, 649.0, 375.0, 250.0, 163.0, 103.0, 61.0, 39.0, 30.0, 26.0, 13.0, 8.0, 8.0, 5.0, 3.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.28125, -32.309814453125, -31.33837890625, -30.366943359375, -29.3955078125, -28.424072265625, -27.45263671875, -26.481201171875, -25.509765625, -24.538330078125, -23.56689453125, -22.595458984375, -21.6240234375, -20.652587890625, -19.68115234375, -18.709716796875, -17.73828125, -16.766845703125, -15.79541015625, -14.823974609375, -13.8525390625, -12.881103515625, -11.90966796875, -10.938232421875, -9.966796875, -8.995361328125, -8.02392578125, -7.052490234375, -6.0810546875, -5.109619140625, -4.13818359375, -3.166748046875, -2.1953125, -1.223876953125, -0.25244140625, 0.718994140625, 1.6904296875, 2.661865234375, 3.63330078125, 4.604736328125, 5.576171875, 6.547607421875, 7.51904296875, 8.490478515625, 9.4619140625, 10.433349609375, 11.40478515625, 12.376220703125, 13.34765625, 14.319091796875, 15.29052734375, 16.261962890625, 17.2333984375, 18.204833984375, 19.17626953125, 20.147705078125, 21.119140625, 22.090576171875, 23.06201171875, 24.033447265625, 25.0048828125, 25.976318359375, 26.94775390625, 27.919189453125, 28.890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 13.0, 10.0, 9.0, 24.0, 27.0, 27.0, 56.0, 52.0, 63.0, 67.0, 69.0, 77.0, 71.0, 73.0, 65.0, 65.0, 58.0, 40.0, 37.0, 22.0, 19.0, 14.0, 12.0, 6.0, 7.0, 3.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.90625, -49.4580078125, -48.009765625, -46.5615234375, -45.11328125, -43.6650390625, -42.216796875, -40.7685546875, -39.3203125, -37.8720703125, -36.423828125, -34.9755859375, -33.52734375, -32.0791015625, -30.630859375, -29.1826171875, -27.734375, -26.2861328125, -24.837890625, -23.3896484375, -21.94140625, -20.4931640625, -19.044921875, -17.5966796875, -16.1484375, -14.7001953125, -13.251953125, -11.8037109375, -10.35546875, -8.9072265625, -7.458984375, -6.0107421875, -4.5625, -3.1142578125, -1.666015625, -0.2177734375, 1.23046875, 2.6787109375, 4.126953125, 5.5751953125, 7.0234375, 8.4716796875, 9.919921875, 11.3681640625, 12.81640625, 14.2646484375, 15.712890625, 17.1611328125, 18.609375, 20.0576171875, 21.505859375, 22.9541015625, 24.40234375, 25.8505859375, 27.298828125, 28.7470703125, 30.1953125, 31.6435546875, 33.091796875, 34.5400390625, 35.98828125, 37.4365234375, 38.884765625, 40.3330078125, 41.78125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 11.0, 20.0, 28.0, 50.0, 70.0, 131.0, 273.0, 492.0, 1127.0, 3129.0, 10531.0, 46155.0, 211390.0, 493313.0, 217507.0, 47823.0, 11025.0, 3174.0, 1121.0, 515.0, 289.0, 153.0, 77.0, 43.0, 26.0, 26.0, 16.0, 12.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.90625, -11.5028076171875, -11.099365234375, -10.6959228515625, -10.29248046875, -9.8890380859375, -9.485595703125, -9.0821533203125, -8.6787109375, -8.2752685546875, -7.871826171875, -7.4683837890625, -7.06494140625, -6.6614990234375, -6.258056640625, -5.8546142578125, -5.451171875, -5.0477294921875, -4.644287109375, -4.2408447265625, -3.83740234375, -3.4339599609375, -3.030517578125, -2.6270751953125, -2.2236328125, -1.8201904296875, -1.416748046875, -1.0133056640625, -0.60986328125, -0.2064208984375, 0.197021484375, 0.6004638671875, 1.00390625, 1.4073486328125, 1.810791015625, 2.2142333984375, 2.61767578125, 3.0211181640625, 3.424560546875, 3.8280029296875, 4.2314453125, 4.6348876953125, 5.038330078125, 5.4417724609375, 5.84521484375, 6.2486572265625, 6.652099609375, 7.0555419921875, 7.458984375, 7.8624267578125, 8.265869140625, 8.6693115234375, 9.07275390625, 9.4761962890625, 9.879638671875, 10.2830810546875, 10.6865234375, 11.0899658203125, 11.493408203125, 11.8968505859375, 12.30029296875, 12.7037353515625, 13.107177734375, 13.5106201171875, 13.9140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 9.0, 5.0, 6.0, 4.0, 16.0, 11.0, 22.0, 34.0, 48.0, 57.0, 68.0, 87.0, 101.0, 105.0, 99.0, 82.0, 62.0, 45.0, 33.0, 33.0, 17.0, 17.0, 19.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0024433135986328125, -0.002375677227973938, -0.0023080408573150635, -0.002240404486656189, -0.0021727681159973145, -0.00210513174533844, -0.0020374953746795654, -0.001969859004020691, -0.0019022226333618164, -0.001834586262702942, -0.0017669498920440674, -0.0016993135213851929, -0.0016316771507263184, -0.0015640407800674438, -0.0014964044094085693, -0.0014287680387496948, -0.0013611316680908203, -0.0012934952974319458, -0.0012258589267730713, -0.0011582225561141968, -0.0010905861854553223, -0.0010229498147964478, -0.0009553134441375732, -0.0008876770734786987, -0.0008200407028198242, -0.0007524043321609497, -0.0006847679615020752, -0.0006171315908432007, -0.0005494952201843262, -0.00048185884952545166, -0.00041422247886657715, -0.00034658610820770264, -0.0002789497375488281, -0.0002113133668899536, -0.0001436769962310791, -7.604062557220459e-05, -8.404254913330078e-06, 5.9232115745544434e-05, 0.00012686848640441895, 0.00019450485706329346, 0.00026214122772216797, 0.0003297775983810425, 0.000397413969039917, 0.0004650503396987915, 0.000532686710357666, 0.0006003230810165405, 0.000667959451675415, 0.0007355958223342896, 0.0008032321929931641, 0.0008708685636520386, 0.0009385049343109131, 0.0010061413049697876, 0.0010737776756286621, 0.0011414140462875366, 0.0012090504169464111, 0.0012766867876052856, 0.0013443231582641602, 0.0014119595289230347, 0.0014795958995819092, 0.0015472322702407837, 0.0016148686408996582, 0.0016825050115585327, 0.0017501413822174072, 0.0018177777528762817, 0.0018854141235351562]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 12.0, 11.0, 27.0, 42.0, 68.0, 105.0, 193.0, 402.0, 834.0, 2343.0, 8385.0, 49269.0, 328292.0, 530738.0, 105891.0, 15986.0, 3665.0, 1222.0, 528.0, 245.0, 131.0, 66.0, 31.0, 25.0, 17.0, 6.0, 3.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.75, -19.218994140625, -18.68798828125, -18.156982421875, -17.6259765625, -17.094970703125, -16.56396484375, -16.032958984375, -15.501953125, -14.970947265625, -14.43994140625, -13.908935546875, -13.3779296875, -12.846923828125, -12.31591796875, -11.784912109375, -11.25390625, -10.722900390625, -10.19189453125, -9.660888671875, -9.1298828125, -8.598876953125, -8.06787109375, -7.536865234375, -7.005859375, -6.474853515625, -5.94384765625, -5.412841796875, -4.8818359375, -4.350830078125, -3.81982421875, -3.288818359375, -2.7578125, -2.226806640625, -1.69580078125, -1.164794921875, -0.6337890625, -0.102783203125, 0.42822265625, 0.959228515625, 1.490234375, 2.021240234375, 2.55224609375, 3.083251953125, 3.6142578125, 4.145263671875, 4.67626953125, 5.207275390625, 5.73828125, 6.269287109375, 6.80029296875, 7.331298828125, 7.8623046875, 8.393310546875, 8.92431640625, 9.455322265625, 9.986328125, 10.517333984375, 11.04833984375, 11.579345703125, 12.1103515625, 12.641357421875, 13.17236328125, 13.703369140625, 14.234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 7.0, 11.0, 14.0, 25.0, 21.0, 27.0, 46.0, 45.0, 57.0, 65.0, 74.0, 87.0, 86.0, 80.0, 82.0, 66.0, 46.0, 44.0, 24.0, 23.0, 22.0, 10.0, 11.0, 8.0, 6.0, 3.0, 6.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.765625, -15.3804931640625, -14.995361328125, -14.6102294921875, -14.22509765625, -13.8399658203125, -13.454833984375, -13.0697021484375, -12.6845703125, -12.2994384765625, -11.914306640625, -11.5291748046875, -11.14404296875, -10.7589111328125, -10.373779296875, -9.9886474609375, -9.603515625, -9.2183837890625, -8.833251953125, -8.4481201171875, -8.06298828125, -7.6778564453125, -7.292724609375, -6.9075927734375, -6.5224609375, -6.1373291015625, -5.752197265625, -5.3670654296875, -4.98193359375, -4.5968017578125, -4.211669921875, -3.8265380859375, -3.44140625, -3.0562744140625, -2.671142578125, -2.2860107421875, -1.90087890625, -1.5157470703125, -1.130615234375, -0.7454833984375, -0.3603515625, 0.0247802734375, 0.409912109375, 0.7950439453125, 1.18017578125, 1.5653076171875, 1.950439453125, 2.3355712890625, 2.720703125, 3.1058349609375, 3.490966796875, 3.8760986328125, 4.26123046875, 4.6463623046875, 5.031494140625, 5.4166259765625, 5.8017578125, 6.1868896484375, 6.572021484375, 6.9571533203125, 7.34228515625, 7.7274169921875, 8.112548828125, 8.4976806640625, 8.8828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 16.0, 27.0, 53.0, 150.0, 198.0, 237.0, 153.0, 92.0, 38.0, 22.0, 11.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-533.4025268554688, -522.0223388671875, -510.64215087890625, -499.2619934082031, -487.8818054199219, -476.5016174316406, -465.1214294433594, -453.74127197265625, -442.361083984375, -430.98089599609375, -419.6007080078125, -408.2205505371094, -396.8403625488281, -385.4601745605469, -374.0799865722656, -362.6998291015625, -351.31964111328125, -339.939453125, -328.55926513671875, -317.1791076660156, -305.7989196777344, -294.4187316894531, -283.0385437011719, -271.65838623046875, -260.2781677246094, -248.89797973632812, -237.51780700683594, -226.1376190185547, -214.7574462890625, -203.37725830078125, -191.9970703125, -180.6168975830078, -169.23672485351562, -157.85653686523438, -146.4763641357422, -135.09617614746094, -123.71600341796875, -112.3358154296875, -100.95563507080078, -89.57545471191406, -78.19527435302734, -66.81509399414062, -55.434913635253906, -44.05472946166992, -32.6745491027832, -21.294368743896484, -9.9141845703125, 1.4659957885742188, 12.846176147460938, 24.226356506347656, 35.606536865234375, 46.98672103881836, 58.36690139770508, 69.74708557128906, 81.12726593017578, 92.5074462890625, 103.88762664794922, 115.26780700683594, 126.64798736572266, 138.02816772460938, 149.40835571289062, 160.7885284423828, 172.16871643066406, 183.54888916015625, 194.9290771484375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 9.0, 10.0, 16.0, 15.0, 18.0, 11.0, 21.0, 26.0, 23.0, 32.0, 36.0, 31.0, 32.0, 46.0, 51.0, 44.0, 42.0, 50.0, 40.0, 32.0, 39.0, 43.0, 34.0, 33.0, 28.0, 25.0, 31.0, 24.0, 29.0, 17.0, 16.0, 11.0, 17.0, 11.0, 9.0, 14.0, 7.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0], "bins": [-155.40689086914062, -151.18545532226562, -146.9640350341797, -142.74261474609375, -138.52117919921875, -134.29974365234375, -130.0783233642578, -125.85689544677734, -121.63546752929688, -117.4140396118164, -113.19261169433594, -108.97118377685547, -104.749755859375, -100.52832794189453, -96.30690002441406, -92.0854721069336, -87.86404418945312, -83.64261627197266, -79.42118835449219, -75.19976043701172, -70.97833251953125, -66.75690460205078, -62.53547668457031, -58.314048767089844, -54.092620849609375, -49.871192932128906, -45.64976501464844, -41.42833709716797, -37.2069091796875, -32.98548126220703, -28.764053344726562, -24.542625427246094, -20.321197509765625, -16.099769592285156, -11.878341674804688, -7.656913757324219, -3.43548583984375, 0.7859420776367188, 5.0073699951171875, 9.228797912597656, 13.450225830078125, 17.671653747558594, 21.893081665039062, 26.11450958251953, 30.3359375, 34.55736541748047, 38.77879333496094, 43.000221252441406, 47.221649169921875, 51.443077087402344, 55.66450500488281, 59.88593292236328, 64.10736083984375, 68.32878875732422, 72.55021667480469, 76.77164459228516, 80.99307250976562, 85.2145004272461, 89.43592834472656, 93.65735626220703, 97.8787841796875, 102.10021209716797, 106.32164001464844, 110.5430679321289, 114.76449584960938]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 8.0, 13.0, 11.0, 16.0, 24.0, 48.0, 42.0, 65.0, 94.0, 151.0, 241.0, 421.0, 580.0, 1130.0, 2224.0, 4987.0, 13776.0, 61908.0, 3994759.0, 86150.0, 16382.0, 5662.0, 2518.0, 1253.0, 621.0, 424.0, 242.0, 164.0, 107.0, 47.0, 45.0, 32.0, 38.0, 23.0, 12.0, 12.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.59375, -52.68310546875, -50.7724609375, -48.86181640625, -46.951171875, -45.04052734375, -43.1298828125, -41.21923828125, -39.30859375, -37.39794921875, -35.4873046875, -33.57666015625, -31.666015625, -29.75537109375, -27.8447265625, -25.93408203125, -24.0234375, -22.11279296875, -20.2021484375, -18.29150390625, -16.380859375, -14.47021484375, -12.5595703125, -10.64892578125, -8.73828125, -6.82763671875, -4.9169921875, -3.00634765625, -1.095703125, 0.81494140625, 2.7255859375, 4.63623046875, 6.546875, 8.45751953125, 10.3681640625, 12.27880859375, 14.189453125, 16.10009765625, 18.0107421875, 19.92138671875, 21.83203125, 23.74267578125, 25.6533203125, 27.56396484375, 29.474609375, 31.38525390625, 33.2958984375, 35.20654296875, 37.1171875, 39.02783203125, 40.9384765625, 42.84912109375, 44.759765625, 46.67041015625, 48.5810546875, 50.49169921875, 52.40234375, 54.31298828125, 56.2236328125, 58.13427734375, 60.044921875, 61.95556640625, 63.8662109375, 65.77685546875, 67.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 14.0, 12.0, 12.0, 24.0, 20.0, 15.0, 26.0, 31.0, 45.0, 54.0, 52.0, 66.0, 75.0, 67.0, 80.0, 59.0, 69.0, 46.0, 52.0, 39.0, 39.0, 20.0, 22.0, 15.0, 12.0, 14.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.3966064453125, -10.043212890625, -9.6898193359375, -9.33642578125, -8.9830322265625, -8.629638671875, -8.2762451171875, -7.9228515625, -7.5694580078125, -7.216064453125, -6.8626708984375, -6.50927734375, -6.1558837890625, -5.802490234375, -5.4490966796875, -5.095703125, -4.7423095703125, -4.388916015625, -4.0355224609375, -3.68212890625, -3.3287353515625, -2.975341796875, -2.6219482421875, -2.2685546875, -1.9151611328125, -1.561767578125, -1.2083740234375, -0.85498046875, -0.5015869140625, -0.148193359375, 0.2052001953125, 0.55859375, 0.9119873046875, 1.265380859375, 1.6187744140625, 1.97216796875, 2.3255615234375, 2.678955078125, 3.0323486328125, 3.3857421875, 3.7391357421875, 4.092529296875, 4.4459228515625, 4.79931640625, 5.1527099609375, 5.506103515625, 5.8594970703125, 6.212890625, 6.5662841796875, 6.919677734375, 7.2730712890625, 7.62646484375, 7.9798583984375, 8.333251953125, 8.6866455078125, 9.0400390625, 9.3934326171875, 9.746826171875, 10.1002197265625, 10.45361328125, 10.8070068359375, 11.160400390625, 11.5137939453125, 11.8671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 12.0, 19.0, 25.0, 44.0, 65.0, 117.0, 181.0, 302.0, 490.0, 805.0, 1431.0, 2386.0, 4594.0, 9377.0, 21949.0, 70700.0, 3549525.0, 441991.0, 54236.0, 18287.0, 8235.0, 4132.0, 2214.0, 1235.0, 745.0, 452.0, 267.0, 166.0, 102.0, 59.0, 42.0, 28.0, 18.0, 16.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.224609375, -27.33984375, -26.455078125, -25.5703125, -24.685546875, -23.80078125, -22.916015625, -22.03125, -21.146484375, -20.26171875, -19.376953125, -18.4921875, -17.607421875, -16.72265625, -15.837890625, -14.953125, -14.068359375, -13.18359375, -12.298828125, -11.4140625, -10.529296875, -9.64453125, -8.759765625, -7.875, -6.990234375, -6.10546875, -5.220703125, -4.3359375, -3.451171875, -2.56640625, -1.681640625, -0.796875, 0.087890625, 0.97265625, 1.857421875, 2.7421875, 3.626953125, 4.51171875, 5.396484375, 6.28125, 7.166015625, 8.05078125, 8.935546875, 9.8203125, 10.705078125, 11.58984375, 12.474609375, 13.359375, 14.244140625, 15.12890625, 16.013671875, 16.8984375, 17.783203125, 18.66796875, 19.552734375, 20.4375, 21.322265625, 22.20703125, 23.091796875, 23.9765625, 24.861328125, 25.74609375, 26.630859375, 27.515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 9.0, 10.0, 2.0, 12.0, 12.0, 21.0, 40.0, 71.0, 132.0, 404.0, 2924.0, 168.0, 72.0, 63.0, 23.0, 29.0, 15.0, 9.0, 11.0, 6.0, 9.0, 8.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.98046875, -5.7889404296875, -5.597412109375, -5.4058837890625, -5.21435546875, -5.0228271484375, -4.831298828125, -4.6397705078125, -4.4482421875, -4.2567138671875, -4.065185546875, -3.8736572265625, -3.68212890625, -3.4906005859375, -3.299072265625, -3.1075439453125, -2.916015625, -2.7244873046875, -2.532958984375, -2.3414306640625, -2.14990234375, -1.9583740234375, -1.766845703125, -1.5753173828125, -1.3837890625, -1.1922607421875, -1.000732421875, -0.8092041015625, -0.61767578125, -0.4261474609375, -0.234619140625, -0.0430908203125, 0.1484375, 0.3399658203125, 0.531494140625, 0.7230224609375, 0.91455078125, 1.1060791015625, 1.297607421875, 1.4891357421875, 1.6806640625, 1.8721923828125, 2.063720703125, 2.2552490234375, 2.44677734375, 2.6383056640625, 2.829833984375, 3.0213623046875, 3.212890625, 3.4044189453125, 3.595947265625, 3.7874755859375, 3.97900390625, 4.1705322265625, 4.362060546875, 4.5535888671875, 4.7451171875, 4.9366455078125, 5.128173828125, 5.3197021484375, 5.51123046875, 5.7027587890625, 5.894287109375, 6.0858154296875, 6.27734375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 12.0, 13.0, 33.0, 63.0, 101.0, 160.0, 159.0, 167.0, 124.0, 94.0, 36.0, 14.0, 19.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.821247100830078, -20.340980529785156, -18.860713958740234, -17.38044548034668, -15.900178909301758, -14.419912338256836, -12.939644813537598, -11.45937728881836, -9.979110717773438, -8.498844146728516, -7.018576622009277, -5.538309574127197, -4.058042526245117, -2.577775478363037, -1.097508430480957, 0.38275909423828125, 1.8630256652832031, 3.343292713165283, 4.823559761047363, 6.303826808929443, 7.784093856811523, 9.264360427856445, 10.744627952575684, 12.224895477294922, 13.705162048339844, 15.185428619384766, 16.665695190429688, 18.145963668823242, 19.626230239868164, 21.106496810913086, 22.58676528930664, 24.067031860351562, 25.54730224609375, 27.027568817138672, 28.507835388183594, 29.98810386657715, 31.46837043762207, 32.948638916015625, 34.42890548706055, 35.90917205810547, 37.38943862915039, 38.86970520019531, 40.349971771240234, 41.830238342285156, 43.310508728027344, 44.790775299072266, 46.27104187011719, 47.75130844116211, 49.23157501220703, 50.71184158325195, 52.192108154296875, 53.6723747253418, 55.15264129638672, 56.632911682128906, 58.11317825317383, 59.59344482421875, 61.07371139526367, 62.553977966308594, 64.03424835205078, 65.51451110839844, 66.99478149414062, 68.47504425048828, 69.95531463623047, 71.43557739257812, 72.91584777832031]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 7.0, 6.0, 11.0, 22.0, 13.0, 19.0, 15.0, 21.0, 26.0, 25.0, 37.0, 36.0, 35.0, 40.0, 40.0, 56.0, 36.0, 46.0, 40.0, 58.0, 32.0, 33.0, 35.0, 42.0, 38.0, 38.0, 25.0, 24.0, 29.0, 15.0, 12.0, 18.0, 12.0, 16.0, 4.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.061873435974121, -14.571001052856445, -14.080129623413086, -13.58925724029541, -13.098384857177734, -12.607513427734375, -12.1166410446167, -11.625768661499023, -11.134897232055664, -10.644024848937988, -10.153153419494629, -9.662281036376953, -9.171408653259277, -8.680536270141602, -8.189664840698242, -7.698792457580566, -7.207920074462891, -6.717048168182373, -6.226175785064697, -5.73530387878418, -5.244431495666504, -4.753559589385986, -4.262687683105469, -3.771815538406372, -3.2809433937072754, -2.7900712490081787, -2.299199104309082, -1.8083271980285645, -1.3174550533294678, -0.8265829086303711, -0.3357110023498535, 0.15516114234924316, 0.6460323333740234, 1.1369044780731201, 1.6277765035629272, 2.1186485290527344, 2.609520673751831, 3.1003928184509277, 3.5912647247314453, 4.082137107849121, 4.573009014129639, 5.063880920410156, 5.554753303527832, 6.04562520980835, 6.536497116088867, 7.027369499206543, 7.5182414054870605, 8.009113311767578, 8.499985694885254, 8.99085807800293, 9.481729507446289, 9.972601890563965, 10.46347427368164, 10.954345703125, 11.445218086242676, 11.936090469360352, 12.426961898803711, 12.917834281921387, 13.408705711364746, 13.899578094482422, 14.390450477600098, 14.881322860717773, 15.372194290161133, 15.863066673278809, 16.353939056396484]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 12.0, 14.0, 38.0, 39.0, 109.0, 150.0, 249.0, 477.0, 1059.0, 2420.0, 6828.0, 22608.0, 83682.0, 313563.0, 429174.0, 136043.0, 35465.0, 10477.0, 3481.0, 1266.0, 647.0, 313.0, 160.0, 89.0, 65.0, 33.0, 32.0, 18.0, 12.0, 8.0, 8.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -37.281982421875, -36.25146484375, -35.220947265625, -34.1904296875, -33.159912109375, -32.12939453125, -31.098876953125, -30.068359375, -29.037841796875, -28.00732421875, -26.976806640625, -25.9462890625, -24.915771484375, -23.88525390625, -22.854736328125, -21.82421875, -20.793701171875, -19.76318359375, -18.732666015625, -17.7021484375, -16.671630859375, -15.64111328125, -14.610595703125, -13.580078125, -12.549560546875, -11.51904296875, -10.488525390625, -9.4580078125, -8.427490234375, -7.39697265625, -6.366455078125, -5.3359375, -4.305419921875, -3.27490234375, -2.244384765625, -1.2138671875, -0.183349609375, 0.84716796875, 1.877685546875, 2.908203125, 3.938720703125, 4.96923828125, 5.999755859375, 7.0302734375, 8.060791015625, 9.09130859375, 10.121826171875, 11.15234375, 12.182861328125, 13.21337890625, 14.243896484375, 15.2744140625, 16.304931640625, 17.33544921875, 18.365966796875, 19.396484375, 20.427001953125, 21.45751953125, 22.488037109375, 23.5185546875, 24.549072265625, 25.57958984375, 26.610107421875, 27.640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 5.0, 17.0, 7.0, 7.0, 18.0, 16.0, 22.0, 23.0, 33.0, 37.0, 32.0, 54.0, 54.0, 47.0, 69.0, 60.0, 70.0, 65.0, 55.0, 47.0, 44.0, 47.0, 35.0, 29.0, 25.0, 17.0, 19.0, 11.0, 12.0, 4.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.4317626953125, -9.090087890625, -8.7484130859375, -8.40673828125, -8.0650634765625, -7.723388671875, -7.3817138671875, -7.0400390625, -6.6983642578125, -6.356689453125, -6.0150146484375, -5.67333984375, -5.3316650390625, -4.989990234375, -4.6483154296875, -4.306640625, -3.9649658203125, -3.623291015625, -3.2816162109375, -2.93994140625, -2.5982666015625, -2.256591796875, -1.9149169921875, -1.5732421875, -1.2315673828125, -0.889892578125, -0.5482177734375, -0.20654296875, 0.1351318359375, 0.476806640625, 0.8184814453125, 1.16015625, 1.5018310546875, 1.843505859375, 2.1851806640625, 2.52685546875, 2.8685302734375, 3.210205078125, 3.5518798828125, 3.8935546875, 4.2352294921875, 4.576904296875, 4.9185791015625, 5.26025390625, 5.6019287109375, 5.943603515625, 6.2852783203125, 6.626953125, 6.9686279296875, 7.310302734375, 7.6519775390625, 7.99365234375, 8.3353271484375, 8.677001953125, 9.0186767578125, 9.3603515625, 9.7020263671875, 10.043701171875, 10.3853759765625, 10.72705078125, 11.0687255859375, 11.410400390625, 11.7520751953125, 12.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 12.0, 18.0, 31.0, 35.0, 51.0, 107.0, 163.0, 248.0, 408.0, 705.0, 1337.0, 3571.0, 13932.0, 79777.0, 539730.0, 345493.0, 48394.0, 9225.0, 2643.0, 1149.0, 611.0, 357.0, 188.0, 139.0, 82.0, 42.0, 42.0, 21.0, 10.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-45.375, -44.20751953125, -43.0400390625, -41.87255859375, -40.705078125, -39.53759765625, -38.3701171875, -37.20263671875, -36.03515625, -34.86767578125, -33.7001953125, -32.53271484375, -31.365234375, -30.19775390625, -29.0302734375, -27.86279296875, -26.6953125, -25.52783203125, -24.3603515625, -23.19287109375, -22.025390625, -20.85791015625, -19.6904296875, -18.52294921875, -17.35546875, -16.18798828125, -15.0205078125, -13.85302734375, -12.685546875, -11.51806640625, -10.3505859375, -9.18310546875, -8.015625, -6.84814453125, -5.6806640625, -4.51318359375, -3.345703125, -2.17822265625, -1.0107421875, 0.15673828125, 1.32421875, 2.49169921875, 3.6591796875, 4.82666015625, 5.994140625, 7.16162109375, 8.3291015625, 9.49658203125, 10.6640625, 11.83154296875, 12.9990234375, 14.16650390625, 15.333984375, 16.50146484375, 17.6689453125, 18.83642578125, 20.00390625, 21.17138671875, 22.3388671875, 23.50634765625, 24.673828125, 25.84130859375, 27.0087890625, 28.17626953125, 29.34375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 5.0, 9.0, 11.0, 20.0, 22.0, 25.0, 37.0, 45.0, 53.0, 57.0, 58.0, 74.0, 70.0, 58.0, 72.0, 71.0, 57.0, 73.0, 45.0, 37.0, 21.0, 19.0, 15.0, 8.0, 10.0, 5.0, 9.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.5, -43.7412109375, -41.982421875, -40.2236328125, -38.46484375, -36.7060546875, -34.947265625, -33.1884765625, -31.4296875, -29.6708984375, -27.912109375, -26.1533203125, -24.39453125, -22.6357421875, -20.876953125, -19.1181640625, -17.359375, -15.6005859375, -13.841796875, -12.0830078125, -10.32421875, -8.5654296875, -6.806640625, -5.0478515625, -3.2890625, -1.5302734375, 0.228515625, 1.9873046875, 3.74609375, 5.5048828125, 7.263671875, 9.0224609375, 10.78125, 12.5400390625, 14.298828125, 16.0576171875, 17.81640625, 19.5751953125, 21.333984375, 23.0927734375, 24.8515625, 26.6103515625, 28.369140625, 30.1279296875, 31.88671875, 33.6455078125, 35.404296875, 37.1630859375, 38.921875, 40.6806640625, 42.439453125, 44.1982421875, 45.95703125, 47.7158203125, 49.474609375, 51.2333984375, 52.9921875, 54.7509765625, 56.509765625, 58.2685546875, 60.02734375, 61.7861328125, 63.544921875, 65.3037109375, 67.0625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 24.0, 20.0, 48.0, 80.0, 141.0, 240.0, 594.0, 1889.0, 7727.0, 55964.0, 666447.0, 285193.0, 23915.0, 4171.0, 1212.0, 426.0, 190.0, 88.0, 52.0, 48.0, 25.0, 13.0, 7.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15625, -19.45654296875, -18.7568359375, -18.05712890625, -17.357421875, -16.65771484375, -15.9580078125, -15.25830078125, -14.55859375, -13.85888671875, -13.1591796875, -12.45947265625, -11.759765625, -11.06005859375, -10.3603515625, -9.66064453125, -8.9609375, -8.26123046875, -7.5615234375, -6.86181640625, -6.162109375, -5.46240234375, -4.7626953125, -4.06298828125, -3.36328125, -2.66357421875, -1.9638671875, -1.26416015625, -0.564453125, 0.13525390625, 0.8349609375, 1.53466796875, 2.234375, 2.93408203125, 3.6337890625, 4.33349609375, 5.033203125, 5.73291015625, 6.4326171875, 7.13232421875, 7.83203125, 8.53173828125, 9.2314453125, 9.93115234375, 10.630859375, 11.33056640625, 12.0302734375, 12.72998046875, 13.4296875, 14.12939453125, 14.8291015625, 15.52880859375, 16.228515625, 16.92822265625, 17.6279296875, 18.32763671875, 19.02734375, 19.72705078125, 20.4267578125, 21.12646484375, 21.826171875, 22.52587890625, 23.2255859375, 23.92529296875, 24.625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 7.0, 12.0, 19.0, 16.0, 25.0, 35.0, 42.0, 61.0, 57.0, 100.0, 90.0, 97.0, 100.0, 81.0, 66.0, 47.0, 29.0, 21.0, 16.0, 10.0, 5.0, 7.0, 8.0, 6.0, 7.0, 2.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0017881393432617188, -0.0017286986112594604, -0.0016692578792572021, -0.0016098171472549438, -0.0015503764152526855, -0.0014909356832504272, -0.001431494951248169, -0.0013720542192459106, -0.0013126134872436523, -0.001253172755241394, -0.0011937320232391357, -0.0011342912912368774, -0.0010748505592346191, -0.0010154098272323608, -0.0009559690952301025, -0.0008965283632278442, -0.0008370876312255859, -0.0007776468992233276, -0.0007182061672210693, -0.000658765435218811, -0.0005993247032165527, -0.0005398839712142944, -0.00048044323921203613, -0.00042100250720977783, -0.00036156177520751953, -0.00030212104320526123, -0.00024268031120300293, -0.00018323957920074463, -0.00012379884719848633, -6.435811519622803e-05, -4.9173831939697266e-06, 5.4523348808288574e-05, 0.00011396408081054688, 0.00017340481281280518, 0.00023284554481506348, 0.0002922862768173218, 0.0003517270088195801, 0.0004111677408218384, 0.0004706084728240967, 0.000530049204826355, 0.0005894899368286133, 0.0006489306688308716, 0.0007083714008331299, 0.0007678121328353882, 0.0008272528648376465, 0.0008866935968399048, 0.0009461343288421631, 0.0010055750608444214, 0.0010650157928466797, 0.001124456524848938, 0.0011838972568511963, 0.0012433379888534546, 0.0013027787208557129, 0.0013622194528579712, 0.0014216601848602295, 0.0014811009168624878, 0.001540541648864746, 0.0015999823808670044, 0.0016594231128692627, 0.001718863844871521, 0.0017783045768737793, 0.0018377453088760376, 0.001897186040878296, 0.001956626772880554, 0.0020160675048828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 8.0, 17.0, 18.0, 35.0, 60.0, 104.0, 236.0, 576.0, 1799.0, 9962.0, 183686.0, 807592.0, 38576.0, 4129.0, 985.0, 369.0, 183.0, 81.0, 47.0, 29.0, 22.0, 10.0, 3.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.38720703125, -18.4306640625, -17.47412109375, -16.517578125, -15.56103515625, -14.6044921875, -13.64794921875, -12.69140625, -11.73486328125, -10.7783203125, -9.82177734375, -8.865234375, -7.90869140625, -6.9521484375, -5.99560546875, -5.0390625, -4.08251953125, -3.1259765625, -2.16943359375, -1.212890625, -0.25634765625, 0.7001953125, 1.65673828125, 2.61328125, 3.56982421875, 4.5263671875, 5.48291015625, 6.439453125, 7.39599609375, 8.3525390625, 9.30908203125, 10.265625, 11.22216796875, 12.1787109375, 13.13525390625, 14.091796875, 15.04833984375, 16.0048828125, 16.96142578125, 17.91796875, 18.87451171875, 19.8310546875, 20.78759765625, 21.744140625, 22.70068359375, 23.6572265625, 24.61376953125, 25.5703125, 26.52685546875, 27.4833984375, 28.43994140625, 29.396484375, 30.35302734375, 31.3095703125, 32.26611328125, 33.22265625, 34.17919921875, 35.1357421875, 36.09228515625, 37.048828125, 38.00537109375, 38.9619140625, 39.91845703125, 40.875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 21.0, 29.0, 58.0, 138.0, 291.0, 230.0, 114.0, 62.0, 18.0, 21.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.78125, -57.52490234375, -56.2685546875, -55.01220703125, -53.755859375, -52.49951171875, -51.2431640625, -49.98681640625, -48.73046875, -47.47412109375, -46.2177734375, -44.96142578125, -43.705078125, -42.44873046875, -41.1923828125, -39.93603515625, -38.6796875, -37.42333984375, -36.1669921875, -34.91064453125, -33.654296875, -32.39794921875, -31.1416015625, -29.88525390625, -28.62890625, -27.37255859375, -26.1162109375, -24.85986328125, -23.603515625, -22.34716796875, -21.0908203125, -19.83447265625, -18.578125, -17.32177734375, -16.0654296875, -14.80908203125, -13.552734375, -12.29638671875, -11.0400390625, -9.78369140625, -8.52734375, -7.27099609375, -6.0146484375, -4.75830078125, -3.501953125, -2.24560546875, -0.9892578125, 0.26708984375, 1.5234375, 2.77978515625, 4.0361328125, 5.29248046875, 6.548828125, 7.80517578125, 9.0615234375, 10.31787109375, 11.57421875, 12.83056640625, 14.0869140625, 15.34326171875, 16.599609375, 17.85595703125, 19.1123046875, 20.36865234375, 21.625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 27.0, 27.0, 83.0, 122.0, 200.0, 208.0, 154.0, 85.0, 46.0, 23.0, 17.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.73980712890625, -273.4122009277344, -261.0846252441406, -248.75701904296875, -236.42942810058594, -224.10183715820312, -211.77423095703125, -199.44664001464844, -187.11904907226562, -174.7914581298828, -162.4638671875, -150.13626098632812, -137.8086700439453, -125.4810791015625, -113.15348052978516, -100.82588195800781, -88.498291015625, -76.17070007324219, -63.843101501464844, -51.515506744384766, -39.18791198730469, -26.86031723022461, -14.532722473144531, -2.2051239013671875, 10.122467041015625, 22.450061798095703, 34.77765655517578, 47.10525131225586, 59.43284606933594, 71.76043701171875, 84.0880355834961, 96.41563415527344, 108.74325561523438, 121.07084655761719, 133.3984375, 145.72604370117188, 158.0536346435547, 170.3812255859375, 182.70883178710938, 195.0364227294922, 207.364013671875, 219.6916046142578, 232.01919555664062, 244.3468017578125, 256.67437744140625, 269.0019836425781, 281.32958984375, 293.65716552734375, 305.9847717285156, 318.3123779296875, 330.63995361328125, 342.9675598144531, 355.295166015625, 367.62274169921875, 379.9503479003906, 392.2779541015625, 404.60552978515625, 416.9331359863281, 429.2607116699219, 441.58831787109375, 453.9158935546875, 466.2434997558594, 478.57110595703125, 490.898681640625, 503.2262878417969]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 9.0, 16.0, 6.0, 16.0, 13.0, 21.0, 26.0, 24.0, 32.0, 24.0, 36.0, 42.0, 50.0, 45.0, 53.0, 42.0, 50.0, 49.0, 45.0, 42.0, 41.0, 38.0, 40.0, 33.0, 35.0, 22.0, 18.0, 17.0, 26.0, 15.0, 11.0, 11.0, 8.0, 2.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.52256774902344, -165.47189331054688, -159.42120361328125, -153.37051391601562, -147.31983947753906, -141.2691650390625, -135.21847534179688, -129.16778564453125, -123.11711120605469, -117.0664291381836, -111.0157470703125, -104.9650650024414, -98.91438293457031, -92.86370086669922, -86.81301879882812, -80.76233673095703, -74.71165466308594, -68.66097259521484, -62.61029052734375, -56.559608459472656, -50.50892639160156, -44.45824432373047, -38.407562255859375, -32.35688018798828, -26.306198120117188, -20.255516052246094, -14.204833984375, -8.154151916503906, -2.1034698486328125, 3.9472122192382812, 9.997894287109375, 16.04857635498047, 22.099273681640625, 28.14995574951172, 34.20063781738281, 40.251319885253906, 46.302001953125, 52.352684020996094, 58.40336608886719, 64.45404815673828, 70.50473022460938, 76.55541229248047, 82.60609436035156, 88.65677642822266, 94.70745849609375, 100.75814056396484, 106.80882263183594, 112.85950469970703, 118.91018676757812, 124.96086883544922, 131.0115509033203, 137.06222534179688, 143.1129150390625, 149.16360473632812, 155.2142791748047, 161.26495361328125, 167.31564331054688, 173.3663330078125, 179.41700744628906, 185.46768188476562, 191.51837158203125, 197.56906127929688, 203.61973571777344, 209.67041015625, 215.72109985351562]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 6.0, 18.0, 23.0, 29.0, 56.0, 75.0, 113.0, 158.0, 316.0, 474.0, 897.0, 1705.0, 4105.0, 12298.0, 62134.0, 3975148.0, 110311.0, 16735.0, 5137.0, 2082.0, 975.0, 528.0, 323.0, 204.0, 121.0, 80.0, 46.0, 36.0, 30.0, 26.0, 15.0, 15.0, 8.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-61.65625, -59.822265625, -57.98828125, -56.154296875, -54.3203125, -52.486328125, -50.65234375, -48.818359375, -46.984375, -45.150390625, -43.31640625, -41.482421875, -39.6484375, -37.814453125, -35.98046875, -34.146484375, -32.3125, -30.478515625, -28.64453125, -26.810546875, -24.9765625, -23.142578125, -21.30859375, -19.474609375, -17.640625, -15.806640625, -13.97265625, -12.138671875, -10.3046875, -8.470703125, -6.63671875, -4.802734375, -2.96875, -1.134765625, 0.69921875, 2.533203125, 4.3671875, 6.201171875, 8.03515625, 9.869140625, 11.703125, 13.537109375, 15.37109375, 17.205078125, 19.0390625, 20.873046875, 22.70703125, 24.541015625, 26.375, 28.208984375, 30.04296875, 31.876953125, 33.7109375, 35.544921875, 37.37890625, 39.212890625, 41.046875, 42.880859375, 44.71484375, 46.548828125, 48.3828125, 50.216796875, 52.05078125, 53.884765625, 55.71875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 15.0, 10.0, 11.0, 23.0, 20.0, 19.0, 29.0, 27.0, 39.0, 47.0, 53.0, 61.0, 51.0, 56.0, 67.0, 61.0, 55.0, 55.0, 42.0, 46.0, 43.0, 34.0, 24.0, 19.0, 24.0, 14.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.616455078125, -9.27197265625, -8.927490234375, -8.5830078125, -8.238525390625, -7.89404296875, -7.549560546875, -7.205078125, -6.860595703125, -6.51611328125, -6.171630859375, -5.8271484375, -5.482666015625, -5.13818359375, -4.793701171875, -4.44921875, -4.104736328125, -3.76025390625, -3.415771484375, -3.0712890625, -2.726806640625, -2.38232421875, -2.037841796875, -1.693359375, -1.348876953125, -1.00439453125, -0.659912109375, -0.3154296875, 0.029052734375, 0.37353515625, 0.718017578125, 1.0625, 1.406982421875, 1.75146484375, 2.095947265625, 2.4404296875, 2.784912109375, 3.12939453125, 3.473876953125, 3.818359375, 4.162841796875, 4.50732421875, 4.851806640625, 5.1962890625, 5.540771484375, 5.88525390625, 6.229736328125, 6.57421875, 6.918701171875, 7.26318359375, 7.607666015625, 7.9521484375, 8.296630859375, 8.64111328125, 8.985595703125, 9.330078125, 9.674560546875, 10.01904296875, 10.363525390625, 10.7080078125, 11.052490234375, 11.39697265625, 11.741455078125, 12.0859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 6.0, 9.0, 15.0, 18.0, 29.0, 48.0, 50.0, 76.0, 110.0, 142.0, 224.0, 317.0, 523.0, 815.0, 1351.0, 2556.0, 5226.0, 12386.0, 36958.0, 172228.0, 3738484.0, 163419.0, 35970.0, 12142.0, 5092.0, 2525.0, 1257.0, 761.0, 507.0, 321.0, 215.0, 144.0, 93.0, 78.0, 52.0, 35.0, 31.0, 18.0, 15.0, 6.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.21875, -24.30126953125, -23.3837890625, -22.46630859375, -21.548828125, -20.63134765625, -19.7138671875, -18.79638671875, -17.87890625, -16.96142578125, -16.0439453125, -15.12646484375, -14.208984375, -13.29150390625, -12.3740234375, -11.45654296875, -10.5390625, -9.62158203125, -8.7041015625, -7.78662109375, -6.869140625, -5.95166015625, -5.0341796875, -4.11669921875, -3.19921875, -2.28173828125, -1.3642578125, -0.44677734375, 0.470703125, 1.38818359375, 2.3056640625, 3.22314453125, 4.140625, 5.05810546875, 5.9755859375, 6.89306640625, 7.810546875, 8.72802734375, 9.6455078125, 10.56298828125, 11.48046875, 12.39794921875, 13.3154296875, 14.23291015625, 15.150390625, 16.06787109375, 16.9853515625, 17.90283203125, 18.8203125, 19.73779296875, 20.6552734375, 21.57275390625, 22.490234375, 23.40771484375, 24.3251953125, 25.24267578125, 26.16015625, 27.07763671875, 27.9951171875, 28.91259765625, 29.830078125, 30.74755859375, 31.6650390625, 32.58251953125, 33.5]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 15.0, 11.0, 21.0, 34.0, 63.0, 108.0, 203.0, 2800.0, 440.0, 145.0, 66.0, 53.0, 30.0, 23.0, 13.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.59521484375, -7.3310546875, -7.06689453125, -6.802734375, -6.53857421875, -6.2744140625, -6.01025390625, -5.74609375, -5.48193359375, -5.2177734375, -4.95361328125, -4.689453125, -4.42529296875, -4.1611328125, -3.89697265625, -3.6328125, -3.36865234375, -3.1044921875, -2.84033203125, -2.576171875, -2.31201171875, -2.0478515625, -1.78369140625, -1.51953125, -1.25537109375, -0.9912109375, -0.72705078125, -0.462890625, -0.19873046875, 0.0654296875, 0.32958984375, 0.59375, 0.85791015625, 1.1220703125, 1.38623046875, 1.650390625, 1.91455078125, 2.1787109375, 2.44287109375, 2.70703125, 2.97119140625, 3.2353515625, 3.49951171875, 3.763671875, 4.02783203125, 4.2919921875, 4.55615234375, 4.8203125, 5.08447265625, 5.3486328125, 5.61279296875, 5.876953125, 6.14111328125, 6.4052734375, 6.66943359375, 6.93359375, 7.19775390625, 7.4619140625, 7.72607421875, 7.990234375, 8.25439453125, 8.5185546875, 8.78271484375, 9.046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 13.0, 14.0, 28.0, 20.0, 45.0, 37.0, 57.0, 67.0, 74.0, 79.0, 78.0, 91.0, 74.0, 83.0, 56.0, 43.0, 34.0, 21.0, 19.0, 19.0, 15.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.86351776123047, -22.810800552368164, -21.75808334350586, -20.705366134643555, -19.65264892578125, -18.599933624267578, -17.547216415405273, -16.49449920654297, -15.441781997680664, -14.38906478881836, -13.336347579956055, -12.283631324768066, -11.230914115905762, -10.178196907043457, -9.125480651855469, -8.072763442993164, -7.020046234130859, -5.967329025268555, -4.914612293243408, -3.8618953227996826, -2.809178352355957, -1.7564611434936523, -0.7037444114685059, 0.3489723205566406, 1.4016895294189453, 2.454406499862671, 3.5071234703063965, 4.559840202331543, 5.612557411193848, 6.665274620056152, 7.717991352081299, 8.770708084106445, 9.82342529296875, 10.876142501831055, 11.92885971069336, 12.981575965881348, 14.034293174743652, 15.087010383605957, 16.139726638793945, 17.19244384765625, 18.245161056518555, 19.29787826538086, 20.350595474243164, 21.40331268310547, 22.45602798461914, 23.508747100830078, 24.56146240234375, 25.614179611206055, 26.66689682006836, 27.719614028930664, 28.77233123779297, 29.825048446655273, 30.877765655517578, 31.93048095703125, 32.98320007324219, 34.03591537475586, 35.08863067626953, 36.1413459777832, 37.19406509399414, 38.24678039550781, 39.29949951171875, 40.35221481323242, 41.40493392944336, 42.45764923095703, 43.51036834716797]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 6.0, 3.0, 7.0, 8.0, 8.0, 13.0, 20.0, 17.0, 19.0, 17.0, 20.0, 18.0, 28.0, 23.0, 39.0, 28.0, 33.0, 36.0, 27.0, 35.0, 40.0, 33.0, 41.0, 41.0, 47.0, 33.0, 34.0, 36.0, 31.0, 34.0, 27.0, 35.0, 24.0, 27.0, 15.0, 17.0, 19.0, 10.0, 8.0, 7.0, 11.0, 7.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-20.44688606262207, -19.838655471801758, -19.230424880981445, -18.6221923828125, -18.013961791992188, -17.405731201171875, -16.797500610351562, -16.18927001953125, -15.581038475036621, -14.972807884216309, -14.36457633972168, -13.756345748901367, -13.148115158081055, -12.539883613586426, -11.931653022766113, -11.323421478271484, -10.715190887451172, -10.10696029663086, -9.49872875213623, -8.890498161315918, -8.282266616821289, -7.674036026000977, -7.065805435180664, -6.457574367523193, -5.849343299865723, -5.241112232208252, -4.632881164550781, -4.024650573730469, -3.416419506072998, -2.8081884384155273, -2.1999576091766357, -1.5917267799377441, -0.9834938049316406, -0.3752628564834595, 0.23296809196472168, 0.8411990404129028, 1.449429988861084, 2.0576610565185547, 2.6658918857574463, 3.274122714996338, 3.8823537826538086, 4.490584850311279, 5.09881591796875, 5.7070465087890625, 6.315277576446533, 6.923508644104004, 7.531739234924316, 8.139970779418945, 8.748201370239258, 9.35643196105957, 9.9646635055542, 10.572894096374512, 11.18112564086914, 11.789356231689453, 12.397586822509766, 13.005817413330078, 13.614048957824707, 14.22227954864502, 14.830511093139648, 15.438741683959961, 16.046972274780273, 16.65520477294922, 17.26343536376953, 17.871665954589844, 18.479896545410156]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 13.0, 23.0, 35.0, 33.0, 54.0, 98.0, 163.0, 226.0, 386.0, 714.0, 1307.0, 2392.0, 4898.0, 10575.0, 24868.0, 61761.0, 160364.0, 330136.0, 265697.0, 109294.0, 42368.0, 17463.0, 7788.0, 3700.0, 1773.0, 954.0, 549.0, 328.0, 171.0, 138.0, 83.0, 58.0, 45.0, 23.0, 12.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 5.0], "bins": [-23.265625, -22.6810302734375, -22.096435546875, -21.5118408203125, -20.92724609375, -20.3426513671875, -19.758056640625, -19.1734619140625, -18.5888671875, -18.0042724609375, -17.419677734375, -16.8350830078125, -16.25048828125, -15.6658935546875, -15.081298828125, -14.4967041015625, -13.912109375, -13.3275146484375, -12.742919921875, -12.1583251953125, -11.57373046875, -10.9891357421875, -10.404541015625, -9.8199462890625, -9.2353515625, -8.6507568359375, -8.066162109375, -7.4815673828125, -6.89697265625, -6.3123779296875, -5.727783203125, -5.1431884765625, -4.55859375, -3.9739990234375, -3.389404296875, -2.8048095703125, -2.22021484375, -1.6356201171875, -1.051025390625, -0.4664306640625, 0.1181640625, 0.7027587890625, 1.287353515625, 1.8719482421875, 2.45654296875, 3.0411376953125, 3.625732421875, 4.2103271484375, 4.794921875, 5.3795166015625, 5.964111328125, 6.5487060546875, 7.13330078125, 7.7178955078125, 8.302490234375, 8.8870849609375, 9.4716796875, 10.0562744140625, 10.640869140625, 11.2254638671875, 11.81005859375, 12.3946533203125, 12.979248046875, 13.5638427734375, 14.1484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 13.0, 14.0, 17.0, 13.0, 18.0, 43.0, 23.0, 32.0, 40.0, 44.0, 43.0, 38.0, 49.0, 55.0, 71.0, 56.0, 53.0, 52.0, 45.0, 46.0, 49.0, 30.0, 30.0, 29.0, 17.0, 13.0, 12.0, 13.0, 4.0, 4.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.3175048828125, -9.963134765625, -9.6087646484375, -9.25439453125, -8.9000244140625, -8.545654296875, -8.1912841796875, -7.8369140625, -7.4825439453125, -7.128173828125, -6.7738037109375, -6.41943359375, -6.0650634765625, -5.710693359375, -5.3563232421875, -5.001953125, -4.6475830078125, -4.293212890625, -3.9388427734375, -3.58447265625, -3.2301025390625, -2.875732421875, -2.5213623046875, -2.1669921875, -1.8126220703125, -1.458251953125, -1.1038818359375, -0.74951171875, -0.3951416015625, -0.040771484375, 0.3135986328125, 0.66796875, 1.0223388671875, 1.376708984375, 1.7310791015625, 2.08544921875, 2.4398193359375, 2.794189453125, 3.1485595703125, 3.5029296875, 3.8572998046875, 4.211669921875, 4.5660400390625, 4.92041015625, 5.2747802734375, 5.629150390625, 5.9835205078125, 6.337890625, 6.6922607421875, 7.046630859375, 7.4010009765625, 7.75537109375, 8.1097412109375, 8.464111328125, 8.8184814453125, 9.1728515625, 9.5272216796875, 9.881591796875, 10.2359619140625, 10.59033203125, 10.9447021484375, 11.299072265625, 11.6534423828125, 12.0078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 14.0, 17.0, 25.0, 38.0, 51.0, 109.0, 154.0, 286.0, 443.0, 807.0, 1514.0, 3996.0, 20550.0, 223846.0, 708073.0, 74141.0, 9319.0, 2496.0, 1097.0, 609.0, 362.0, 222.0, 130.0, 85.0, 58.0, 32.0, 19.0, 18.0, 15.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.77001953125, -37.4462890625, -36.12255859375, -34.798828125, -33.47509765625, -32.1513671875, -30.82763671875, -29.50390625, -28.18017578125, -26.8564453125, -25.53271484375, -24.208984375, -22.88525390625, -21.5615234375, -20.23779296875, -18.9140625, -17.59033203125, -16.2666015625, -14.94287109375, -13.619140625, -12.29541015625, -10.9716796875, -9.64794921875, -8.32421875, -7.00048828125, -5.6767578125, -4.35302734375, -3.029296875, -1.70556640625, -0.3818359375, 0.94189453125, 2.265625, 3.58935546875, 4.9130859375, 6.23681640625, 7.560546875, 8.88427734375, 10.2080078125, 11.53173828125, 12.85546875, 14.17919921875, 15.5029296875, 16.82666015625, 18.150390625, 19.47412109375, 20.7978515625, 22.12158203125, 23.4453125, 24.76904296875, 26.0927734375, 27.41650390625, 28.740234375, 30.06396484375, 31.3876953125, 32.71142578125, 34.03515625, 35.35888671875, 36.6826171875, 38.00634765625, 39.330078125, 40.65380859375, 41.9775390625, 43.30126953125, 44.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 10.0, 15.0, 11.0, 24.0, 28.0, 36.0, 47.0, 68.0, 68.0, 81.0, 97.0, 92.0, 82.0, 74.0, 74.0, 60.0, 46.0, 39.0, 12.0, 19.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.125, -94.6435546875, -92.162109375, -89.6806640625, -87.19921875, -84.7177734375, -82.236328125, -79.7548828125, -77.2734375, -74.7919921875, -72.310546875, -69.8291015625, -67.34765625, -64.8662109375, -62.384765625, -59.9033203125, -57.421875, -54.9404296875, -52.458984375, -49.9775390625, -47.49609375, -45.0146484375, -42.533203125, -40.0517578125, -37.5703125, -35.0888671875, -32.607421875, -30.1259765625, -27.64453125, -25.1630859375, -22.681640625, -20.2001953125, -17.71875, -15.2373046875, -12.755859375, -10.2744140625, -7.79296875, -5.3115234375, -2.830078125, -0.3486328125, 2.1328125, 4.6142578125, 7.095703125, 9.5771484375, 12.05859375, 14.5400390625, 17.021484375, 19.5029296875, 21.984375, 24.4658203125, 26.947265625, 29.4287109375, 31.91015625, 34.3916015625, 36.873046875, 39.3544921875, 41.8359375, 44.3173828125, 46.798828125, 49.2802734375, 51.76171875, 54.2431640625, 56.724609375, 59.2060546875, 61.6875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 9.0, 20.0, 24.0, 36.0, 33.0, 46.0, 87.0, 165.0, 320.0, 830.0, 2377.0, 10241.0, 72716.0, 685320.0, 244919.0, 24460.0, 4593.0, 1227.0, 469.0, 236.0, 130.0, 79.0, 62.0, 28.0, 20.0, 23.0, 16.0, 12.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.90625, -14.4366455078125, -13.967041015625, -13.4974365234375, -13.02783203125, -12.5582275390625, -12.088623046875, -11.6190185546875, -11.1494140625, -10.6798095703125, -10.210205078125, -9.7406005859375, -9.27099609375, -8.8013916015625, -8.331787109375, -7.8621826171875, -7.392578125, -6.9229736328125, -6.453369140625, -5.9837646484375, -5.51416015625, -5.0445556640625, -4.574951171875, -4.1053466796875, -3.6357421875, -3.1661376953125, -2.696533203125, -2.2269287109375, -1.75732421875, -1.2877197265625, -0.818115234375, -0.3485107421875, 0.12109375, 0.5906982421875, 1.060302734375, 1.5299072265625, 1.99951171875, 2.4691162109375, 2.938720703125, 3.4083251953125, 3.8779296875, 4.3475341796875, 4.817138671875, 5.2867431640625, 5.75634765625, 6.2259521484375, 6.695556640625, 7.1651611328125, 7.634765625, 8.1043701171875, 8.573974609375, 9.0435791015625, 9.51318359375, 9.9827880859375, 10.452392578125, 10.9219970703125, 11.3916015625, 11.8612060546875, 12.330810546875, 12.8004150390625, 13.27001953125, 13.7396240234375, 14.209228515625, 14.6788330078125, 15.1484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 12.0, 14.0, 14.0, 23.0, 23.0, 26.0, 38.0, 49.0, 61.0, 86.0, 92.0, 97.0, 77.0, 94.0, 74.0, 52.0, 40.0, 21.0, 15.0, 27.0, 12.0, 6.0, 3.0, 7.0, 7.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015344619750976562, -0.001486077904701233, -0.0014376938343048096, -0.0013893097639083862, -0.0013409256935119629, -0.0012925416231155396, -0.0012441575527191162, -0.0011957734823226929, -0.0011473894119262695, -0.0010990053415298462, -0.0010506212711334229, -0.0010022372007369995, -0.0009538531303405762, -0.0009054690599441528, -0.0008570849895477295, -0.0008087009191513062, -0.0007603168487548828, -0.0007119327783584595, -0.0006635487079620361, -0.0006151646375656128, -0.0005667805671691895, -0.0005183964967727661, -0.0004700124263763428, -0.00042162835597991943, -0.0003732442855834961, -0.00032486021518707275, -0.0002764761447906494, -0.00022809207439422607, -0.00017970800399780273, -0.0001313239336013794, -8.293986320495605e-05, -3.4555792808532715e-05, 1.3828277587890625e-05, 6.221234798431396e-05, 0.0001105964183807373, 0.00015898048877716064, 0.00020736455917358398, 0.0002557486295700073, 0.00030413269996643066, 0.000352516770362854, 0.00040090084075927734, 0.0004492849111557007, 0.000497668981552124, 0.0005460530519485474, 0.0005944371223449707, 0.000642821192741394, 0.0006912052631378174, 0.0007395893335342407, 0.0007879734039306641, 0.0008363574743270874, 0.0008847415447235107, 0.0009331256151199341, 0.0009815096855163574, 0.0010298937559127808, 0.001078277826309204, 0.0011266618967056274, 0.0011750459671020508, 0.0012234300374984741, 0.0012718141078948975, 0.0013201981782913208, 0.0013685822486877441, 0.0014169663190841675, 0.0014653503894805908, 0.0015137344598770142, 0.0015621185302734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 12.0, 18.0, 39.0, 64.0, 96.0, 148.0, 340.0, 870.0, 2642.0, 15790.0, 292222.0, 693800.0, 35941.0, 4480.0, 1144.0, 420.0, 207.0, 125.0, 66.0, 45.0, 22.0, 17.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.365966796875, -21.74755859375, -21.129150390625, -20.5107421875, -19.892333984375, -19.27392578125, -18.655517578125, -18.037109375, -17.418701171875, -16.80029296875, -16.181884765625, -15.5634765625, -14.945068359375, -14.32666015625, -13.708251953125, -13.08984375, -12.471435546875, -11.85302734375, -11.234619140625, -10.6162109375, -9.997802734375, -9.37939453125, -8.760986328125, -8.142578125, -7.524169921875, -6.90576171875, -6.287353515625, -5.6689453125, -5.050537109375, -4.43212890625, -3.813720703125, -3.1953125, -2.576904296875, -1.95849609375, -1.340087890625, -0.7216796875, -0.103271484375, 0.51513671875, 1.133544921875, 1.751953125, 2.370361328125, 2.98876953125, 3.607177734375, 4.2255859375, 4.843994140625, 5.46240234375, 6.080810546875, 6.69921875, 7.317626953125, 7.93603515625, 8.554443359375, 9.1728515625, 9.791259765625, 10.40966796875, 11.028076171875, 11.646484375, 12.264892578125, 12.88330078125, 13.501708984375, 14.1201171875, 14.738525390625, 15.35693359375, 15.975341796875, 16.59375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 16.0, 18.0, 29.0, 62.0, 116.0, 174.0, 212.0, 161.0, 82.0, 46.0, 35.0, 18.0, 11.0, 10.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -12.74658203125, -11.9619140625, -11.17724609375, -10.392578125, -9.60791015625, -8.8232421875, -8.03857421875, -7.25390625, -6.46923828125, -5.6845703125, -4.89990234375, -4.115234375, -3.33056640625, -2.5458984375, -1.76123046875, -0.9765625, -0.19189453125, 0.5927734375, 1.37744140625, 2.162109375, 2.94677734375, 3.7314453125, 4.51611328125, 5.30078125, 6.08544921875, 6.8701171875, 7.65478515625, 8.439453125, 9.22412109375, 10.0087890625, 10.79345703125, 11.578125, 12.36279296875, 13.1474609375, 13.93212890625, 14.716796875, 15.50146484375, 16.2861328125, 17.07080078125, 17.85546875, 18.64013671875, 19.4248046875, 20.20947265625, 20.994140625, 21.77880859375, 22.5634765625, 23.34814453125, 24.1328125, 24.91748046875, 25.7021484375, 26.48681640625, 27.271484375, 28.05615234375, 28.8408203125, 29.62548828125, 30.41015625, 31.19482421875, 31.9794921875, 32.76416015625, 33.548828125, 34.33349609375, 35.1181640625, 35.90283203125, 36.6875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 10.0, 25.0, 62.0, 113.0, 178.0, 186.0, 198.0, 104.0, 67.0, 29.0, 16.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.80343627929688, -229.04330444335938, -219.28317260742188, -209.52304077148438, -199.76290893554688, -190.00277709960938, -180.24266052246094, -170.48252868652344, -160.72239685058594, -150.96226501464844, -141.20213317871094, -131.44200134277344, -121.68187713623047, -111.92174530029297, -102.16162109375, -92.4014892578125, -82.641357421875, -72.8812255859375, -63.121097564697266, -53.36096954345703, -43.60083770751953, -33.84070587158203, -24.080577850341797, -14.320449829101562, -4.5603179931640625, 5.199811935424805, 14.959941864013672, 24.72007179260254, 34.480201721191406, 44.240333557128906, 54.00046157836914, 63.760589599609375, 73.520751953125, 83.2808837890625, 93.041015625, 102.80113983154297, 112.56127166748047, 122.32140350341797, 132.08152770996094, 141.84165954589844, 151.60179138183594, 161.36192321777344, 171.12205505371094, 180.88218688964844, 190.64230346679688, 200.40243530273438, 210.16256713867188, 219.92269897460938, 229.68283081054688, 239.44296264648438, 249.20309448242188, 258.9632263183594, 268.7233581542969, 278.4834899902344, 288.2436218261719, 298.00372314453125, 307.76385498046875, 317.52398681640625, 327.28411865234375, 337.04425048828125, 346.80438232421875, 356.56451416015625, 366.32464599609375, 376.08477783203125, 385.84490966796875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 7.0, 6.0, 6.0, 9.0, 14.0, 20.0, 18.0, 19.0, 16.0, 25.0, 30.0, 30.0, 35.0, 39.0, 38.0, 69.0, 42.0, 46.0, 42.0, 49.0, 42.0, 61.0, 54.0, 39.0, 30.0, 26.0, 27.0, 29.0, 21.0, 22.0, 18.0, 14.0, 13.0, 6.0, 10.0, 4.0, 1.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.62432861328125, -136.12173461914062, -130.619140625, -125.11654663085938, -119.61395263671875, -114.11135864257812, -108.60877227783203, -103.1061782836914, -97.60358428955078, -92.10099029541016, -86.59839630126953, -81.09580993652344, -75.59321594238281, -70.09062194824219, -64.58802795410156, -59.08543395996094, -53.58283996582031, -48.08024597167969, -42.57765197753906, -37.0750617980957, -31.572467803955078, -26.069873809814453, -20.567283630371094, -15.064689636230469, -9.562095642089844, -4.059502601623535, 1.4430904388427734, 6.945682525634766, 12.44827651977539, 17.950870513916016, 23.453460693359375, 28.9560546875, 34.458648681640625, 39.96124267578125, 45.463836669921875, 50.966426849365234, 56.46902084350586, 61.971614837646484, 67.47420501708984, 72.97679901123047, 78.4793930053711, 83.98198699951172, 89.48458099365234, 94.98716735839844, 100.48976135253906, 105.99235534667969, 111.49494934082031, 116.99754333496094, 122.50013732910156, 128.0027313232422, 133.5053253173828, 139.00791931152344, 144.51051330566406, 150.0131072998047, 155.51568603515625, 161.01828002929688, 166.5208740234375, 172.02346801757812, 177.52606201171875, 183.02865600585938, 188.53125, 194.03384399414062, 199.53643798828125, 205.03903198242188, 210.5416259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 14.0, 26.0, 29.0, 53.0, 47.0, 66.0, 127.0, 218.0, 303.0, 536.0, 921.0, 1679.0, 3633.0, 9746.0, 70909.0, 4076140.0, 19210.0, 5362.0, 2359.0, 1141.0, 627.0, 378.0, 244.0, 152.0, 105.0, 77.0, 44.0, 35.0, 20.0, 20.0, 19.0, 9.0, 13.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.28125, -57.54931640625, -55.8173828125, -54.08544921875, -52.353515625, -50.62158203125, -48.8896484375, -47.15771484375, -45.42578125, -43.69384765625, -41.9619140625, -40.22998046875, -38.498046875, -36.76611328125, -35.0341796875, -33.30224609375, -31.5703125, -29.83837890625, -28.1064453125, -26.37451171875, -24.642578125, -22.91064453125, -21.1787109375, -19.44677734375, -17.71484375, -15.98291015625, -14.2509765625, -12.51904296875, -10.787109375, -9.05517578125, -7.3232421875, -5.59130859375, -3.859375, -2.12744140625, -0.3955078125, 1.33642578125, 3.068359375, 4.80029296875, 6.5322265625, 8.26416015625, 9.99609375, 11.72802734375, 13.4599609375, 15.19189453125, 16.923828125, 18.65576171875, 20.3876953125, 22.11962890625, 23.8515625, 25.58349609375, 27.3154296875, 29.04736328125, 30.779296875, 32.51123046875, 34.2431640625, 35.97509765625, 37.70703125, 39.43896484375, 41.1708984375, 42.90283203125, 44.634765625, 46.36669921875, 48.0986328125, 49.83056640625, 51.5625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 6.0, 8.0, 11.0, 13.0, 24.0, 18.0, 25.0, 22.0, 32.0, 36.0, 58.0, 46.0, 48.0, 62.0, 69.0, 57.0, 66.0, 54.0, 45.0, 51.0, 46.0, 38.0, 28.0, 32.0, 25.0, 20.0, 14.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.859375, -11.4774169921875, -11.095458984375, -10.7135009765625, -10.33154296875, -9.9495849609375, -9.567626953125, -9.1856689453125, -8.8037109375, -8.4217529296875, -8.039794921875, -7.6578369140625, -7.27587890625, -6.8939208984375, -6.511962890625, -6.1300048828125, -5.748046875, -5.3660888671875, -4.984130859375, -4.6021728515625, -4.22021484375, -3.8382568359375, -3.456298828125, -3.0743408203125, -2.6923828125, -2.3104248046875, -1.928466796875, -1.5465087890625, -1.16455078125, -0.7825927734375, -0.400634765625, -0.0186767578125, 0.36328125, 0.7452392578125, 1.127197265625, 1.5091552734375, 1.89111328125, 2.2730712890625, 2.655029296875, 3.0369873046875, 3.4189453125, 3.8009033203125, 4.182861328125, 4.5648193359375, 4.94677734375, 5.3287353515625, 5.710693359375, 6.0926513671875, 6.474609375, 6.8565673828125, 7.238525390625, 7.6204833984375, 8.00244140625, 8.3843994140625, 8.766357421875, 9.1483154296875, 9.5302734375, 9.9122314453125, 10.294189453125, 10.6761474609375, 11.05810546875, 11.4400634765625, 11.822021484375, 12.2039794921875, 12.5859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 8.0, 15.0, 11.0, 26.0, 52.0, 42.0, 104.0, 135.0, 170.0, 258.0, 414.0, 679.0, 1214.0, 2261.0, 4717.0, 11633.0, 54635.0, 4044434.0, 52344.0, 11318.0, 4549.0, 2177.0, 1162.0, 696.0, 424.0, 248.0, 175.0, 103.0, 95.0, 68.0, 39.0, 24.0, 18.0, 17.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.25, -38.0419921875, -36.833984375, -35.6259765625, -34.41796875, -33.2099609375, -32.001953125, -30.7939453125, -29.5859375, -28.3779296875, -27.169921875, -25.9619140625, -24.75390625, -23.5458984375, -22.337890625, -21.1298828125, -19.921875, -18.7138671875, -17.505859375, -16.2978515625, -15.08984375, -13.8818359375, -12.673828125, -11.4658203125, -10.2578125, -9.0498046875, -7.841796875, -6.6337890625, -5.42578125, -4.2177734375, -3.009765625, -1.8017578125, -0.59375, 0.6142578125, 1.822265625, 3.0302734375, 4.23828125, 5.4462890625, 6.654296875, 7.8623046875, 9.0703125, 10.2783203125, 11.486328125, 12.6943359375, 13.90234375, 15.1103515625, 16.318359375, 17.5263671875, 18.734375, 19.9423828125, 21.150390625, 22.3583984375, 23.56640625, 24.7744140625, 25.982421875, 27.1904296875, 28.3984375, 29.6064453125, 30.814453125, 32.0224609375, 33.23046875, 34.4384765625, 35.646484375, 36.8544921875, 38.0625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 3.0, 11.0, 10.0, 10.0, 19.0, 34.0, 50.0, 169.0, 3543.0, 112.0, 38.0, 21.0, 14.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.1163330078125, -6.865478515625, -6.6146240234375, -6.36376953125, -6.1129150390625, -5.862060546875, -5.6112060546875, -5.3603515625, -5.1094970703125, -4.858642578125, -4.6077880859375, -4.35693359375, -4.1060791015625, -3.855224609375, -3.6043701171875, -3.353515625, -3.1026611328125, -2.851806640625, -2.6009521484375, -2.35009765625, -2.0992431640625, -1.848388671875, -1.5975341796875, -1.3466796875, -1.0958251953125, -0.844970703125, -0.5941162109375, -0.34326171875, -0.0924072265625, 0.158447265625, 0.4093017578125, 0.66015625, 0.9110107421875, 1.161865234375, 1.4127197265625, 1.66357421875, 1.9144287109375, 2.165283203125, 2.4161376953125, 2.6669921875, 2.9178466796875, 3.168701171875, 3.4195556640625, 3.67041015625, 3.9212646484375, 4.172119140625, 4.4229736328125, 4.673828125, 4.9246826171875, 5.175537109375, 5.4263916015625, 5.67724609375, 5.9281005859375, 6.178955078125, 6.4298095703125, 6.6806640625, 6.9315185546875, 7.182373046875, 7.4332275390625, 7.68408203125, 7.9349365234375, 8.185791015625, 8.4366455078125, 8.6875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 9.0, 7.0, 21.0, 32.0, 52.0, 76.0, 99.0, 165.0, 156.0, 145.0, 80.0, 56.0, 48.0, 21.0, 10.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.23912811279297, -28.971227645874023, -27.703327178955078, -26.435426712036133, -25.167526245117188, -23.89962387084961, -22.631723403930664, -21.36382293701172, -20.095922470092773, -18.828022003173828, -17.560121536254883, -16.292221069335938, -15.024319648742676, -13.75641918182373, -12.488517761230469, -11.220617294311523, -9.952716827392578, -8.684816360473633, -7.416915416717529, -6.149014472961426, -4.8811140060424805, -3.613213539123535, -2.3453125953674316, -1.0774116516113281, 0.1904888153076172, 1.4583895206451416, 2.726290225982666, 3.9941909313201904, 5.262091636657715, 6.52999210357666, 7.797893047332764, 9.065793991088867, 10.333694458007812, 11.601594924926758, 12.869495391845703, 14.137396812438965, 15.40529727935791, 16.673198699951172, 17.941099166870117, 19.208999633789062, 20.476900100708008, 21.744800567626953, 23.0127010345459, 24.280601501464844, 25.548503875732422, 26.816402435302734, 28.084304809570312, 29.352205276489258, 30.620105743408203, 31.88800621032715, 33.155906677246094, 34.42380905151367, 35.691707611083984, 36.95960998535156, 38.227508544921875, 39.49541091918945, 40.76331329345703, 42.03121566772461, 43.29911422729492, 44.5670166015625, 45.83491516113281, 47.10281753540039, 48.3707160949707, 49.63861846923828, 50.906517028808594]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 5.0, 9.0, 12.0, 11.0, 24.0, 30.0, 36.0, 24.0, 44.0, 34.0, 48.0, 51.0, 34.0, 55.0, 45.0, 49.0, 48.0, 48.0, 44.0, 56.0, 40.0, 34.0, 37.0, 38.0, 27.0, 19.0, 17.0, 21.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.48516845703125, -16.885601043701172, -16.286035537719727, -15.686468124389648, -15.086901664733887, -14.487335205078125, -13.887767791748047, -13.288201332092285, -12.688634872436523, -12.089068412780762, -11.489500999450684, -10.889934539794922, -10.29036808013916, -9.690801620483398, -9.09123420715332, -8.491667747497559, -7.8921003341674805, -7.2925333976745605, -6.692966938018799, -6.093400001525879, -5.493833541870117, -4.894266605377197, -4.294699668884277, -3.6951332092285156, -3.0955662727355957, -2.495999574661255, -1.8964327573776245, -1.2968659400939941, -0.6972992420196533, -0.0977325439453125, 0.5018343925476074, 1.1014008522033691, 1.700967788696289, 2.30053448677063, 2.9001011848449707, 3.4996681213378906, 4.099234580993652, 4.698801517486572, 5.298368453979492, 5.897934913635254, 6.497501850128174, 7.097068786621094, 7.6966352462768555, 8.296201705932617, 8.895769119262695, 9.495335578918457, 10.094902038574219, 10.694469451904297, 11.294035911560059, 11.89360237121582, 12.493169784545898, 13.09273624420166, 13.692302703857422, 14.2918701171875, 14.891436576843262, 15.491003036499023, 16.0905704498291, 16.69013786315918, 17.289703369140625, 17.889270782470703, 18.48883819580078, 19.088403701782227, 19.687971115112305, 20.28753662109375, 20.887104034423828]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 14.0, 13.0, 24.0, 22.0, 35.0, 50.0, 69.0, 98.0, 165.0, 271.0, 370.0, 609.0, 992.0, 1791.0, 3120.0, 5748.0, 10670.0, 21807.0, 44177.0, 91865.0, 181555.0, 271511.0, 203803.0, 106014.0, 51348.0, 24798.0, 12461.0, 6518.0, 3571.0, 1976.0, 1129.0, 670.0, 427.0, 283.0, 193.0, 122.0, 87.0, 41.0, 32.0, 27.0, 20.0, 18.0, 9.0, 10.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-13.5078125, -13.117431640625, -12.72705078125, -12.336669921875, -11.9462890625, -11.555908203125, -11.16552734375, -10.775146484375, -10.384765625, -9.994384765625, -9.60400390625, -9.213623046875, -8.8232421875, -8.432861328125, -8.04248046875, -7.652099609375, -7.26171875, -6.871337890625, -6.48095703125, -6.090576171875, -5.7001953125, -5.309814453125, -4.91943359375, -4.529052734375, -4.138671875, -3.748291015625, -3.35791015625, -2.967529296875, -2.5771484375, -2.186767578125, -1.79638671875, -1.406005859375, -1.015625, -0.625244140625, -0.23486328125, 0.155517578125, 0.5458984375, 0.936279296875, 1.32666015625, 1.717041015625, 2.107421875, 2.497802734375, 2.88818359375, 3.278564453125, 3.6689453125, 4.059326171875, 4.44970703125, 4.840087890625, 5.23046875, 5.620849609375, 6.01123046875, 6.401611328125, 6.7919921875, 7.182373046875, 7.57275390625, 7.963134765625, 8.353515625, 8.743896484375, 9.13427734375, 9.524658203125, 9.9150390625, 10.305419921875, 10.69580078125, 11.086181640625, 11.4765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 11.0, 12.0, 14.0, 12.0, 25.0, 32.0, 23.0, 37.0, 40.0, 29.0, 55.0, 57.0, 65.0, 69.0, 59.0, 61.0, 59.0, 46.0, 53.0, 50.0, 28.0, 40.0, 31.0, 18.0, 13.0, 11.0, 18.0, 7.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6640625, -12.268310546875, -11.87255859375, -11.476806640625, -11.0810546875, -10.685302734375, -10.28955078125, -9.893798828125, -9.498046875, -9.102294921875, -8.70654296875, -8.310791015625, -7.9150390625, -7.519287109375, -7.12353515625, -6.727783203125, -6.33203125, -5.936279296875, -5.54052734375, -5.144775390625, -4.7490234375, -4.353271484375, -3.95751953125, -3.561767578125, -3.166015625, -2.770263671875, -2.37451171875, -1.978759765625, -1.5830078125, -1.187255859375, -0.79150390625, -0.395751953125, 0.0, 0.395751953125, 0.79150390625, 1.187255859375, 1.5830078125, 1.978759765625, 2.37451171875, 2.770263671875, 3.166015625, 3.561767578125, 3.95751953125, 4.353271484375, 4.7490234375, 5.144775390625, 5.54052734375, 5.936279296875, 6.33203125, 6.727783203125, 7.12353515625, 7.519287109375, 7.9150390625, 8.310791015625, 8.70654296875, 9.102294921875, 9.498046875, 9.893798828125, 10.28955078125, 10.685302734375, 11.0810546875, 11.476806640625, 11.87255859375, 12.268310546875, 12.6640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 16.0, 22.0, 22.0, 31.0, 48.0, 68.0, 110.0, 122.0, 163.0, 213.0, 293.0, 414.0, 591.0, 893.0, 1678.0, 4011.0, 16330.0, 101031.0, 630230.0, 245837.0, 33594.0, 6824.0, 2324.0, 1179.0, 727.0, 509.0, 328.0, 242.0, 203.0, 122.0, 97.0, 64.0, 56.0, 29.0, 48.0, 21.0, 15.0, 13.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.0, -26.120849609375, -25.24169921875, -24.362548828125, -23.4833984375, -22.604248046875, -21.72509765625, -20.845947265625, -19.966796875, -19.087646484375, -18.20849609375, -17.329345703125, -16.4501953125, -15.571044921875, -14.69189453125, -13.812744140625, -12.93359375, -12.054443359375, -11.17529296875, -10.296142578125, -9.4169921875, -8.537841796875, -7.65869140625, -6.779541015625, -5.900390625, -5.021240234375, -4.14208984375, -3.262939453125, -2.3837890625, -1.504638671875, -0.62548828125, 0.253662109375, 1.1328125, 2.011962890625, 2.89111328125, 3.770263671875, 4.6494140625, 5.528564453125, 6.40771484375, 7.286865234375, 8.166015625, 9.045166015625, 9.92431640625, 10.803466796875, 11.6826171875, 12.561767578125, 13.44091796875, 14.320068359375, 15.19921875, 16.078369140625, 16.95751953125, 17.836669921875, 18.7158203125, 19.594970703125, 20.47412109375, 21.353271484375, 22.232421875, 23.111572265625, 23.99072265625, 24.869873046875, 25.7490234375, 26.628173828125, 27.50732421875, 28.386474609375, 29.265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 11.0, 6.0, 8.0, 11.0, 15.0, 23.0, 18.0, 24.0, 44.0, 32.0, 38.0, 40.0, 50.0, 46.0, 43.0, 55.0, 60.0, 51.0, 50.0, 47.0, 46.0, 41.0, 34.0, 29.0, 30.0, 27.0, 22.0, 20.0, 17.0, 16.0, 9.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-53.03125, -51.62548828125, -50.2197265625, -48.81396484375, -47.408203125, -46.00244140625, -44.5966796875, -43.19091796875, -41.78515625, -40.37939453125, -38.9736328125, -37.56787109375, -36.162109375, -34.75634765625, -33.3505859375, -31.94482421875, -30.5390625, -29.13330078125, -27.7275390625, -26.32177734375, -24.916015625, -23.51025390625, -22.1044921875, -20.69873046875, -19.29296875, -17.88720703125, -16.4814453125, -15.07568359375, -13.669921875, -12.26416015625, -10.8583984375, -9.45263671875, -8.046875, -6.64111328125, -5.2353515625, -3.82958984375, -2.423828125, -1.01806640625, 0.3876953125, 1.79345703125, 3.19921875, 4.60498046875, 6.0107421875, 7.41650390625, 8.822265625, 10.22802734375, 11.6337890625, 13.03955078125, 14.4453125, 15.85107421875, 17.2568359375, 18.66259765625, 20.068359375, 21.47412109375, 22.8798828125, 24.28564453125, 25.69140625, 27.09716796875, 28.5029296875, 29.90869140625, 31.314453125, 32.72021484375, 34.1259765625, 35.53173828125, 36.9375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 8.0, 9.0, 10.0, 13.0, 15.0, 23.0, 32.0, 48.0, 54.0, 80.0, 168.0, 350.0, 797.0, 2456.0, 10813.0, 120345.0, 844161.0, 58879.0, 7101.0, 1822.0, 648.0, 317.0, 161.0, 80.0, 53.0, 26.0, 23.0, 12.0, 11.0, 12.0, 10.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.275146484375, -16.70654296875, -16.137939453125, -15.5693359375, -15.000732421875, -14.43212890625, -13.863525390625, -13.294921875, -12.726318359375, -12.15771484375, -11.589111328125, -11.0205078125, -10.451904296875, -9.88330078125, -9.314697265625, -8.74609375, -8.177490234375, -7.60888671875, -7.040283203125, -6.4716796875, -5.903076171875, -5.33447265625, -4.765869140625, -4.197265625, -3.628662109375, -3.06005859375, -2.491455078125, -1.9228515625, -1.354248046875, -0.78564453125, -0.217041015625, 0.3515625, 0.920166015625, 1.48876953125, 2.057373046875, 2.6259765625, 3.194580078125, 3.76318359375, 4.331787109375, 4.900390625, 5.468994140625, 6.03759765625, 6.606201171875, 7.1748046875, 7.743408203125, 8.31201171875, 8.880615234375, 9.44921875, 10.017822265625, 10.58642578125, 11.155029296875, 11.7236328125, 12.292236328125, 12.86083984375, 13.429443359375, 13.998046875, 14.566650390625, 15.13525390625, 15.703857421875, 16.2724609375, 16.841064453125, 17.40966796875, 17.978271484375, 18.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 11.0, 11.0, 21.0, 25.0, 30.0, 64.0, 81.0, 104.0, 127.0, 141.0, 104.0, 82.0, 46.0, 35.0, 32.0, 23.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015468597412109375, -0.001484990119934082, -0.0014231204986572266, -0.001361250877380371, -0.0012993812561035156, -0.0012375116348266602, -0.0011756420135498047, -0.0011137723922729492, -0.0010519027709960938, -0.0009900331497192383, -0.0009281635284423828, -0.0008662939071655273, -0.0008044242858886719, -0.0007425546646118164, -0.0006806850433349609, -0.0006188154220581055, -0.00055694580078125, -0.0004950761795043945, -0.00043320655822753906, -0.0003713369369506836, -0.0003094673156738281, -0.00024759769439697266, -0.0001857280731201172, -0.00012385845184326172, -6.198883056640625e-05, -1.1920928955078125e-07, 6.175041198730469e-05, 0.00012362003326416016, 0.00018548965454101562, 0.0002473592758178711, 0.00030922889709472656, 0.00037109851837158203, 0.0004329681396484375, 0.000494837760925293, 0.0005567073822021484, 0.0006185770034790039, 0.0006804466247558594, 0.0007423162460327148, 0.0008041858673095703, 0.0008660554885864258, 0.0009279251098632812, 0.0009897947311401367, 0.0010516643524169922, 0.0011135339736938477, 0.0011754035949707031, 0.0012372732162475586, 0.001299142837524414, 0.0013610124588012695, 0.001422882080078125, 0.0014847517013549805, 0.001546621322631836, 0.0016084909439086914, 0.0016703605651855469, 0.0017322301864624023, 0.0017940998077392578, 0.0018559694290161133, 0.0019178390502929688, 0.0019797086715698242, 0.0020415782928466797, 0.002103447914123535, 0.0021653175354003906, 0.002227187156677246, 0.0022890567779541016, 0.002350926399230957, 0.0024127960205078125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 24.0, 27.0, 69.0, 81.0, 123.0, 245.0, 426.0, 873.0, 2245.0, 7613.0, 40742.0, 548306.0, 404706.0, 32699.0, 6515.0, 2045.0, 803.0, 373.0, 208.0, 151.0, 86.0, 64.0, 37.0, 19.0, 12.0, 10.0, 3.0, 8.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.246337890625, -8.75830078125, -8.270263671875, -7.7822265625, -7.294189453125, -6.80615234375, -6.318115234375, -5.830078125, -5.342041015625, -4.85400390625, -4.365966796875, -3.8779296875, -3.389892578125, -2.90185546875, -2.413818359375, -1.92578125, -1.437744140625, -0.94970703125, -0.461669921875, 0.0263671875, 0.514404296875, 1.00244140625, 1.490478515625, 1.978515625, 2.466552734375, 2.95458984375, 3.442626953125, 3.9306640625, 4.418701171875, 4.90673828125, 5.394775390625, 5.8828125, 6.370849609375, 6.85888671875, 7.346923828125, 7.8349609375, 8.322998046875, 8.81103515625, 9.299072265625, 9.787109375, 10.275146484375, 10.76318359375, 11.251220703125, 11.7392578125, 12.227294921875, 12.71533203125, 13.203369140625, 13.69140625, 14.179443359375, 14.66748046875, 15.155517578125, 15.6435546875, 16.131591796875, 16.61962890625, 17.107666015625, 17.595703125, 18.083740234375, 18.57177734375, 19.059814453125, 19.5478515625, 20.035888671875, 20.52392578125, 21.011962890625, 21.5]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 9.0, 14.0, 26.0, 30.0, 40.0, 61.0, 116.0, 142.0, 163.0, 131.0, 76.0, 50.0, 44.0, 25.0, 11.0, 14.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.453125, -10.8818359375, -10.310546875, -9.7392578125, -9.16796875, -8.5966796875, -8.025390625, -7.4541015625, -6.8828125, -6.3115234375, -5.740234375, -5.1689453125, -4.59765625, -4.0263671875, -3.455078125, -2.8837890625, -2.3125, -1.7412109375, -1.169921875, -0.5986328125, -0.02734375, 0.5439453125, 1.115234375, 1.6865234375, 2.2578125, 2.8291015625, 3.400390625, 3.9716796875, 4.54296875, 5.1142578125, 5.685546875, 6.2568359375, 6.828125, 7.3994140625, 7.970703125, 8.5419921875, 9.11328125, 9.6845703125, 10.255859375, 10.8271484375, 11.3984375, 11.9697265625, 12.541015625, 13.1123046875, 13.68359375, 14.2548828125, 14.826171875, 15.3974609375, 15.96875, 16.5400390625, 17.111328125, 17.6826171875, 18.25390625, 18.8251953125, 19.396484375, 19.9677734375, 20.5390625, 21.1103515625, 21.681640625, 22.2529296875, 22.82421875, 23.3955078125, 23.966796875, 24.5380859375, 25.109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 12.0, 21.0, 37.0, 94.0, 211.0, 248.0, 191.0, 113.0, 44.0, 16.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-439.4387512207031, -428.66754150390625, -417.89630126953125, -407.1250915527344, -396.3538818359375, -385.5826416015625, -374.8114318847656, -364.04022216796875, -353.26898193359375, -342.4977722167969, -331.7265319824219, -320.955322265625, -310.18408203125, -299.4128723144531, -288.64166259765625, -277.87042236328125, -267.0992126464844, -256.3280029296875, -245.5567626953125, -234.78555297851562, -224.0143280029297, -213.24310302734375, -202.47189331054688, -191.70066833496094, -180.929443359375, -170.15821838378906, -159.38699340820312, -148.61578369140625, -137.8445587158203, -127.07333374023438, -116.30211639404297, -105.53089904785156, -94.7596435546875, -83.98841857910156, -73.21720123291016, -62.445980072021484, -51.67475891113281, -40.90353775024414, -30.13231658935547, -19.361099243164062, -8.589874267578125, 2.181346893310547, 12.952568054199219, 23.72378921508789, 34.49501037597656, 45.266231536865234, 56.037452697753906, 66.80867004394531, 77.57989501953125, 88.35111999511719, 99.1223373413086, 109.8935546875, 120.66477966308594, 131.43600463867188, 142.20721435546875, 152.9784393310547, 163.74966430664062, 174.52088928222656, 185.2921142578125, 196.06332397460938, 206.8345489501953, 217.60577392578125, 228.37698364257812, 239.14820861816406, 249.91943359375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 5.0, 8.0, 10.0, 11.0, 19.0, 20.0, 20.0, 28.0, 20.0, 31.0, 48.0, 41.0, 45.0, 56.0, 53.0, 51.0, 61.0, 50.0, 43.0, 56.0, 37.0, 43.0, 48.0, 38.0, 32.0, 23.0, 19.0, 10.0, 16.0, 9.0, 10.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.14907836914062, -163.138427734375, -157.12777709960938, -151.11712646484375, -145.10647583007812, -139.0958251953125, -133.08517456054688, -127.07450866699219, -121.06385803222656, -115.05320739746094, -109.04255676269531, -103.03190612792969, -97.02124786376953, -91.0105972290039, -84.99994659423828, -78.98928833007812, -72.97864532470703, -66.9679946899414, -60.957340240478516, -54.94668960571289, -48.93603515625, -42.925384521484375, -36.91473388671875, -30.90407943725586, -24.893428802490234, -18.882776260375977, -12.872124671936035, -6.861473083496094, -0.8508205413818359, 5.159832000732422, 11.170482635498047, 17.181137084960938, 23.191787719726562, 29.20244026184082, 35.21309280395508, 41.2237434387207, 47.234397888183594, 53.24504852294922, 59.255699157714844, 65.266357421875, 71.27700805664062, 77.28765869140625, 83.29830932617188, 89.3089599609375, 95.31961822509766, 101.33026885986328, 107.3409194946289, 113.35157775878906, 119.36222076416016, 125.37287139892578, 131.38352966308594, 137.39418029785156, 143.4048309326172, 149.4154815673828, 155.42613220214844, 161.43678283691406, 167.4474334716797, 173.4580841064453, 179.46873474121094, 185.47938537597656, 191.4900360107422, 197.50070190429688, 203.5113525390625, 209.52200317382812, 215.53265380859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 20.0, 13.0, 21.0, 35.0, 44.0, 71.0, 143.0, 194.0, 419.0, 885.0, 1903.0, 5232.0, 20951.0, 360612.0, 3768590.0, 25309.0, 5836.0, 1995.0, 898.0, 471.0, 245.0, 116.0, 85.0, 52.0, 36.0, 28.0, 16.0, 17.0, 10.0, 11.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -34.888671875, -33.49609375, -32.103515625, -30.7109375, -29.318359375, -27.92578125, -26.533203125, -25.140625, -23.748046875, -22.35546875, -20.962890625, -19.5703125, -18.177734375, -16.78515625, -15.392578125, -14.0, -12.607421875, -11.21484375, -9.822265625, -8.4296875, -7.037109375, -5.64453125, -4.251953125, -2.859375, -1.466796875, -0.07421875, 1.318359375, 2.7109375, 4.103515625, 5.49609375, 6.888671875, 8.28125, 9.673828125, 11.06640625, 12.458984375, 13.8515625, 15.244140625, 16.63671875, 18.029296875, 19.421875, 20.814453125, 22.20703125, 23.599609375, 24.9921875, 26.384765625, 27.77734375, 29.169921875, 30.5625, 31.955078125, 33.34765625, 34.740234375, 36.1328125, 37.525390625, 38.91796875, 40.310546875, 41.703125, 43.095703125, 44.48828125, 45.880859375, 47.2734375, 48.666015625, 50.05859375, 51.451171875, 52.84375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 12.0, 8.0, 9.0, 18.0, 33.0, 47.0, 65.0, 80.0, 94.0, 92.0, 88.0, 96.0, 94.0, 82.0, 52.0, 43.0, 24.0, 24.0, 10.0, 6.0, 9.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.33203125, -20.7265625, -20.12109375, -19.515625, -18.91015625, -18.3046875, -17.69921875, -17.09375, -16.48828125, -15.8828125, -15.27734375, -14.671875, -14.06640625, -13.4609375, -12.85546875, -12.25, -11.64453125, -11.0390625, -10.43359375, -9.828125, -9.22265625, -8.6171875, -8.01171875, -7.40625, -6.80078125, -6.1953125, -5.58984375, -4.984375, -4.37890625, -3.7734375, -3.16796875, -2.5625, -1.95703125, -1.3515625, -0.74609375, -0.140625, 0.46484375, 1.0703125, 1.67578125, 2.28125, 2.88671875, 3.4921875, 4.09765625, 4.703125, 5.30859375, 5.9140625, 6.51953125, 7.125, 7.73046875, 8.3359375, 8.94140625, 9.546875, 10.15234375, 10.7578125, 11.36328125, 11.96875, 12.57421875, 13.1796875, 13.78515625, 14.390625, 14.99609375, 15.6015625, 16.20703125, 16.8125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 3.0, 7.0, 15.0, 17.0, 23.0, 42.0, 52.0, 70.0, 158.0, 240.0, 388.0, 725.0, 1497.0, 3144.0, 8743.0, 38268.0, 3855783.0, 251240.0, 22400.0, 6307.0, 2453.0, 1164.0, 603.0, 325.0, 195.0, 129.0, 86.0, 42.0, 34.0, 36.0, 24.0, 19.0, 9.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.875, -40.7685546875, -39.662109375, -38.5556640625, -37.44921875, -36.3427734375, -35.236328125, -34.1298828125, -33.0234375, -31.9169921875, -30.810546875, -29.7041015625, -28.59765625, -27.4912109375, -26.384765625, -25.2783203125, -24.171875, -23.0654296875, -21.958984375, -20.8525390625, -19.74609375, -18.6396484375, -17.533203125, -16.4267578125, -15.3203125, -14.2138671875, -13.107421875, -12.0009765625, -10.89453125, -9.7880859375, -8.681640625, -7.5751953125, -6.46875, -5.3623046875, -4.255859375, -3.1494140625, -2.04296875, -0.9365234375, 0.169921875, 1.2763671875, 2.3828125, 3.4892578125, 4.595703125, 5.7021484375, 6.80859375, 7.9150390625, 9.021484375, 10.1279296875, 11.234375, 12.3408203125, 13.447265625, 14.5537109375, 15.66015625, 16.7666015625, 17.873046875, 18.9794921875, 20.0859375, 21.1923828125, 22.298828125, 23.4052734375, 24.51171875, 25.6181640625, 26.724609375, 27.8310546875, 28.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 11.0, 11.0, 13.0, 16.0, 23.0, 37.0, 71.0, 126.0, 646.0, 2746.0, 152.0, 59.0, 38.0, 33.0, 21.0, 9.0, 11.0, 4.0, 8.0, 4.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-12.3671875, -12.06622314453125, -11.7652587890625, -11.46429443359375, -11.163330078125, -10.86236572265625, -10.5614013671875, -10.26043701171875, -9.95947265625, -9.65850830078125, -9.3575439453125, -9.05657958984375, -8.755615234375, -8.45465087890625, -8.1536865234375, -7.85272216796875, -7.5517578125, -7.25079345703125, -6.9498291015625, -6.64886474609375, -6.347900390625, -6.04693603515625, -5.7459716796875, -5.44500732421875, -5.14404296875, -4.84307861328125, -4.5421142578125, -4.24114990234375, -3.940185546875, -3.63922119140625, -3.3382568359375, -3.03729248046875, -2.736328125, -2.43536376953125, -2.1343994140625, -1.83343505859375, -1.532470703125, -1.23150634765625, -0.9305419921875, -0.62957763671875, -0.32861328125, -0.02764892578125, 0.2733154296875, 0.57427978515625, 0.875244140625, 1.17620849609375, 1.4771728515625, 1.77813720703125, 2.0791015625, 2.38006591796875, 2.6810302734375, 2.98199462890625, 3.282958984375, 3.58392333984375, 3.8848876953125, 4.18585205078125, 4.48681640625, 4.78778076171875, 5.0887451171875, 5.38970947265625, 5.690673828125, 5.99163818359375, 6.2926025390625, 6.59356689453125, 6.89453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 17.0, 32.0, 59.0, 74.0, 131.0, 154.0, 161.0, 141.0, 95.0, 62.0, 29.0, 13.0, 9.0, 7.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.1380844116211, -75.88655853271484, -73.63502502441406, -71.38349914550781, -69.13196563720703, -66.88043975830078, -64.62890625, -62.37738037109375, -60.125850677490234, -57.87432098388672, -55.6227912902832, -53.37126159667969, -51.11973571777344, -48.868202209472656, -46.616676330566406, -44.36514663696289, -42.113616943359375, -39.86208724975586, -37.610557556152344, -35.35902786254883, -33.10749816894531, -30.85597038269043, -28.604442596435547, -26.35291290283203, -24.101383209228516, -21.849853515625, -19.598323822021484, -17.3467960357666, -15.095266342163086, -12.84373664855957, -10.592207908630371, -8.340679168701172, -6.0891571044921875, -3.83762788772583, -1.5860986709594727, 0.6654305458068848, 2.916959762573242, 5.168489456176758, 7.420018196105957, 9.671546936035156, 11.923076629638672, 14.174606323242188, 16.426136016845703, 18.677663803100586, 20.9291934967041, 23.180723190307617, 25.4322509765625, 27.683780670166016, 29.93531036376953, 32.18684005737305, 34.43836975097656, 36.68989944458008, 38.941429138183594, 41.192955017089844, 43.44448471069336, 45.696014404296875, 47.94754409790039, 50.199073791503906, 52.45060348510742, 54.70213317871094, 56.95365905761719, 59.20519256591797, 61.45671844482422, 63.708248138427734, 65.95977783203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 8.0, 6.0, 12.0, 19.0, 13.0, 21.0, 24.0, 28.0, 33.0, 35.0, 52.0, 34.0, 36.0, 49.0, 31.0, 45.0, 46.0, 46.0, 36.0, 40.0, 38.0, 37.0, 43.0, 24.0, 32.0, 35.0, 32.0, 18.0, 15.0, 19.0, 23.0, 8.0, 6.0, 9.0, 6.0, 5.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.679134368896484, -23.871896743774414, -23.06465721130371, -22.25741958618164, -21.450180053710938, -20.642942428588867, -19.835704803466797, -19.028465270996094, -18.221227645874023, -17.413990020751953, -16.60675048828125, -15.79951286315918, -14.992274284362793, -14.185035705566406, -13.37779712677002, -12.570558547973633, -11.763319969177246, -10.95608139038086, -10.148842811584473, -9.341604232788086, -8.534366607666016, -7.727128028869629, -6.919889450073242, -6.112651348114014, -5.305412769317627, -4.49817419052124, -3.6909360885620117, -2.883697509765625, -2.0764591693878174, -1.2692208290100098, -0.46198225021362305, 0.34525585174560547, 1.1524944305419922, 1.9597327709197998, 2.7669711112976074, 3.574209690093994, 4.381447792053223, 5.188686370849609, 5.995924949645996, 6.803163051605225, 7.610401630401611, 8.41763973236084, 9.224878311157227, 10.032116889953613, 10.83935546875, 11.64659309387207, 12.453832626342773, 13.261070251464844, 14.06830883026123, 14.875547409057617, 15.682785987854004, 16.49002456665039, 17.29726219177246, 18.10449981689453, 18.911739349365234, 19.718976974487305, 20.526216506958008, 21.333454132080078, 22.14069366455078, 22.94793128967285, 23.755170822143555, 24.562408447265625, 25.369647979736328, 26.1768856048584, 26.98412322998047]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 15.0, 12.0, 10.0, 22.0, 45.0, 52.0, 76.0, 103.0, 173.0, 262.0, 445.0, 811.0, 1405.0, 2711.0, 5983.0, 13357.0, 33453.0, 84438.0, 211461.0, 366751.0, 194291.0, 78263.0, 30621.0, 12460.0, 5443.0, 2571.0, 1351.0, 767.0, 415.0, 275.0, 142.0, 116.0, 70.0, 43.0, 39.0, 30.0, 18.0, 15.0, 11.0, 0.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.703369140625, -20.00048828125, -19.297607421875, -18.5947265625, -17.891845703125, -17.18896484375, -16.486083984375, -15.783203125, -15.080322265625, -14.37744140625, -13.674560546875, -12.9716796875, -12.268798828125, -11.56591796875, -10.863037109375, -10.16015625, -9.457275390625, -8.75439453125, -8.051513671875, -7.3486328125, -6.645751953125, -5.94287109375, -5.239990234375, -4.537109375, -3.834228515625, -3.13134765625, -2.428466796875, -1.7255859375, -1.022705078125, -0.31982421875, 0.383056640625, 1.0859375, 1.788818359375, 2.49169921875, 3.194580078125, 3.8974609375, 4.600341796875, 5.30322265625, 6.006103515625, 6.708984375, 7.411865234375, 8.11474609375, 8.817626953125, 9.5205078125, 10.223388671875, 10.92626953125, 11.629150390625, 12.33203125, 13.034912109375, 13.73779296875, 14.440673828125, 15.1435546875, 15.846435546875, 16.54931640625, 17.252197265625, 17.955078125, 18.657958984375, 19.36083984375, 20.063720703125, 20.7666015625, 21.469482421875, 22.17236328125, 22.875244140625, 23.578125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 6.0, 11.0, 10.0, 15.0, 24.0, 28.0, 49.0, 60.0, 73.0, 72.0, 77.0, 96.0, 72.0, 84.0, 76.0, 52.0, 43.0, 38.0, 27.0, 22.0, 21.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.953125, -19.436279296875, -18.91943359375, -18.402587890625, -17.8857421875, -17.368896484375, -16.85205078125, -16.335205078125, -15.818359375, -15.301513671875, -14.78466796875, -14.267822265625, -13.7509765625, -13.234130859375, -12.71728515625, -12.200439453125, -11.68359375, -11.166748046875, -10.64990234375, -10.133056640625, -9.6162109375, -9.099365234375, -8.58251953125, -8.065673828125, -7.548828125, -7.031982421875, -6.51513671875, -5.998291015625, -5.4814453125, -4.964599609375, -4.44775390625, -3.930908203125, -3.4140625, -2.897216796875, -2.38037109375, -1.863525390625, -1.3466796875, -0.829833984375, -0.31298828125, 0.203857421875, 0.720703125, 1.237548828125, 1.75439453125, 2.271240234375, 2.7880859375, 3.304931640625, 3.82177734375, 4.338623046875, 4.85546875, 5.372314453125, 5.88916015625, 6.406005859375, 6.9228515625, 7.439697265625, 7.95654296875, 8.473388671875, 8.990234375, 9.507080078125, 10.02392578125, 10.540771484375, 11.0576171875, 11.574462890625, 12.09130859375, 12.608154296875, 13.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 7.0, 16.0, 20.0, 22.0, 33.0, 59.0, 74.0, 102.0, 144.0, 207.0, 353.0, 629.0, 1192.0, 2735.0, 9321.0, 56398.0, 520188.0, 399974.0, 44054.0, 8010.0, 2440.0, 1062.0, 562.0, 341.0, 197.0, 122.0, 79.0, 67.0, 37.0, 34.0, 13.0, 11.0, 12.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.1875, -42.9580078125, -41.728515625, -40.4990234375, -39.26953125, -38.0400390625, -36.810546875, -35.5810546875, -34.3515625, -33.1220703125, -31.892578125, -30.6630859375, -29.43359375, -28.2041015625, -26.974609375, -25.7451171875, -24.515625, -23.2861328125, -22.056640625, -20.8271484375, -19.59765625, -18.3681640625, -17.138671875, -15.9091796875, -14.6796875, -13.4501953125, -12.220703125, -10.9912109375, -9.76171875, -8.5322265625, -7.302734375, -6.0732421875, -4.84375, -3.6142578125, -2.384765625, -1.1552734375, 0.07421875, 1.3037109375, 2.533203125, 3.7626953125, 4.9921875, 6.2216796875, 7.451171875, 8.6806640625, 9.91015625, 11.1396484375, 12.369140625, 13.5986328125, 14.828125, 16.0576171875, 17.287109375, 18.5166015625, 19.74609375, 20.9755859375, 22.205078125, 23.4345703125, 24.6640625, 25.8935546875, 27.123046875, 28.3525390625, 29.58203125, 30.8115234375, 32.041015625, 33.2705078125, 34.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 8.0, 8.0, 8.0, 5.0, 10.0, 10.0, 11.0, 22.0, 16.0, 25.0, 21.0, 37.0, 30.0, 33.0, 48.0, 48.0, 57.0, 49.0, 43.0, 54.0, 56.0, 48.0, 46.0, 46.0, 49.0, 34.0, 24.0, 30.0, 24.0, 20.0, 15.0, 18.0, 9.0, 16.0, 5.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.5146484375, -33.248046875, -31.9814453125, -30.71484375, -29.4482421875, -28.181640625, -26.9150390625, -25.6484375, -24.3818359375, -23.115234375, -21.8486328125, -20.58203125, -19.3154296875, -18.048828125, -16.7822265625, -15.515625, -14.2490234375, -12.982421875, -11.7158203125, -10.44921875, -9.1826171875, -7.916015625, -6.6494140625, -5.3828125, -4.1162109375, -2.849609375, -1.5830078125, -0.31640625, 0.9501953125, 2.216796875, 3.4833984375, 4.75, 6.0166015625, 7.283203125, 8.5498046875, 9.81640625, 11.0830078125, 12.349609375, 13.6162109375, 14.8828125, 16.1494140625, 17.416015625, 18.6826171875, 19.94921875, 21.2158203125, 22.482421875, 23.7490234375, 25.015625, 26.2822265625, 27.548828125, 28.8154296875, 30.08203125, 31.3486328125, 32.615234375, 33.8818359375, 35.1484375, 36.4150390625, 37.681640625, 38.9482421875, 40.21484375, 41.4814453125, 42.748046875, 44.0146484375, 45.28125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 13.0, 29.0, 46.0, 56.0, 99.0, 161.0, 263.0, 574.0, 1259.0, 3455.0, 13267.0, 72578.0, 498860.0, 384502.0, 57273.0, 10977.0, 3026.0, 1000.0, 476.0, 246.0, 130.0, 94.0, 53.0, 36.0, 19.0, 17.0, 7.0, 8.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.015625, -6.709716796875, -6.40380859375, -6.097900390625, -5.7919921875, -5.486083984375, -5.18017578125, -4.874267578125, -4.568359375, -4.262451171875, -3.95654296875, -3.650634765625, -3.3447265625, -3.038818359375, -2.73291015625, -2.427001953125, -2.12109375, -1.815185546875, -1.50927734375, -1.203369140625, -0.8974609375, -0.591552734375, -0.28564453125, 0.020263671875, 0.326171875, 0.632080078125, 0.93798828125, 1.243896484375, 1.5498046875, 1.855712890625, 2.16162109375, 2.467529296875, 2.7734375, 3.079345703125, 3.38525390625, 3.691162109375, 3.9970703125, 4.302978515625, 4.60888671875, 4.914794921875, 5.220703125, 5.526611328125, 5.83251953125, 6.138427734375, 6.4443359375, 6.750244140625, 7.05615234375, 7.362060546875, 7.66796875, 7.973876953125, 8.27978515625, 8.585693359375, 8.8916015625, 9.197509765625, 9.50341796875, 9.809326171875, 10.115234375, 10.421142578125, 10.72705078125, 11.032958984375, 11.3388671875, 11.644775390625, 11.95068359375, 12.256591796875, 12.5625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 4.0, 15.0, 12.0, 12.0, 15.0, 19.0, 20.0, 35.0, 41.0, 63.0, 59.0, 87.0, 121.0, 102.0, 95.0, 65.0, 50.0, 37.0, 27.0, 22.0, 21.0, 16.0, 6.0, 8.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002079010009765625, -0.002019554376602173, -0.0019600987434387207, -0.0019006431102752686, -0.0018411874771118164, -0.0017817318439483643, -0.0017222762107849121, -0.00166282057762146, -0.0016033649444580078, -0.0015439093112945557, -0.0014844536781311035, -0.0014249980449676514, -0.0013655424118041992, -0.001306086778640747, -0.001246631145477295, -0.0011871755123138428, -0.0011277198791503906, -0.0010682642459869385, -0.0010088086128234863, -0.0009493529796600342, -0.000889897346496582, -0.0008304417133331299, -0.0007709860801696777, -0.0007115304470062256, -0.0006520748138427734, -0.0005926191806793213, -0.0005331635475158691, -0.000473707914352417, -0.00041425228118896484, -0.0003547966480255127, -0.00029534101486206055, -0.0002358853816986084, -0.00017642974853515625, -0.0001169741153717041, -5.751848220825195e-05, 1.9371509552001953e-06, 6.139278411865234e-05, 0.00012084841728210449, 0.00018030405044555664, 0.0002397596836090088, 0.00029921531677246094, 0.0003586709499359131, 0.00041812658309936523, 0.0004775822162628174, 0.0005370378494262695, 0.0005964934825897217, 0.0006559491157531738, 0.000715404748916626, 0.0007748603820800781, 0.0008343160152435303, 0.0008937716484069824, 0.0009532272815704346, 0.0010126829147338867, 0.0010721385478973389, 0.001131594181060791, 0.0011910498142242432, 0.0012505054473876953, 0.0013099610805511475, 0.0013694167137145996, 0.0014288723468780518, 0.001488327980041504, 0.001547783613204956, 0.0016072392463684082, 0.0016666948795318604, 0.0017261505126953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 11.0, 26.0, 37.0, 78.0, 189.0, 454.0, 1234.0, 5123.0, 58338.0, 833656.0, 138192.0, 8523.0, 1689.0, 545.0, 226.0, 110.0, 43.0, 36.0, 13.0, 11.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.078125, -19.498291015625, -18.91845703125, -18.338623046875, -17.7587890625, -17.178955078125, -16.59912109375, -16.019287109375, -15.439453125, -14.859619140625, -14.27978515625, -13.699951171875, -13.1201171875, -12.540283203125, -11.96044921875, -11.380615234375, -10.80078125, -10.220947265625, -9.64111328125, -9.061279296875, -8.4814453125, -7.901611328125, -7.32177734375, -6.741943359375, -6.162109375, -5.582275390625, -5.00244140625, -4.422607421875, -3.8427734375, -3.262939453125, -2.68310546875, -2.103271484375, -1.5234375, -0.943603515625, -0.36376953125, 0.216064453125, 0.7958984375, 1.375732421875, 1.95556640625, 2.535400390625, 3.115234375, 3.695068359375, 4.27490234375, 4.854736328125, 5.4345703125, 6.014404296875, 6.59423828125, 7.174072265625, 7.75390625, 8.333740234375, 8.91357421875, 9.493408203125, 10.0732421875, 10.653076171875, 11.23291015625, 11.812744140625, 12.392578125, 12.972412109375, 13.55224609375, 14.132080078125, 14.7119140625, 15.291748046875, 15.87158203125, 16.451416015625, 17.03125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 15.0, 35.0, 28.0, 50.0, 53.0, 94.0, 91.0, 96.0, 101.0, 99.0, 91.0, 74.0, 43.0, 36.0, 21.0, 19.0, 16.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.7264404296875, -7.320068359375, -6.9136962890625, -6.50732421875, -6.1009521484375, -5.694580078125, -5.2882080078125, -4.8818359375, -4.4754638671875, -4.069091796875, -3.6627197265625, -3.25634765625, -2.8499755859375, -2.443603515625, -2.0372314453125, -1.630859375, -1.2244873046875, -0.818115234375, -0.4117431640625, -0.00537109375, 0.4010009765625, 0.807373046875, 1.2137451171875, 1.6201171875, 2.0264892578125, 2.432861328125, 2.8392333984375, 3.24560546875, 3.6519775390625, 4.058349609375, 4.4647216796875, 4.87109375, 5.2774658203125, 5.683837890625, 6.0902099609375, 6.49658203125, 6.9029541015625, 7.309326171875, 7.7156982421875, 8.1220703125, 8.5284423828125, 8.934814453125, 9.3411865234375, 9.74755859375, 10.1539306640625, 10.560302734375, 10.9666748046875, 11.373046875, 11.7794189453125, 12.185791015625, 12.5921630859375, 12.99853515625, 13.4049072265625, 13.811279296875, 14.2176513671875, 14.6240234375, 15.0303955078125, 15.436767578125, 15.8431396484375, 16.24951171875, 16.6558837890625, 17.062255859375, 17.4686279296875, 17.875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 15.0, 12.0, 24.0, 27.0, 45.0, 62.0, 82.0, 93.0, 88.0, 123.0, 112.0, 82.0, 76.0, 57.0, 22.0, 20.0, 18.0, 7.0, 4.0, 0.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.87744140625, -189.8155975341797, -183.75375366210938, -177.69190979003906, -171.63006591796875, -165.56820678710938, -159.50637817382812, -153.44451904296875, -147.38267517089844, -141.32083129882812, -135.2589874267578, -129.1971435546875, -123.13529205322266, -117.07344818115234, -111.01160430908203, -104.94975280761719, -98.8879165649414, -92.8260726928711, -86.76422882080078, -80.70237731933594, -74.64053344726562, -68.57868957519531, -62.516845703125, -56.45499801635742, -50.39315414428711, -44.3313102722168, -38.26946258544922, -32.207618713378906, -26.14577293395996, -20.083927154541016, -14.022083282470703, -7.960235595703125, -1.8983917236328125, 4.163453578948975, 10.225298881530762, 16.28714370727539, 22.348989486694336, 28.41083526611328, 34.472679138183594, 40.53452682495117, 46.596370697021484, 52.6582145690918, 58.720062255859375, 64.78190612792969, 70.84375, 76.90559387207031, 82.96743774414062, 89.02928924560547, 95.09113311767578, 101.1529769897461, 107.2148208618164, 113.27667236328125, 119.33851623535156, 125.40036010742188, 131.4622039794922, 137.5240478515625, 143.5858917236328, 149.64773559570312, 155.70957946777344, 161.77142333984375, 167.83326721191406, 173.89511108398438, 179.95697021484375, 186.01881408691406, 192.08065795898438]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 19.0, 4.0, 13.0, 20.0, 28.0, 30.0, 27.0, 37.0, 42.0, 42.0, 55.0, 39.0, 70.0, 53.0, 61.0, 73.0, 53.0, 44.0, 42.0, 48.0, 35.0, 37.0, 20.0, 24.0, 19.0, 16.0, 9.0, 13.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.36550903320312, -168.04466247558594, -161.7238311767578, -155.40298461914062, -149.0821533203125, -142.7613067626953, -136.44046020507812, -130.11962890625, -123.79878997802734, -117.47795104980469, -111.15711212158203, -104.83627319335938, -98.51542663574219, -92.19459533691406, -85.87374877929688, -79.55290985107422, -73.23207092285156, -66.9112319946289, -60.59039306640625, -54.26955032348633, -47.94871139526367, -41.627872467041016, -35.307029724121094, -28.986190795898438, -22.66535186767578, -16.344512939453125, -10.023672103881836, -3.702831268310547, 2.6180076599121094, 8.938846588134766, 15.259689331054688, 21.580528259277344, 27.9013671875, 34.222206115722656, 40.54304504394531, 46.863887786865234, 53.18472671508789, 59.50556564331055, 65.82640838623047, 72.14724731445312, 78.46808624267578, 84.78892517089844, 91.1097640991211, 97.43060302734375, 103.75144958496094, 110.07228088378906, 116.39312744140625, 122.7139663696289, 129.03480529785156, 135.35565185546875, 141.67648315429688, 147.99732971191406, 154.3181610107422, 160.63900756835938, 166.9598388671875, 173.2806854248047, 179.60153198242188, 185.92237854003906, 192.2432098388672, 198.56405639648438, 204.8848876953125, 211.2057342529297, 217.52658081054688, 223.847412109375, 230.16824340820312]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 9.0, 15.0, 11.0, 28.0, 39.0, 47.0, 84.0, 149.0, 217.0, 383.0, 621.0, 1054.0, 2076.0, 3858.0, 8071.0, 18163.0, 47180.0, 167764.0, 1662907.0, 2010443.0, 185059.0, 49489.0, 18966.0, 8336.0, 4118.0, 2178.0, 1191.0, 675.0, 420.0, 235.0, 160.0, 101.0, 58.0, 46.0, 40.0, 11.0, 14.0, 10.0, 11.0, 2.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.62109375, -13.1171875, -12.61328125, -12.109375, -11.60546875, -11.1015625, -10.59765625, -10.09375, -9.58984375, -9.0859375, -8.58203125, -8.078125, -7.57421875, -7.0703125, -6.56640625, -6.0625, -5.55859375, -5.0546875, -4.55078125, -4.046875, -3.54296875, -3.0390625, -2.53515625, -2.03125, -1.52734375, -1.0234375, -0.51953125, -0.015625, 0.48828125, 0.9921875, 1.49609375, 2.0, 2.50390625, 3.0078125, 3.51171875, 4.015625, 4.51953125, 5.0234375, 5.52734375, 6.03125, 6.53515625, 7.0390625, 7.54296875, 8.046875, 8.55078125, 9.0546875, 9.55859375, 10.0625, 10.56640625, 11.0703125, 11.57421875, 12.078125, 12.58203125, 13.0859375, 13.58984375, 14.09375, 14.59765625, 15.1015625, 15.60546875, 16.109375, 16.61328125, 17.1171875, 17.62109375, 18.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 4.0, 3.0, 14.0, 14.0, 20.0, 18.0, 32.0, 19.0, 35.0, 47.0, 55.0, 64.0, 61.0, 64.0, 68.0, 72.0, 55.0, 48.0, 47.0, 45.0, 49.0, 33.0, 22.0, 24.0, 21.0, 8.0, 9.0, 8.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9197998046875, -8.581787109375, -8.2437744140625, -7.90576171875, -7.5677490234375, -7.229736328125, -6.8917236328125, -6.5537109375, -6.2156982421875, -5.877685546875, -5.5396728515625, -5.20166015625, -4.8636474609375, -4.525634765625, -4.1876220703125, -3.849609375, -3.5115966796875, -3.173583984375, -2.8355712890625, -2.49755859375, -2.1595458984375, -1.821533203125, -1.4835205078125, -1.1455078125, -0.8074951171875, -0.469482421875, -0.1314697265625, 0.20654296875, 0.5445556640625, 0.882568359375, 1.2205810546875, 1.55859375, 1.8966064453125, 2.234619140625, 2.5726318359375, 2.91064453125, 3.2486572265625, 3.586669921875, 3.9246826171875, 4.2626953125, 4.6007080078125, 4.938720703125, 5.2767333984375, 5.61474609375, 5.9527587890625, 6.290771484375, 6.6287841796875, 6.966796875, 7.3048095703125, 7.642822265625, 7.9808349609375, 8.31884765625, 8.6568603515625, 8.994873046875, 9.3328857421875, 9.6708984375, 10.0089111328125, 10.346923828125, 10.6849365234375, 11.02294921875, 11.3609619140625, 11.698974609375, 12.0369873046875, 12.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 2.0, 4.0, 9.0, 6.0, 13.0, 18.0, 38.0, 43.0, 63.0, 128.0, 243.0, 455.0, 1178.0, 2871.0, 8084.0, 27439.0, 142782.0, 3095730.0, 818667.0, 70819.0, 16977.0, 5269.0, 1870.0, 785.0, 331.0, 172.0, 85.0, 52.0, 41.0, 23.0, 15.0, 10.0, 7.0, 5.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.2529296875, -24.458984375, -23.6650390625, -22.87109375, -22.0771484375, -21.283203125, -20.4892578125, -19.6953125, -18.9013671875, -18.107421875, -17.3134765625, -16.51953125, -15.7255859375, -14.931640625, -14.1376953125, -13.34375, -12.5498046875, -11.755859375, -10.9619140625, -10.16796875, -9.3740234375, -8.580078125, -7.7861328125, -6.9921875, -6.1982421875, -5.404296875, -4.6103515625, -3.81640625, -3.0224609375, -2.228515625, -1.4345703125, -0.640625, 0.1533203125, 0.947265625, 1.7412109375, 2.53515625, 3.3291015625, 4.123046875, 4.9169921875, 5.7109375, 6.5048828125, 7.298828125, 8.0927734375, 8.88671875, 9.6806640625, 10.474609375, 11.2685546875, 12.0625, 12.8564453125, 13.650390625, 14.4443359375, 15.23828125, 16.0322265625, 16.826171875, 17.6201171875, 18.4140625, 19.2080078125, 20.001953125, 20.7958984375, 21.58984375, 22.3837890625, 23.177734375, 23.9716796875, 24.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 9.0, 8.0, 23.0, 23.0, 39.0, 50.0, 113.0, 191.0, 415.0, 932.0, 1104.0, 494.0, 247.0, 142.0, 89.0, 51.0, 32.0, 21.0, 23.0, 13.0, 6.0, 4.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.9375, -27.068359375, -26.19921875, -25.330078125, -24.4609375, -23.591796875, -22.72265625, -21.853515625, -20.984375, -20.115234375, -19.24609375, -18.376953125, -17.5078125, -16.638671875, -15.76953125, -14.900390625, -14.03125, -13.162109375, -12.29296875, -11.423828125, -10.5546875, -9.685546875, -8.81640625, -7.947265625, -7.078125, -6.208984375, -5.33984375, -4.470703125, -3.6015625, -2.732421875, -1.86328125, -0.994140625, -0.125, 0.744140625, 1.61328125, 2.482421875, 3.3515625, 4.220703125, 5.08984375, 5.958984375, 6.828125, 7.697265625, 8.56640625, 9.435546875, 10.3046875, 11.173828125, 12.04296875, 12.912109375, 13.78125, 14.650390625, 15.51953125, 16.388671875, 17.2578125, 18.126953125, 18.99609375, 19.865234375, 20.734375, 21.603515625, 22.47265625, 23.341796875, 24.2109375, 25.080078125, 25.94921875, 26.818359375, 27.6875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 15.0, 39.0, 88.0, 143.0, 199.0, 206.0, 152.0, 77.0, 21.0, 19.0, 12.0, 8.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-301.9026794433594, -292.92535400390625, -283.947998046875, -274.9706726074219, -265.99334716796875, -257.0159912109375, -248.03866577148438, -239.06134033203125, -230.08399963378906, -221.10665893554688, -212.12933349609375, -203.15199279785156, -194.17465209960938, -185.19732666015625, -176.21998596191406, -167.24264526367188, -158.26531982421875, -149.28797912597656, -140.31065368652344, -131.33331298828125, -122.3559799194336, -113.37864685058594, -104.40130615234375, -95.4239730834961, -86.44664001464844, -77.46930694580078, -68.49197387695312, -59.51463317871094, -50.53730010986328, -41.559967041015625, -32.5826301574707, -23.60529327392578, -14.6279296875, -5.650594711303711, 3.326740264892578, 12.304075241088867, 21.281410217285156, 30.258743286132812, 39.236080169677734, 48.213417053222656, 57.19075012207031, 66.16808319091797, 75.14541625976562, 84.12275695800781, 93.10009002685547, 102.07742309570312, 111.05476379394531, 120.03209686279297, 129.00942993164062, 137.9867706298828, 146.96409606933594, 155.94143676757812, 164.91876220703125, 173.89610290527344, 182.87344360351562, 191.85076904296875, 200.82810974121094, 209.80545043945312, 218.78277587890625, 227.76011657714844, 236.73745727539062, 245.71478271484375, 254.69212341308594, 263.6694641113281, 272.64678955078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 10.0, 17.0, 19.0, 14.0, 29.0, 31.0, 26.0, 33.0, 38.0, 27.0, 43.0, 52.0, 57.0, 40.0, 59.0, 45.0, 37.0, 48.0, 53.0, 41.0, 28.0, 46.0, 37.0, 24.0, 20.0, 19.0, 22.0, 15.0, 9.0, 10.0, 15.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.10187530517578, -110.51746368408203, -106.93305969238281, -103.34864807128906, -99.76424407958984, -96.1798324584961, -92.59542846679688, -89.01101684570312, -85.42660522460938, -81.84219360351562, -78.2577896118164, -74.67337799072266, -71.08897399902344, -67.50456237792969, -63.9201545715332, -60.33574676513672, -56.751338958740234, -53.16693115234375, -49.582523345947266, -45.99811553955078, -42.41370391845703, -38.82929611206055, -35.24488830566406, -31.660478591918945, -28.07607078552246, -24.491662979125977, -20.90725326538086, -17.322845458984375, -13.738436698913574, -10.154027938842773, -6.569620132446289, -2.985210418701172, 0.5991973876953125, 4.183606147766113, 7.768014430999756, 11.352422714233398, 14.9368314743042, 18.521240234375, 22.105648040771484, 25.6900577545166, 29.274465560913086, 32.8588752746582, 36.44328308105469, 40.02769088745117, 43.612098693847656, 47.196510314941406, 50.780914306640625, 54.365325927734375, 57.94973373413086, 61.534141540527344, 65.1185531616211, 68.70295715332031, 72.28736877441406, 75.87178039550781, 79.45618438720703, 83.04059600830078, 86.625, 90.20941162109375, 93.79381561279297, 97.37822723388672, 100.96263122558594, 104.54704284667969, 108.13145446777344, 111.71585845947266, 115.3002700805664]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 13.0, 14.0, 10.0, 21.0, 32.0, 57.0, 88.0, 135.0, 249.0, 359.0, 620.0, 1065.0, 1764.0, 3469.0, 6736.0, 13940.0, 31028.0, 70192.0, 173650.0, 367271.0, 219828.0, 86220.0, 37702.0, 17084.0, 7905.0, 3950.0, 2142.0, 1234.0, 667.0, 359.0, 242.0, 180.0, 111.0, 55.0, 48.0, 37.0, 25.0, 17.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.449462890625, -16.91455078125, -16.379638671875, -15.8447265625, -15.309814453125, -14.77490234375, -14.239990234375, -13.705078125, -13.170166015625, -12.63525390625, -12.100341796875, -11.5654296875, -11.030517578125, -10.49560546875, -9.960693359375, -9.42578125, -8.890869140625, -8.35595703125, -7.821044921875, -7.2861328125, -6.751220703125, -6.21630859375, -5.681396484375, -5.146484375, -4.611572265625, -4.07666015625, -3.541748046875, -3.0068359375, -2.471923828125, -1.93701171875, -1.402099609375, -0.8671875, -0.332275390625, 0.20263671875, 0.737548828125, 1.2724609375, 1.807373046875, 2.34228515625, 2.877197265625, 3.412109375, 3.947021484375, 4.48193359375, 5.016845703125, 5.5517578125, 6.086669921875, 6.62158203125, 7.156494140625, 7.69140625, 8.226318359375, 8.76123046875, 9.296142578125, 9.8310546875, 10.365966796875, 10.90087890625, 11.435791015625, 11.970703125, 12.505615234375, 13.04052734375, 13.575439453125, 14.1103515625, 14.645263671875, 15.18017578125, 15.715087890625, 16.25]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 12.0, 7.0, 17.0, 17.0, 23.0, 28.0, 19.0, 29.0, 33.0, 47.0, 52.0, 53.0, 59.0, 64.0, 72.0, 65.0, 59.0, 43.0, 53.0, 37.0, 40.0, 31.0, 28.0, 26.0, 21.0, 16.0, 8.0, 9.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.9705810546875, -8.628662109375, -8.2867431640625, -7.94482421875, -7.6029052734375, -7.260986328125, -6.9190673828125, -6.5771484375, -6.2352294921875, -5.893310546875, -5.5513916015625, -5.20947265625, -4.8675537109375, -4.525634765625, -4.1837158203125, -3.841796875, -3.4998779296875, -3.157958984375, -2.8160400390625, -2.47412109375, -2.1322021484375, -1.790283203125, -1.4483642578125, -1.1064453125, -0.7645263671875, -0.422607421875, -0.0806884765625, 0.26123046875, 0.6031494140625, 0.945068359375, 1.2869873046875, 1.62890625, 1.9708251953125, 2.312744140625, 2.6546630859375, 2.99658203125, 3.3385009765625, 3.680419921875, 4.0223388671875, 4.3642578125, 4.7061767578125, 5.048095703125, 5.3900146484375, 5.73193359375, 6.0738525390625, 6.415771484375, 6.7576904296875, 7.099609375, 7.4415283203125, 7.783447265625, 8.1253662109375, 8.46728515625, 8.8092041015625, 9.151123046875, 9.4930419921875, 9.8349609375, 10.1768798828125, 10.518798828125, 10.8607177734375, 11.20263671875, 11.5445556640625, 11.886474609375, 12.2283935546875, 12.5703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 16.0, 20.0, 22.0, 45.0, 60.0, 111.0, 178.0, 354.0, 711.0, 1603.0, 4796.0, 32380.0, 682445.0, 301532.0, 18270.0, 3380.0, 1215.0, 614.0, 290.0, 176.0, 94.0, 83.0, 51.0, 36.0, 19.0, 12.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.0693359375, -45.544921875, -44.0205078125, -42.49609375, -40.9716796875, -39.447265625, -37.9228515625, -36.3984375, -34.8740234375, -33.349609375, -31.8251953125, -30.30078125, -28.7763671875, -27.251953125, -25.7275390625, -24.203125, -22.6787109375, -21.154296875, -19.6298828125, -18.10546875, -16.5810546875, -15.056640625, -13.5322265625, -12.0078125, -10.4833984375, -8.958984375, -7.4345703125, -5.91015625, -4.3857421875, -2.861328125, -1.3369140625, 0.1875, 1.7119140625, 3.236328125, 4.7607421875, 6.28515625, 7.8095703125, 9.333984375, 10.8583984375, 12.3828125, 13.9072265625, 15.431640625, 16.9560546875, 18.48046875, 20.0048828125, 21.529296875, 23.0537109375, 24.578125, 26.1025390625, 27.626953125, 29.1513671875, 30.67578125, 32.2001953125, 33.724609375, 35.2490234375, 36.7734375, 38.2978515625, 39.822265625, 41.3466796875, 42.87109375, 44.3955078125, 45.919921875, 47.4443359375, 48.96875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 12.0, 15.0, 22.0, 18.0, 24.0, 23.0, 26.0, 40.0, 37.0, 53.0, 49.0, 48.0, 60.0, 48.0, 62.0, 55.0, 51.0, 50.0, 50.0, 48.0, 25.0, 37.0, 32.0, 24.0, 18.0, 14.0, 20.0, 10.0, 8.0, 6.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.53125, -41.2861328125, -40.041015625, -38.7958984375, -37.55078125, -36.3056640625, -35.060546875, -33.8154296875, -32.5703125, -31.3251953125, -30.080078125, -28.8349609375, -27.58984375, -26.3447265625, -25.099609375, -23.8544921875, -22.609375, -21.3642578125, -20.119140625, -18.8740234375, -17.62890625, -16.3837890625, -15.138671875, -13.8935546875, -12.6484375, -11.4033203125, -10.158203125, -8.9130859375, -7.66796875, -6.4228515625, -5.177734375, -3.9326171875, -2.6875, -1.4423828125, -0.197265625, 1.0478515625, 2.29296875, 3.5380859375, 4.783203125, 6.0283203125, 7.2734375, 8.5185546875, 9.763671875, 11.0087890625, 12.25390625, 13.4990234375, 14.744140625, 15.9892578125, 17.234375, 18.4794921875, 19.724609375, 20.9697265625, 22.21484375, 23.4599609375, 24.705078125, 25.9501953125, 27.1953125, 28.4404296875, 29.685546875, 30.9306640625, 32.17578125, 33.4208984375, 34.666015625, 35.9111328125, 37.15625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 8.0, 6.0, 15.0, 19.0, 33.0, 46.0, 74.0, 133.0, 242.0, 621.0, 2135.0, 12394.0, 185781.0, 800742.0, 39773.0, 4548.0, 1122.0, 419.0, 165.0, 88.0, 57.0, 38.0, 26.0, 18.0, 16.0, 5.0, 5.0, 4.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.15087890625, -15.5986328125, -15.04638671875, -14.494140625, -13.94189453125, -13.3896484375, -12.83740234375, -12.28515625, -11.73291015625, -11.1806640625, -10.62841796875, -10.076171875, -9.52392578125, -8.9716796875, -8.41943359375, -7.8671875, -7.31494140625, -6.7626953125, -6.21044921875, -5.658203125, -5.10595703125, -4.5537109375, -4.00146484375, -3.44921875, -2.89697265625, -2.3447265625, -1.79248046875, -1.240234375, -0.68798828125, -0.1357421875, 0.41650390625, 0.96875, 1.52099609375, 2.0732421875, 2.62548828125, 3.177734375, 3.72998046875, 4.2822265625, 4.83447265625, 5.38671875, 5.93896484375, 6.4912109375, 7.04345703125, 7.595703125, 8.14794921875, 8.7001953125, 9.25244140625, 9.8046875, 10.35693359375, 10.9091796875, 11.46142578125, 12.013671875, 12.56591796875, 13.1181640625, 13.67041015625, 14.22265625, 14.77490234375, 15.3271484375, 15.87939453125, 16.431640625, 16.98388671875, 17.5361328125, 18.08837890625, 18.640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 4.0, 3.0, 8.0, 9.0, 7.0, 7.0, 14.0, 13.0, 10.0, 15.0, 15.0, 25.0, 27.0, 42.0, 59.0, 74.0, 96.0, 120.0, 124.0, 65.0, 55.0, 31.0, 33.0, 20.0, 21.0, 19.0, 7.0, 9.0, 5.0, 17.0, 9.0, 9.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016498565673828125, -0.0015919506549835205, -0.0015340447425842285, -0.0014761388301849365, -0.0014182329177856445, -0.0013603270053863525, -0.0013024210929870605, -0.0012445151805877686, -0.0011866092681884766, -0.0011287033557891846, -0.0010707974433898926, -0.0010128915309906006, -0.0009549856185913086, -0.0008970797061920166, -0.0008391737937927246, -0.0007812678813934326, -0.0007233619689941406, -0.0006654560565948486, -0.0006075501441955566, -0.0005496442317962646, -0.0004917383193969727, -0.00043383240699768066, -0.00037592649459838867, -0.0003180205821990967, -0.0002601146697998047, -0.0002022087574005127, -0.0001443028450012207, -8.639693260192871e-05, -2.849102020263672e-05, 2.9414892196655273e-05, 8.732080459594727e-05, 0.00014522671699523926, 0.00020313262939453125, 0.00026103854179382324, 0.00031894445419311523, 0.0003768503665924072, 0.0004347562789916992, 0.0004926621913909912, 0.0005505681037902832, 0.0006084740161895752, 0.0006663799285888672, 0.0007242858409881592, 0.0007821917533874512, 0.0008400976657867432, 0.0008980035781860352, 0.0009559094905853271, 0.0010138154029846191, 0.0010717213153839111, 0.0011296272277832031, 0.0011875331401824951, 0.0012454390525817871, 0.001303344964981079, 0.001361250877380371, 0.001419156789779663, 0.001477062702178955, 0.001534968614578247, 0.001592874526977539, 0.001650780439376831, 0.001708686351776123, 0.001766592264175415, 0.001824498176574707, 0.001882404088973999, 0.001940310001373291, 0.001998215913772583, 0.002056121826171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 7.0, 16.0, 19.0, 33.0, 41.0, 54.0, 95.0, 150.0, 281.0, 485.0, 991.0, 2321.0, 7314.0, 44921.0, 604526.0, 348179.0, 29451.0, 5822.0, 1909.0, 900.0, 430.0, 216.0, 142.0, 69.0, 48.0, 31.0, 23.0, 15.0, 11.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5703125, -11.1556396484375, -10.740966796875, -10.3262939453125, -9.91162109375, -9.4969482421875, -9.082275390625, -8.6676025390625, -8.2529296875, -7.8382568359375, -7.423583984375, -7.0089111328125, -6.59423828125, -6.1795654296875, -5.764892578125, -5.3502197265625, -4.935546875, -4.5208740234375, -4.106201171875, -3.6915283203125, -3.27685546875, -2.8621826171875, -2.447509765625, -2.0328369140625, -1.6181640625, -1.2034912109375, -0.788818359375, -0.3741455078125, 0.04052734375, 0.4552001953125, 0.869873046875, 1.2845458984375, 1.69921875, 2.1138916015625, 2.528564453125, 2.9432373046875, 3.35791015625, 3.7725830078125, 4.187255859375, 4.6019287109375, 5.0166015625, 5.4312744140625, 5.845947265625, 6.2606201171875, 6.67529296875, 7.0899658203125, 7.504638671875, 7.9193115234375, 8.333984375, 8.7486572265625, 9.163330078125, 9.5780029296875, 9.99267578125, 10.4073486328125, 10.822021484375, 11.2366943359375, 11.6513671875, 12.0660400390625, 12.480712890625, 12.8953857421875, 13.31005859375, 13.7247314453125, 14.139404296875, 14.5540771484375, 14.96875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 6.0, 14.0, 18.0, 27.0, 37.0, 35.0, 74.0, 86.0, 101.0, 123.0, 112.0, 103.0, 78.0, 50.0, 44.0, 30.0, 22.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.0625, -15.6256103515625, -15.188720703125, -14.7518310546875, -14.31494140625, -13.8780517578125, -13.441162109375, -13.0042724609375, -12.5673828125, -12.1304931640625, -11.693603515625, -11.2567138671875, -10.81982421875, -10.3829345703125, -9.946044921875, -9.5091552734375, -9.072265625, -8.6353759765625, -8.198486328125, -7.7615966796875, -7.32470703125, -6.8878173828125, -6.450927734375, -6.0140380859375, -5.5771484375, -5.1402587890625, -4.703369140625, -4.2664794921875, -3.82958984375, -3.3927001953125, -2.955810546875, -2.5189208984375, -2.08203125, -1.6451416015625, -1.208251953125, -0.7713623046875, -0.33447265625, 0.1024169921875, 0.539306640625, 0.9761962890625, 1.4130859375, 1.8499755859375, 2.286865234375, 2.7237548828125, 3.16064453125, 3.5975341796875, 4.034423828125, 4.4713134765625, 4.908203125, 5.3450927734375, 5.781982421875, 6.2188720703125, 6.65576171875, 7.0926513671875, 7.529541015625, 7.9664306640625, 8.4033203125, 8.8402099609375, 9.277099609375, 9.7139892578125, 10.15087890625, 10.5877685546875, 11.024658203125, 11.4615478515625, 11.8984375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 18.0, 22.0, 62.0, 81.0, 126.0, 159.0, 170.0, 131.0, 91.0, 48.0, 28.0, 11.0, 14.0, 12.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-216.178466796875, -209.62818908691406, -203.07791137695312, -196.5276336669922, -189.97735595703125, -183.42709350585938, -176.87680053710938, -170.3265380859375, -163.77626037597656, -157.22598266601562, -150.6757049560547, -144.12542724609375, -137.5751495361328, -131.02487182617188, -124.47460174560547, -117.92433166503906, -111.3740463256836, -104.82376861572266, -98.27349090576172, -91.72322082519531, -85.17294311523438, -78.62266540527344, -72.0723876953125, -65.52210998535156, -58.97183609008789, -52.42155838012695, -45.87128448486328, -39.321006774902344, -32.770729064941406, -26.220455169677734, -19.670177459716797, -13.119903564453125, -6.5696258544921875, -0.01934957504272461, 6.530926704406738, 13.08120346069336, 19.631479263305664, 26.18175506591797, 32.732032775878906, 39.28230667114258, 45.832584381103516, 52.38286209106445, 58.933135986328125, 65.48341369628906, 72.03369140625, 78.58396911621094, 85.13424682617188, 91.68451690673828, 98.23479461669922, 104.78507232666016, 111.3353500366211, 117.8856201171875, 124.43589782714844, 130.98617553710938, 137.5364532470703, 144.08673095703125, 150.6370086669922, 157.18728637695312, 163.73756408691406, 170.287841796875, 176.83811950683594, 183.38839721679688, 189.93865966796875, 196.4889373779297, 203.03921508789062]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 6.0, 11.0, 18.0, 16.0, 25.0, 26.0, 38.0, 43.0, 41.0, 48.0, 64.0, 69.0, 81.0, 73.0, 76.0, 63.0, 57.0, 41.0, 41.0, 33.0, 32.0, 22.0, 15.0, 13.0, 12.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.09713745117188, -134.03933715820312, -127.98152160644531, -121.92372131347656, -115.86591339111328, -109.80810546875, -103.75030517578125, -97.69249725341797, -91.63468933105469, -85.5768814086914, -79.51907348632812, -73.46127319335938, -67.4034652709961, -61.34565734863281, -55.2878532409668, -49.23004913330078, -43.1722412109375, -37.11443328857422, -31.056629180908203, -24.998823165893555, -18.941017150878906, -12.883211135864258, -6.825405120849609, -0.7676010131835938, 5.2902069091796875, 11.348012924194336, 17.405818939208984, 23.463624954223633, 29.52143096923828, 35.57923889160156, 41.63704299926758, 47.694847106933594, 53.752655029296875, 59.810462951660156, 65.86827087402344, 71.92607116699219, 77.98387908935547, 84.04168701171875, 90.0994873046875, 96.15729522705078, 102.21510314941406, 108.27291107177734, 114.33071899414062, 120.38851928710938, 126.44632720947266, 132.50413513183594, 138.5619354248047, 144.6197509765625, 150.67755126953125, 156.7353515625, 162.7931671142578, 168.85096740722656, 174.90878295898438, 180.96658325195312, 187.02438354492188, 193.08218383789062, 199.13999938964844, 205.1977996826172, 211.255615234375, 217.31341552734375, 223.3712158203125, 229.4290313720703, 235.48683166503906, 241.54464721679688, 247.60244750976562]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 2.0, 7.0, 10.0, 14.0, 27.0, 39.0, 63.0, 119.0, 250.0, 505.0, 1063.0, 2503.0, 6068.0, 17955.0, 66859.0, 721727.0, 3155161.0, 173419.0, 31791.0, 9914.0, 3668.0, 1574.0, 705.0, 313.0, 190.0, 126.0, 65.0, 35.0, 25.0, 17.0, 23.0, 8.0, 13.0, 9.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.703125, -10.147216796875, -9.59130859375, -9.035400390625, -8.4794921875, -7.923583984375, -7.36767578125, -6.811767578125, -6.255859375, -5.699951171875, -5.14404296875, -4.588134765625, -4.0322265625, -3.476318359375, -2.92041015625, -2.364501953125, -1.80859375, -1.252685546875, -0.69677734375, -0.140869140625, 0.4150390625, 0.970947265625, 1.52685546875, 2.082763671875, 2.638671875, 3.194580078125, 3.75048828125, 4.306396484375, 4.8623046875, 5.418212890625, 5.97412109375, 6.530029296875, 7.0859375, 7.641845703125, 8.19775390625, 8.753662109375, 9.3095703125, 9.865478515625, 10.42138671875, 10.977294921875, 11.533203125, 12.089111328125, 12.64501953125, 13.200927734375, 13.7568359375, 14.312744140625, 14.86865234375, 15.424560546875, 15.98046875, 16.536376953125, 17.09228515625, 17.648193359375, 18.2041015625, 18.760009765625, 19.31591796875, 19.871826171875, 20.427734375, 20.983642578125, 21.53955078125, 22.095458984375, 22.6513671875, 23.207275390625, 23.76318359375, 24.319091796875, 24.875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 12.0, 25.0, 33.0, 37.0, 73.0, 64.0, 94.0, 88.0, 101.0, 91.0, 90.0, 73.0, 74.0, 44.0, 36.0, 15.0, 11.0, 10.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.77880859375, -8.2451171875, -7.71142578125, -7.177734375, -6.64404296875, -6.1103515625, -5.57666015625, -5.04296875, -4.50927734375, -3.9755859375, -3.44189453125, -2.908203125, -2.37451171875, -1.8408203125, -1.30712890625, -0.7734375, -0.23974609375, 0.2939453125, 0.82763671875, 1.361328125, 1.89501953125, 2.4287109375, 2.96240234375, 3.49609375, 4.02978515625, 4.5634765625, 5.09716796875, 5.630859375, 6.16455078125, 6.6982421875, 7.23193359375, 7.765625, 8.29931640625, 8.8330078125, 9.36669921875, 9.900390625, 10.43408203125, 10.9677734375, 11.50146484375, 12.03515625, 12.56884765625, 13.1025390625, 13.63623046875, 14.169921875, 14.70361328125, 15.2373046875, 15.77099609375, 16.3046875, 16.83837890625, 17.3720703125, 17.90576171875, 18.439453125, 18.97314453125, 19.5068359375, 20.04052734375, 20.57421875, 21.10791015625, 21.6416015625, 22.17529296875, 22.708984375, 23.24267578125, 23.7763671875, 24.31005859375, 24.84375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 5.0, 7.0, 11.0, 10.0, 27.0, 32.0, 40.0, 51.0, 97.0, 192.0, 334.0, 730.0, 1574.0, 3764.0, 9842.0, 32750.0, 175578.0, 3078958.0, 789752.0, 72434.0, 17892.0, 5961.0, 2314.0, 1001.0, 439.0, 218.0, 107.0, 51.0, 36.0, 27.0, 22.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.375, -24.720458984375, -24.06591796875, -23.411376953125, -22.7568359375, -22.102294921875, -21.44775390625, -20.793212890625, -20.138671875, -19.484130859375, -18.82958984375, -18.175048828125, -17.5205078125, -16.865966796875, -16.21142578125, -15.556884765625, -14.90234375, -14.247802734375, -13.59326171875, -12.938720703125, -12.2841796875, -11.629638671875, -10.97509765625, -10.320556640625, -9.666015625, -9.011474609375, -8.35693359375, -7.702392578125, -7.0478515625, -6.393310546875, -5.73876953125, -5.084228515625, -4.4296875, -3.775146484375, -3.12060546875, -2.466064453125, -1.8115234375, -1.156982421875, -0.50244140625, 0.152099609375, 0.806640625, 1.461181640625, 2.11572265625, 2.770263671875, 3.4248046875, 4.079345703125, 4.73388671875, 5.388427734375, 6.04296875, 6.697509765625, 7.35205078125, 8.006591796875, 8.6611328125, 9.315673828125, 9.97021484375, 10.624755859375, 11.279296875, 11.933837890625, 12.58837890625, 13.242919921875, 13.8974609375, 14.552001953125, 15.20654296875, 15.861083984375, 16.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 3.0, 10.0, 5.0, 11.0, 16.0, 15.0, 37.0, 60.0, 116.0, 179.0, 379.0, 835.0, 1163.0, 605.0, 275.0, 135.0, 81.0, 45.0, 32.0, 21.0, 11.0, 6.0, 14.0, 9.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.65625, -31.88427734375, -31.1123046875, -30.34033203125, -29.568359375, -28.79638671875, -28.0244140625, -27.25244140625, -26.48046875, -25.70849609375, -24.9365234375, -24.16455078125, -23.392578125, -22.62060546875, -21.8486328125, -21.07666015625, -20.3046875, -19.53271484375, -18.7607421875, -17.98876953125, -17.216796875, -16.44482421875, -15.6728515625, -14.90087890625, -14.12890625, -13.35693359375, -12.5849609375, -11.81298828125, -11.041015625, -10.26904296875, -9.4970703125, -8.72509765625, -7.953125, -7.18115234375, -6.4091796875, -5.63720703125, -4.865234375, -4.09326171875, -3.3212890625, -2.54931640625, -1.77734375, -1.00537109375, -0.2333984375, 0.53857421875, 1.310546875, 2.08251953125, 2.8544921875, 3.62646484375, 4.3984375, 5.17041015625, 5.9423828125, 6.71435546875, 7.486328125, 8.25830078125, 9.0302734375, 9.80224609375, 10.57421875, 11.34619140625, 12.1181640625, 12.89013671875, 13.662109375, 14.43408203125, 15.2060546875, 15.97802734375, 16.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 12.0, 17.0, 54.0, 94.0, 191.0, 230.0, 183.0, 118.0, 53.0, 26.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.417236328125, -202.32986450195312, -195.24249267578125, -188.15512084960938, -181.0677490234375, -173.98037719726562, -166.89300537109375, -159.80563354492188, -152.71826171875, -145.63088989257812, -138.54351806640625, -131.45614624023438, -124.3687744140625, -117.28140258789062, -110.19403076171875, -103.10665893554688, -96.019287109375, -88.93191528320312, -81.84454345703125, -74.75717163085938, -67.6697998046875, -60.582427978515625, -53.49505615234375, -46.407684326171875, -39.3203125, -32.232940673828125, -25.14556884765625, -18.058197021484375, -10.9708251953125, -3.883453369140625, 3.20391845703125, 10.291290283203125, 17.378662109375, 24.466033935546875, 31.55340576171875, 38.640777587890625, 45.7281494140625, 52.815521240234375, 59.90289306640625, 66.99026489257812, 74.07763671875, 81.16500854492188, 88.25238037109375, 95.33975219726562, 102.4271240234375, 109.51449584960938, 116.60186767578125, 123.68923950195312, 130.776611328125, 137.86398315429688, 144.95135498046875, 152.03872680664062, 159.1260986328125, 166.21347045898438, 173.30084228515625, 180.38821411132812, 187.4755859375, 194.56295776367188, 201.65032958984375, 208.73770141601562, 215.8250732421875, 222.91244506835938, 229.99981689453125, 237.08718872070312, 244.174560546875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 8.0, 15.0, 19.0, 23.0, 22.0, 39.0, 39.0, 36.0, 52.0, 56.0, 68.0, 72.0, 58.0, 72.0, 67.0, 59.0, 45.0, 42.0, 42.0, 23.0, 24.0, 28.0, 18.0, 14.0, 12.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.9265365600586, -117.66624450683594, -114.40595245361328, -111.14566040039062, -107.8853759765625, -104.62508392333984, -101.36479187011719, -98.10449981689453, -94.84420776367188, -91.58391571044922, -88.32362365722656, -85.06333923339844, -81.80304718017578, -78.54275512695312, -75.28246307373047, -72.02217102050781, -68.76188659667969, -65.50159454345703, -62.24130630493164, -58.981014251708984, -55.720726013183594, -52.46043395996094, -49.20014190673828, -45.939849853515625, -42.679561614990234, -39.41926956176758, -36.15898132324219, -32.89868927001953, -29.638399124145508, -26.378108978271484, -23.117816925048828, -19.857526779174805, -16.597244262695312, -13.336954116821289, -10.07666301727295, -6.816371917724609, -3.556081771850586, -0.2957916259765625, 2.9645004272460938, 6.224790573120117, 9.48508071899414, 12.745370864868164, 16.005661010742188, 19.265953063964844, 22.526243209838867, 25.78653335571289, 29.046825408935547, 32.30711364746094, 35.567405700683594, 38.82769775390625, 42.08798599243164, 45.3482780456543, 48.60856628417969, 51.868858337402344, 55.129150390625, 58.389442443847656, 61.64973068237305, 64.91001892089844, 68.1703109741211, 71.43060302734375, 74.6908950805664, 77.95118713378906, 81.21147155761719, 84.47176361083984, 87.7320556640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 7.0, 14.0, 32.0, 34.0, 63.0, 98.0, 167.0, 292.0, 486.0, 855.0, 1618.0, 3098.0, 6175.0, 12384.0, 26965.0, 62128.0, 160510.0, 367629.0, 243384.0, 91021.0, 37652.0, 17175.0, 7991.0, 4000.0, 2184.0, 1112.0, 609.0, 365.0, 176.0, 120.0, 78.0, 49.0, 22.0, 21.0, 8.0, 7.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-19.046875, -18.541748046875, -18.03662109375, -17.531494140625, -17.0263671875, -16.521240234375, -16.01611328125, -15.510986328125, -15.005859375, -14.500732421875, -13.99560546875, -13.490478515625, -12.9853515625, -12.480224609375, -11.97509765625, -11.469970703125, -10.96484375, -10.459716796875, -9.95458984375, -9.449462890625, -8.9443359375, -8.439208984375, -7.93408203125, -7.428955078125, -6.923828125, -6.418701171875, -5.91357421875, -5.408447265625, -4.9033203125, -4.398193359375, -3.89306640625, -3.387939453125, -2.8828125, -2.377685546875, -1.87255859375, -1.367431640625, -0.8623046875, -0.357177734375, 0.14794921875, 0.653076171875, 1.158203125, 1.663330078125, 2.16845703125, 2.673583984375, 3.1787109375, 3.683837890625, 4.18896484375, 4.694091796875, 5.19921875, 5.704345703125, 6.20947265625, 6.714599609375, 7.2197265625, 7.724853515625, 8.22998046875, 8.735107421875, 9.240234375, 9.745361328125, 10.25048828125, 10.755615234375, 11.2607421875, 11.765869140625, 12.27099609375, 12.776123046875, 13.28125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 7.0, 15.0, 11.0, 16.0, 16.0, 17.0, 19.0, 37.0, 55.0, 38.0, 42.0, 47.0, 56.0, 61.0, 66.0, 68.0, 61.0, 63.0, 51.0, 49.0, 40.0, 44.0, 23.0, 19.0, 17.0, 15.0, 13.0, 12.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4140625, -9.0723876953125, -8.730712890625, -8.3890380859375, -8.04736328125, -7.7056884765625, -7.364013671875, -7.0223388671875, -6.6806640625, -6.3389892578125, -5.997314453125, -5.6556396484375, -5.31396484375, -4.9722900390625, -4.630615234375, -4.2889404296875, -3.947265625, -3.6055908203125, -3.263916015625, -2.9222412109375, -2.58056640625, -2.2388916015625, -1.897216796875, -1.5555419921875, -1.2138671875, -0.8721923828125, -0.530517578125, -0.1888427734375, 0.15283203125, 0.4945068359375, 0.836181640625, 1.1778564453125, 1.51953125, 1.8612060546875, 2.202880859375, 2.5445556640625, 2.88623046875, 3.2279052734375, 3.569580078125, 3.9112548828125, 4.2529296875, 4.5946044921875, 4.936279296875, 5.2779541015625, 5.61962890625, 5.9613037109375, 6.302978515625, 6.6446533203125, 6.986328125, 7.3280029296875, 7.669677734375, 8.0113525390625, 8.35302734375, 8.6947021484375, 9.036376953125, 9.3780517578125, 9.7197265625, 10.0614013671875, 10.403076171875, 10.7447509765625, 11.08642578125, 11.4281005859375, 11.769775390625, 12.1114501953125, 12.453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 7.0, 10.0, 15.0, 17.0, 24.0, 38.0, 35.0, 58.0, 101.0, 129.0, 168.0, 286.0, 509.0, 850.0, 1675.0, 3610.0, 9543.0, 30482.0, 126131.0, 606141.0, 202810.0, 44058.0, 12770.0, 4489.0, 1931.0, 996.0, 584.0, 348.0, 223.0, 156.0, 106.0, 73.0, 46.0, 36.0, 25.0, 22.0, 11.0, 8.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.984375, -23.226318359375, -22.46826171875, -21.710205078125, -20.9521484375, -20.194091796875, -19.43603515625, -18.677978515625, -17.919921875, -17.161865234375, -16.40380859375, -15.645751953125, -14.8876953125, -14.129638671875, -13.37158203125, -12.613525390625, -11.85546875, -11.097412109375, -10.33935546875, -9.581298828125, -8.8232421875, -8.065185546875, -7.30712890625, -6.549072265625, -5.791015625, -5.032958984375, -4.27490234375, -3.516845703125, -2.7587890625, -2.000732421875, -1.24267578125, -0.484619140625, 0.2734375, 1.031494140625, 1.78955078125, 2.547607421875, 3.3056640625, 4.063720703125, 4.82177734375, 5.579833984375, 6.337890625, 7.095947265625, 7.85400390625, 8.612060546875, 9.3701171875, 10.128173828125, 10.88623046875, 11.644287109375, 12.40234375, 13.160400390625, 13.91845703125, 14.676513671875, 15.4345703125, 16.192626953125, 16.95068359375, 17.708740234375, 18.466796875, 19.224853515625, 19.98291015625, 20.740966796875, 21.4990234375, 22.257080078125, 23.01513671875, 23.773193359375, 24.53125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 8.0, 7.0, 5.0, 5.0, 13.0, 11.0, 10.0, 13.0, 20.0, 22.0, 29.0, 38.0, 52.0, 60.0, 59.0, 43.0, 61.0, 45.0, 70.0, 57.0, 54.0, 43.0, 45.0, 32.0, 51.0, 36.0, 18.0, 23.0, 18.0, 5.0, 10.0, 5.0, 7.0, 4.0, 6.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.65087890625, -35.4892578125, -34.32763671875, -33.166015625, -32.00439453125, -30.8427734375, -29.68115234375, -28.51953125, -27.35791015625, -26.1962890625, -25.03466796875, -23.873046875, -22.71142578125, -21.5498046875, -20.38818359375, -19.2265625, -18.06494140625, -16.9033203125, -15.74169921875, -14.580078125, -13.41845703125, -12.2568359375, -11.09521484375, -9.93359375, -8.77197265625, -7.6103515625, -6.44873046875, -5.287109375, -4.12548828125, -2.9638671875, -1.80224609375, -0.640625, 0.52099609375, 1.6826171875, 2.84423828125, 4.005859375, 5.16748046875, 6.3291015625, 7.49072265625, 8.65234375, 9.81396484375, 10.9755859375, 12.13720703125, 13.298828125, 14.46044921875, 15.6220703125, 16.78369140625, 17.9453125, 19.10693359375, 20.2685546875, 21.43017578125, 22.591796875, 23.75341796875, 24.9150390625, 26.07666015625, 27.23828125, 28.39990234375, 29.5615234375, 30.72314453125, 31.884765625, 33.04638671875, 34.2080078125, 35.36962890625, 36.53125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 7.0, 12.0, 20.0, 25.0, 43.0, 107.0, 325.0, 1028.0, 7801.0, 287122.0, 735056.0, 14669.0, 1614.0, 416.0, 138.0, 69.0, 31.0, 18.0, 9.0, 10.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.1875, -20.459716796875, -19.73193359375, -19.004150390625, -18.2763671875, -17.548583984375, -16.82080078125, -16.093017578125, -15.365234375, -14.637451171875, -13.90966796875, -13.181884765625, -12.4541015625, -11.726318359375, -10.99853515625, -10.270751953125, -9.54296875, -8.815185546875, -8.08740234375, -7.359619140625, -6.6318359375, -5.904052734375, -5.17626953125, -4.448486328125, -3.720703125, -2.992919921875, -2.26513671875, -1.537353515625, -0.8095703125, -0.081787109375, 0.64599609375, 1.373779296875, 2.1015625, 2.829345703125, 3.55712890625, 4.284912109375, 5.0126953125, 5.740478515625, 6.46826171875, 7.196044921875, 7.923828125, 8.651611328125, 9.37939453125, 10.107177734375, 10.8349609375, 11.562744140625, 12.29052734375, 13.018310546875, 13.74609375, 14.473876953125, 15.20166015625, 15.929443359375, 16.6572265625, 17.385009765625, 18.11279296875, 18.840576171875, 19.568359375, 20.296142578125, 21.02392578125, 21.751708984375, 22.4794921875, 23.207275390625, 23.93505859375, 24.662841796875, 25.390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 8.0, 6.0, 9.0, 18.0, 18.0, 25.0, 16.0, 19.0, 31.0, 38.0, 56.0, 63.0, 82.0, 82.0, 79.0, 76.0, 68.0, 46.0, 50.0, 29.0, 25.0, 24.0, 21.0, 14.0, 11.0, 16.0, 9.0, 7.0, 7.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017986297607421875, -0.0017469674348831177, -0.0016953051090240479, -0.001643642783164978, -0.0015919804573059082, -0.0015403181314468384, -0.0014886558055877686, -0.0014369934797286987, -0.001385331153869629, -0.001333668828010559, -0.0012820065021514893, -0.0012303441762924194, -0.0011786818504333496, -0.0011270195245742798, -0.00107535719871521, -0.0010236948728561401, -0.0009720325469970703, -0.0009203702211380005, -0.0008687078952789307, -0.0008170455694198608, -0.000765383243560791, -0.0007137209177017212, -0.0006620585918426514, -0.0006103962659835815, -0.0005587339401245117, -0.0005070716142654419, -0.00045540928840637207, -0.00040374696254730225, -0.0003520846366882324, -0.0003004223108291626, -0.0002487599849700928, -0.00019709765911102295, -0.00014543533325195312, -9.37730073928833e-05, -4.2110681533813477e-05, 9.551644325256348e-06, 6.121397018432617e-05, 0.000112876296043396, 0.00016453862190246582, 0.00021620094776153564, 0.00026786327362060547, 0.0003195255994796753, 0.0003711879253387451, 0.00042285025119781494, 0.00047451257705688477, 0.0005261749029159546, 0.0005778372287750244, 0.0006294995546340942, 0.0006811618804931641, 0.0007328242063522339, 0.0007844865322113037, 0.0008361488580703735, 0.0008878111839294434, 0.0009394735097885132, 0.000991135835647583, 0.0010427981615066528, 0.0010944604873657227, 0.0011461228132247925, 0.0011977851390838623, 0.0012494474649429321, 0.001301109790802002, 0.0013527721166610718, 0.0014044344425201416, 0.0014560967683792114, 0.0015077590942382812]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 13.0, 20.0, 25.0, 51.0, 79.0, 133.0, 247.0, 440.0, 1042.0, 2641.0, 9569.0, 60542.0, 634637.0, 298529.0, 30936.0, 6091.0, 1897.0, 763.0, 384.0, 209.0, 109.0, 53.0, 41.0, 37.0, 17.0, 10.0, 4.0, 6.0, 2.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.7578125, -10.384765625, -10.01171875, -9.638671875, -9.265625, -8.892578125, -8.51953125, -8.146484375, -7.7734375, -7.400390625, -7.02734375, -6.654296875, -6.28125, -5.908203125, -5.53515625, -5.162109375, -4.7890625, -4.416015625, -4.04296875, -3.669921875, -3.296875, -2.923828125, -2.55078125, -2.177734375, -1.8046875, -1.431640625, -1.05859375, -0.685546875, -0.3125, 0.060546875, 0.43359375, 0.806640625, 1.1796875, 1.552734375, 1.92578125, 2.298828125, 2.671875, 3.044921875, 3.41796875, 3.791015625, 4.1640625, 4.537109375, 4.91015625, 5.283203125, 5.65625, 6.029296875, 6.40234375, 6.775390625, 7.1484375, 7.521484375, 7.89453125, 8.267578125, 8.640625, 9.013671875, 9.38671875, 9.759765625, 10.1328125, 10.505859375, 10.87890625, 11.251953125, 11.625, 11.998046875, 12.37109375, 12.744140625, 13.1171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 13.0, 23.0, 31.0, 38.0, 66.0, 77.0, 95.0, 106.0, 139.0, 103.0, 87.0, 60.0, 39.0, 31.0, 17.0, 22.0, 12.0, 14.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -7.959716796875, -7.58349609375, -7.207275390625, -6.8310546875, -6.454833984375, -6.07861328125, -5.702392578125, -5.326171875, -4.949951171875, -4.57373046875, -4.197509765625, -3.8212890625, -3.445068359375, -3.06884765625, -2.692626953125, -2.31640625, -1.940185546875, -1.56396484375, -1.187744140625, -0.8115234375, -0.435302734375, -0.05908203125, 0.317138671875, 0.693359375, 1.069580078125, 1.44580078125, 1.822021484375, 2.1982421875, 2.574462890625, 2.95068359375, 3.326904296875, 3.703125, 4.079345703125, 4.45556640625, 4.831787109375, 5.2080078125, 5.584228515625, 5.96044921875, 6.336669921875, 6.712890625, 7.089111328125, 7.46533203125, 7.841552734375, 8.2177734375, 8.593994140625, 8.97021484375, 9.346435546875, 9.72265625, 10.098876953125, 10.47509765625, 10.851318359375, 11.2275390625, 11.603759765625, 11.97998046875, 12.356201171875, 12.732421875, 13.108642578125, 13.48486328125, 13.861083984375, 14.2373046875, 14.613525390625, 14.98974609375, 15.365966796875, 15.7421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 9.0, 30.0, 78.0, 149.0, 309.0, 214.0, 118.0, 53.0, 22.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-381.7818908691406, -371.64874267578125, -361.515625, -351.38250732421875, -341.2493591308594, -331.1162109375, -320.98309326171875, -310.8499755859375, -300.7168273925781, -290.58367919921875, -280.4505615234375, -270.31744384765625, -260.1842956542969, -250.05116271972656, -239.91802978515625, -229.78489685058594, -219.65176391601562, -209.5186309814453, -199.385498046875, -189.2523651123047, -179.11923217773438, -168.98609924316406, -158.85296630859375, -148.71983337402344, -138.58670043945312, -128.4535675048828, -118.3204345703125, -108.18730163574219, -98.05416870117188, -87.92103576660156, -77.78790283203125, -67.65476989746094, -57.52166748046875, -47.38853454589844, -37.255401611328125, -27.122268676757812, -16.9891357421875, -6.8560028076171875, 3.277130126953125, 13.410263061523438, 23.54339599609375, 33.67652893066406, 43.809661865234375, 53.94279479980469, 64.075927734375, 74.20906066894531, 84.34219360351562, 94.47532653808594, 104.60845947265625, 114.74159240722656, 124.87472534179688, 135.0078582763672, 145.1409912109375, 155.2741241455078, 165.40725708007812, 175.54039001464844, 185.67352294921875, 195.80665588378906, 205.93978881835938, 216.0729217529297, 226.2060546875, 236.3391876220703, 246.47232055664062, 256.60546875, 266.73858642578125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 5.0, 5.0, 11.0, 8.0, 15.0, 21.0, 29.0, 32.0, 30.0, 30.0, 28.0, 38.0, 49.0, 57.0, 60.0, 67.0, 69.0, 60.0, 62.0, 49.0, 41.0, 43.0, 40.0, 31.0, 24.0, 28.0, 21.0, 11.0, 10.0, 6.0, 2.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-198.1376495361328, -192.92897033691406, -187.7202911376953, -182.51161193847656, -177.3029327392578, -172.09425354003906, -166.8855743408203, -161.67689514160156, -156.4682159423828, -151.25953674316406, -146.0508575439453, -140.84217834472656, -135.6334991455078, -130.42481994628906, -125.21614074707031, -120.00746154785156, -114.79878234863281, -109.59010314941406, -104.38142395019531, -99.17274475097656, -93.96406555175781, -88.75538635253906, -83.54670715332031, -78.33802795410156, -73.12934875488281, -67.92066955566406, -62.71199035644531, -57.50331115722656, -52.29463195800781, -47.08595275878906, -41.87727355957031, -36.66859436035156, -31.45989990234375, -26.251220703125, -21.04254150390625, -15.8338623046875, -10.62518310546875, -5.41650390625, -0.20782470703125, 5.0008544921875, 10.20953369140625, 15.418212890625, 20.62689208984375, 25.8355712890625, 31.04425048828125, 36.2529296875, 41.46160888671875, 46.6702880859375, 51.87896728515625, 57.087646484375, 62.29632568359375, 67.5050048828125, 72.71368408203125, 77.92236328125, 83.13104248046875, 88.3397216796875, 93.54840087890625, 98.757080078125, 103.96575927734375, 109.1744384765625, 114.38311767578125, 119.591796875, 124.80047607421875, 130.0091552734375, 135.21783447265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 5.0, 6.0, 11.0, 8.0, 18.0, 23.0, 23.0, 46.0, 89.0, 119.0, 235.0, 517.0, 972.0, 2392.0, 6096.0, 17196.0, 59320.0, 286144.0, 2010203.0, 1526092.0, 213865.0, 47577.0, 14299.0, 5121.0, 2048.0, 929.0, 425.0, 203.0, 126.0, 59.0, 46.0, 13.0, 20.0, 13.0, 5.0, 6.0, 1.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-15.34375, -14.949462890625, -14.55517578125, -14.160888671875, -13.7666015625, -13.372314453125, -12.97802734375, -12.583740234375, -12.189453125, -11.795166015625, -11.40087890625, -11.006591796875, -10.6123046875, -10.218017578125, -9.82373046875, -9.429443359375, -9.03515625, -8.640869140625, -8.24658203125, -7.852294921875, -7.4580078125, -7.063720703125, -6.66943359375, -6.275146484375, -5.880859375, -5.486572265625, -5.09228515625, -4.697998046875, -4.3037109375, -3.909423828125, -3.51513671875, -3.120849609375, -2.7265625, -2.332275390625, -1.93798828125, -1.543701171875, -1.1494140625, -0.755126953125, -0.36083984375, 0.033447265625, 0.427734375, 0.822021484375, 1.21630859375, 1.610595703125, 2.0048828125, 2.399169921875, 2.79345703125, 3.187744140625, 3.58203125, 3.976318359375, 4.37060546875, 4.764892578125, 5.1591796875, 5.553466796875, 5.94775390625, 6.342041015625, 6.736328125, 7.130615234375, 7.52490234375, 7.919189453125, 8.3134765625, 8.707763671875, 9.10205078125, 9.496337890625, 9.890625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 9.0, 5.0, 15.0, 21.0, 29.0, 34.0, 46.0, 59.0, 80.0, 113.0, 107.0, 91.0, 85.0, 71.0, 71.0, 53.0, 39.0, 34.0, 18.0, 12.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.734375, -18.2535400390625, -17.772705078125, -17.2918701171875, -16.81103515625, -16.3302001953125, -15.849365234375, -15.3685302734375, -14.8876953125, -14.4068603515625, -13.926025390625, -13.4451904296875, -12.96435546875, -12.4835205078125, -12.002685546875, -11.5218505859375, -11.041015625, -10.5601806640625, -10.079345703125, -9.5985107421875, -9.11767578125, -8.6368408203125, -8.156005859375, -7.6751708984375, -7.1943359375, -6.7135009765625, -6.232666015625, -5.7518310546875, -5.27099609375, -4.7901611328125, -4.309326171875, -3.8284912109375, -3.34765625, -2.8668212890625, -2.385986328125, -1.9051513671875, -1.42431640625, -0.9434814453125, -0.462646484375, 0.0181884765625, 0.4990234375, 0.9798583984375, 1.460693359375, 1.9415283203125, 2.42236328125, 2.9031982421875, 3.384033203125, 3.8648681640625, 4.345703125, 4.8265380859375, 5.307373046875, 5.7882080078125, 6.26904296875, 6.7498779296875, 7.230712890625, 7.7115478515625, 8.1923828125, 8.6732177734375, 9.154052734375, 9.6348876953125, 10.11572265625, 10.5965576171875, 11.077392578125, 11.5582275390625, 12.0390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 1.0, 6.0, 8.0, 22.0, 23.0, 14.0, 34.0, 63.0, 79.0, 106.0, 196.0, 352.0, 630.0, 1044.0, 2184.0, 4654.0, 10877.0, 28988.0, 93930.0, 455404.0, 2632134.0, 770028.0, 134387.0, 36985.0, 12671.0, 5001.0, 2147.0, 1004.0, 497.0, 298.0, 181.0, 110.0, 70.0, 52.0, 27.0, 17.0, 20.0, 8.0, 7.0, 8.0, 5.0, 0.0, 7.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.7890625, -15.35791015625, -14.9267578125, -14.49560546875, -14.064453125, -13.63330078125, -13.2021484375, -12.77099609375, -12.33984375, -11.90869140625, -11.4775390625, -11.04638671875, -10.615234375, -10.18408203125, -9.7529296875, -9.32177734375, -8.890625, -8.45947265625, -8.0283203125, -7.59716796875, -7.166015625, -6.73486328125, -6.3037109375, -5.87255859375, -5.44140625, -5.01025390625, -4.5791015625, -4.14794921875, -3.716796875, -3.28564453125, -2.8544921875, -2.42333984375, -1.9921875, -1.56103515625, -1.1298828125, -0.69873046875, -0.267578125, 0.16357421875, 0.5947265625, 1.02587890625, 1.45703125, 1.88818359375, 2.3193359375, 2.75048828125, 3.181640625, 3.61279296875, 4.0439453125, 4.47509765625, 4.90625, 5.33740234375, 5.7685546875, 6.19970703125, 6.630859375, 7.06201171875, 7.4931640625, 7.92431640625, 8.35546875, 8.78662109375, 9.2177734375, 9.64892578125, 10.080078125, 10.51123046875, 10.9423828125, 11.37353515625, 11.8046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 5.0, 13.0, 19.0, 31.0, 25.0, 23.0, 36.0, 40.0, 61.0, 65.0, 114.0, 156.0, 258.0, 377.0, 502.0, 565.0, 488.0, 370.0, 264.0, 179.0, 108.0, 85.0, 65.0, 52.0, 42.0, 20.0, 25.0, 14.0, 13.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-20.359375, -19.8297119140625, -19.300048828125, -18.7703857421875, -18.24072265625, -17.7110595703125, -17.181396484375, -16.6517333984375, -16.1220703125, -15.5924072265625, -15.062744140625, -14.5330810546875, -14.00341796875, -13.4737548828125, -12.944091796875, -12.4144287109375, -11.884765625, -11.3551025390625, -10.825439453125, -10.2957763671875, -9.76611328125, -9.2364501953125, -8.706787109375, -8.1771240234375, -7.6474609375, -7.1177978515625, -6.588134765625, -6.0584716796875, -5.52880859375, -4.9991455078125, -4.469482421875, -3.9398193359375, -3.41015625, -2.8804931640625, -2.350830078125, -1.8211669921875, -1.29150390625, -0.7618408203125, -0.232177734375, 0.2974853515625, 0.8271484375, 1.3568115234375, 1.886474609375, 2.4161376953125, 2.94580078125, 3.4754638671875, 4.005126953125, 4.5347900390625, 5.064453125, 5.5941162109375, 6.123779296875, 6.6534423828125, 7.18310546875, 7.7127685546875, 8.242431640625, 8.7720947265625, 9.3017578125, 9.8314208984375, 10.361083984375, 10.8907470703125, 11.42041015625, 11.9500732421875, 12.479736328125, 13.0093994140625, 13.5390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 7.0, 14.0, 20.0, 67.0, 149.0, 299.0, 247.0, 124.0, 43.0, 16.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.4140625, -224.6109619140625, -213.807861328125, -203.0047607421875, -192.20166015625, -181.3985595703125, -170.59544372558594, -159.79234313964844, -148.98924255371094, -138.18614196777344, -127.38304138183594, -116.5799331665039, -105.7768325805664, -94.9737319946289, -84.17062377929688, -73.36752319335938, -62.564422607421875, -51.761322021484375, -40.95821762084961, -30.155113220214844, -19.352012634277344, -8.548912048339844, 2.2541961669921875, 13.057296752929688, 23.860397338867188, 34.66349792480469, 45.46660232543945, 56.26970672607422, 67.07280731201172, 77.87590789794922, 88.67901611328125, 99.48211669921875, 110.28518676757812, 121.08828735351562, 131.89138793945312, 142.69448852539062, 153.49758911132812, 164.30068969726562, 175.1038055419922, 185.9069061279297, 196.7100067138672, 207.5131072998047, 218.3162078857422, 229.11932373046875, 239.92242431640625, 250.72552490234375, 261.52862548828125, 272.33172607421875, 283.13482666015625, 293.93792724609375, 304.74102783203125, 315.54412841796875, 326.34722900390625, 337.15032958984375, 347.95343017578125, 358.75653076171875, 369.55963134765625, 380.36273193359375, 391.16583251953125, 401.96893310546875, 412.77203369140625, 423.57513427734375, 434.37823486328125, 445.18133544921875, 455.9844665527344]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 10.0, 19.0, 10.0, 26.0, 21.0, 32.0, 48.0, 50.0, 54.0, 67.0, 61.0, 75.0, 53.0, 87.0, 56.0, 55.0, 50.0, 52.0, 31.0, 21.0, 25.0, 33.0, 21.0, 11.0, 9.0, 9.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.06410217285156, -92.57223510742188, -88.08036041259766, -83.58848571777344, -79.09661865234375, -74.60475158691406, -70.11287689208984, -65.62100219726562, -61.12913513183594, -56.637264251708984, -52.14539337158203, -47.65352249145508, -43.161651611328125, -38.66978073120117, -34.17790985107422, -29.686038970947266, -25.194168090820312, -20.70229721069336, -16.210426330566406, -11.718555450439453, -7.2266845703125, -2.734813690185547, 1.7570571899414062, 6.248928070068359, 10.740798950195312, 15.232669830322266, 19.72454071044922, 24.216411590576172, 28.708282470703125, 33.20015335083008, 37.69202423095703, 42.183895111083984, 46.67578125, 51.16765213012695, 55.659523010253906, 60.15139389038086, 64.64326477050781, 69.1351318359375, 73.62700653076172, 78.11888122558594, 82.61074829101562, 87.10261535644531, 91.59449005126953, 96.08636474609375, 100.57823181152344, 105.07009887695312, 109.56197357177734, 114.05384826660156, 118.54571533203125, 123.03758239746094, 127.52945709228516, 132.02133178710938, 136.51319885253906, 141.00506591796875, 145.4969482421875, 149.9888153076172, 154.48068237304688, 158.97254943847656, 163.46441650390625, 167.956298828125, 172.4481658935547, 176.94003295898438, 181.43191528320312, 185.9237823486328, 190.4156494140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 9.0, 7.0, 24.0, 15.0, 27.0, 32.0, 60.0, 61.0, 101.0, 157.0, 216.0, 373.0, 584.0, 942.0, 1725.0, 3162.0, 5898.0, 11932.0, 25070.0, 51958.0, 107479.0, 224456.0, 299694.0, 162129.0, 77564.0, 37724.0, 18106.0, 8868.0, 4389.0, 2356.0, 1294.0, 803.0, 432.0, 316.0, 201.0, 131.0, 72.0, 48.0, 47.0, 23.0, 17.0, 22.0, 8.0, 8.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.1640625, -13.7508544921875, -13.337646484375, -12.9244384765625, -12.51123046875, -12.0980224609375, -11.684814453125, -11.2716064453125, -10.8583984375, -10.4451904296875, -10.031982421875, -9.6187744140625, -9.20556640625, -8.7923583984375, -8.379150390625, -7.9659423828125, -7.552734375, -7.1395263671875, -6.726318359375, -6.3131103515625, -5.89990234375, -5.4866943359375, -5.073486328125, -4.6602783203125, -4.2470703125, -3.8338623046875, -3.420654296875, -3.0074462890625, -2.59423828125, -2.1810302734375, -1.767822265625, -1.3546142578125, -0.94140625, -0.5281982421875, -0.114990234375, 0.2982177734375, 0.71142578125, 1.1246337890625, 1.537841796875, 1.9510498046875, 2.3642578125, 2.7774658203125, 3.190673828125, 3.6038818359375, 4.01708984375, 4.4302978515625, 4.843505859375, 5.2567138671875, 5.669921875, 6.0831298828125, 6.496337890625, 6.9095458984375, 7.32275390625, 7.7359619140625, 8.149169921875, 8.5623779296875, 8.9755859375, 9.3887939453125, 9.802001953125, 10.2152099609375, 10.62841796875, 11.0416259765625, 11.454833984375, 11.8680419921875, 12.28125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 11.0, 16.0, 20.0, 18.0, 14.0, 49.0, 48.0, 38.0, 51.0, 68.0, 68.0, 65.0, 82.0, 65.0, 64.0, 49.0, 45.0, 36.0, 36.0, 29.0, 29.0, 20.0, 16.0, 15.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4140625, -9.0787353515625, -8.743408203125, -8.4080810546875, -8.07275390625, -7.7374267578125, -7.402099609375, -7.0667724609375, -6.7314453125, -6.3961181640625, -6.060791015625, -5.7254638671875, -5.39013671875, -5.0548095703125, -4.719482421875, -4.3841552734375, -4.048828125, -3.7135009765625, -3.378173828125, -3.0428466796875, -2.70751953125, -2.3721923828125, -2.036865234375, -1.7015380859375, -1.3662109375, -1.0308837890625, -0.695556640625, -0.3602294921875, -0.02490234375, 0.3104248046875, 0.645751953125, 0.9810791015625, 1.31640625, 1.6517333984375, 1.987060546875, 2.3223876953125, 2.65771484375, 2.9930419921875, 3.328369140625, 3.6636962890625, 3.9990234375, 4.3343505859375, 4.669677734375, 5.0050048828125, 5.34033203125, 5.6756591796875, 6.010986328125, 6.3463134765625, 6.681640625, 7.0169677734375, 7.352294921875, 7.6876220703125, 8.02294921875, 8.3582763671875, 8.693603515625, 9.0289306640625, 9.3642578125, 9.6995849609375, 10.034912109375, 10.3702392578125, 10.70556640625, 11.0408935546875, 11.376220703125, 11.7115478515625, 12.046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 16.0, 9.0, 16.0, 20.0, 34.0, 61.0, 62.0, 102.0, 178.0, 253.0, 377.0, 629.0, 1044.0, 1921.0, 4267.0, 15119.0, 112119.0, 757066.0, 129376.0, 16702.0, 4307.0, 1935.0, 1094.0, 657.0, 410.0, 257.0, 172.0, 121.0, 61.0, 47.0, 29.0, 19.0, 18.0, 7.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.0, -36.86669921875, -35.7333984375, -34.60009765625, -33.466796875, -32.33349609375, -31.2001953125, -30.06689453125, -28.93359375, -27.80029296875, -26.6669921875, -25.53369140625, -24.400390625, -23.26708984375, -22.1337890625, -21.00048828125, -19.8671875, -18.73388671875, -17.6005859375, -16.46728515625, -15.333984375, -14.20068359375, -13.0673828125, -11.93408203125, -10.80078125, -9.66748046875, -8.5341796875, -7.40087890625, -6.267578125, -5.13427734375, -4.0009765625, -2.86767578125, -1.734375, -0.60107421875, 0.5322265625, 1.66552734375, 2.798828125, 3.93212890625, 5.0654296875, 6.19873046875, 7.33203125, 8.46533203125, 9.5986328125, 10.73193359375, 11.865234375, 12.99853515625, 14.1318359375, 15.26513671875, 16.3984375, 17.53173828125, 18.6650390625, 19.79833984375, 20.931640625, 22.06494140625, 23.1982421875, 24.33154296875, 25.46484375, 26.59814453125, 27.7314453125, 28.86474609375, 29.998046875, 31.13134765625, 32.2646484375, 33.39794921875, 34.53125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 12.0, 12.0, 10.0, 11.0, 22.0, 20.0, 37.0, 30.0, 37.0, 47.0, 40.0, 54.0, 50.0, 56.0, 49.0, 49.0, 48.0, 42.0, 37.0, 30.0, 41.0, 32.0, 43.0, 22.0, 23.0, 23.0, 28.0, 16.0, 10.0, 10.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.69677734375, -32.6435546875, -31.59033203125, -30.537109375, -29.48388671875, -28.4306640625, -27.37744140625, -26.32421875, -25.27099609375, -24.2177734375, -23.16455078125, -22.111328125, -21.05810546875, -20.0048828125, -18.95166015625, -17.8984375, -16.84521484375, -15.7919921875, -14.73876953125, -13.685546875, -12.63232421875, -11.5791015625, -10.52587890625, -9.47265625, -8.41943359375, -7.3662109375, -6.31298828125, -5.259765625, -4.20654296875, -3.1533203125, -2.10009765625, -1.046875, 0.00634765625, 1.0595703125, 2.11279296875, 3.166015625, 4.21923828125, 5.2724609375, 6.32568359375, 7.37890625, 8.43212890625, 9.4853515625, 10.53857421875, 11.591796875, 12.64501953125, 13.6982421875, 14.75146484375, 15.8046875, 16.85791015625, 17.9111328125, 18.96435546875, 20.017578125, 21.07080078125, 22.1240234375, 23.17724609375, 24.23046875, 25.28369140625, 26.3369140625, 27.39013671875, 28.443359375, 29.49658203125, 30.5498046875, 31.60302734375, 32.65625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 10.0, 15.0, 12.0, 22.0, 48.0, 85.0, 138.0, 383.0, 1035.0, 6214.0, 105058.0, 875517.0, 54526.0, 4073.0, 795.0, 290.0, 132.0, 89.0, 55.0, 19.0, 13.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.1175537109375, -13.602294921875, -13.0870361328125, -12.57177734375, -12.0565185546875, -11.541259765625, -11.0260009765625, -10.5107421875, -9.9954833984375, -9.480224609375, -8.9649658203125, -8.44970703125, -7.9344482421875, -7.419189453125, -6.9039306640625, -6.388671875, -5.8734130859375, -5.358154296875, -4.8428955078125, -4.32763671875, -3.8123779296875, -3.297119140625, -2.7818603515625, -2.2666015625, -1.7513427734375, -1.236083984375, -0.7208251953125, -0.20556640625, 0.3096923828125, 0.824951171875, 1.3402099609375, 1.85546875, 2.3707275390625, 2.885986328125, 3.4012451171875, 3.91650390625, 4.4317626953125, 4.947021484375, 5.4622802734375, 5.9775390625, 6.4927978515625, 7.008056640625, 7.5233154296875, 8.03857421875, 8.5538330078125, 9.069091796875, 9.5843505859375, 10.099609375, 10.6148681640625, 11.130126953125, 11.6453857421875, 12.16064453125, 12.6759033203125, 13.191162109375, 13.7064208984375, 14.2216796875, 14.7369384765625, 15.252197265625, 15.7674560546875, 16.28271484375, 16.7979736328125, 17.313232421875, 17.8284912109375, 18.34375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 11.0, 8.0, 10.0, 13.0, 14.0, 19.0, 21.0, 18.0, 19.0, 24.0, 20.0, 35.0, 28.0, 51.0, 78.0, 84.0, 110.0, 99.0, 54.0, 41.0, 25.0, 28.0, 25.0, 24.0, 19.0, 14.0, 13.0, 11.0, 12.0, 9.0, 8.0, 10.0, 4.0, 6.0, 7.0, 4.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.0017766952514648438, -0.0017218589782714844, -0.001667022705078125, -0.0016121864318847656, -0.0015573501586914062, -0.0015025138854980469, -0.0014476776123046875, -0.0013928413391113281, -0.0013380050659179688, -0.0012831687927246094, -0.00122833251953125, -0.0011734962463378906, -0.0011186599731445312, -0.0010638236999511719, -0.0010089874267578125, -0.0009541511535644531, -0.0008993148803710938, -0.0008444786071777344, -0.000789642333984375, -0.0007348060607910156, -0.0006799697875976562, -0.0006251335144042969, -0.0005702972412109375, -0.0005154609680175781, -0.00046062469482421875, -0.0004057884216308594, -0.0003509521484375, -0.0002961158752441406, -0.00024127960205078125, -0.00018644332885742188, -0.0001316070556640625, -7.677078247070312e-05, -2.193450927734375e-05, 3.2901763916015625e-05, 8.7738037109375e-05, 0.00014257431030273438, 0.00019741058349609375, 0.0002522468566894531, 0.0003070831298828125, 0.0003619194030761719, 0.00041675567626953125, 0.0004715919494628906, 0.00052642822265625, 0.0005812644958496094, 0.0006361007690429688, 0.0006909370422363281, 0.0007457733154296875, 0.0008006095886230469, 0.0008554458618164062, 0.0009102821350097656, 0.000965118408203125, 0.0010199546813964844, 0.0010747909545898438, 0.0011296272277832031, 0.0011844635009765625, 0.0012392997741699219, 0.0012941360473632812, 0.0013489723205566406, 0.00140380859375, 0.0014586448669433594, 0.0015134811401367188, 0.0015683174133300781, 0.0016231536865234375, 0.0016779899597167969, 0.0017328262329101562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 11.0, 28.0, 61.0, 84.0, 168.0, 426.0, 959.0, 2873.0, 13586.0, 212112.0, 774183.0, 36348.0, 5124.0, 1485.0, 568.0, 236.0, 141.0, 66.0, 30.0, 17.0, 16.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9765625, -14.55126953125, -14.1259765625, -13.70068359375, -13.275390625, -12.85009765625, -12.4248046875, -11.99951171875, -11.57421875, -11.14892578125, -10.7236328125, -10.29833984375, -9.873046875, -9.44775390625, -9.0224609375, -8.59716796875, -8.171875, -7.74658203125, -7.3212890625, -6.89599609375, -6.470703125, -6.04541015625, -5.6201171875, -5.19482421875, -4.76953125, -4.34423828125, -3.9189453125, -3.49365234375, -3.068359375, -2.64306640625, -2.2177734375, -1.79248046875, -1.3671875, -0.94189453125, -0.5166015625, -0.09130859375, 0.333984375, 0.75927734375, 1.1845703125, 1.60986328125, 2.03515625, 2.46044921875, 2.8857421875, 3.31103515625, 3.736328125, 4.16162109375, 4.5869140625, 5.01220703125, 5.4375, 5.86279296875, 6.2880859375, 6.71337890625, 7.138671875, 7.56396484375, 7.9892578125, 8.41455078125, 8.83984375, 9.26513671875, 9.6904296875, 10.11572265625, 10.541015625, 10.96630859375, 11.3916015625, 11.81689453125, 12.2421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 7.0, 9.0, 16.0, 16.0, 11.0, 23.0, 18.0, 42.0, 41.0, 48.0, 54.0, 71.0, 71.0, 84.0, 84.0, 63.0, 68.0, 45.0, 50.0, 33.0, 34.0, 25.0, 25.0, 15.0, 15.0, 6.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7109375, -6.48797607421875, -6.2650146484375, -6.04205322265625, -5.819091796875, -5.59613037109375, -5.3731689453125, -5.15020751953125, -4.92724609375, -4.70428466796875, -4.4813232421875, -4.25836181640625, -4.035400390625, -3.81243896484375, -3.5894775390625, -3.36651611328125, -3.1435546875, -2.92059326171875, -2.6976318359375, -2.47467041015625, -2.251708984375, -2.02874755859375, -1.8057861328125, -1.58282470703125, -1.35986328125, -1.13690185546875, -0.9139404296875, -0.69097900390625, -0.468017578125, -0.24505615234375, -0.0220947265625, 0.20086669921875, 0.423828125, 0.64678955078125, 0.8697509765625, 1.09271240234375, 1.315673828125, 1.53863525390625, 1.7615966796875, 1.98455810546875, 2.20751953125, 2.43048095703125, 2.6534423828125, 2.87640380859375, 3.099365234375, 3.32232666015625, 3.5452880859375, 3.76824951171875, 3.9912109375, 4.21417236328125, 4.4371337890625, 4.66009521484375, 4.883056640625, 5.10601806640625, 5.3289794921875, 5.55194091796875, 5.77490234375, 5.99786376953125, 6.2208251953125, 6.44378662109375, 6.666748046875, 6.88970947265625, 7.1126708984375, 7.33563232421875, 7.55859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 7.0, 13.0, 31.0, 66.0, 102.0, 165.0, 231.0, 147.0, 76.0, 70.0, 32.0, 16.0, 10.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.60125732421875, -212.82029724121094, -206.0393524169922, -199.25839233398438, -192.47744750976562, -185.6964874267578, -178.91554260253906, -172.13458251953125, -165.3536376953125, -158.5726776123047, -151.79173278808594, -145.01077270507812, -138.22982788085938, -131.44886779785156, -124.66792297363281, -117.886962890625, -111.10601043701172, -104.32505798339844, -97.54410552978516, -90.76315307617188, -83.9822006225586, -77.20124816894531, -70.4202880859375, -63.639339447021484, -56.8583869934082, -50.07743453979492, -43.29648208618164, -36.515525817871094, -29.734575271606445, -22.95362091064453, -16.17266845703125, -9.391716003417969, -2.6107635498046875, 4.170189380645752, 10.951142311096191, 17.73209571838379, 24.51304817199707, 31.294002532958984, 38.074954986572266, 44.85590744018555, 51.63685989379883, 58.41781234741211, 65.19876861572266, 71.97972106933594, 78.76067352294922, 85.5416259765625, 92.32257843017578, 99.10353088378906, 105.88448333740234, 112.66543579101562, 119.4463882446289, 126.22734069824219, 133.00830078125, 139.78924560546875, 146.57020568847656, 153.3511505126953, 160.13211059570312, 166.91307067871094, 173.6940155029297, 180.4749755859375, 187.25592041015625, 194.03688049316406, 200.8178253173828, 207.59878540039062, 214.37973022460938]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 3.0, 9.0, 9.0, 12.0, 17.0, 24.0, 19.0, 21.0, 27.0, 28.0, 37.0, 26.0, 35.0, 37.0, 43.0, 58.0, 81.0, 76.0, 52.0, 45.0, 60.0, 42.0, 34.0, 28.0, 29.0, 26.0, 17.0, 22.0, 15.0, 11.0, 6.0, 11.0, 10.0, 3.0, 3.0, 3.0, 8.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-145.24365234375, -140.96322631835938, -136.6827850341797, -132.40235900878906, -128.12193298339844, -123.84149932861328, -119.56106567382812, -115.2806396484375, -111.00021362304688, -106.71977996826172, -102.4393539428711, -98.15892028808594, -93.87849426269531, -89.59806060791016, -85.317626953125, -81.03720092773438, -76.75676727294922, -72.47633361816406, -68.19590759277344, -63.91547393798828, -59.635047912597656, -55.3546142578125, -51.07418441772461, -46.79375457763672, -42.51332473754883, -38.23289489746094, -33.95246505737305, -29.672033309936523, -25.391603469848633, -21.111173629760742, -16.83074188232422, -12.550312042236328, -8.269882202148438, -3.9894518852233887, 0.29097843170166016, 4.571409225463867, 8.851839065551758, 13.132268905639648, 17.412700653076172, 21.693130493164062, 25.973560333251953, 30.253990173339844, 34.534420013427734, 38.814849853515625, 43.09528350830078, 47.375709533691406, 51.65614318847656, 55.93657302856445, 60.217002868652344, 64.4974365234375, 68.77786254882812, 73.05829620361328, 77.3387222290039, 81.61915588378906, 85.89958190917969, 90.18001556396484, 94.46044921875, 98.74088287353516, 103.02130889892578, 107.30174255371094, 111.58216857910156, 115.86260223388672, 120.14303588867188, 124.4234619140625, 128.70388793945312]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 9.0, 15.0, 13.0, 17.0, 34.0, 51.0, 84.0, 107.0, 217.0, 436.0, 767.0, 1524.0, 3615.0, 8955.0, 26043.0, 92947.0, 566098.0, 2564079.0, 765033.0, 117773.0, 29447.0, 9750.0, 3832.0, 1630.0, 745.0, 428.0, 229.0, 123.0, 91.0, 60.0, 48.0, 21.0, 16.0, 7.0, 7.0, 4.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.921875, -9.5745849609375, -9.227294921875, -8.8800048828125, -8.53271484375, -8.1854248046875, -7.838134765625, -7.4908447265625, -7.1435546875, -6.7962646484375, -6.448974609375, -6.1016845703125, -5.75439453125, -5.4071044921875, -5.059814453125, -4.7125244140625, -4.365234375, -4.0179443359375, -3.670654296875, -3.3233642578125, -2.97607421875, -2.6287841796875, -2.281494140625, -1.9342041015625, -1.5869140625, -1.2396240234375, -0.892333984375, -0.5450439453125, -0.19775390625, 0.1495361328125, 0.496826171875, 0.8441162109375, 1.19140625, 1.5386962890625, 1.885986328125, 2.2332763671875, 2.58056640625, 2.9278564453125, 3.275146484375, 3.6224365234375, 3.9697265625, 4.3170166015625, 4.664306640625, 5.0115966796875, 5.35888671875, 5.7061767578125, 6.053466796875, 6.4007568359375, 6.748046875, 7.0953369140625, 7.442626953125, 7.7899169921875, 8.13720703125, 8.4844970703125, 8.831787109375, 9.1790771484375, 9.5263671875, 9.8736572265625, 10.220947265625, 10.5682373046875, 10.91552734375, 11.2628173828125, 11.610107421875, 11.9573974609375, 12.3046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 6.0, 15.0, 14.0, 15.0, 19.0, 22.0, 27.0, 44.0, 41.0, 64.0, 49.0, 69.0, 64.0, 60.0, 62.0, 62.0, 65.0, 59.0, 49.0, 44.0, 33.0, 21.0, 24.0, 19.0, 9.0, 12.0, 10.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.6356201171875, -8.310302734375, -7.9849853515625, -7.65966796875, -7.3343505859375, -7.009033203125, -6.6837158203125, -6.3583984375, -6.0330810546875, -5.707763671875, -5.3824462890625, -5.05712890625, -4.7318115234375, -4.406494140625, -4.0811767578125, -3.755859375, -3.4305419921875, -3.105224609375, -2.7799072265625, -2.45458984375, -2.1292724609375, -1.803955078125, -1.4786376953125, -1.1533203125, -0.8280029296875, -0.502685546875, -0.1773681640625, 0.14794921875, 0.4732666015625, 0.798583984375, 1.1239013671875, 1.44921875, 1.7745361328125, 2.099853515625, 2.4251708984375, 2.75048828125, 3.0758056640625, 3.401123046875, 3.7264404296875, 4.0517578125, 4.3770751953125, 4.702392578125, 5.0277099609375, 5.35302734375, 5.6783447265625, 6.003662109375, 6.3289794921875, 6.654296875, 6.9796142578125, 7.304931640625, 7.6302490234375, 7.95556640625, 8.2808837890625, 8.606201171875, 8.9315185546875, 9.2568359375, 9.5821533203125, 9.907470703125, 10.2327880859375, 10.55810546875, 10.8834228515625, 11.208740234375, 11.5340576171875, 11.859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 7.0, 6.0, 10.0, 18.0, 36.0, 38.0, 58.0, 106.0, 186.0, 359.0, 742.0, 1878.0, 5512.0, 18748.0, 86441.0, 1010641.0, 2862775.0, 169224.0, 27368.0, 6617.0, 2064.0, 759.0, 343.0, 172.0, 70.0, 42.0, 22.0, 13.0, 14.0, 9.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.296875, -25.673583984375, -25.05029296875, -24.427001953125, -23.8037109375, -23.180419921875, -22.55712890625, -21.933837890625, -21.310546875, -20.687255859375, -20.06396484375, -19.440673828125, -18.8173828125, -18.194091796875, -17.57080078125, -16.947509765625, -16.32421875, -15.700927734375, -15.07763671875, -14.454345703125, -13.8310546875, -13.207763671875, -12.58447265625, -11.961181640625, -11.337890625, -10.714599609375, -10.09130859375, -9.468017578125, -8.8447265625, -8.221435546875, -7.59814453125, -6.974853515625, -6.3515625, -5.728271484375, -5.10498046875, -4.481689453125, -3.8583984375, -3.235107421875, -2.61181640625, -1.988525390625, -1.365234375, -0.741943359375, -0.11865234375, 0.504638671875, 1.1279296875, 1.751220703125, 2.37451171875, 2.997802734375, 3.62109375, 4.244384765625, 4.86767578125, 5.490966796875, 6.1142578125, 6.737548828125, 7.36083984375, 7.984130859375, 8.607421875, 9.230712890625, 9.85400390625, 10.477294921875, 11.1005859375, 11.723876953125, 12.34716796875, 12.970458984375, 13.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 4.0, 12.0, 6.0, 12.0, 13.0, 22.0, 20.0, 28.0, 41.0, 44.0, 65.0, 103.0, 170.0, 296.0, 513.0, 755.0, 749.0, 472.0, 311.0, 148.0, 94.0, 54.0, 35.0, 31.0, 19.0, 17.0, 14.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.828125, -26.156494140625, -25.48486328125, -24.813232421875, -24.1416015625, -23.469970703125, -22.79833984375, -22.126708984375, -21.455078125, -20.783447265625, -20.11181640625, -19.440185546875, -18.7685546875, -18.096923828125, -17.42529296875, -16.753662109375, -16.08203125, -15.410400390625, -14.73876953125, -14.067138671875, -13.3955078125, -12.723876953125, -12.05224609375, -11.380615234375, -10.708984375, -10.037353515625, -9.36572265625, -8.694091796875, -8.0224609375, -7.350830078125, -6.67919921875, -6.007568359375, -5.3359375, -4.664306640625, -3.99267578125, -3.321044921875, -2.6494140625, -1.977783203125, -1.30615234375, -0.634521484375, 0.037109375, 0.708740234375, 1.38037109375, 2.052001953125, 2.7236328125, 3.395263671875, 4.06689453125, 4.738525390625, 5.41015625, 6.081787109375, 6.75341796875, 7.425048828125, 8.0966796875, 8.768310546875, 9.43994140625, 10.111572265625, 10.783203125, 11.454833984375, 12.12646484375, 12.798095703125, 13.4697265625, 14.141357421875, 14.81298828125, 15.484619140625, 16.15625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 15.0, 32.0, 82.0, 195.0, 280.0, 214.0, 100.0, 36.0, 16.0, 5.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.15786743164062, -171.47311401367188, -162.78836059570312, -154.10360717773438, -145.41885375976562, -136.73410034179688, -128.0493621826172, -119.36460876464844, -110.67985534667969, -101.99510192871094, -93.31034851074219, -84.62560272216797, -75.94084930419922, -67.25609588623047, -58.571346282958984, -49.8865966796875, -41.20184326171875, -32.51708984375, -23.832340240478516, -15.147588729858398, -6.462837219238281, 2.2219161987304688, 10.906665802001953, 19.591415405273438, 28.276168823242188, 36.96092224121094, 45.64567184448242, 54.330421447753906, 63.015174865722656, 71.6999282836914, 80.38467407226562, 89.06942749023438, 97.75421142578125, 106.43896484375, 115.12371826171875, 123.80846405029297, 132.49322509765625, 141.177978515625, 149.8627166748047, 158.54747009277344, 167.2322235107422, 175.91697692871094, 184.6017303466797, 193.28648376464844, 201.97122192382812, 210.65597534179688, 219.34072875976562, 228.02548217773438, 236.71023559570312, 245.39498901367188, 254.07974243164062, 262.7644958496094, 271.4492492675781, 280.1340026855469, 288.8187561035156, 297.50347900390625, 306.188232421875, 314.87298583984375, 323.5577392578125, 332.24249267578125, 340.92724609375, 349.61199951171875, 358.2967529296875, 366.98150634765625, 375.666259765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 11.0, 18.0, 20.0, 24.0, 25.0, 40.0, 38.0, 35.0, 49.0, 52.0, 59.0, 45.0, 46.0, 55.0, 77.0, 45.0, 51.0, 46.0, 46.0, 38.0, 30.0, 22.0, 22.0, 23.0, 17.0, 15.0, 9.0, 9.0, 12.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.65245819091797, -122.11328125, -118.57410430908203, -115.03492736816406, -111.49575805664062, -107.95658111572266, -104.41740417480469, -100.87822723388672, -97.33905029296875, -93.79987335205078, -90.26069641113281, -86.72152709960938, -83.1823501586914, -79.64317321777344, -76.10399627685547, -72.5648193359375, -69.02565002441406, -65.4864730834961, -61.94729995727539, -58.40812301635742, -54.86894989013672, -51.32977294921875, -47.79059600830078, -44.25141906738281, -40.71224594116211, -37.17306900024414, -33.63389587402344, -30.09471893310547, -26.555543899536133, -23.016368865966797, -19.477191925048828, -15.938016891479492, -12.398834228515625, -8.859659194946289, -5.320483207702637, -1.7813072204589844, 1.7578678131103516, 5.2970428466796875, 8.836219787597656, 12.375394821166992, 15.914569854736328, 19.453744888305664, 22.992919921875, 26.53209686279297, 30.071271896362305, 33.61044692993164, 37.14962387084961, 40.68879699707031, 44.22797393798828, 47.76715087890625, 51.30632400512695, 54.84550094604492, 58.384674072265625, 61.923851013183594, 65.46302795410156, 69.00220489501953, 72.5413818359375, 76.08055877685547, 79.61973571777344, 83.15890502929688, 86.69808197021484, 90.23725891113281, 93.77643585205078, 97.31561279296875, 100.85478210449219]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 11.0, 26.0, 28.0, 55.0, 74.0, 86.0, 185.0, 228.0, 379.0, 556.0, 902.0, 1479.0, 2428.0, 3966.0, 6731.0, 11830.0, 21297.0, 38661.0, 74579.0, 155603.0, 282237.0, 222408.0, 106181.0, 52859.0, 28181.0, 15573.0, 8714.0, 5136.0, 3059.0, 1880.0, 1148.0, 753.0, 434.0, 267.0, 184.0, 131.0, 81.0, 63.0, 37.0, 27.0, 16.0, 17.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.0828857421875, -9.743896484375, -9.4049072265625, -9.06591796875, -8.7269287109375, -8.387939453125, -8.0489501953125, -7.7099609375, -7.3709716796875, -7.031982421875, -6.6929931640625, -6.35400390625, -6.0150146484375, -5.676025390625, -5.3370361328125, -4.998046875, -4.6590576171875, -4.320068359375, -3.9810791015625, -3.64208984375, -3.3031005859375, -2.964111328125, -2.6251220703125, -2.2861328125, -1.9471435546875, -1.608154296875, -1.2691650390625, -0.93017578125, -0.5911865234375, -0.252197265625, 0.0867919921875, 0.42578125, 0.7647705078125, 1.103759765625, 1.4427490234375, 1.78173828125, 2.1207275390625, 2.459716796875, 2.7987060546875, 3.1376953125, 3.4766845703125, 3.815673828125, 4.1546630859375, 4.49365234375, 4.8326416015625, 5.171630859375, 5.5106201171875, 5.849609375, 6.1885986328125, 6.527587890625, 6.8665771484375, 7.20556640625, 7.5445556640625, 7.883544921875, 8.2225341796875, 8.5615234375, 8.9005126953125, 9.239501953125, 9.5784912109375, 9.91748046875, 10.2564697265625, 10.595458984375, 10.9344482421875, 11.2734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 7.0, 10.0, 18.0, 15.0, 28.0, 26.0, 37.0, 47.0, 46.0, 51.0, 47.0, 57.0, 59.0, 58.0, 56.0, 58.0, 39.0, 60.0, 44.0, 41.0, 37.0, 32.0, 21.0, 22.0, 10.0, 13.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.171875, -8.86767578125, -8.5634765625, -8.25927734375, -7.955078125, -7.65087890625, -7.3466796875, -7.04248046875, -6.73828125, -6.43408203125, -6.1298828125, -5.82568359375, -5.521484375, -5.21728515625, -4.9130859375, -4.60888671875, -4.3046875, -4.00048828125, -3.6962890625, -3.39208984375, -3.087890625, -2.78369140625, -2.4794921875, -2.17529296875, -1.87109375, -1.56689453125, -1.2626953125, -0.95849609375, -0.654296875, -0.35009765625, -0.0458984375, 0.25830078125, 0.5625, 0.86669921875, 1.1708984375, 1.47509765625, 1.779296875, 2.08349609375, 2.3876953125, 2.69189453125, 2.99609375, 3.30029296875, 3.6044921875, 3.90869140625, 4.212890625, 4.51708984375, 4.8212890625, 5.12548828125, 5.4296875, 5.73388671875, 6.0380859375, 6.34228515625, 6.646484375, 6.95068359375, 7.2548828125, 7.55908203125, 7.86328125, 8.16748046875, 8.4716796875, 8.77587890625, 9.080078125, 9.38427734375, 9.6884765625, 9.99267578125, 10.296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 3.0, 16.0, 16.0, 23.0, 45.0, 52.0, 70.0, 106.0, 163.0, 236.0, 339.0, 619.0, 1016.0, 1801.0, 4431.0, 16592.0, 110744.0, 769012.0, 116949.0, 17181.0, 4565.0, 1786.0, 1015.0, 591.0, 372.0, 261.0, 176.0, 98.0, 93.0, 47.0, 41.0, 28.0, 20.0, 15.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-41.125, -40.05712890625, -38.9892578125, -37.92138671875, -36.853515625, -35.78564453125, -34.7177734375, -33.64990234375, -32.58203125, -31.51416015625, -30.4462890625, -29.37841796875, -28.310546875, -27.24267578125, -26.1748046875, -25.10693359375, -24.0390625, -22.97119140625, -21.9033203125, -20.83544921875, -19.767578125, -18.69970703125, -17.6318359375, -16.56396484375, -15.49609375, -14.42822265625, -13.3603515625, -12.29248046875, -11.224609375, -10.15673828125, -9.0888671875, -8.02099609375, -6.953125, -5.88525390625, -4.8173828125, -3.74951171875, -2.681640625, -1.61376953125, -0.5458984375, 0.52197265625, 1.58984375, 2.65771484375, 3.7255859375, 4.79345703125, 5.861328125, 6.92919921875, 7.9970703125, 9.06494140625, 10.1328125, 11.20068359375, 12.2685546875, 13.33642578125, 14.404296875, 15.47216796875, 16.5400390625, 17.60791015625, 18.67578125, 19.74365234375, 20.8115234375, 21.87939453125, 22.947265625, 24.01513671875, 25.0830078125, 26.15087890625, 27.21875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 16.0, 16.0, 19.0, 29.0, 27.0, 28.0, 32.0, 40.0, 44.0, 52.0, 50.0, 58.0, 63.0, 58.0, 57.0, 50.0, 50.0, 41.0, 44.0, 30.0, 25.0, 27.0, 23.0, 20.0, 11.0, 15.0, 13.0, 6.0, 8.0, 0.0, 3.0, 3.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.734375, -29.636474609375, -28.53857421875, -27.440673828125, -26.3427734375, -25.244873046875, -24.14697265625, -23.049072265625, -21.951171875, -20.853271484375, -19.75537109375, -18.657470703125, -17.5595703125, -16.461669921875, -15.36376953125, -14.265869140625, -13.16796875, -12.070068359375, -10.97216796875, -9.874267578125, -8.7763671875, -7.678466796875, -6.58056640625, -5.482666015625, -4.384765625, -3.286865234375, -2.18896484375, -1.091064453125, 0.0068359375, 1.104736328125, 2.20263671875, 3.300537109375, 4.3984375, 5.496337890625, 6.59423828125, 7.692138671875, 8.7900390625, 9.887939453125, 10.98583984375, 12.083740234375, 13.181640625, 14.279541015625, 15.37744140625, 16.475341796875, 17.5732421875, 18.671142578125, 19.76904296875, 20.866943359375, 21.96484375, 23.062744140625, 24.16064453125, 25.258544921875, 26.3564453125, 27.454345703125, 28.55224609375, 29.650146484375, 30.748046875, 31.845947265625, 32.94384765625, 34.041748046875, 35.1396484375, 36.237548828125, 37.33544921875, 38.433349609375, 39.53125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 6.0, 11.0, 29.0, 42.0, 91.0, 162.0, 486.0, 2137.0, 33712.0, 945882.0, 62081.0, 2959.0, 571.0, 193.0, 79.0, 47.0, 23.0, 17.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.3310546875, -16.724609375, -16.1181640625, -15.51171875, -14.9052734375, -14.298828125, -13.6923828125, -13.0859375, -12.4794921875, -11.873046875, -11.2666015625, -10.66015625, -10.0537109375, -9.447265625, -8.8408203125, -8.234375, -7.6279296875, -7.021484375, -6.4150390625, -5.80859375, -5.2021484375, -4.595703125, -3.9892578125, -3.3828125, -2.7763671875, -2.169921875, -1.5634765625, -0.95703125, -0.3505859375, 0.255859375, 0.8623046875, 1.46875, 2.0751953125, 2.681640625, 3.2880859375, 3.89453125, 4.5009765625, 5.107421875, 5.7138671875, 6.3203125, 6.9267578125, 7.533203125, 8.1396484375, 8.74609375, 9.3525390625, 9.958984375, 10.5654296875, 11.171875, 11.7783203125, 12.384765625, 12.9912109375, 13.59765625, 14.2041015625, 14.810546875, 15.4169921875, 16.0234375, 16.6298828125, 17.236328125, 17.8427734375, 18.44921875, 19.0556640625, 19.662109375, 20.2685546875, 20.875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 1.0, 10.0, 6.0, 12.0, 15.0, 17.0, 15.0, 21.0, 22.0, 34.0, 49.0, 46.0, 80.0, 87.0, 96.0, 82.0, 85.0, 57.0, 54.0, 34.0, 29.0, 19.0, 21.0, 13.0, 15.0, 13.0, 12.0, 10.0, 10.0, 4.0, 8.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016641616821289062, -0.0016119331121444702, -0.0015597045421600342, -0.0015074759721755981, -0.0014552474021911621, -0.001403018832206726, -0.00135079026222229, -0.001298561692237854, -0.001246333122253418, -0.001194104552268982, -0.001141875982284546, -0.0010896474123001099, -0.0010374188423156738, -0.0009851902723312378, -0.0009329617023468018, -0.0008807331323623657, -0.0008285045623779297, -0.0007762759923934937, -0.0007240474224090576, -0.0006718188524246216, -0.0006195902824401855, -0.0005673617124557495, -0.0005151331424713135, -0.00046290457248687744, -0.0004106760025024414, -0.00035844743251800537, -0.00030621886253356934, -0.0002539902925491333, -0.00020176172256469727, -0.00014953315258026123, -9.73045825958252e-05, -4.507601261138916e-05, 7.152557373046875e-06, 5.938112735748291e-05, 0.00011160969734191895, 0.00016383826732635498, 0.00021606683731079102, 0.00026829540729522705, 0.0003205239772796631, 0.0003727525472640991, 0.00042498111724853516, 0.0004772096872329712, 0.0005294382572174072, 0.0005816668272018433, 0.0006338953971862793, 0.0006861239671707153, 0.0007383525371551514, 0.0007905811071395874, 0.0008428096771240234, 0.0008950382471084595, 0.0009472668170928955, 0.0009994953870773315, 0.0010517239570617676, 0.0011039525270462036, 0.0011561810970306396, 0.0012084096670150757, 0.0012606382369995117, 0.0013128668069839478, 0.0013650953769683838, 0.0014173239469528198, 0.0014695525169372559, 0.001521781086921692, 0.001574009656906128, 0.001626238226890564, 0.001678466796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 11.0, 6.0, 14.0, 9.0, 28.0, 27.0, 60.0, 88.0, 141.0, 287.0, 567.0, 1206.0, 2936.0, 9110.0, 54995.0, 718321.0, 230033.0, 21752.0, 5215.0, 1971.0, 850.0, 420.0, 202.0, 104.0, 80.0, 35.0, 30.0, 17.0, 14.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.8934326171875, -5.622802734375, -5.3521728515625, -5.08154296875, -4.8109130859375, -4.540283203125, -4.2696533203125, -3.9990234375, -3.7283935546875, -3.457763671875, -3.1871337890625, -2.91650390625, -2.6458740234375, -2.375244140625, -2.1046142578125, -1.833984375, -1.5633544921875, -1.292724609375, -1.0220947265625, -0.75146484375, -0.4808349609375, -0.210205078125, 0.0604248046875, 0.3310546875, 0.6016845703125, 0.872314453125, 1.1429443359375, 1.41357421875, 1.6842041015625, 1.954833984375, 2.2254638671875, 2.49609375, 2.7667236328125, 3.037353515625, 3.3079833984375, 3.57861328125, 3.8492431640625, 4.119873046875, 4.3905029296875, 4.6611328125, 4.9317626953125, 5.202392578125, 5.4730224609375, 5.74365234375, 6.0142822265625, 6.284912109375, 6.5555419921875, 6.826171875, 7.0968017578125, 7.367431640625, 7.6380615234375, 7.90869140625, 8.1793212890625, 8.449951171875, 8.7205810546875, 8.9912109375, 9.2618408203125, 9.532470703125, 9.8031005859375, 10.07373046875, 10.3443603515625, 10.614990234375, 10.8856201171875, 11.15625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 8.0, 6.0, 14.0, 11.0, 18.0, 28.0, 26.0, 34.0, 43.0, 67.0, 55.0, 65.0, 89.0, 91.0, 82.0, 89.0, 58.0, 46.0, 39.0, 27.0, 20.0, 21.0, 11.0, 9.0, 7.0, 9.0, 3.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.398681640625, -5.21923828125, -5.039794921875, -4.8603515625, -4.680908203125, -4.50146484375, -4.322021484375, -4.142578125, -3.963134765625, -3.78369140625, -3.604248046875, -3.4248046875, -3.245361328125, -3.06591796875, -2.886474609375, -2.70703125, -2.527587890625, -2.34814453125, -2.168701171875, -1.9892578125, -1.809814453125, -1.63037109375, -1.450927734375, -1.271484375, -1.092041015625, -0.91259765625, -0.733154296875, -0.5537109375, -0.374267578125, -0.19482421875, -0.015380859375, 0.1640625, 0.343505859375, 0.52294921875, 0.702392578125, 0.8818359375, 1.061279296875, 1.24072265625, 1.420166015625, 1.599609375, 1.779052734375, 1.95849609375, 2.137939453125, 2.3173828125, 2.496826171875, 2.67626953125, 2.855712890625, 3.03515625, 3.214599609375, 3.39404296875, 3.573486328125, 3.7529296875, 3.932373046875, 4.11181640625, 4.291259765625, 4.470703125, 4.650146484375, 4.82958984375, 5.009033203125, 5.1884765625, 5.367919921875, 5.54736328125, 5.726806640625, 5.90625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 16.0, 34.0, 99.0, 244.0, 348.0, 146.0, 64.0, 19.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.90438842773438, -203.83253479003906, -193.76068115234375, -183.68882751464844, -173.61697387695312, -163.5451202392578, -153.4732666015625, -143.40142822265625, -133.32955932617188, -123.25770568847656, -113.18585205078125, -103.11399841308594, -93.04214477539062, -82.97029113769531, -72.89844512939453, -62.82659149169922, -52.75474548339844, -42.682891845703125, -32.61103820800781, -22.539188385009766, -12.467334747314453, -2.3954811096191406, 7.676368713378906, 17.74822235107422, 27.82007598876953, 37.891929626464844, 47.963783264160156, 58.0356330871582, 68.10748291015625, 78.17933654785156, 88.25119018554688, 98.32304382324219, 108.3948974609375, 118.46675109863281, 128.53860473632812, 138.61045837402344, 148.68231201171875, 158.75416564941406, 168.82601928710938, 178.89785766601562, 188.9697265625, 199.0415802001953, 209.11343383789062, 219.18528747558594, 229.25714111328125, 239.32899475097656, 249.40084838867188, 259.4726867675781, 269.5445556640625, 279.61639404296875, 289.6882629394531, 299.7601013183594, 309.83197021484375, 319.90380859375, 329.9756774902344, 340.0475158691406, 350.1193542480469, 360.1911926269531, 370.2630615234375, 380.33489990234375, 390.4067687988281, 400.4786071777344, 410.55047607421875, 420.622314453125, 430.6941833496094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 14.0, 8.0, 15.0, 14.0, 24.0, 10.0, 10.0, 19.0, 22.0, 30.0, 21.0, 23.0, 26.0, 30.0, 40.0, 48.0, 59.0, 69.0, 53.0, 51.0, 54.0, 28.0, 41.0, 50.0, 31.0, 25.0, 15.0, 23.0, 16.0, 18.0, 16.0, 12.0, 16.0, 9.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0], "bins": [-128.56396484375, -125.0047836303711, -121.44560241699219, -117.88642120361328, -114.32723999023438, -110.76805877685547, -107.20887756347656, -103.64969635009766, -100.09051513671875, -96.53133392333984, -92.97215270996094, -89.41297149658203, -85.85379028320312, -82.29460906982422, -78.73542785644531, -75.1762466430664, -71.6170654296875, -68.0578842163086, -64.49870300292969, -60.93952178955078, -57.380340576171875, -53.82115936279297, -50.26197814941406, -46.702796936035156, -43.14362335205078, -39.584442138671875, -36.02526092529297, -32.46607971191406, -28.906898498535156, -25.347719192504883, -21.788537979125977, -18.22935676574707, -14.670173645019531, -11.110992431640625, -7.551811695098877, -3.992630958557129, -0.43344974517822266, 3.125730514526367, 6.684911727905273, 10.24409294128418, 13.803274154663086, 17.362455368041992, 20.9216365814209, 24.480815887451172, 28.039997100830078, 31.599178314208984, 35.15835952758789, 38.7175407409668, 42.2767219543457, 45.83590316772461, 49.395084381103516, 52.95426559448242, 56.51344680786133, 60.07262420654297, 63.631805419921875, 67.19098663330078, 70.75016784667969, 74.3093490600586, 77.8685302734375, 81.4277114868164, 84.98689270019531, 88.54607391357422, 92.10525512695312, 95.66443634033203, 99.22361755371094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 10.0, 18.0, 21.0, 43.0, 75.0, 112.0, 162.0, 279.0, 492.0, 1068.0, 2122.0, 5110.0, 15876.0, 69730.0, 753155.0, 2873665.0, 406002.0, 47325.0, 11280.0, 4038.0, 1717.0, 857.0, 451.0, 242.0, 139.0, 94.0, 67.0, 40.0, 26.0, 17.0, 9.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.1875, -11.772705078125, -11.35791015625, -10.943115234375, -10.5283203125, -10.113525390625, -9.69873046875, -9.283935546875, -8.869140625, -8.454345703125, -8.03955078125, -7.624755859375, -7.2099609375, -6.795166015625, -6.38037109375, -5.965576171875, -5.55078125, -5.135986328125, -4.72119140625, -4.306396484375, -3.8916015625, -3.476806640625, -3.06201171875, -2.647216796875, -2.232421875, -1.817626953125, -1.40283203125, -0.988037109375, -0.5732421875, -0.158447265625, 0.25634765625, 0.671142578125, 1.0859375, 1.500732421875, 1.91552734375, 2.330322265625, 2.7451171875, 3.159912109375, 3.57470703125, 3.989501953125, 4.404296875, 4.819091796875, 5.23388671875, 5.648681640625, 6.0634765625, 6.478271484375, 6.89306640625, 7.307861328125, 7.72265625, 8.137451171875, 8.55224609375, 8.967041015625, 9.3818359375, 9.796630859375, 10.21142578125, 10.626220703125, 11.041015625, 11.455810546875, 11.87060546875, 12.285400390625, 12.7001953125, 13.114990234375, 13.52978515625, 13.944580078125, 14.359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 8.0, 5.0, 14.0, 13.0, 15.0, 18.0, 25.0, 29.0, 33.0, 46.0, 48.0, 60.0, 57.0, 71.0, 50.0, 57.0, 57.0, 38.0, 53.0, 60.0, 43.0, 43.0, 38.0, 27.0, 20.0, 20.0, 11.0, 5.0, 12.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0625, -8.7608642578125, -8.459228515625, -8.1575927734375, -7.85595703125, -7.5543212890625, -7.252685546875, -6.9510498046875, -6.6494140625, -6.3477783203125, -6.046142578125, -5.7445068359375, -5.44287109375, -5.1412353515625, -4.839599609375, -4.5379638671875, -4.236328125, -3.9346923828125, -3.633056640625, -3.3314208984375, -3.02978515625, -2.7281494140625, -2.426513671875, -2.1248779296875, -1.8232421875, -1.5216064453125, -1.219970703125, -0.9183349609375, -0.61669921875, -0.3150634765625, -0.013427734375, 0.2882080078125, 0.58984375, 0.8914794921875, 1.193115234375, 1.4947509765625, 1.79638671875, 2.0980224609375, 2.399658203125, 2.7012939453125, 3.0029296875, 3.3045654296875, 3.606201171875, 3.9078369140625, 4.20947265625, 4.5111083984375, 4.812744140625, 5.1143798828125, 5.416015625, 5.7176513671875, 6.019287109375, 6.3209228515625, 6.62255859375, 6.9241943359375, 7.225830078125, 7.5274658203125, 7.8291015625, 8.1307373046875, 8.432373046875, 8.7340087890625, 9.03564453125, 9.3372802734375, 9.638916015625, 9.9405517578125, 10.2421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 11.0, 10.0, 21.0, 38.0, 42.0, 84.0, 150.0, 312.0, 782.0, 1974.0, 6371.0, 25541.0, 192882.0, 3356710.0, 547018.0, 46153.0, 10565.0, 3205.0, 1294.0, 488.0, 248.0, 150.0, 73.0, 45.0, 25.0, 23.0, 13.0, 10.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.90625, -19.277587890625, -18.64892578125, -18.020263671875, -17.3916015625, -16.762939453125, -16.13427734375, -15.505615234375, -14.876953125, -14.248291015625, -13.61962890625, -12.990966796875, -12.3623046875, -11.733642578125, -11.10498046875, -10.476318359375, -9.84765625, -9.218994140625, -8.59033203125, -7.961669921875, -7.3330078125, -6.704345703125, -6.07568359375, -5.447021484375, -4.818359375, -4.189697265625, -3.56103515625, -2.932373046875, -2.3037109375, -1.675048828125, -1.04638671875, -0.417724609375, 0.2109375, 0.839599609375, 1.46826171875, 2.096923828125, 2.7255859375, 3.354248046875, 3.98291015625, 4.611572265625, 5.240234375, 5.868896484375, 6.49755859375, 7.126220703125, 7.7548828125, 8.383544921875, 9.01220703125, 9.640869140625, 10.26953125, 10.898193359375, 11.52685546875, 12.155517578125, 12.7841796875, 13.412841796875, 14.04150390625, 14.670166015625, 15.298828125, 15.927490234375, 16.55615234375, 17.184814453125, 17.8134765625, 18.442138671875, 19.07080078125, 19.699462890625, 20.328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 6.0, 12.0, 17.0, 28.0, 21.0, 48.0, 68.0, 113.0, 172.0, 300.0, 494.0, 739.0, 705.0, 469.0, 322.0, 169.0, 122.0, 86.0, 38.0, 34.0, 19.0, 13.0, 13.0, 10.0, 7.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.6201171875, -18.037109375, -17.4541015625, -16.87109375, -16.2880859375, -15.705078125, -15.1220703125, -14.5390625, -13.9560546875, -13.373046875, -12.7900390625, -12.20703125, -11.6240234375, -11.041015625, -10.4580078125, -9.875, -9.2919921875, -8.708984375, -8.1259765625, -7.54296875, -6.9599609375, -6.376953125, -5.7939453125, -5.2109375, -4.6279296875, -4.044921875, -3.4619140625, -2.87890625, -2.2958984375, -1.712890625, -1.1298828125, -0.546875, 0.0361328125, 0.619140625, 1.2021484375, 1.78515625, 2.3681640625, 2.951171875, 3.5341796875, 4.1171875, 4.7001953125, 5.283203125, 5.8662109375, 6.44921875, 7.0322265625, 7.615234375, 8.1982421875, 8.78125, 9.3642578125, 9.947265625, 10.5302734375, 11.11328125, 11.6962890625, 12.279296875, 12.8623046875, 13.4453125, 14.0283203125, 14.611328125, 15.1943359375, 15.77734375, 16.3603515625, 16.943359375, 17.5263671875, 18.109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 15.0, 53.0, 211.0, 466.0, 187.0, 50.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-395.7889404296875, -381.8563232421875, -367.9237365722656, -353.9911193847656, -340.05853271484375, -326.12591552734375, -312.19329833984375, -298.2607116699219, -284.328125, -270.3955078125, -256.4629211425781, -242.53030395507812, -228.59771728515625, -214.66510009765625, -200.7324981689453, -186.79989624023438, -172.86727905273438, -158.93467712402344, -145.0020751953125, -131.0694580078125, -117.1368637084961, -103.20426177978516, -89.27165222167969, -75.33905029296875, -61.40644836425781, -47.473846435546875, -33.54124069213867, -19.60863494873047, -5.676033020019531, 8.256568908691406, 22.189178466796875, 36.12178039550781, 50.054412841796875, 63.98701477050781, 77.91961669921875, 91.85222625732422, 105.78482818603516, 119.7174301147461, 133.65003967285156, 147.5826416015625, 161.51524353027344, 175.44784545898438, 189.3804473876953, 203.31304931640625, 217.24566650390625, 231.17825317382812, 245.11087036132812, 259.04345703125, 272.97607421875, 286.90869140625, 300.8412780761719, 314.7738952636719, 328.70648193359375, 342.63909912109375, 356.57171630859375, 370.5043029785156, 384.4368896484375, 398.3695068359375, 412.3020935058594, 426.2347106933594, 440.16729736328125, 454.09991455078125, 468.03253173828125, 481.9651184082031, 495.8977355957031]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 8.0, 10.0, 9.0, 10.0, 27.0, 16.0, 12.0, 37.0, 28.0, 39.0, 44.0, 38.0, 38.0, 52.0, 45.0, 51.0, 52.0, 52.0, 50.0, 53.0, 37.0, 37.0, 36.0, 29.0, 44.0, 30.0, 25.0, 17.0, 13.0, 5.0, 15.0, 7.0, 8.0, 4.0, 3.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-95.1252670288086, -92.31668853759766, -89.50811004638672, -86.69953918457031, -83.89096069335938, -81.08238220214844, -78.2738037109375, -75.46522521972656, -72.65664672851562, -69.84806823730469, -67.03948974609375, -64.23091125488281, -61.422340393066406, -58.61376190185547, -55.80518341064453, -52.996604919433594, -50.18803405761719, -47.37945556640625, -44.57088088989258, -41.76230239868164, -38.95372772216797, -36.14514923095703, -33.336570739746094, -30.52799415588379, -27.719417572021484, -24.91084098815918, -22.102264404296875, -19.293685913085938, -16.485109329223633, -13.676532745361328, -10.86795425415039, -8.059377670288086, -5.2508087158203125, -2.4422316551208496, 0.3663454055786133, 3.1749229431152344, 5.983499526977539, 8.792076110839844, 11.600654602050781, 14.409231185913086, 17.21780776977539, 20.026384353637695, 22.8349609375, 25.643539428710938, 28.452116012573242, 31.260692596435547, 34.069271087646484, 36.877845764160156, 39.686424255371094, 42.49500274658203, 45.3035774230957, 48.11215591430664, 50.92073059082031, 53.72930908203125, 56.53788757324219, 59.346466064453125, 62.1550407409668, 64.96361541748047, 67.7721939086914, 70.58077239990234, 73.38935089111328, 76.19792175292969, 79.00650024414062, 81.81507873535156, 84.6236572265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 8.0, 9.0, 10.0, 29.0, 33.0, 45.0, 75.0, 110.0, 164.0, 305.0, 521.0, 800.0, 1407.0, 2541.0, 4910.0, 9540.0, 20308.0, 46357.0, 110041.0, 235925.0, 298216.0, 176768.0, 77195.0, 32541.0, 14838.0, 7143.0, 3735.0, 1960.0, 1190.0, 703.0, 393.0, 252.0, 162.0, 99.0, 68.0, 52.0, 31.0, 22.0, 11.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.046875, -9.75390625, -9.4609375, -9.16796875, -8.875, -8.58203125, -8.2890625, -7.99609375, -7.703125, -7.41015625, -7.1171875, -6.82421875, -6.53125, -6.23828125, -5.9453125, -5.65234375, -5.359375, -5.06640625, -4.7734375, -4.48046875, -4.1875, -3.89453125, -3.6015625, -3.30859375, -3.015625, -2.72265625, -2.4296875, -2.13671875, -1.84375, -1.55078125, -1.2578125, -0.96484375, -0.671875, -0.37890625, -0.0859375, 0.20703125, 0.5, 0.79296875, 1.0859375, 1.37890625, 1.671875, 1.96484375, 2.2578125, 2.55078125, 2.84375, 3.13671875, 3.4296875, 3.72265625, 4.015625, 4.30859375, 4.6015625, 4.89453125, 5.1875, 5.48046875, 5.7734375, 6.06640625, 6.359375, 6.65234375, 6.9453125, 7.23828125, 7.53125, 7.82421875, 8.1171875, 8.41015625, 8.703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 8.0, 19.0, 14.0, 10.0, 27.0, 17.0, 19.0, 36.0, 35.0, 49.0, 42.0, 53.0, 61.0, 50.0, 64.0, 58.0, 49.0, 57.0, 42.0, 45.0, 38.0, 54.0, 29.0, 19.0, 22.0, 18.0, 10.0, 11.0, 11.0, 9.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.600830078125, -8.30322265625, -8.005615234375, -7.7080078125, -7.410400390625, -7.11279296875, -6.815185546875, -6.517578125, -6.219970703125, -5.92236328125, -5.624755859375, -5.3271484375, -5.029541015625, -4.73193359375, -4.434326171875, -4.13671875, -3.839111328125, -3.54150390625, -3.243896484375, -2.9462890625, -2.648681640625, -2.35107421875, -2.053466796875, -1.755859375, -1.458251953125, -1.16064453125, -0.863037109375, -0.5654296875, -0.267822265625, 0.02978515625, 0.327392578125, 0.625, 0.922607421875, 1.22021484375, 1.517822265625, 1.8154296875, 2.113037109375, 2.41064453125, 2.708251953125, 3.005859375, 3.303466796875, 3.60107421875, 3.898681640625, 4.1962890625, 4.493896484375, 4.79150390625, 5.089111328125, 5.38671875, 5.684326171875, 5.98193359375, 6.279541015625, 6.5771484375, 6.874755859375, 7.17236328125, 7.469970703125, 7.767578125, 8.065185546875, 8.36279296875, 8.660400390625, 8.9580078125, 9.255615234375, 9.55322265625, 9.850830078125, 10.1484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 16.0, 20.0, 27.0, 30.0, 56.0, 80.0, 162.0, 291.0, 664.0, 1642.0, 4895.0, 18732.0, 105401.0, 687303.0, 189633.0, 28814.0, 6902.0, 2157.0, 848.0, 361.0, 172.0, 116.0, 70.0, 36.0, 28.0, 13.0, 11.0, 13.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.156982421875, -23.43896484375, -22.720947265625, -22.0029296875, -21.284912109375, -20.56689453125, -19.848876953125, -19.130859375, -18.412841796875, -17.69482421875, -16.976806640625, -16.2587890625, -15.540771484375, -14.82275390625, -14.104736328125, -13.38671875, -12.668701171875, -11.95068359375, -11.232666015625, -10.5146484375, -9.796630859375, -9.07861328125, -8.360595703125, -7.642578125, -6.924560546875, -6.20654296875, -5.488525390625, -4.7705078125, -4.052490234375, -3.33447265625, -2.616455078125, -1.8984375, -1.180419921875, -0.46240234375, 0.255615234375, 0.9736328125, 1.691650390625, 2.40966796875, 3.127685546875, 3.845703125, 4.563720703125, 5.28173828125, 5.999755859375, 6.7177734375, 7.435791015625, 8.15380859375, 8.871826171875, 9.58984375, 10.307861328125, 11.02587890625, 11.743896484375, 12.4619140625, 13.179931640625, 13.89794921875, 14.615966796875, 15.333984375, 16.052001953125, 16.77001953125, 17.488037109375, 18.2060546875, 18.924072265625, 19.64208984375, 20.360107421875, 21.078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 13.0, 7.0, 7.0, 14.0, 14.0, 21.0, 32.0, 26.0, 31.0, 37.0, 44.0, 39.0, 46.0, 45.0, 54.0, 58.0, 53.0, 33.0, 41.0, 58.0, 40.0, 31.0, 30.0, 29.0, 17.0, 29.0, 20.0, 19.0, 16.0, 9.0, 11.0, 7.0, 8.0, 8.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-27.53125, -26.6123046875, -25.693359375, -24.7744140625, -23.85546875, -22.9365234375, -22.017578125, -21.0986328125, -20.1796875, -19.2607421875, -18.341796875, -17.4228515625, -16.50390625, -15.5849609375, -14.666015625, -13.7470703125, -12.828125, -11.9091796875, -10.990234375, -10.0712890625, -9.15234375, -8.2333984375, -7.314453125, -6.3955078125, -5.4765625, -4.5576171875, -3.638671875, -2.7197265625, -1.80078125, -0.8818359375, 0.037109375, 0.9560546875, 1.875, 2.7939453125, 3.712890625, 4.6318359375, 5.55078125, 6.4697265625, 7.388671875, 8.3076171875, 9.2265625, 10.1455078125, 11.064453125, 11.9833984375, 12.90234375, 13.8212890625, 14.740234375, 15.6591796875, 16.578125, 17.4970703125, 18.416015625, 19.3349609375, 20.25390625, 21.1728515625, 22.091796875, 23.0107421875, 23.9296875, 24.8486328125, 25.767578125, 26.6865234375, 27.60546875, 28.5244140625, 29.443359375, 30.3623046875, 31.28125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 13.0, 9.0, 12.0, 22.0, 31.0, 49.0, 100.0, 146.0, 267.0, 432.0, 983.0, 2235.0, 6011.0, 18059.0, 63369.0, 261488.0, 553748.0, 100501.0, 27031.0, 8411.0, 3090.0, 1236.0, 520.0, 305.0, 132.0, 103.0, 76.0, 52.0, 30.0, 18.0, 13.0, 11.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.744140625, -3.620025634765625, -3.49591064453125, -3.371795654296875, -3.2476806640625, -3.123565673828125, -2.99945068359375, -2.875335693359375, -2.751220703125, -2.627105712890625, -2.50299072265625, -2.378875732421875, -2.2547607421875, -2.130645751953125, -2.00653076171875, -1.882415771484375, -1.75830078125, -1.634185791015625, -1.51007080078125, -1.385955810546875, -1.2618408203125, -1.137725830078125, -1.01361083984375, -0.889495849609375, -0.765380859375, -0.641265869140625, -0.51715087890625, -0.393035888671875, -0.2689208984375, -0.144805908203125, -0.02069091796875, 0.103424072265625, 0.2275390625, 0.351654052734375, 0.47576904296875, 0.599884033203125, 0.7239990234375, 0.848114013671875, 0.97222900390625, 1.096343994140625, 1.220458984375, 1.344573974609375, 1.46868896484375, 1.592803955078125, 1.7169189453125, 1.841033935546875, 1.96514892578125, 2.089263916015625, 2.21337890625, 2.337493896484375, 2.46160888671875, 2.585723876953125, 2.7098388671875, 2.833953857421875, 2.95806884765625, 3.082183837890625, 3.206298828125, 3.330413818359375, 3.45452880859375, 3.578643798828125, 3.7027587890625, 3.826873779296875, 3.95098876953125, 4.075103759765625, 4.19921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 5.0, 17.0, 26.0, 45.0, 40.0, 76.0, 109.0, 133.0, 105.0, 116.0, 71.0, 56.0, 52.0, 37.0, 17.0, 17.0, 17.0, 11.0, 4.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0016069412231445312, -0.0015649795532226562, -0.0015230178833007812, -0.0014810562133789062, -0.0014390945434570312, -0.0013971328735351562, -0.0013551712036132812, -0.0013132095336914062, -0.0012712478637695312, -0.0012292861938476562, -0.0011873245239257812, -0.0011453628540039062, -0.0011034011840820312, -0.0010614395141601562, -0.0010194778442382812, -0.0009775161743164062, -0.0009355545043945312, -0.0008935928344726562, -0.0008516311645507812, -0.0008096694946289062, -0.0007677078247070312, -0.0007257461547851562, -0.0006837844848632812, -0.0006418228149414062, -0.0005998611450195312, -0.0005578994750976562, -0.0005159378051757812, -0.00047397613525390625, -0.00043201446533203125, -0.00039005279541015625, -0.00034809112548828125, -0.00030612945556640625, -0.00026416778564453125, -0.00022220611572265625, -0.00018024444580078125, -0.00013828277587890625, -9.632110595703125e-05, -5.435943603515625e-05, -1.239776611328125e-05, 2.956390380859375e-05, 7.152557373046875e-05, 0.00011348724365234375, 0.00015544891357421875, 0.00019741058349609375, 0.00023937225341796875, 0.00028133392333984375, 0.00032329559326171875, 0.00036525726318359375, 0.00040721893310546875, 0.00044918060302734375, 0.0004911422729492188, 0.0005331039428710938, 0.0005750656127929688, 0.0006170272827148438, 0.0006589889526367188, 0.0007009506225585938, 0.0007429122924804688, 0.0007848739624023438, 0.0008268356323242188, 0.0008687973022460938, 0.0009107589721679688, 0.0009527206420898438, 0.0009946823120117188, 0.0010366439819335938, 0.0010786056518554688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 2.0, 1.0, 6.0, 17.0, 14.0, 28.0, 55.0, 112.0, 198.0, 417.0, 946.0, 2824.0, 11237.0, 70192.0, 669841.0, 252526.0, 31086.0, 6070.0, 1741.0, 623.0, 299.0, 125.0, 78.0, 45.0, 26.0, 15.0, 14.0, 5.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.86279296875, -5.6591796875, -5.45556640625, -5.251953125, -5.04833984375, -4.8447265625, -4.64111328125, -4.4375, -4.23388671875, -4.0302734375, -3.82666015625, -3.623046875, -3.41943359375, -3.2158203125, -3.01220703125, -2.80859375, -2.60498046875, -2.4013671875, -2.19775390625, -1.994140625, -1.79052734375, -1.5869140625, -1.38330078125, -1.1796875, -0.97607421875, -0.7724609375, -0.56884765625, -0.365234375, -0.16162109375, 0.0419921875, 0.24560546875, 0.44921875, 0.65283203125, 0.8564453125, 1.06005859375, 1.263671875, 1.46728515625, 1.6708984375, 1.87451171875, 2.078125, 2.28173828125, 2.4853515625, 2.68896484375, 2.892578125, 3.09619140625, 3.2998046875, 3.50341796875, 3.70703125, 3.91064453125, 4.1142578125, 4.31787109375, 4.521484375, 4.72509765625, 4.9287109375, 5.13232421875, 5.3359375, 5.53955078125, 5.7431640625, 5.94677734375, 6.150390625, 6.35400390625, 6.5576171875, 6.76123046875, 6.96484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 9.0, 9.0, 11.0, 17.0, 24.0, 38.0, 57.0, 63.0, 92.0, 99.0, 129.0, 122.0, 90.0, 65.0, 60.0, 34.0, 23.0, 17.0, 15.0, 9.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5078125, -7.28411865234375, -7.0604248046875, -6.83673095703125, -6.613037109375, -6.38934326171875, -6.1656494140625, -5.94195556640625, -5.71826171875, -5.49456787109375, -5.2708740234375, -5.04718017578125, -4.823486328125, -4.59979248046875, -4.3760986328125, -4.15240478515625, -3.9287109375, -3.70501708984375, -3.4813232421875, -3.25762939453125, -3.033935546875, -2.81024169921875, -2.5865478515625, -2.36285400390625, -2.13916015625, -1.91546630859375, -1.6917724609375, -1.46807861328125, -1.244384765625, -1.02069091796875, -0.7969970703125, -0.57330322265625, -0.349609375, -0.12591552734375, 0.0977783203125, 0.32147216796875, 0.545166015625, 0.76885986328125, 0.9925537109375, 1.21624755859375, 1.43994140625, 1.66363525390625, 1.8873291015625, 2.11102294921875, 2.334716796875, 2.55841064453125, 2.7821044921875, 3.00579833984375, 3.2294921875, 3.45318603515625, 3.6768798828125, 3.90057373046875, 4.124267578125, 4.34796142578125, 4.5716552734375, 4.79534912109375, 5.01904296875, 5.24273681640625, 5.4664306640625, 5.69012451171875, 5.913818359375, 6.13751220703125, 6.3612060546875, 6.58489990234375, 6.80859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 25.0, 42.0, 94.0, 206.0, 330.0, 145.0, 72.0, 39.0, 15.0, 9.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.6329650878906, -267.60498046875, -261.5769958496094, -255.5490264892578, -249.5210418701172, -243.49307250976562, -237.465087890625, -231.43710327148438, -225.4091339111328, -219.3811492919922, -213.35317993164062, -207.3251953125, -201.29721069335938, -195.2692413330078, -189.2412567138672, -183.21328735351562, -177.185302734375, -171.15731811523438, -165.1293487548828, -159.1013641357422, -153.07337951660156, -147.04541015625, -141.01742553710938, -134.98944091796875, -128.96145629882812, -122.93347930908203, -116.9054946899414, -110.87751770019531, -104.84954071044922, -98.82156372070312, -92.7935791015625, -86.7656021118164, -80.73762512207031, -74.70964813232422, -68.6816635131836, -62.6536865234375, -56.625709533691406, -50.59772872924805, -44.56974792480469, -38.541770935058594, -32.513790130615234, -26.485811233520508, -20.45783233642578, -14.429851531982422, -8.401872634887695, -2.3738937377929688, 3.6540870666503906, 9.682064056396484, 15.710044860839844, 21.73802375793457, 27.766002655029297, 33.793983459472656, 39.82196044921875, 45.84994125366211, 51.87792205810547, 57.90589904785156, 63.93387985229492, 69.96186065673828, 75.98983764648438, 82.017822265625, 88.0457992553711, 94.07377624511719, 100.10176086425781, 106.12973022460938, 112.15771484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 3.0, 7.0, 9.0, 12.0, 10.0, 16.0, 21.0, 16.0, 17.0, 26.0, 21.0, 19.0, 33.0, 36.0, 41.0, 62.0, 72.0, 67.0, 51.0, 68.0, 46.0, 40.0, 34.0, 38.0, 22.0, 27.0, 23.0, 22.0, 16.0, 21.0, 12.0, 14.0, 7.0, 8.0, 8.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-108.47959899902344, -105.140380859375, -101.80115509033203, -98.4619369506836, -95.12271118164062, -91.78349304199219, -88.44427490234375, -85.10505676269531, -81.76583099365234, -78.4266128540039, -75.08738708496094, -71.7481689453125, -68.40895080566406, -65.0697250366211, -61.730506896972656, -58.39128494262695, -55.05206298828125, -51.71284103393555, -48.373619079589844, -45.034400939941406, -41.6951789855957, -38.35595703125, -35.01673889160156, -31.67751693725586, -28.338294982910156, -24.999073028564453, -21.659852981567383, -18.320632934570312, -14.98141098022461, -11.642189025878906, -8.302968978881836, -4.963748931884766, -1.6245269775390625, 1.7146940231323242, 5.053915023803711, 8.393136024475098, 11.732357025146484, 15.071578979492188, 18.410799026489258, 21.750019073486328, 25.08924102783203, 28.428462982177734, 31.767683029174805, 35.106903076171875, 38.44612503051758, 41.78534698486328, 45.12456512451172, 48.46378707885742, 51.803009033203125, 55.14223098754883, 58.48145294189453, 61.82067108154297, 65.15989685058594, 68.49911499023438, 71.83833312988281, 75.17755126953125, 78.51677703857422, 81.85599517822266, 85.19522094726562, 88.53443908691406, 91.8736572265625, 95.21288299560547, 98.5521011352539, 101.89132690429688, 105.23054504394531]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 14.0, 18.0, 25.0, 27.0, 30.0, 63.0, 91.0, 134.0, 223.0, 373.0, 592.0, 1019.0, 2001.0, 4411.0, 9859.0, 25493.0, 83961.0, 340662.0, 1289639.0, 1707301.0, 540164.0, 128724.0, 36343.0, 12671.0, 4990.0, 2342.0, 1216.0, 695.0, 412.0, 268.0, 150.0, 99.0, 75.0, 63.0, 37.0, 23.0, 12.0, 10.0, 6.0, 11.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.24090576171875, -5.0325927734375, -4.82427978515625, -4.615966796875, -4.40765380859375, -4.1993408203125, -3.99102783203125, -3.78271484375, -3.57440185546875, -3.3660888671875, -3.15777587890625, -2.949462890625, -2.74114990234375, -2.5328369140625, -2.32452392578125, -2.1162109375, -1.90789794921875, -1.6995849609375, -1.49127197265625, -1.282958984375, -1.07464599609375, -0.8663330078125, -0.65802001953125, -0.44970703125, -0.24139404296875, -0.0330810546875, 0.17523193359375, 0.383544921875, 0.59185791015625, 0.8001708984375, 1.00848388671875, 1.216796875, 1.42510986328125, 1.6334228515625, 1.84173583984375, 2.050048828125, 2.25836181640625, 2.4666748046875, 2.67498779296875, 2.88330078125, 3.09161376953125, 3.2999267578125, 3.50823974609375, 3.716552734375, 3.92486572265625, 4.1331787109375, 4.34149169921875, 4.5498046875, 4.75811767578125, 4.9664306640625, 5.17474365234375, 5.383056640625, 5.59136962890625, 5.7996826171875, 6.00799560546875, 6.21630859375, 6.42462158203125, 6.6329345703125, 6.84124755859375, 7.049560546875, 7.25787353515625, 7.4661865234375, 7.67449951171875, 7.8828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 9.0, 10.0, 11.0, 17.0, 24.0, 28.0, 32.0, 54.0, 41.0, 45.0, 46.0, 59.0, 53.0, 55.0, 48.0, 50.0, 42.0, 55.0, 51.0, 45.0, 37.0, 35.0, 39.0, 20.0, 22.0, 12.0, 18.0, 5.0, 13.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.984375, -8.68798828125, -8.3916015625, -8.09521484375, -7.798828125, -7.50244140625, -7.2060546875, -6.90966796875, -6.61328125, -6.31689453125, -6.0205078125, -5.72412109375, -5.427734375, -5.13134765625, -4.8349609375, -4.53857421875, -4.2421875, -3.94580078125, -3.6494140625, -3.35302734375, -3.056640625, -2.76025390625, -2.4638671875, -2.16748046875, -1.87109375, -1.57470703125, -1.2783203125, -0.98193359375, -0.685546875, -0.38916015625, -0.0927734375, 0.20361328125, 0.5, 0.79638671875, 1.0927734375, 1.38916015625, 1.685546875, 1.98193359375, 2.2783203125, 2.57470703125, 2.87109375, 3.16748046875, 3.4638671875, 3.76025390625, 4.056640625, 4.35302734375, 4.6494140625, 4.94580078125, 5.2421875, 5.53857421875, 5.8349609375, 6.13134765625, 6.427734375, 6.72412109375, 7.0205078125, 7.31689453125, 7.61328125, 7.90966796875, 8.2060546875, 8.50244140625, 8.798828125, 9.09521484375, 9.3916015625, 9.68798828125, 9.984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 9.0, 5.0, 4.0, 9.0, 17.0, 16.0, 39.0, 35.0, 88.0, 144.0, 277.0, 792.0, 2901.0, 16450.0, 260780.0, 3720156.0, 175190.0, 13492.0, 2549.0, 716.0, 279.0, 125.0, 83.0, 35.0, 32.0, 17.0, 7.0, 14.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -17.916259765625, -17.23876953125, -16.561279296875, -15.8837890625, -15.206298828125, -14.52880859375, -13.851318359375, -13.173828125, -12.496337890625, -11.81884765625, -11.141357421875, -10.4638671875, -9.786376953125, -9.10888671875, -8.431396484375, -7.75390625, -7.076416015625, -6.39892578125, -5.721435546875, -5.0439453125, -4.366455078125, -3.68896484375, -3.011474609375, -2.333984375, -1.656494140625, -0.97900390625, -0.301513671875, 0.3759765625, 1.053466796875, 1.73095703125, 2.408447265625, 3.0859375, 3.763427734375, 4.44091796875, 5.118408203125, 5.7958984375, 6.473388671875, 7.15087890625, 7.828369140625, 8.505859375, 9.183349609375, 9.86083984375, 10.538330078125, 11.2158203125, 11.893310546875, 12.57080078125, 13.248291015625, 13.92578125, 14.603271484375, 15.28076171875, 15.958251953125, 16.6357421875, 17.313232421875, 17.99072265625, 18.668212890625, 19.345703125, 20.023193359375, 20.70068359375, 21.378173828125, 22.0556640625, 22.733154296875, 23.41064453125, 24.088134765625, 24.765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 6.0, 14.0, 17.0, 43.0, 38.0, 73.0, 138.0, 238.0, 371.0, 634.0, 803.0, 628.0, 451.0, 226.0, 138.0, 80.0, 49.0, 37.0, 25.0, 19.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.258056640625, -19.70361328125, -19.149169921875, -18.5947265625, -18.040283203125, -17.48583984375, -16.931396484375, -16.376953125, -15.822509765625, -15.26806640625, -14.713623046875, -14.1591796875, -13.604736328125, -13.05029296875, -12.495849609375, -11.94140625, -11.386962890625, -10.83251953125, -10.278076171875, -9.7236328125, -9.169189453125, -8.61474609375, -8.060302734375, -7.505859375, -6.951416015625, -6.39697265625, -5.842529296875, -5.2880859375, -4.733642578125, -4.17919921875, -3.624755859375, -3.0703125, -2.515869140625, -1.96142578125, -1.406982421875, -0.8525390625, -0.298095703125, 0.25634765625, 0.810791015625, 1.365234375, 1.919677734375, 2.47412109375, 3.028564453125, 3.5830078125, 4.137451171875, 4.69189453125, 5.246337890625, 5.80078125, 6.355224609375, 6.90966796875, 7.464111328125, 8.0185546875, 8.572998046875, 9.12744140625, 9.681884765625, 10.236328125, 10.790771484375, 11.34521484375, 11.899658203125, 12.4541015625, 13.008544921875, 13.56298828125, 14.117431640625, 14.671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 15.0, 21.0, 96.0, 226.0, 299.0, 217.0, 74.0, 32.0, 9.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-325.6950988769531, -318.8290100097656, -311.9629211425781, -305.0968322753906, -298.2307434082031, -291.3646545410156, -284.4985656738281, -277.6324768066406, -270.7663879394531, -263.9002990722656, -257.0342102050781, -250.16812133789062, -243.30203247070312, -236.43594360351562, -229.56985473632812, -222.70376586914062, -215.83766174316406, -208.97157287597656, -202.10548400878906, -195.23939514160156, -188.37330627441406, -181.50721740722656, -174.64111328125, -167.7750244140625, -160.908935546875, -154.0428466796875, -147.1767578125, -140.3106689453125, -133.444580078125, -126.5784912109375, -119.71239471435547, -112.84630584716797, -105.980224609375, -99.1141357421875, -92.248046875, -85.3819580078125, -78.515869140625, -71.6497802734375, -64.78368377685547, -57.91759490966797, -51.05150604248047, -44.18541717529297, -37.31932830810547, -30.453235626220703, -23.587146759033203, -16.721057891845703, -9.854965209960938, -2.9888763427734375, 3.8772125244140625, 10.743302345275879, 17.609392166137695, 24.475482940673828, 31.341571807861328, 38.20766067504883, 45.073753356933594, 51.939842224121094, 58.805931091308594, 65.6720199584961, 72.5381088256836, 79.40420532226562, 86.27029418945312, 93.13638305664062, 100.00247192382812, 106.86856079101562, 113.73464965820312]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 11.0, 14.0, 11.0, 15.0, 20.0, 21.0, 20.0, 32.0, 30.0, 36.0, 40.0, 44.0, 48.0, 43.0, 55.0, 56.0, 32.0, 45.0, 50.0, 53.0, 46.0, 38.0, 34.0, 29.0, 16.0, 21.0, 17.0, 17.0, 19.0, 14.0, 11.0, 14.0, 8.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.91127014160156, -55.9961051940918, -54.080936431884766, -52.165771484375, -50.250606536865234, -48.33544158935547, -46.42027282714844, -44.50510787963867, -42.589942932128906, -40.67477798461914, -38.75960922241211, -36.844444274902344, -34.92927932739258, -33.01411437988281, -31.09894561767578, -29.183780670166016, -27.268611907958984, -25.353445053100586, -23.43828010559082, -21.523113250732422, -19.607948303222656, -17.692781448364258, -15.77761459350586, -13.862448692321777, -11.947282791137695, -10.032116889953613, -8.116950988769531, -6.201784133911133, -4.286618232727051, -2.3714523315429688, -0.4562854766845703, 1.4588804244995117, 3.3740463256835938, 5.289212226867676, 7.204378604888916, 9.119544982910156, 11.034710884094238, 12.94987678527832, 14.865043640136719, 16.780208587646484, 18.695375442504883, 20.61054229736328, 22.525707244873047, 24.440874099731445, 26.356040954589844, 28.27120590209961, 30.186372756958008, 32.101539611816406, 34.01670455932617, 35.93186950683594, 37.84703826904297, 39.762203216552734, 41.6773681640625, 43.59253692626953, 45.5077018737793, 47.42286682128906, 49.338035583496094, 51.25320053100586, 53.16836929321289, 55.083534240722656, 56.99869918823242, 58.91386413574219, 60.82903289794922, 62.744197845458984, 64.65936279296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 16.0, 29.0, 42.0, 72.0, 99.0, 213.0, 342.0, 656.0, 1280.0, 2586.0, 5932.0, 14303.0, 39920.0, 121516.0, 337337.0, 336265.0, 121899.0, 39984.0, 14728.0, 5977.0, 2577.0, 1213.0, 687.0, 338.0, 203.0, 127.0, 68.0, 43.0, 33.0, 17.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.661376953125, -8.31494140625, -7.968505859375, -7.6220703125, -7.275634765625, -6.92919921875, -6.582763671875, -6.236328125, -5.889892578125, -5.54345703125, -5.197021484375, -4.8505859375, -4.504150390625, -4.15771484375, -3.811279296875, -3.46484375, -3.118408203125, -2.77197265625, -2.425537109375, -2.0791015625, -1.732666015625, -1.38623046875, -1.039794921875, -0.693359375, -0.346923828125, -0.00048828125, 0.345947265625, 0.6923828125, 1.038818359375, 1.38525390625, 1.731689453125, 2.078125, 2.424560546875, 2.77099609375, 3.117431640625, 3.4638671875, 3.810302734375, 4.15673828125, 4.503173828125, 4.849609375, 5.196044921875, 5.54248046875, 5.888916015625, 6.2353515625, 6.581787109375, 6.92822265625, 7.274658203125, 7.62109375, 7.967529296875, 8.31396484375, 8.660400390625, 9.0068359375, 9.353271484375, 9.69970703125, 10.046142578125, 10.392578125, 10.739013671875, 11.08544921875, 11.431884765625, 11.7783203125, 12.124755859375, 12.47119140625, 12.817626953125, 13.1640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 9.0, 9.0, 7.0, 10.0, 12.0, 22.0, 23.0, 28.0, 30.0, 29.0, 40.0, 50.0, 45.0, 59.0, 41.0, 52.0, 64.0, 60.0, 56.0, 46.0, 39.0, 50.0, 42.0, 37.0, 28.0, 25.0, 21.0, 13.0, 12.0, 12.0, 5.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0546875, -8.75732421875, -8.4599609375, -8.16259765625, -7.865234375, -7.56787109375, -7.2705078125, -6.97314453125, -6.67578125, -6.37841796875, -6.0810546875, -5.78369140625, -5.486328125, -5.18896484375, -4.8916015625, -4.59423828125, -4.296875, -3.99951171875, -3.7021484375, -3.40478515625, -3.107421875, -2.81005859375, -2.5126953125, -2.21533203125, -1.91796875, -1.62060546875, -1.3232421875, -1.02587890625, -0.728515625, -0.43115234375, -0.1337890625, 0.16357421875, 0.4609375, 0.75830078125, 1.0556640625, 1.35302734375, 1.650390625, 1.94775390625, 2.2451171875, 2.54248046875, 2.83984375, 3.13720703125, 3.4345703125, 3.73193359375, 4.029296875, 4.32666015625, 4.6240234375, 4.92138671875, 5.21875, 5.51611328125, 5.8134765625, 6.11083984375, 6.408203125, 6.70556640625, 7.0029296875, 7.30029296875, 7.59765625, 7.89501953125, 8.1923828125, 8.48974609375, 8.787109375, 9.08447265625, 9.3818359375, 9.67919921875, 9.9765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 7.0, 14.0, 12.0, 19.0, 32.0, 39.0, 71.0, 127.0, 173.0, 290.0, 432.0, 800.0, 1654.0, 4609.0, 18706.0, 122638.0, 740826.0, 130261.0, 19539.0, 4582.0, 1669.0, 788.0, 457.0, 293.0, 173.0, 111.0, 69.0, 52.0, 37.0, 19.0, 22.0, 16.0, 6.0, 3.0, 8.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.5789794921875, -13.931396484375, -13.2838134765625, -12.63623046875, -11.9886474609375, -11.341064453125, -10.6934814453125, -10.0458984375, -9.3983154296875, -8.750732421875, -8.1031494140625, -7.45556640625, -6.8079833984375, -6.160400390625, -5.5128173828125, -4.865234375, -4.2176513671875, -3.570068359375, -2.9224853515625, -2.27490234375, -1.6273193359375, -0.979736328125, -0.3321533203125, 0.3154296875, 0.9630126953125, 1.610595703125, 2.2581787109375, 2.90576171875, 3.5533447265625, 4.200927734375, 4.8485107421875, 5.49609375, 6.1436767578125, 6.791259765625, 7.4388427734375, 8.08642578125, 8.7340087890625, 9.381591796875, 10.0291748046875, 10.6767578125, 11.3243408203125, 11.971923828125, 12.6195068359375, 13.26708984375, 13.9146728515625, 14.562255859375, 15.2098388671875, 15.857421875, 16.5050048828125, 17.152587890625, 17.8001708984375, 18.44775390625, 19.0953369140625, 19.742919921875, 20.3905029296875, 21.0380859375, 21.6856689453125, 22.333251953125, 22.9808349609375, 23.62841796875, 24.2760009765625, 24.923583984375, 25.5711669921875, 26.21875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 7.0, 16.0, 15.0, 23.0, 22.0, 28.0, 34.0, 31.0, 47.0, 40.0, 43.0, 41.0, 54.0, 42.0, 60.0, 61.0, 50.0, 49.0, 47.0, 41.0, 35.0, 28.0, 26.0, 32.0, 23.0, 20.0, 15.0, 16.0, 10.0, 8.0, 5.0, 1.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -21.690673828125, -20.77197265625, -19.853271484375, -18.9345703125, -18.015869140625, -17.09716796875, -16.178466796875, -15.259765625, -14.341064453125, -13.42236328125, -12.503662109375, -11.5849609375, -10.666259765625, -9.74755859375, -8.828857421875, -7.91015625, -6.991455078125, -6.07275390625, -5.154052734375, -4.2353515625, -3.316650390625, -2.39794921875, -1.479248046875, -0.560546875, 0.358154296875, 1.27685546875, 2.195556640625, 3.1142578125, 4.032958984375, 4.95166015625, 5.870361328125, 6.7890625, 7.707763671875, 8.62646484375, 9.545166015625, 10.4638671875, 11.382568359375, 12.30126953125, 13.219970703125, 14.138671875, 15.057373046875, 15.97607421875, 16.894775390625, 17.8134765625, 18.732177734375, 19.65087890625, 20.569580078125, 21.48828125, 22.406982421875, 23.32568359375, 24.244384765625, 25.1630859375, 26.081787109375, 27.00048828125, 27.919189453125, 28.837890625, 29.756591796875, 30.67529296875, 31.593994140625, 32.5126953125, 33.431396484375, 34.35009765625, 35.268798828125, 36.1875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 1.0, 4.0, 6.0, 8.0, 15.0, 16.0, 21.0, 36.0, 91.0, 158.0, 345.0, 842.0, 2101.0, 6178.0, 23996.0, 151029.0, 762978.0, 78377.0, 15215.0, 4357.0, 1558.0, 611.0, 280.0, 130.0, 84.0, 37.0, 23.0, 9.0, 14.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.62109375, -5.4705810546875, -5.320068359375, -5.1695556640625, -5.01904296875, -4.8685302734375, -4.718017578125, -4.5675048828125, -4.4169921875, -4.2664794921875, -4.115966796875, -3.9654541015625, -3.81494140625, -3.6644287109375, -3.513916015625, -3.3634033203125, -3.212890625, -3.0623779296875, -2.911865234375, -2.7613525390625, -2.61083984375, -2.4603271484375, -2.309814453125, -2.1593017578125, -2.0087890625, -1.8582763671875, -1.707763671875, -1.5572509765625, -1.40673828125, -1.2562255859375, -1.105712890625, -0.9552001953125, -0.8046875, -0.6541748046875, -0.503662109375, -0.3531494140625, -0.20263671875, -0.0521240234375, 0.098388671875, 0.2489013671875, 0.3994140625, 0.5499267578125, 0.700439453125, 0.8509521484375, 1.00146484375, 1.1519775390625, 1.302490234375, 1.4530029296875, 1.603515625, 1.7540283203125, 1.904541015625, 2.0550537109375, 2.20556640625, 2.3560791015625, 2.506591796875, 2.6571044921875, 2.8076171875, 2.9581298828125, 3.108642578125, 3.2591552734375, 3.40966796875, 3.5601806640625, 3.710693359375, 3.8612060546875, 4.01171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 8.0, 2.0, 8.0, 13.0, 18.0, 33.0, 38.0, 50.0, 72.0, 131.0, 148.0, 133.0, 106.0, 67.0, 41.0, 25.0, 17.0, 19.0, 17.0, 6.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0014715194702148438, -0.0014325082302093506, -0.0013934969902038574, -0.0013544857501983643, -0.001315474510192871, -0.001276463270187378, -0.0012374520301818848, -0.0011984407901763916, -0.0011594295501708984, -0.0011204183101654053, -0.0010814070701599121, -0.001042395830154419, -0.0010033845901489258, -0.0009643733501434326, -0.0009253621101379395, -0.0008863508701324463, -0.0008473396301269531, -0.00080832839012146, -0.0007693171501159668, -0.0007303059101104736, -0.0006912946701049805, -0.0006522834300994873, -0.0006132721900939941, -0.000574260950088501, -0.0005352497100830078, -0.0004962384700775146, -0.0004572272300720215, -0.0004182159900665283, -0.00037920475006103516, -0.000340193510055542, -0.00030118227005004883, -0.00026217103004455566, -0.0002231597900390625, -0.00018414855003356934, -0.00014513731002807617, -0.00010612607002258301, -6.711483001708984e-05, -2.810359001159668e-05, 1.0907649993896484e-05, 4.991888999938965e-05, 8.893013000488281e-05, 0.00012794137001037598, 0.00016695261001586914, 0.0002059638500213623, 0.00024497509002685547, 0.00028398633003234863, 0.0003229975700378418, 0.00036200881004333496, 0.0004010200500488281, 0.0004400312900543213, 0.00047904253005981445, 0.0005180537700653076, 0.0005570650100708008, 0.0005960762500762939, 0.0006350874900817871, 0.0006740987300872803, 0.0007131099700927734, 0.0007521212100982666, 0.0007911324501037598, 0.0008301436901092529, 0.0008691549301147461, 0.0009081661701202393, 0.0009471774101257324, 0.0009861886501312256, 0.0010251998901367188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 24.0, 28.0, 46.0, 51.0, 113.0, 153.0, 276.0, 493.0, 994.0, 2118.0, 5259.0, 16172.0, 61946.0, 561915.0, 320710.0, 54478.0, 14680.0, 4921.0, 2018.0, 921.0, 518.0, 264.0, 160.0, 97.0, 59.0, 38.0, 30.0, 16.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.33984375, -4.2156982421875, -4.091552734375, -3.9674072265625, -3.84326171875, -3.7191162109375, -3.594970703125, -3.4708251953125, -3.3466796875, -3.2225341796875, -3.098388671875, -2.9742431640625, -2.85009765625, -2.7259521484375, -2.601806640625, -2.4776611328125, -2.353515625, -2.2293701171875, -2.105224609375, -1.9810791015625, -1.85693359375, -1.7327880859375, -1.608642578125, -1.4844970703125, -1.3603515625, -1.2362060546875, -1.112060546875, -0.9879150390625, -0.86376953125, -0.7396240234375, -0.615478515625, -0.4913330078125, -0.3671875, -0.2430419921875, -0.118896484375, 0.0052490234375, 0.12939453125, 0.2535400390625, 0.377685546875, 0.5018310546875, 0.6259765625, 0.7501220703125, 0.874267578125, 0.9984130859375, 1.12255859375, 1.2467041015625, 1.370849609375, 1.4949951171875, 1.619140625, 1.7432861328125, 1.867431640625, 1.9915771484375, 2.11572265625, 2.2398681640625, 2.364013671875, 2.4881591796875, 2.6123046875, 2.7364501953125, 2.860595703125, 2.9847412109375, 3.10888671875, 3.2330322265625, 3.357177734375, 3.4813232421875, 3.60546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 1.0, 4.0, 8.0, 9.0, 23.0, 28.0, 33.0, 56.0, 85.0, 115.0, 146.0, 136.0, 109.0, 81.0, 48.0, 39.0, 23.0, 9.0, 7.0, 9.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.703125, -6.525390625, -6.34765625, -6.169921875, -5.9921875, -5.814453125, -5.63671875, -5.458984375, -5.28125, -5.103515625, -4.92578125, -4.748046875, -4.5703125, -4.392578125, -4.21484375, -4.037109375, -3.859375, -3.681640625, -3.50390625, -3.326171875, -3.1484375, -2.970703125, -2.79296875, -2.615234375, -2.4375, -2.259765625, -2.08203125, -1.904296875, -1.7265625, -1.548828125, -1.37109375, -1.193359375, -1.015625, -0.837890625, -0.66015625, -0.482421875, -0.3046875, -0.126953125, 0.05078125, 0.228515625, 0.40625, 0.583984375, 0.76171875, 0.939453125, 1.1171875, 1.294921875, 1.47265625, 1.650390625, 1.828125, 2.005859375, 2.18359375, 2.361328125, 2.5390625, 2.716796875, 2.89453125, 3.072265625, 3.25, 3.427734375, 3.60546875, 3.783203125, 3.9609375, 4.138671875, 4.31640625, 4.494140625, 4.671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 4.0, 9.0, 8.0, 21.0, 34.0, 43.0, 67.0, 95.0, 224.0, 182.0, 96.0, 65.0, 52.0, 27.0, 13.0, 12.0, 6.0, 12.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.23074340820312, -86.33560943603516, -83.44047546386719, -80.54533386230469, -77.65019989013672, -74.75506591796875, -71.85993194580078, -68.96479797363281, -66.06965637207031, -63.174522399902344, -60.27938461303711, -57.38425064086914, -54.489112854003906, -51.59397888183594, -48.69884490966797, -45.803707122802734, -42.908573150634766, -40.0134391784668, -37.11830139160156, -34.223167419433594, -31.32802963256836, -28.43289566040039, -25.53775978088379, -22.642623901367188, -19.747488021850586, -16.852352142333984, -13.957216262817383, -11.062081336975098, -8.166945457458496, -5.2718095779418945, -2.3766746520996094, 0.5184612274169922, 3.4135971069335938, 6.308732986450195, 9.203868865966797, 12.099003791809082, 14.994139671325684, 17.88927459716797, 20.78441047668457, 23.679546356201172, 26.574682235717773, 29.469818115234375, 32.364952087402344, 35.26008987426758, 38.15522384643555, 41.05036163330078, 43.94549560546875, 46.84062957763672, 49.73576736450195, 52.63090133666992, 55.526039123535156, 58.421173095703125, 61.31631088256836, 64.2114486694336, 67.10658264160156, 70.00171661376953, 72.8968505859375, 75.79198455810547, 78.68711853027344, 81.58226013183594, 84.4773941040039, 87.37252807617188, 90.26766204833984, 93.16279602050781, 96.05793762207031]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 2.0, 9.0, 8.0, 13.0, 17.0, 16.0, 43.0, 35.0, 42.0, 33.0, 52.0, 39.0, 87.0, 128.0, 104.0, 61.0, 52.0, 37.0, 36.0, 38.0, 21.0, 27.0, 20.0, 16.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-130.162353515625, -126.38253784179688, -122.60272216796875, -118.82291412353516, -115.04309844970703, -111.2632827758789, -107.48346710205078, -103.70365905761719, -99.92384338378906, -96.14402770996094, -92.36421203613281, -88.58440399169922, -84.8045883178711, -81.02477264404297, -77.24495697021484, -73.46514892578125, -69.68533325195312, -65.905517578125, -62.12570571899414, -58.345890045166016, -54.566078186035156, -50.78626251220703, -47.006446838378906, -43.22663497924805, -39.446815490722656, -35.66699981689453, -31.887187957763672, -28.107372283935547, -24.327560424804688, -20.547744750976562, -16.76793098449707, -12.988117218017578, -9.208305358886719, -5.428491592407227, -1.6486773490905762, 2.131136894226074, 5.910950660705566, 9.690765380859375, 13.470579147338867, 17.25039291381836, 21.03020668029785, 24.810020446777344, 28.589834213256836, 32.36964797973633, 36.14946365356445, 39.92927551269531, 43.70909118652344, 47.48890686035156, 51.26871871948242, 55.04853439331055, 58.828346252441406, 62.60816192626953, 66.38797760009766, 70.16778564453125, 73.94760131835938, 77.7274169921875, 81.50723266601562, 85.28704833984375, 89.06686401367188, 92.84667205810547, 96.6264877319336, 100.40630340576172, 104.18611907958984, 107.96592712402344, 111.74574279785156]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 15.0, 16.0, 18.0, 29.0, 47.0, 83.0, 123.0, 172.0, 304.0, 535.0, 943.0, 1585.0, 2923.0, 5735.0, 11126.0, 23505.0, 55470.0, 152259.0, 467652.0, 1228336.0, 1364614.0, 571907.0, 190445.0, 65875.0, 26120.0, 11771.0, 5710.0, 2974.0, 1621.0, 857.0, 580.0, 314.0, 204.0, 139.0, 89.0, 60.0, 39.0, 24.0, 18.0, 11.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.921875, -4.74664306640625, -4.5714111328125, -4.39617919921875, -4.220947265625, -4.04571533203125, -3.8704833984375, -3.69525146484375, -3.52001953125, -3.34478759765625, -3.1695556640625, -2.99432373046875, -2.819091796875, -2.64385986328125, -2.4686279296875, -2.29339599609375, -2.1181640625, -1.94293212890625, -1.7677001953125, -1.59246826171875, -1.417236328125, -1.24200439453125, -1.0667724609375, -0.89154052734375, -0.71630859375, -0.54107666015625, -0.3658447265625, -0.19061279296875, -0.015380859375, 0.15985107421875, 0.3350830078125, 0.51031494140625, 0.685546875, 0.86077880859375, 1.0360107421875, 1.21124267578125, 1.386474609375, 1.56170654296875, 1.7369384765625, 1.91217041015625, 2.08740234375, 2.26263427734375, 2.4378662109375, 2.61309814453125, 2.788330078125, 2.96356201171875, 3.1387939453125, 3.31402587890625, 3.4892578125, 3.66448974609375, 3.8397216796875, 4.01495361328125, 4.190185546875, 4.36541748046875, 4.5406494140625, 4.71588134765625, 4.89111328125, 5.06634521484375, 5.2415771484375, 5.41680908203125, 5.592041015625, 5.76727294921875, 5.9425048828125, 6.11773681640625, 6.29296875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 8.0, 4.0, 5.0, 10.0, 17.0, 18.0, 15.0, 29.0, 31.0, 38.0, 45.0, 47.0, 52.0, 61.0, 67.0, 59.0, 49.0, 55.0, 44.0, 59.0, 63.0, 48.0, 37.0, 40.0, 20.0, 27.0, 14.0, 13.0, 10.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8153076171875, -8.513427734375, -8.2115478515625, -7.90966796875, -7.6077880859375, -7.305908203125, -7.0040283203125, -6.7021484375, -6.4002685546875, -6.098388671875, -5.7965087890625, -5.49462890625, -5.1927490234375, -4.890869140625, -4.5889892578125, -4.287109375, -3.9852294921875, -3.683349609375, -3.3814697265625, -3.07958984375, -2.7777099609375, -2.475830078125, -2.1739501953125, -1.8720703125, -1.5701904296875, -1.268310546875, -0.9664306640625, -0.66455078125, -0.3626708984375, -0.060791015625, 0.2410888671875, 0.54296875, 0.8448486328125, 1.146728515625, 1.4486083984375, 1.75048828125, 2.0523681640625, 2.354248046875, 2.6561279296875, 2.9580078125, 3.2598876953125, 3.561767578125, 3.8636474609375, 4.16552734375, 4.4674072265625, 4.769287109375, 5.0711669921875, 5.373046875, 5.6749267578125, 5.976806640625, 6.2786865234375, 6.58056640625, 6.8824462890625, 7.184326171875, 7.4862060546875, 7.7880859375, 8.0899658203125, 8.391845703125, 8.6937255859375, 8.99560546875, 9.2974853515625, 9.599365234375, 9.9012451171875, 10.203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 11.0, 9.0, 10.0, 21.0, 27.0, 41.0, 51.0, 93.0, 99.0, 211.0, 424.0, 1111.0, 4124.0, 21850.0, 278432.0, 3553116.0, 305204.0, 23229.0, 4138.0, 1098.0, 406.0, 221.0, 86.0, 79.0, 57.0, 35.0, 21.0, 19.0, 17.0, 5.0, 3.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-20.328125, -19.7862548828125, -19.244384765625, -18.7025146484375, -18.16064453125, -17.6187744140625, -17.076904296875, -16.5350341796875, -15.9931640625, -15.4512939453125, -14.909423828125, -14.3675537109375, -13.82568359375, -13.2838134765625, -12.741943359375, -12.2000732421875, -11.658203125, -11.1163330078125, -10.574462890625, -10.0325927734375, -9.49072265625, -8.9488525390625, -8.406982421875, -7.8651123046875, -7.3232421875, -6.7813720703125, -6.239501953125, -5.6976318359375, -5.15576171875, -4.6138916015625, -4.072021484375, -3.5301513671875, -2.98828125, -2.4464111328125, -1.904541015625, -1.3626708984375, -0.82080078125, -0.2789306640625, 0.262939453125, 0.8048095703125, 1.3466796875, 1.8885498046875, 2.430419921875, 2.9722900390625, 3.51416015625, 4.0560302734375, 4.597900390625, 5.1397705078125, 5.681640625, 6.2235107421875, 6.765380859375, 7.3072509765625, 7.84912109375, 8.3909912109375, 8.932861328125, 9.4747314453125, 10.0166015625, 10.5584716796875, 11.100341796875, 11.6422119140625, 12.18408203125, 12.7259521484375, 13.267822265625, 13.8096923828125, 14.3515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 5.0, 9.0, 18.0, 9.0, 10.0, 21.0, 35.0, 51.0, 55.0, 79.0, 101.0, 150.0, 197.0, 358.0, 436.0, 516.0, 505.0, 416.0, 340.0, 226.0, 149.0, 93.0, 68.0, 64.0, 35.0, 24.0, 23.0, 8.0, 19.0, 6.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.046875, -13.6575927734375, -13.268310546875, -12.8790283203125, -12.48974609375, -12.1004638671875, -11.711181640625, -11.3218994140625, -10.9326171875, -10.5433349609375, -10.154052734375, -9.7647705078125, -9.37548828125, -8.9862060546875, -8.596923828125, -8.2076416015625, -7.818359375, -7.4290771484375, -7.039794921875, -6.6505126953125, -6.26123046875, -5.8719482421875, -5.482666015625, -5.0933837890625, -4.7041015625, -4.3148193359375, -3.925537109375, -3.5362548828125, -3.14697265625, -2.7576904296875, -2.368408203125, -1.9791259765625, -1.58984375, -1.2005615234375, -0.811279296875, -0.4219970703125, -0.03271484375, 0.3565673828125, 0.745849609375, 1.1351318359375, 1.5244140625, 1.9136962890625, 2.302978515625, 2.6922607421875, 3.08154296875, 3.4708251953125, 3.860107421875, 4.2493896484375, 4.638671875, 5.0279541015625, 5.417236328125, 5.8065185546875, 6.19580078125, 6.5850830078125, 6.974365234375, 7.3636474609375, 7.7529296875, 8.1422119140625, 8.531494140625, 8.9207763671875, 9.31005859375, 9.6993408203125, 10.088623046875, 10.4779052734375, 10.8671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 5.0, 14.0, 17.0, 50.0, 206.0, 360.0, 232.0, 74.0, 24.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-430.3618469238281, -422.3433532714844, -414.3248291015625, -406.30633544921875, -398.2878112792969, -390.2693176269531, -382.25079345703125, -374.2322998046875, -366.21380615234375, -358.1953125, -350.1767883300781, -342.1582946777344, -334.1397705078125, -326.12127685546875, -318.102783203125, -310.0842590332031, -302.06573486328125, -294.0472412109375, -286.0287170410156, -278.0102233886719, -269.99169921875, -261.97320556640625, -253.95469665527344, -245.93618774414062, -237.91769409179688, -229.89918518066406, -221.88067626953125, -213.8621826171875, -205.8436737060547, -197.82516479492188, -189.80665588378906, -181.78814697265625, -173.76963806152344, -165.75112915039062, -157.7326202392578, -149.714111328125, -141.69561767578125, -133.67710876464844, -125.65859985351562, -117.64009094238281, -109.62158966064453, -101.60308074951172, -93.58457946777344, -85.56607055664062, -77.54756164550781, -69.52906036376953, -61.51055145263672, -53.49204635620117, -45.473541259765625, -37.45503616333008, -29.4365291595459, -21.41802215576172, -13.399517059326172, -5.381011962890625, 2.6374969482421875, 10.656002044677734, 18.67450714111328, 26.693012237548828, 34.711517333984375, 42.73002624511719, 50.748531341552734, 58.76703643798828, 66.7855453491211, 74.80404663085938, 82.82255554199219]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 2.0, 4.0, 13.0, 9.0, 15.0, 14.0, 17.0, 16.0, 24.0, 30.0, 30.0, 32.0, 34.0, 30.0, 39.0, 40.0, 50.0, 47.0, 43.0, 31.0, 53.0, 48.0, 42.0, 43.0, 42.0, 34.0, 41.0, 28.0, 28.0, 18.0, 19.0, 19.0, 12.0, 6.0, 11.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.16143798828125, -67.0321044921875, -64.90277099609375, -62.773441314697266, -60.644107818603516, -58.514774322509766, -56.38544464111328, -54.25611114501953, -52.12677764892578, -49.99744415283203, -47.86811065673828, -45.7387809753418, -43.60944747924805, -41.4801139831543, -39.35078430175781, -37.22145080566406, -35.09211730957031, -32.96278381347656, -30.833452224731445, -28.704120635986328, -26.574787139892578, -24.445453643798828, -22.31612205505371, -20.186790466308594, -18.057456970214844, -15.92812442779541, -13.798791885375977, -11.669459342956543, -9.54012680053711, -7.410794258117676, -5.281461715698242, -3.1521291732788086, -1.022796630859375, 1.1065359115600586, 3.235868453979492, 5.365200996398926, 7.494533538818359, 9.623866081237793, 11.753198623657227, 13.88253116607666, 16.011863708496094, 18.141197204589844, 20.27052879333496, 22.399860382080078, 24.529193878173828, 26.658527374267578, 28.787858963012695, 30.917190551757812, 33.04652404785156, 35.17585754394531, 37.30519104003906, 39.43452072143555, 41.5638542175293, 43.69318771362305, 45.82251739501953, 47.95185089111328, 50.08118438720703, 52.21051788330078, 54.33985137939453, 56.469181060791016, 58.598514556884766, 60.727848052978516, 62.857177734375, 64.98651123046875, 67.1158447265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 3.0, 12.0, 22.0, 36.0, 35.0, 64.0, 109.0, 167.0, 294.0, 521.0, 956.0, 1841.0, 3736.0, 7966.0, 17899.0, 43648.0, 113997.0, 301374.0, 334631.0, 132835.0, 50285.0, 20670.0, 8907.0, 4131.0, 1932.0, 1073.0, 590.0, 289.0, 181.0, 135.0, 69.0, 54.0, 33.0, 18.0, 18.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.1129150390625, -8.788330078125, -8.4637451171875, -8.13916015625, -7.8145751953125, -7.489990234375, -7.1654052734375, -6.8408203125, -6.5162353515625, -6.191650390625, -5.8670654296875, -5.54248046875, -5.2178955078125, -4.893310546875, -4.5687255859375, -4.244140625, -3.9195556640625, -3.594970703125, -3.2703857421875, -2.94580078125, -2.6212158203125, -2.296630859375, -1.9720458984375, -1.6474609375, -1.3228759765625, -0.998291015625, -0.6737060546875, -0.34912109375, -0.0245361328125, 0.300048828125, 0.6246337890625, 0.94921875, 1.2738037109375, 1.598388671875, 1.9229736328125, 2.24755859375, 2.5721435546875, 2.896728515625, 3.2213134765625, 3.5458984375, 3.8704833984375, 4.195068359375, 4.5196533203125, 4.84423828125, 5.1688232421875, 5.493408203125, 5.8179931640625, 6.142578125, 6.4671630859375, 6.791748046875, 7.1163330078125, 7.44091796875, 7.7655029296875, 8.090087890625, 8.4146728515625, 8.7392578125, 9.0638427734375, 9.388427734375, 9.7130126953125, 10.03759765625, 10.3621826171875, 10.686767578125, 11.0113525390625, 11.3359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 6.0, 5.0, 10.0, 11.0, 14.0, 21.0, 21.0, 33.0, 32.0, 45.0, 50.0, 41.0, 45.0, 66.0, 64.0, 74.0, 48.0, 53.0, 53.0, 44.0, 38.0, 34.0, 45.0, 32.0, 21.0, 28.0, 14.0, 12.0, 10.0, 6.0, 5.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.88720703125, -8.5869140625, -8.28662109375, -7.986328125, -7.68603515625, -7.3857421875, -7.08544921875, -6.78515625, -6.48486328125, -6.1845703125, -5.88427734375, -5.583984375, -5.28369140625, -4.9833984375, -4.68310546875, -4.3828125, -4.08251953125, -3.7822265625, -3.48193359375, -3.181640625, -2.88134765625, -2.5810546875, -2.28076171875, -1.98046875, -1.68017578125, -1.3798828125, -1.07958984375, -0.779296875, -0.47900390625, -0.1787109375, 0.12158203125, 0.421875, 0.72216796875, 1.0224609375, 1.32275390625, 1.623046875, 1.92333984375, 2.2236328125, 2.52392578125, 2.82421875, 3.12451171875, 3.4248046875, 3.72509765625, 4.025390625, 4.32568359375, 4.6259765625, 4.92626953125, 5.2265625, 5.52685546875, 5.8271484375, 6.12744140625, 6.427734375, 6.72802734375, 7.0283203125, 7.32861328125, 7.62890625, 7.92919921875, 8.2294921875, 8.52978515625, 8.830078125, 9.13037109375, 9.4306640625, 9.73095703125, 10.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 14.0, 14.0, 26.0, 27.0, 51.0, 62.0, 96.0, 115.0, 165.0, 254.0, 410.0, 633.0, 1105.0, 1989.0, 4755.0, 15513.0, 89334.0, 778773.0, 125332.0, 19513.0, 5398.0, 2080.0, 1050.0, 598.0, 401.0, 262.0, 152.0, 110.0, 94.0, 66.0, 42.0, 32.0, 16.0, 15.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.03125, -21.39404296875, -20.7568359375, -20.11962890625, -19.482421875, -18.84521484375, -18.2080078125, -17.57080078125, -16.93359375, -16.29638671875, -15.6591796875, -15.02197265625, -14.384765625, -13.74755859375, -13.1103515625, -12.47314453125, -11.8359375, -11.19873046875, -10.5615234375, -9.92431640625, -9.287109375, -8.64990234375, -8.0126953125, -7.37548828125, -6.73828125, -6.10107421875, -5.4638671875, -4.82666015625, -4.189453125, -3.55224609375, -2.9150390625, -2.27783203125, -1.640625, -1.00341796875, -0.3662109375, 0.27099609375, 0.908203125, 1.54541015625, 2.1826171875, 2.81982421875, 3.45703125, 4.09423828125, 4.7314453125, 5.36865234375, 6.005859375, 6.64306640625, 7.2802734375, 7.91748046875, 8.5546875, 9.19189453125, 9.8291015625, 10.46630859375, 11.103515625, 11.74072265625, 12.3779296875, 13.01513671875, 13.65234375, 14.28955078125, 14.9267578125, 15.56396484375, 16.201171875, 16.83837890625, 17.4755859375, 18.11279296875, 18.75]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 5.0, 15.0, 15.0, 14.0, 18.0, 32.0, 25.0, 39.0, 49.0, 60.0, 64.0, 60.0, 57.0, 49.0, 62.0, 68.0, 70.0, 54.0, 41.0, 37.0, 25.0, 25.0, 21.0, 17.0, 14.0, 13.0, 12.0, 6.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.90625, -35.849609375, -34.79296875, -33.736328125, -32.6796875, -31.623046875, -30.56640625, -29.509765625, -28.453125, -27.396484375, -26.33984375, -25.283203125, -24.2265625, -23.169921875, -22.11328125, -21.056640625, -20.0, -18.943359375, -17.88671875, -16.830078125, -15.7734375, -14.716796875, -13.66015625, -12.603515625, -11.546875, -10.490234375, -9.43359375, -8.376953125, -7.3203125, -6.263671875, -5.20703125, -4.150390625, -3.09375, -2.037109375, -0.98046875, 0.076171875, 1.1328125, 2.189453125, 3.24609375, 4.302734375, 5.359375, 6.416015625, 7.47265625, 8.529296875, 9.5859375, 10.642578125, 11.69921875, 12.755859375, 13.8125, 14.869140625, 15.92578125, 16.982421875, 18.0390625, 19.095703125, 20.15234375, 21.208984375, 22.265625, 23.322265625, 24.37890625, 25.435546875, 26.4921875, 27.548828125, 28.60546875, 29.662109375, 30.71875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 12.0, 13.0, 15.0, 24.0, 22.0, 37.0, 37.0, 62.0, 77.0, 102.0, 148.0, 257.0, 426.0, 704.0, 1405.0, 2967.0, 7148.0, 21369.0, 87257.0, 731170.0, 147576.0, 30481.0, 9523.0, 3735.0, 1696.0, 887.0, 480.0, 278.0, 176.0, 115.0, 68.0, 70.0, 44.0, 41.0, 34.0, 18.0, 16.0, 10.0, 8.0, 9.0, 4.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.93359375, -2.843719482421875, -2.75384521484375, -2.663970947265625, -2.5740966796875, -2.484222412109375, -2.39434814453125, -2.304473876953125, -2.214599609375, -2.124725341796875, -2.03485107421875, -1.944976806640625, -1.8551025390625, -1.765228271484375, -1.67535400390625, -1.585479736328125, -1.49560546875, -1.405731201171875, -1.31585693359375, -1.225982666015625, -1.1361083984375, -1.046234130859375, -0.95635986328125, -0.866485595703125, -0.776611328125, -0.686737060546875, -0.59686279296875, -0.506988525390625, -0.4171142578125, -0.327239990234375, -0.23736572265625, -0.147491455078125, -0.0576171875, 0.032257080078125, 0.12213134765625, 0.212005615234375, 0.3018798828125, 0.391754150390625, 0.48162841796875, 0.571502685546875, 0.661376953125, 0.751251220703125, 0.84112548828125, 0.930999755859375, 1.0208740234375, 1.110748291015625, 1.20062255859375, 1.290496826171875, 1.38037109375, 1.470245361328125, 1.56011962890625, 1.649993896484375, 1.7398681640625, 1.829742431640625, 1.91961669921875, 2.009490966796875, 2.099365234375, 2.189239501953125, 2.27911376953125, 2.368988037109375, 2.4588623046875, 2.548736572265625, 2.63861083984375, 2.728485107421875, 2.818359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 6.0, 11.0, 14.0, 27.0, 28.0, 40.0, 58.0, 102.0, 136.0, 143.0, 128.0, 65.0, 51.0, 31.0, 27.0, 18.0, 19.0, 8.0, 9.0, 6.0, 8.0, 4.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008645057678222656, -0.0008338764309883118, -0.0008032470941543579, -0.000772617757320404, -0.0007419884204864502, -0.0007113590836524963, -0.0006807297468185425, -0.0006501004099845886, -0.0006194710731506348, -0.0005888417363166809, -0.000558212399482727, -0.0005275830626487732, -0.0004969537258148193, -0.0004663243889808655, -0.0004356950521469116, -0.00040506571531295776, -0.0003744363784790039, -0.00034380704164505005, -0.0003131777048110962, -0.00028254836797714233, -0.0002519190311431885, -0.00022128969430923462, -0.00019066035747528076, -0.0001600310206413269, -0.00012940168380737305, -9.877234697341919e-05, -6.814301013946533e-05, -3.7513673305511475e-05, -6.884336471557617e-06, 2.374500036239624e-05, 5.43743371963501e-05, 8.500367403030396e-05, 0.00011563301086425781, 0.00014626234769821167, 0.00017689168453216553, 0.00020752102136611938, 0.00023815035820007324, 0.0002687796950340271, 0.00029940903186798096, 0.0003300383687019348, 0.00036066770553588867, 0.00039129704236984253, 0.0004219263792037964, 0.00045255571603775024, 0.0004831850528717041, 0.000513814389705658, 0.0005444437265396118, 0.0005750730633735657, 0.0006057024002075195, 0.0006363317370414734, 0.0006669610738754272, 0.0006975904107093811, 0.000728219747543335, 0.0007588490843772888, 0.0007894784212112427, 0.0008201077580451965, 0.0008507370948791504, 0.0008813664317131042, 0.0009119957685470581, 0.000942625105381012, 0.0009732544422149658, 0.0010038837790489197, 0.0010345131158828735, 0.0010651424527168274, 0.0010957717895507812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 13.0, 27.0, 41.0, 52.0, 85.0, 87.0, 135.0, 210.0, 301.0, 552.0, 964.0, 1802.0, 3889.0, 9427.0, 29483.0, 134686.0, 706339.0, 117205.0, 26585.0, 8697.0, 3673.0, 1814.0, 993.0, 549.0, 329.0, 183.0, 136.0, 76.0, 62.0, 40.0, 28.0, 16.0, 18.0, 6.0, 7.0, 10.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.201171875, -3.113372802734375, -3.02557373046875, -2.937774658203125, -2.8499755859375, -2.762176513671875, -2.67437744140625, -2.586578369140625, -2.498779296875, -2.410980224609375, -2.32318115234375, -2.235382080078125, -2.1475830078125, -2.059783935546875, -1.97198486328125, -1.884185791015625, -1.79638671875, -1.708587646484375, -1.62078857421875, -1.532989501953125, -1.4451904296875, -1.357391357421875, -1.26959228515625, -1.181793212890625, -1.093994140625, -1.006195068359375, -0.91839599609375, -0.830596923828125, -0.7427978515625, -0.654998779296875, -0.56719970703125, -0.479400634765625, -0.3916015625, -0.303802490234375, -0.21600341796875, -0.128204345703125, -0.0404052734375, 0.047393798828125, 0.13519287109375, 0.222991943359375, 0.310791015625, 0.398590087890625, 0.48638916015625, 0.574188232421875, 0.6619873046875, 0.749786376953125, 0.83758544921875, 0.925384521484375, 1.01318359375, 1.100982666015625, 1.18878173828125, 1.276580810546875, 1.3643798828125, 1.452178955078125, 1.53997802734375, 1.627777099609375, 1.715576171875, 1.803375244140625, 1.89117431640625, 1.978973388671875, 2.0667724609375, 2.154571533203125, 2.24237060546875, 2.330169677734375, 2.41796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 1.0, 8.0, 15.0, 11.0, 23.0, 19.0, 27.0, 39.0, 41.0, 55.0, 53.0, 65.0, 94.0, 88.0, 72.0, 58.0, 62.0, 43.0, 29.0, 35.0, 31.0, 28.0, 17.0, 14.0, 16.0, 9.0, 5.0, 10.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.14105224609375, -3.0438232421875, -2.94659423828125, -2.849365234375, -2.75213623046875, -2.6549072265625, -2.55767822265625, -2.46044921875, -2.36322021484375, -2.2659912109375, -2.16876220703125, -2.071533203125, -1.97430419921875, -1.8770751953125, -1.77984619140625, -1.6826171875, -1.58538818359375, -1.4881591796875, -1.39093017578125, -1.293701171875, -1.19647216796875, -1.0992431640625, -1.00201416015625, -0.90478515625, -0.80755615234375, -0.7103271484375, -0.61309814453125, -0.515869140625, -0.41864013671875, -0.3214111328125, -0.22418212890625, -0.126953125, -0.02972412109375, 0.0675048828125, 0.16473388671875, 0.261962890625, 0.35919189453125, 0.4564208984375, 0.55364990234375, 0.65087890625, 0.74810791015625, 0.8453369140625, 0.94256591796875, 1.039794921875, 1.13702392578125, 1.2342529296875, 1.33148193359375, 1.4287109375, 1.52593994140625, 1.6231689453125, 1.72039794921875, 1.817626953125, 1.91485595703125, 2.0120849609375, 2.10931396484375, 2.20654296875, 2.30377197265625, 2.4010009765625, 2.49822998046875, 2.595458984375, 2.69268798828125, 2.7899169921875, 2.88714599609375, 2.984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 8.0, 23.0, 48.0, 128.0, 373.0, 262.0, 93.0, 34.0, 16.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.67706298828125, -138.86956787109375, -133.06207275390625, -127.25458526611328, -121.44709777832031, -115.63960266113281, -109.83210754394531, -104.02461242675781, -98.21712493896484, -92.40962982177734, -86.60214233398438, -80.79464721679688, -74.98715209960938, -69.1796646118164, -63.372169494628906, -57.56467819213867, -51.75718688964844, -45.9496955871582, -40.14220428466797, -34.33470916748047, -28.527217864990234, -22.7197265625, -16.9122314453125, -11.104740142822266, -5.297248840332031, 0.5102434158325195, 6.31773567199707, 12.125228881835938, 17.932720184326172, 23.740211486816406, 29.547706604003906, 35.35519790649414, 41.162689208984375, 46.97018051147461, 52.777671813964844, 58.585166931152344, 64.39265441894531, 70.20014953613281, 76.00764465332031, 81.81513977050781, 87.62262725830078, 93.43012237548828, 99.23760986328125, 105.04510498046875, 110.85260009765625, 116.66008758544922, 122.46758270263672, 128.2750701904297, 134.0825653076172, 139.8900604248047, 145.6975555419922, 151.50503540039062, 157.31253051757812, 163.12002563476562, 168.92752075195312, 174.73501586914062, 180.54251098632812, 186.35000610351562, 192.15750122070312, 197.96499633789062, 203.77247619628906, 209.57997131347656, 215.38746643066406, 221.19496154785156, 227.00244140625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 13.0, 8.0, 15.0, 12.0, 22.0, 24.0, 38.0, 31.0, 32.0, 46.0, 47.0, 80.0, 123.0, 123.0, 78.0, 45.0, 47.0, 38.0, 21.0, 26.0, 20.0, 18.0, 12.0, 13.0, 12.0, 9.0, 6.0, 4.0, 8.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-124.669677734375, -121.20639038085938, -117.74310302734375, -114.27981567382812, -110.8165283203125, -107.35324096679688, -103.88995361328125, -100.42666625976562, -96.96337890625, -93.50009155273438, -90.03680419921875, -86.57351684570312, -83.1102294921875, -79.64694213867188, -76.18365478515625, -72.72036743164062, -69.257080078125, -65.79379272460938, -62.33050537109375, -58.867218017578125, -55.4039306640625, -51.940643310546875, -48.47735595703125, -45.014068603515625, -41.55078125, -38.087493896484375, -34.62420654296875, -31.160919189453125, -27.6976318359375, -24.234344482421875, -20.77105712890625, -17.307769775390625, -13.844490051269531, -10.381202697753906, -6.917915344238281, -3.4546279907226562, 0.00865936279296875, 3.4719467163085938, 6.935234069824219, 10.398521423339844, 13.861808776855469, 17.325096130371094, 20.78838348388672, 24.251670837402344, 27.71495819091797, 31.178245544433594, 34.64153289794922, 38.104820251464844, 41.56810760498047, 45.031394958496094, 48.49468231201172, 51.957969665527344, 55.42125701904297, 58.884544372558594, 62.34783172607422, 65.81111907958984, 69.27440643310547, 72.7376937866211, 76.20098114013672, 79.66426849365234, 83.12755584716797, 86.5908432006836, 90.05413055419922, 93.51741790771484, 96.98070526123047]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 2.0, 6.0, 21.0, 19.0, 19.0, 31.0, 39.0, 71.0, 97.0, 151.0, 187.0, 361.0, 581.0, 1122.0, 2499.0, 7288.0, 23337.0, 114692.0, 714617.0, 2202311.0, 931879.0, 156166.0, 26354.0, 7059.0, 2476.0, 1150.0, 676.0, 376.0, 200.0, 153.0, 98.0, 55.0, 63.0, 40.0, 22.0, 17.0, 10.0, 10.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7421875, -10.390869140625, -10.03955078125, -9.688232421875, -9.3369140625, -8.985595703125, -8.63427734375, -8.282958984375, -7.931640625, -7.580322265625, -7.22900390625, -6.877685546875, -6.5263671875, -6.175048828125, -5.82373046875, -5.472412109375, -5.12109375, -4.769775390625, -4.41845703125, -4.067138671875, -3.7158203125, -3.364501953125, -3.01318359375, -2.661865234375, -2.310546875, -1.959228515625, -1.60791015625, -1.256591796875, -0.9052734375, -0.553955078125, -0.20263671875, 0.148681640625, 0.5, 0.851318359375, 1.20263671875, 1.553955078125, 1.9052734375, 2.256591796875, 2.60791015625, 2.959228515625, 3.310546875, 3.661865234375, 4.01318359375, 4.364501953125, 4.7158203125, 5.067138671875, 5.41845703125, 5.769775390625, 6.12109375, 6.472412109375, 6.82373046875, 7.175048828125, 7.5263671875, 7.877685546875, 8.22900390625, 8.580322265625, 8.931640625, 9.282958984375, 9.63427734375, 9.985595703125, 10.3369140625, 10.688232421875, 11.03955078125, 11.390869140625, 11.7421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 10.0, 11.0, 13.0, 22.0, 16.0, 28.0, 26.0, 43.0, 49.0, 45.0, 57.0, 60.0, 67.0, 78.0, 49.0, 57.0, 54.0, 59.0, 58.0, 37.0, 35.0, 20.0, 29.0, 17.0, 9.0, 14.0, 8.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.8955078125, -8.595703125, -8.2958984375, -7.99609375, -7.6962890625, -7.396484375, -7.0966796875, -6.796875, -6.4970703125, -6.197265625, -5.8974609375, -5.59765625, -5.2978515625, -4.998046875, -4.6982421875, -4.3984375, -4.0986328125, -3.798828125, -3.4990234375, -3.19921875, -2.8994140625, -2.599609375, -2.2998046875, -2.0, -1.7001953125, -1.400390625, -1.1005859375, -0.80078125, -0.5009765625, -0.201171875, 0.0986328125, 0.3984375, 0.6982421875, 0.998046875, 1.2978515625, 1.59765625, 1.8974609375, 2.197265625, 2.4970703125, 2.796875, 3.0966796875, 3.396484375, 3.6962890625, 3.99609375, 4.2958984375, 4.595703125, 4.8955078125, 5.1953125, 5.4951171875, 5.794921875, 6.0947265625, 6.39453125, 6.6943359375, 6.994140625, 7.2939453125, 7.59375, 7.8935546875, 8.193359375, 8.4931640625, 8.79296875, 9.0927734375, 9.392578125, 9.6923828125, 9.9921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 5.0, 5.0, 12.0, 20.0, 14.0, 35.0, 80.0, 140.0, 244.0, 512.0, 1594.0, 7881.0, 439948.0, 3722576.0, 17075.0, 2566.0, 827.0, 323.0, 170.0, 80.0, 58.0, 37.0, 25.0, 16.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.28125, -36.87109375, -35.4609375, -34.05078125, -32.640625, -31.23046875, -29.8203125, -28.41015625, -27.0, -25.58984375, -24.1796875, -22.76953125, -21.359375, -19.94921875, -18.5390625, -17.12890625, -15.71875, -14.30859375, -12.8984375, -11.48828125, -10.078125, -8.66796875, -7.2578125, -5.84765625, -4.4375, -3.02734375, -1.6171875, -0.20703125, 1.203125, 2.61328125, 4.0234375, 5.43359375, 6.84375, 8.25390625, 9.6640625, 11.07421875, 12.484375, 13.89453125, 15.3046875, 16.71484375, 18.125, 19.53515625, 20.9453125, 22.35546875, 23.765625, 25.17578125, 26.5859375, 27.99609375, 29.40625, 30.81640625, 32.2265625, 33.63671875, 35.046875, 36.45703125, 37.8671875, 39.27734375, 40.6875, 42.09765625, 43.5078125, 44.91796875, 46.328125, 47.73828125, 49.1484375, 50.55859375, 51.96875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 4.0, 3.0, 6.0, 11.0, 16.0, 20.0, 24.0, 40.0, 72.0, 99.0, 173.0, 316.0, 533.0, 709.0, 754.0, 475.0, 304.0, 174.0, 111.0, 74.0, 44.0, 39.0, 20.0, 11.0, 7.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.47216796875, -19.7099609375, -18.94775390625, -18.185546875, -17.42333984375, -16.6611328125, -15.89892578125, -15.13671875, -14.37451171875, -13.6123046875, -12.85009765625, -12.087890625, -11.32568359375, -10.5634765625, -9.80126953125, -9.0390625, -8.27685546875, -7.5146484375, -6.75244140625, -5.990234375, -5.22802734375, -4.4658203125, -3.70361328125, -2.94140625, -2.17919921875, -1.4169921875, -0.65478515625, 0.107421875, 0.86962890625, 1.6318359375, 2.39404296875, 3.15625, 3.91845703125, 4.6806640625, 5.44287109375, 6.205078125, 6.96728515625, 7.7294921875, 8.49169921875, 9.25390625, 10.01611328125, 10.7783203125, 11.54052734375, 12.302734375, 13.06494140625, 13.8271484375, 14.58935546875, 15.3515625, 16.11376953125, 16.8759765625, 17.63818359375, 18.400390625, 19.16259765625, 19.9248046875, 20.68701171875, 21.44921875, 22.21142578125, 22.9736328125, 23.73583984375, 24.498046875, 25.26025390625, 26.0224609375, 26.78466796875, 27.546875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 10.0, 4.0, 29.0, 49.0, 110.0, 234.0, 265.0, 158.0, 68.0, 23.0, 26.0, 8.0, 7.0, 4.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.176513671875, -169.78628540039062, -160.39605712890625, -151.00582885742188, -141.6156005859375, -132.22537231445312, -122.83515930175781, -113.44493103027344, -104.05470275878906, -94.66447448730469, -85.27424621582031, -75.88402557373047, -66.4937973022461, -57.10356903076172, -47.71334457397461, -38.3231201171875, -28.932891845703125, -19.542665481567383, -10.15243911743164, -0.7622127532958984, 8.628013610839844, 18.01824188232422, 27.408466339111328, 36.79869079589844, 46.18891906738281, 55.57914733886719, 64.96937561035156, 74.3595962524414, 83.74982452392578, 93.14005279541016, 102.5302734375, 111.92050170898438, 121.31072998046875, 130.70095825195312, 140.0911865234375, 149.48141479492188, 158.87164306640625, 168.26187133789062, 177.65208435058594, 187.0423126220703, 196.4325408935547, 205.82276916503906, 215.21299743652344, 224.6032257080078, 233.99343872070312, 243.3836669921875, 252.77389526367188, 262.16412353515625, 271.5543518066406, 280.944580078125, 290.3348083496094, 299.72503662109375, 309.1152648925781, 318.5054931640625, 327.8957214355469, 337.28594970703125, 346.6761474609375, 356.0663757324219, 365.45660400390625, 374.8468322753906, 384.237060546875, 393.6272888183594, 403.01751708984375, 412.40771484375, 421.7979736328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 6.0, 12.0, 10.0, 9.0, 14.0, 25.0, 24.0, 13.0, 23.0, 20.0, 34.0, 41.0, 34.0, 45.0, 41.0, 43.0, 48.0, 63.0, 63.0, 54.0, 50.0, 43.0, 33.0, 37.0, 43.0, 27.0, 19.0, 31.0, 10.0, 21.0, 14.0, 8.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-120.64923095703125, -117.22179412841797, -113.79436492919922, -110.36692810058594, -106.93949890136719, -103.5120620727539, -100.08462524414062, -96.65719604492188, -93.22976684570312, -89.80233001708984, -86.3749008178711, -82.94746398925781, -79.52003479003906, -76.09259796142578, -72.6651611328125, -69.23773193359375, -65.81029510498047, -62.38286209106445, -58.95542907714844, -55.527992248535156, -52.100563049316406, -48.673126220703125, -45.24569320678711, -41.818260192871094, -38.39082717895508, -34.96339416503906, -31.535961151123047, -28.1085262298584, -24.681093215942383, -21.253660202026367, -17.82622528076172, -14.398792266845703, -10.971359252929688, -7.543925762176514, -4.11649227142334, -0.6890583038330078, 2.738374710083008, 6.165807723999023, 9.593242645263672, 13.020675659179688, 16.448108673095703, 19.87554168701172, 23.302974700927734, 26.730409622192383, 30.1578426361084, 33.58527374267578, 37.01271057128906, 40.44014358520508, 43.867576599121094, 47.29500961303711, 50.722442626953125, 54.149879455566406, 57.577308654785156, 61.00474548339844, 64.43217468261719, 67.85961151123047, 71.28704833984375, 74.71448516845703, 78.14191436767578, 81.56935119628906, 84.99678039550781, 88.4242172241211, 91.85165405273438, 95.27908325195312, 98.70651245117188]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 20.0, 31.0, 44.0, 55.0, 88.0, 144.0, 208.0, 358.0, 535.0, 980.0, 1788.0, 3626.0, 7714.0, 19449.0, 55368.0, 186300.0, 480831.0, 196207.0, 58528.0, 19964.0, 8097.0, 3801.0, 1881.0, 1035.0, 527.0, 362.0, 183.0, 125.0, 83.0, 54.0, 40.0, 19.0, 19.0, 12.0, 5.0, 15.0, 10.0, 5.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.2890625, -9.962646484375, -9.63623046875, -9.309814453125, -8.9833984375, -8.656982421875, -8.33056640625, -8.004150390625, -7.677734375, -7.351318359375, -7.02490234375, -6.698486328125, -6.3720703125, -6.045654296875, -5.71923828125, -5.392822265625, -5.06640625, -4.739990234375, -4.41357421875, -4.087158203125, -3.7607421875, -3.434326171875, -3.10791015625, -2.781494140625, -2.455078125, -2.128662109375, -1.80224609375, -1.475830078125, -1.1494140625, -0.822998046875, -0.49658203125, -0.170166015625, 0.15625, 0.482666015625, 0.80908203125, 1.135498046875, 1.4619140625, 1.788330078125, 2.11474609375, 2.441162109375, 2.767578125, 3.093994140625, 3.42041015625, 3.746826171875, 4.0732421875, 4.399658203125, 4.72607421875, 5.052490234375, 5.37890625, 5.705322265625, 6.03173828125, 6.358154296875, 6.6845703125, 7.010986328125, 7.33740234375, 7.663818359375, 7.990234375, 8.316650390625, 8.64306640625, 8.969482421875, 9.2958984375, 9.622314453125, 9.94873046875, 10.275146484375, 10.6015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 8.0, 9.0, 12.0, 13.0, 15.0, 34.0, 17.0, 19.0, 34.0, 42.0, 56.0, 48.0, 45.0, 57.0, 43.0, 57.0, 66.0, 55.0, 46.0, 58.0, 61.0, 35.0, 34.0, 27.0, 30.0, 19.0, 18.0, 11.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.3314208984375, -8.037841796875, -7.7442626953125, -7.45068359375, -7.1571044921875, -6.863525390625, -6.5699462890625, -6.2763671875, -5.9827880859375, -5.689208984375, -5.3956298828125, -5.10205078125, -4.8084716796875, -4.514892578125, -4.2213134765625, -3.927734375, -3.6341552734375, -3.340576171875, -3.0469970703125, -2.75341796875, -2.4598388671875, -2.166259765625, -1.8726806640625, -1.5791015625, -1.2855224609375, -0.991943359375, -0.6983642578125, -0.40478515625, -0.1112060546875, 0.182373046875, 0.4759521484375, 0.76953125, 1.0631103515625, 1.356689453125, 1.6502685546875, 1.94384765625, 2.2374267578125, 2.531005859375, 2.8245849609375, 3.1181640625, 3.4117431640625, 3.705322265625, 3.9989013671875, 4.29248046875, 4.5860595703125, 4.879638671875, 5.1732177734375, 5.466796875, 5.7603759765625, 6.053955078125, 6.3475341796875, 6.64111328125, 6.9346923828125, 7.228271484375, 7.5218505859375, 7.8154296875, 8.1090087890625, 8.402587890625, 8.6961669921875, 8.98974609375, 9.2833251953125, 9.576904296875, 9.8704833984375, 10.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 7.0, 14.0, 16.0, 33.0, 41.0, 44.0, 86.0, 122.0, 159.0, 284.0, 526.0, 1114.0, 2999.0, 14886.0, 227806.0, 755578.0, 36545.0, 4992.0, 1568.0, 677.0, 373.0, 201.0, 140.0, 77.0, 57.0, 53.0, 36.0, 24.0, 11.0, 17.0, 14.0, 10.0, 4.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-19.046875, -18.5609130859375, -18.074951171875, -17.5889892578125, -17.10302734375, -16.6170654296875, -16.131103515625, -15.6451416015625, -15.1591796875, -14.6732177734375, -14.187255859375, -13.7012939453125, -13.21533203125, -12.7293701171875, -12.243408203125, -11.7574462890625, -11.271484375, -10.7855224609375, -10.299560546875, -9.8135986328125, -9.32763671875, -8.8416748046875, -8.355712890625, -7.8697509765625, -7.3837890625, -6.8978271484375, -6.411865234375, -5.9259033203125, -5.43994140625, -4.9539794921875, -4.468017578125, -3.9820556640625, -3.49609375, -3.0101318359375, -2.524169921875, -2.0382080078125, -1.55224609375, -1.0662841796875, -0.580322265625, -0.0943603515625, 0.3916015625, 0.8775634765625, 1.363525390625, 1.8494873046875, 2.33544921875, 2.8214111328125, 3.307373046875, 3.7933349609375, 4.279296875, 4.7652587890625, 5.251220703125, 5.7371826171875, 6.22314453125, 6.7091064453125, 7.195068359375, 7.6810302734375, 8.1669921875, 8.6529541015625, 9.138916015625, 9.6248779296875, 10.11083984375, 10.5968017578125, 11.082763671875, 11.5687255859375, 12.0546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 6.0, 4.0, 9.0, 11.0, 7.0, 16.0, 13.0, 15.0, 15.0, 19.0, 18.0, 29.0, 24.0, 35.0, 38.0, 38.0, 51.0, 56.0, 66.0, 69.0, 61.0, 54.0, 42.0, 38.0, 36.0, 42.0, 20.0, 36.0, 18.0, 17.0, 12.0, 11.0, 14.0, 9.0, 11.0, 8.0, 7.0, 6.0, 7.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.0625, -25.207763671875, -24.35302734375, -23.498291015625, -22.6435546875, -21.788818359375, -20.93408203125, -20.079345703125, -19.224609375, -18.369873046875, -17.51513671875, -16.660400390625, -15.8056640625, -14.950927734375, -14.09619140625, -13.241455078125, -12.38671875, -11.531982421875, -10.67724609375, -9.822509765625, -8.9677734375, -8.113037109375, -7.25830078125, -6.403564453125, -5.548828125, -4.694091796875, -3.83935546875, -2.984619140625, -2.1298828125, -1.275146484375, -0.42041015625, 0.434326171875, 1.2890625, 2.143798828125, 2.99853515625, 3.853271484375, 4.7080078125, 5.562744140625, 6.41748046875, 7.272216796875, 8.126953125, 8.981689453125, 9.83642578125, 10.691162109375, 11.5458984375, 12.400634765625, 13.25537109375, 14.110107421875, 14.96484375, 15.819580078125, 16.67431640625, 17.529052734375, 18.3837890625, 19.238525390625, 20.09326171875, 20.947998046875, 21.802734375, 22.657470703125, 23.51220703125, 24.366943359375, 25.2216796875, 26.076416015625, 26.93115234375, 27.785888671875, 28.640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 12.0, 18.0, 18.0, 30.0, 48.0, 86.0, 154.0, 312.0, 829.0, 3101.0, 18170.0, 839739.0, 171347.0, 11164.0, 2213.0, 690.0, 282.0, 125.0, 64.0, 44.0, 27.0, 19.0, 10.0, 13.0, 7.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.205078125, -3.113189697265625, -3.02130126953125, -2.929412841796875, -2.8375244140625, -2.745635986328125, -2.65374755859375, -2.561859130859375, -2.469970703125, -2.378082275390625, -2.28619384765625, -2.194305419921875, -2.1024169921875, -2.010528564453125, -1.91864013671875, -1.826751708984375, -1.73486328125, -1.642974853515625, -1.55108642578125, -1.459197998046875, -1.3673095703125, -1.275421142578125, -1.18353271484375, -1.091644287109375, -0.999755859375, -0.907867431640625, -0.81597900390625, -0.724090576171875, -0.6322021484375, -0.540313720703125, -0.44842529296875, -0.356536865234375, -0.2646484375, -0.172760009765625, -0.08087158203125, 0.011016845703125, 0.1029052734375, 0.194793701171875, 0.28668212890625, 0.378570556640625, 0.470458984375, 0.562347412109375, 0.65423583984375, 0.746124267578125, 0.8380126953125, 0.929901123046875, 1.02178955078125, 1.113677978515625, 1.20556640625, 1.297454833984375, 1.38934326171875, 1.481231689453125, 1.5731201171875, 1.665008544921875, 1.75689697265625, 1.848785400390625, 1.940673828125, 2.032562255859375, 2.12445068359375, 2.216339111328125, 2.3082275390625, 2.400115966796875, 2.49200439453125, 2.583892822265625, 2.67578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 5.0, 15.0, 14.0, 27.0, 30.0, 41.0, 60.0, 99.0, 111.0, 134.0, 128.0, 81.0, 62.0, 35.0, 24.0, 26.0, 21.0, 14.0, 9.0, 10.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006089210510253906, -0.0005906447768211365, -0.0005723685026168823, -0.0005540922284126282, -0.000535815954208374, -0.0005175396800041199, -0.0004992634057998657, -0.00048098713159561157, -0.0004627108573913574, -0.00044443458318710327, -0.0004261583089828491, -0.00040788203477859497, -0.0003896057605743408, -0.00037132948637008667, -0.0003530532121658325, -0.00033477693796157837, -0.0003165006637573242, -0.00029822438955307007, -0.0002799481153488159, -0.00026167184114456177, -0.00024339556694030762, -0.00022511929273605347, -0.00020684301853179932, -0.00018856674432754517, -0.00017029047012329102, -0.00015201419591903687, -0.00013373792171478271, -0.00011546164751052856, -9.718537330627441e-05, -7.890909910202026e-05, -6.063282489776611e-05, -4.235655069351196e-05, -2.4080276489257812e-05, -5.804002285003662e-06, 1.2472271919250488e-05, 3.074854612350464e-05, 4.902482032775879e-05, 6.730109453201294e-05, 8.557736873626709e-05, 0.00010385364294052124, 0.0001221299171447754, 0.00014040619134902954, 0.0001586824655532837, 0.00017695873975753784, 0.000195235013961792, 0.00021351128816604614, 0.0002317875623703003, 0.00025006383657455444, 0.0002683401107788086, 0.00028661638498306274, 0.0003048926591873169, 0.00032316893339157104, 0.0003414452075958252, 0.00035972148180007935, 0.0003779977560043335, 0.00039627403020858765, 0.0004145503044128418, 0.00043282657861709595, 0.0004511028528213501, 0.00046937912702560425, 0.0004876554012298584, 0.0005059316754341125, 0.0005242079496383667, 0.0005424842238426208, 0.000560760498046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 9.0, 15.0, 27.0, 35.0, 42.0, 65.0, 102.0, 151.0, 262.0, 449.0, 869.0, 1586.0, 3482.0, 8536.0, 24401.0, 106493.0, 766216.0, 97161.0, 23578.0, 8107.0, 3332.0, 1629.0, 765.0, 498.0, 236.0, 173.0, 86.0, 68.0, 36.0, 29.0, 30.0, 18.0, 8.0, 6.0, 9.0, 9.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2571563720703125, -1.214508056640625, -1.1718597412109375, -1.12921142578125, -1.0865631103515625, -1.043914794921875, -1.0012664794921875, -0.9586181640625, -0.9159698486328125, -0.873321533203125, -0.8306732177734375, -0.78802490234375, -0.7453765869140625, -0.702728271484375, -0.6600799560546875, -0.617431640625, -0.5747833251953125, -0.532135009765625, -0.4894866943359375, -0.44683837890625, -0.4041900634765625, -0.361541748046875, -0.3188934326171875, -0.2762451171875, -0.2335968017578125, -0.190948486328125, -0.1483001708984375, -0.10565185546875, -0.0630035400390625, -0.020355224609375, 0.0222930908203125, 0.06494140625, 0.1075897216796875, 0.150238037109375, 0.1928863525390625, 0.23553466796875, 0.2781829833984375, 0.320831298828125, 0.3634796142578125, 0.4061279296875, 0.4487762451171875, 0.491424560546875, 0.5340728759765625, 0.57672119140625, 0.6193695068359375, 0.662017822265625, 0.7046661376953125, 0.747314453125, 0.7899627685546875, 0.832611083984375, 0.8752593994140625, 0.91790771484375, 0.9605560302734375, 1.003204345703125, 1.0458526611328125, 1.0885009765625, 1.1311492919921875, 1.173797607421875, 1.2164459228515625, 1.25909423828125, 1.3017425537109375, 1.344390869140625, 1.3870391845703125, 1.4296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 7.0, 2.0, 4.0, 6.0, 10.0, 13.0, 13.0, 22.0, 23.0, 38.0, 42.0, 72.0, 133.0, 129.0, 111.0, 97.0, 85.0, 52.0, 32.0, 25.0, 19.0, 16.0, 13.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.337890625, -2.270416259765625, -2.20294189453125, -2.135467529296875, -2.0679931640625, -2.000518798828125, -1.93304443359375, -1.865570068359375, -1.798095703125, -1.730621337890625, -1.66314697265625, -1.595672607421875, -1.5281982421875, -1.460723876953125, -1.39324951171875, -1.325775146484375, -1.25830078125, -1.190826416015625, -1.12335205078125, -1.055877685546875, -0.9884033203125, -0.920928955078125, -0.85345458984375, -0.785980224609375, -0.718505859375, -0.651031494140625, -0.58355712890625, -0.516082763671875, -0.4486083984375, -0.381134033203125, -0.31365966796875, -0.246185302734375, -0.1787109375, -0.111236572265625, -0.04376220703125, 0.023712158203125, 0.0911865234375, 0.158660888671875, 0.22613525390625, 0.293609619140625, 0.361083984375, 0.428558349609375, 0.49603271484375, 0.563507080078125, 0.6309814453125, 0.698455810546875, 0.76593017578125, 0.833404541015625, 0.90087890625, 0.968353271484375, 1.03582763671875, 1.103302001953125, 1.1707763671875, 1.238250732421875, 1.30572509765625, 1.373199462890625, 1.440673828125, 1.508148193359375, 1.57562255859375, 1.643096923828125, 1.7105712890625, 1.778045654296875, 1.84552001953125, 1.912994384765625, 1.98046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 13.0, 24.0, 49.0, 106.0, 476.0, 137.0, 70.0, 45.0, 21.0, 14.0, 15.0, 3.0, 5.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.92178344726562, -66.52570343017578, -63.12963104248047, -59.733551025390625, -56.33747863769531, -52.94139862060547, -49.54532241821289, -46.14924621582031, -42.753170013427734, -39.357093811035156, -35.96101760864258, -32.56494140625, -29.16886329650879, -25.77278709411621, -22.376708984375, -18.980632781982422, -15.584556579589844, -12.188480377197266, -8.792403221130371, -5.396326065063477, -2.0002498626708984, 1.3958263397216797, 4.791904449462891, 8.187980651855469, 11.584056854248047, 14.980133056640625, 18.376209259033203, 21.772287368774414, 25.168363571166992, 28.56443977355957, 31.96051788330078, 35.35659408569336, 38.75267028808594, 42.148746490478516, 45.544822692871094, 48.94090270996094, 52.33697509765625, 55.733055114746094, 59.12913131713867, 62.52520751953125, 65.92127990722656, 69.3173599243164, 72.71343231201172, 76.10951232910156, 79.50558471679688, 82.90166473388672, 86.29774475097656, 89.69381713867188, 93.08989715576172, 96.48597717285156, 99.88204956054688, 103.27812957763672, 106.67420196533203, 110.07028198242188, 113.46635437011719, 116.86243438720703, 120.25851440429688, 123.65459442138672, 127.05066680908203, 130.44674682617188, 133.8428192138672, 137.2388916015625, 140.63497924804688, 144.0310516357422, 147.4271240234375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 3.0, 9.0, 6.0, 6.0, 17.0, 10.0, 10.0, 19.0, 21.0, 20.0, 21.0, 18.0, 27.0, 56.0, 143.0, 168.0, 148.0, 49.0, 29.0, 29.0, 19.0, 16.0, 16.0, 14.0, 17.0, 16.0, 5.0, 12.0, 12.0, 6.0, 10.0, 3.0, 8.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.87934112548828, -67.33285522460938, -64.786376953125, -62.23989486694336, -59.69341278076172, -57.14692687988281, -54.60044479370117, -52.05396270751953, -49.50748062133789, -46.96099853515625, -44.41451644897461, -41.86803436279297, -39.32154846191406, -36.77507019042969, -34.22858428955078, -31.68210220336914, -29.1356201171875, -26.58913803100586, -24.04265594482422, -21.496171951293945, -18.949689865112305, -16.403207778930664, -13.856724739074707, -11.31024169921875, -8.76375961303711, -6.2172770500183105, -3.6707944869995117, -1.124311923980713, 1.422170639038086, 3.9686527252197266, 6.515135765075684, 9.06161880493164, 11.60809326171875, 14.15457534790039, 16.70105743408203, 19.247541427612305, 21.794023513793945, 24.340505599975586, 26.88698959350586, 29.4334716796875, 31.97995376586914, 34.52643585205078, 37.07291793823242, 39.61940002441406, 42.16588592529297, 44.712364196777344, 47.25885009765625, 49.80533218383789, 52.35181427001953, 54.89829635620117, 57.44477844238281, 59.99126052856445, 62.537742614746094, 65.084228515625, 67.63070678710938, 70.17719268798828, 72.72367858886719, 75.2701644897461, 77.81664276123047, 80.36312866210938, 82.90960693359375, 85.45609283447266, 88.00257110595703, 90.54905700683594, 93.09553527832031]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 4.0, 4.0, 11.0, 8.0, 10.0, 13.0, 16.0, 21.0, 26.0, 23.0, 37.0, 24.0, 44.0, 59.0, 179.0, 229.0, 62.0, 46.0, 31.0, 28.0, 27.0, 17.0, 16.0, 7.0, 17.0, 7.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.90625, -9.6236572265625, -9.341064453125, -9.0584716796875, -8.77587890625, -8.4932861328125, -8.210693359375, -7.9281005859375, -7.6455078125, -7.3629150390625, -7.080322265625, -6.7977294921875, -6.51513671875, -6.2325439453125, -5.949951171875, -5.6673583984375, -5.384765625, -5.1021728515625, -4.819580078125, -4.5369873046875, -4.25439453125, -3.9718017578125, -3.689208984375, -3.4066162109375, -3.1240234375, -2.8414306640625, -2.558837890625, -2.2762451171875, -1.99365234375, -1.7110595703125, -1.428466796875, -1.1458740234375, -0.86328125, -0.5806884765625, -0.298095703125, -0.0155029296875, 0.26708984375, 0.5496826171875, 0.832275390625, 1.1148681640625, 1.3974609375, 1.6800537109375, 1.962646484375, 2.2452392578125, 2.52783203125, 2.8104248046875, 3.093017578125, 3.3756103515625, 3.658203125, 3.9407958984375, 4.223388671875, 4.5059814453125, 4.78857421875, 5.0711669921875, 5.353759765625, 5.6363525390625, 5.9189453125, 6.2015380859375, 6.484130859375, 6.7667236328125, 7.04931640625, 7.3319091796875, 7.614501953125, 7.8970947265625, 8.1796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 2.0, 0.0, 4.0, 1.0, 9.0, 5.0, 17.0, 19.0, 29.0, 78.0, 122.0, 285.0, 807.0, 4174.0, 7604836.0, 773051.0, 3835.0, 776.0, 263.0, 108.0, 47.0, 41.0, 19.0, 19.0, 14.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.76966857910156, -107.41175079345703, -104.0538330078125, -100.69591522216797, -97.33799743652344, -93.9800796508789, -90.62216186523438, -87.26423645019531, -83.90632629394531, -80.54840850830078, -77.19049072265625, -73.83257293701172, -70.47465515136719, -67.11673736572266, -63.75881576538086, -60.40089797973633, -57.04297637939453, -53.68505859375, -50.32714080810547, -46.96922302246094, -43.611305236816406, -40.253387451171875, -36.89546585083008, -33.53754806518555, -30.179630279541016, -26.821712493896484, -23.463794708251953, -20.10587501525879, -16.747957229614258, -13.390039443969727, -10.032119750976562, -6.674201965332031, -3.3162841796875, 0.04163408279418945, 3.399552345275879, 6.757471084594727, 10.115388870239258, 13.473306655883789, 16.831226348876953, 20.189144134521484, 23.547061920166016, 26.904979705810547, 30.262897491455078, 33.620819091796875, 36.978736877441406, 40.33665466308594, 43.69457244873047, 47.052490234375, 50.41040802001953, 53.76832580566406, 57.126243591308594, 60.484161376953125, 63.842079162597656, 67.19999694824219, 70.55792236328125, 73.91583251953125, 77.27375793457031, 80.63167572021484, 83.98959350585938, 87.3475112915039, 90.70542907714844, 94.06334686279297, 97.4212646484375, 100.77919006347656, 104.13710021972656]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 5.0, 1.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.20687103271484, -77.32122802734375, -74.43557739257812, -71.54993438720703, -68.6642837524414, -65.77864074707031, -62.89299392700195, -60.007347106933594, -57.1217041015625, -54.23605728149414, -51.35041046142578, -48.46476745605469, -45.57912063598633, -42.69347381591797, -39.80782699584961, -36.92218017578125, -34.03653335571289, -31.15088653564453, -28.265241622924805, -25.379594802856445, -22.49394989013672, -19.60830307006836, -16.72265625, -13.837011337280273, -10.951364517211914, -8.065718650817871, -5.18007230758667, -2.2944259643554688, 0.5912199020385742, 3.476865768432617, 6.362512588500977, 9.248157501220703, 12.133804321289062, 15.019450187683105, 17.90509605407715, 20.790742874145508, 23.676387786865234, 26.562034606933594, 29.447681427001953, 32.33332824707031, 35.218971252441406, 38.104618072509766, 40.990264892578125, 43.87590789794922, 46.76155471801758, 49.64720153808594, 52.5328483581543, 55.418495178222656, 58.304141998291016, 61.189788818359375, 64.07543182373047, 66.9610824584961, 69.84672546386719, 72.73237609863281, 75.6180191040039, 78.503662109375, 81.38931274414062, 84.27495574951172, 87.16060638427734, 90.04624938964844, 92.93190002441406, 95.81754302978516, 98.70318603515625, 101.58883666992188, 104.47447967529297]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 10.0, 29.0, 48.0, 78.0, 133.0, 303.0, 585.0, 1293.0, 2864.0, 6498.0, 15555.0, 36810.0, 89011.0, 167120.0, 116824.0, 49659.0, 21010.0, 9070.0, 3810.0, 1808.0, 827.0, 411.0, 204.0, 104.0, 71.0, 45.0, 17.0, 20.0, 10.0, 13.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.5, -35.02001953125, -33.5400390625, -32.06005859375, -30.580078125, -29.10009765625, -27.6201171875, -26.14013671875, -24.66015625, -23.18017578125, -21.7001953125, -20.22021484375, -18.740234375, -17.26025390625, -15.7802734375, -14.30029296875, -12.8203125, -11.34033203125, -9.8603515625, -8.38037109375, -6.900390625, -5.42041015625, -3.9404296875, -2.46044921875, -0.98046875, 0.49951171875, 1.9794921875, 3.45947265625, 4.939453125, 6.41943359375, 7.8994140625, 9.37939453125, 10.859375, 12.33935546875, 13.8193359375, 15.29931640625, 16.779296875, 18.25927734375, 19.7392578125, 21.21923828125, 22.69921875, 24.17919921875, 25.6591796875, 27.13916015625, 28.619140625, 30.09912109375, 31.5791015625, 33.05908203125, 34.5390625, 36.01904296875, 37.4990234375, 38.97900390625, 40.458984375, 41.93896484375, 43.4189453125, 44.89892578125, 46.37890625, 47.85888671875, 49.3388671875, 50.81884765625, 52.298828125, 53.77880859375, 55.2587890625, 56.73876953125, 58.21875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 2.0, 9.0, 10.0, 7.0, 11.0, 16.0, 23.0, 22.0, 20.0, 32.0, 29.0, 37.0, 50.0, 66.0, 54.0, 53.0, 67.0, 71.0, 56.0, 58.0, 48.0, 37.0, 34.0, 37.0, 30.0, 24.0, 8.0, 10.0, 16.0, 14.0, 8.0, 2.0, 8.0, 3.0, 5.0, 5.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.94775390625, -7.6845703125, -7.42138671875, -7.158203125, -6.89501953125, -6.6318359375, -6.36865234375, -6.10546875, -5.84228515625, -5.5791015625, -5.31591796875, -5.052734375, -4.78955078125, -4.5263671875, -4.26318359375, -4.0, -3.73681640625, -3.4736328125, -3.21044921875, -2.947265625, -2.68408203125, -2.4208984375, -2.15771484375, -1.89453125, -1.63134765625, -1.3681640625, -1.10498046875, -0.841796875, -0.57861328125, -0.3154296875, -0.05224609375, 0.2109375, 0.47412109375, 0.7373046875, 1.00048828125, 1.263671875, 1.52685546875, 1.7900390625, 2.05322265625, 2.31640625, 2.57958984375, 2.8427734375, 3.10595703125, 3.369140625, 3.63232421875, 3.8955078125, 4.15869140625, 4.421875, 4.68505859375, 4.9482421875, 5.21142578125, 5.474609375, 5.73779296875, 6.0009765625, 6.26416015625, 6.52734375, 6.79052734375, 7.0537109375, 7.31689453125, 7.580078125, 7.84326171875, 8.1064453125, 8.36962890625, 8.6328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 9.0, 9.0, 20.0, 41.0, 76.0, 102.0, 87.0, 67.0, 21.0, 20.0, 9.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.8221435546875, -34.45989227294922, -32.09764099121094, -29.735387802124023, -27.373136520385742, -25.01088523864746, -22.648632049560547, -20.286380767822266, -17.924129486083984, -15.561878204345703, -13.199625968933105, -10.837373733520508, -8.475122451782227, -6.112871170043945, -3.7506189346313477, -1.38836669921875, 0.9738845825195312, 3.3361363410949707, 5.69838809967041, 8.060640335083008, 10.422891616821289, 12.78514289855957, 15.147395133972168, 17.509647369384766, 19.871898651123047, 22.234149932861328, 24.59640121459961, 26.958654403686523, 29.320905685424805, 31.683156967163086, 34.04541015625, 36.40766143798828, 38.76990509033203, 41.13215637207031, 43.494407653808594, 45.856658935546875, 48.218910217285156, 50.58116149902344, 52.943416595458984, 55.305667877197266, 57.66791915893555, 60.03017044067383, 62.39242172241211, 64.75467681884766, 67.11692810058594, 69.47917938232422, 71.8414306640625, 74.20368194580078, 76.56593322753906, 78.92818450927734, 81.29043579101562, 83.6526870727539, 86.01493835449219, 88.37718963623047, 90.73944091796875, 93.10169982910156, 95.46394348144531, 97.8261947631836, 100.18844604492188, 102.55069732666016, 104.91294860839844, 107.27519989013672, 109.637451171875, 111.99971008300781, 114.3619613647461]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 10.0, 6.0, 13.0, 35.0, 58.0, 66.0, 72.0, 62.0, 35.0, 26.0, 21.0, 10.0, 15.0, 2.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15165710449219, -38.915802001953125, -37.67994689941406, -36.444087982177734, -35.20823287963867, -33.97237777709961, -32.73651885986328, -31.50066375732422, -30.264808654785156, -29.028953552246094, -27.7930965423584, -26.557239532470703, -25.32138442993164, -24.085529327392578, -22.849672317504883, -21.613815307617188, -20.377960205078125, -19.142105102539062, -17.906248092651367, -16.670391082763672, -15.43453598022461, -14.19867992401123, -12.962823867797852, -11.726967811584473, -10.491111755371094, -9.255255699157715, -8.019399642944336, -6.783543586730957, -5.547687530517578, -4.311831474304199, -3.0759754180908203, -1.8401193618774414, -0.6042633056640625, 0.6315927505493164, 1.8674488067626953, 3.103304862976074, 4.339160919189453, 5.575016975402832, 6.810873031616211, 8.04672908782959, 9.282585144042969, 10.518441200256348, 11.754297256469727, 12.990153312683105, 14.226009368896484, 15.461865425109863, 16.697721481323242, 17.933578491210938, 19.16943359375, 20.405288696289062, 21.641145706176758, 22.877002716064453, 24.112857818603516, 25.348712921142578, 26.584569931030273, 27.82042694091797, 29.05628204345703, 30.292137145996094, 31.52799415588379, 32.763851165771484, 33.99970626831055, 35.23556137084961, 36.47142028808594, 37.707275390625, 38.94313049316406]}, "eval/loss": 0.9598673582077026, "eval/wer": 0.14415540607575847, "eval/runtime": 868.6571, "eval/samples_per_second": 3.041, "eval/steps_per_second": 0.381} \ No newline at end of file +{"train/loss": 0.292, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 116020, "_timestamp": 1646777259, "_step": 17851, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 21.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 5.0, 4.0, 1.0, 2.0, 7.0, 14.0, 29.0, 30270.0, 111.0, 20.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-701.0, -687.619140625, -674.23828125, -660.857421875, -647.4765625, -634.095703125, -620.71484375, -607.333984375, -593.953125, -580.572265625, -567.19140625, -553.810546875, -540.4296875, -527.048828125, -513.66796875, -500.287109375, -486.90625, -473.525390625, -460.14453125, -446.763671875, -433.3828125, -420.001953125, -406.62109375, -393.240234375, -379.859375, -366.478515625, -353.09765625, -339.716796875, -326.3359375, -312.955078125, -299.57421875, -286.193359375, -272.8125, -259.431640625, -246.05078125, -232.669921875, -219.2890625, -205.908203125, -192.52734375, -179.146484375, -165.765625, -152.384765625, -139.00390625, -125.623046875, -112.2421875, -98.861328125, -85.48046875, -72.099609375, -58.71875, -45.337890625, -31.95703125, -18.576171875, -5.1953125, 8.185546875, 21.56640625, 34.947265625, 48.328125, 61.708984375, 75.08984375, 88.470703125, 101.8515625, 115.232421875, 128.61328125, 141.994140625, 155.375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 12.0, 8.0, 5.0, 20.0, 8.0, 20.0, 29.0, 29.0, 35.0, 42.0, 47.0, 64.0, 55.0, 58.0, 58.0, 55.0, 71.0, 52.0, 41.0, 54.0, 44.0, 29.0, 31.0, 34.0, 16.0, 26.0, 18.0, 15.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-213.13580322265625, -208.03428649902344, -202.93275451660156, -197.83123779296875, -192.72970581054688, -187.62818908691406, -182.5266571044922, -177.42514038085938, -172.3236083984375, -167.2220916748047, -162.1205596923828, -157.01904296875, -151.91751098632812, -146.8159942626953, -141.71446228027344, -136.61294555664062, -131.5114288330078, -126.40990447998047, -121.30838012695312, -116.20685577392578, -111.10533142089844, -106.00381469726562, -100.90229034423828, -95.80076599121094, -90.6992416381836, -85.59771728515625, -80.4961929321289, -75.39466857910156, -70.29315185546875, -65.19161987304688, -60.09010314941406, -54.98857879638672, -49.88706970214844, -44.785545349121094, -39.68402099609375, -34.58250045776367, -29.480976104736328, -24.379451751708984, -19.277929306030273, -14.176406860351562, -9.074882507324219, -3.9733591079711914, 1.128164291381836, 6.229687690734863, 11.33121109008789, 16.432735443115234, 21.534257888793945, 26.635780334472656, 31.7373046875, 36.838829040527344, 41.94035339355469, 47.041873931884766, 52.14339828491211, 57.24492263793945, 62.34644317626953, 67.44796752929688, 72.54949188232422, 77.65101623535156, 82.7525405883789, 87.85406494140625, 92.95558166503906, 98.05711364746094, 103.15863037109375, 108.2601547241211, 113.36167907714844]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 7.0, 7.0, 12.0, 14.0, 24.0, 10.0, 25.0, 32.0, 41.0, 31.0, 27.0, 32.0, 44.0, 45.0, 43.0, 42.0, 45.0, 47.0, 49.0, 36.0, 32.0, 32.0, 27.0, 28.0, 30.0, 33.0, 27.0, 22.0, 22.0, 21.0, 14.0, 17.0, 13.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.2356185913086, -120.41963195800781, -116.60365295410156, -112.78766632080078, -108.9716796875, -105.15570068359375, -101.33971405029297, -97.52372741699219, -93.70774841308594, -89.89176177978516, -86.0757827758789, -82.25979614257812, -78.44381713867188, -74.6278305053711, -70.81184387207031, -66.99586486816406, -63.17987823486328, -59.363895416259766, -55.54791259765625, -51.73192596435547, -47.91594314575195, -44.09996032714844, -40.283973693847656, -36.46799087524414, -32.652008056640625, -28.83602523803711, -25.02004051208496, -21.204055786132812, -17.388072967529297, -13.572090148925781, -9.756105422973633, -5.940120697021484, -2.1241378784179688, 1.6918458938598633, 5.507829666137695, 9.323813438415527, 13.13979721069336, 16.955780029296875, 20.771764755249023, 24.587749481201172, 28.403732299804688, 32.2197151184082, 36.03569793701172, 39.8516845703125, 43.667667388916016, 47.48365020751953, 51.29963684082031, 55.11561965942383, 58.931602478027344, 62.74758529663086, 66.56356811523438, 70.37955474853516, 74.19554138183594, 78.01152038574219, 81.82750701904297, 85.64349365234375, 89.45947265625, 93.27545928955078, 97.09143829345703, 100.90742492675781, 104.72340393066406, 108.53939056396484, 112.35537719726562, 116.17135620117188, 119.98734283447266]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 18.0, 25.0, 27.0, 50.0, 81.0, 145.0, 194.0, 351.0, 504.0, 780.0, 1315.0, 2016.0, 3131.0, 4959.0, 7612.0, 11577.0, 16624.0, 24222.0, 33958.0, 45803.0, 60119.0, 75042.0, 89462.0, 101695.0, 127668.0, 97477.0, 83977.0, 69542.0, 54968.0, 41591.0, 29967.0, 21211.0, 14441.0, 9894.0, 6441.0, 4196.0, 2752.0, 1717.0, 1086.0, 735.0, 434.0, 274.0, 163.0, 113.0, 77.0, 35.0, 27.0, 14.0, 14.0, 11.0, 10.0, 6.0, 3.0, 1.0, 1.0], "bins": [-404.75, -392.6015625, -380.453125, -368.3046875, -356.15625, -344.0078125, -331.859375, -319.7109375, -307.5625, -295.4140625, -283.265625, -271.1171875, -258.96875, -246.8203125, -234.671875, -222.5234375, -210.375, -198.2265625, -186.078125, -173.9296875, -161.78125, -149.6328125, -137.484375, -125.3359375, -113.1875, -101.0390625, -88.890625, -76.7421875, -64.59375, -52.4453125, -40.296875, -28.1484375, -16.0, -3.8515625, 8.296875, 20.4453125, 32.59375, 44.7421875, 56.890625, 69.0390625, 81.1875, 93.3359375, 105.484375, 117.6328125, 129.78125, 141.9296875, 154.078125, 166.2265625, 178.375, 190.5234375, 202.671875, 214.8203125, 226.96875, 239.1171875, 251.265625, 263.4140625, 275.5625, 287.7109375, 299.859375, 312.0078125, 324.15625, 336.3046875, 348.453125, 360.6015625, 372.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 6.0, 8.0, 15.0, 9.0, 12.0, 14.0, 22.0, 18.0, 33.0, 18.0, 33.0, 19.0, 43.0, 42.0, 45.0, 43.0, 41.0, 41.0, 62.0, 42.0, 41.0, 45.0, 38.0, 38.0, 33.0, 27.0, 26.0, 27.0, 24.0, 28.0, 18.0, 12.0, 15.0, 13.0, 10.0, 10.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.875, -182.82421875, -176.7734375, -170.72265625, -164.671875, -158.62109375, -152.5703125, -146.51953125, -140.46875, -134.41796875, -128.3671875, -122.31640625, -116.265625, -110.21484375, -104.1640625, -98.11328125, -92.0625, -86.01171875, -79.9609375, -73.91015625, -67.859375, -61.80859375, -55.7578125, -49.70703125, -43.65625, -37.60546875, -31.5546875, -25.50390625, -19.453125, -13.40234375, -7.3515625, -1.30078125, 4.75, 10.80078125, 16.8515625, 22.90234375, 28.953125, 35.00390625, 41.0546875, 47.10546875, 53.15625, 59.20703125, 65.2578125, 71.30859375, 77.359375, 83.41015625, 89.4609375, 95.51171875, 101.5625, 107.61328125, 113.6640625, 119.71484375, 125.765625, 131.81640625, 137.8671875, 143.91796875, 149.96875, 156.01953125, 162.0703125, 168.12109375, 174.171875, 180.22265625, 186.2734375, 192.32421875, 198.375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 3.0, 6.0, 8.0, 14.0, 19.0, 13.0, 19.0, 24.0, 44.0, 31.0, 23.0, 44.0, 41.0, 49.0, 42.0, 52.0, 54.0, 43.0, 52.0, 55.0, 45.0, 43.0, 50.0, 36.0, 32.0, 24.0, 26.0, 20.0, 14.0, 20.0, 15.0, 11.0, 12.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.77110290527344, -142.3655548095703, -137.96002197265625, -133.55447387695312, -129.14894104003906, -124.74339294433594, -120.33785247802734, -115.93231201171875, -111.52677154541016, -107.12123107910156, -102.71569061279297, -98.31015014648438, -93.90460205078125, -89.49906921386719, -85.09352111816406, -80.68798065185547, -76.28244018554688, -71.87689971923828, -67.47135925292969, -63.06581497192383, -58.660274505615234, -54.25473403930664, -49.84918975830078, -45.44364929199219, -41.038108825683594, -36.632568359375, -32.227027893066406, -27.821483612060547, -23.415943145751953, -19.01040267944336, -14.604860305786133, -10.199317932128906, -5.793792724609375, -1.3882513046264648, 3.0172901153564453, 7.4228315353393555, 11.828372955322266, 16.23391342163086, 20.639455795288086, 25.044998168945312, 29.450538635253906, 33.8560791015625, 38.261619567871094, 42.66716384887695, 47.07270431518555, 51.47824478149414, 55.8837890625, 60.289329528808594, 64.69486999511719, 69.10041046142578, 73.50595092773438, 77.91149139404297, 82.31703186035156, 86.72257995605469, 91.12812042236328, 95.53366088867188, 99.93920135498047, 104.34474182128906, 108.75028228759766, 113.15582275390625, 117.56137084960938, 121.96690368652344, 126.37245178222656, 130.77798461914062, 135.18353271484375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 4.0, 9.0, 6.0, 7.0, 19.0, 17.0, 10.0, 24.0, 20.0, 25.0, 19.0, 22.0, 28.0, 40.0, 37.0, 28.0, 42.0, 48.0, 45.0, 38.0, 39.0, 46.0, 39.0, 47.0, 42.0, 35.0, 41.0, 38.0, 28.0, 27.0, 30.0, 16.0, 12.0, 13.0, 12.0, 14.0, 4.0, 8.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-136.23291015625, -132.0714569091797, -127.9100112915039, -123.7485580444336, -119.58710479736328, -115.4256591796875, -111.26420593261719, -107.10275268554688, -102.94129943847656, -98.77984619140625, -94.61840057373047, -90.45694732666016, -86.29549407958984, -82.13404846191406, -77.97259521484375, -73.81114196777344, -69.64969635009766, -65.48824310302734, -61.3267936706543, -57.16534423828125, -53.00389099121094, -48.84244155883789, -44.680992126464844, -40.51953887939453, -36.358089447021484, -32.19664001464844, -28.035186767578125, -23.873737335205078, -19.7122859954834, -15.550834655761719, -11.389385223388672, -7.227933883666992, -3.0664825439453125, 1.094968318939209, 5.2564191818237305, 9.417869567871094, 13.579320907592773, 17.740772247314453, 21.9022216796875, 26.06367301940918, 30.22512435913086, 34.386573791503906, 38.54802703857422, 42.709476470947266, 46.87092590332031, 51.032379150390625, 55.19382858276367, 59.35527801513672, 63.51673126220703, 67.67818450927734, 71.83963012695312, 76.00108337402344, 80.16253662109375, 84.32398986816406, 88.48543548583984, 92.64688873291016, 96.80833435058594, 100.96978759765625, 105.13123321533203, 109.29268646240234, 113.45413970947266, 117.61558532714844, 121.77703857421875, 125.93849182128906, 130.09994506835938]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 11.0, 12.0, 18.0, 19.0, 39.0, 56.0, 104.0, 204.0, 300.0, 481.0, 816.0, 1275.0, 2071.0, 3549.0, 5819.0, 9740.0, 16663.0, 28230.0, 47989.0, 82882.0, 144040.0, 251088.0, 432745.0, 714245.0, 885607.0, 642858.0, 385436.0, 224792.0, 130596.0, 75765.0, 43935.0, 25837.0, 15019.0, 8889.0, 5280.0, 3147.0, 1873.0, 1113.0, 662.0, 431.0, 261.0, 168.0, 83.0, 48.0, 31.0, 27.0, 15.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.375, -201.517578125, -194.66015625, -187.802734375, -180.9453125, -174.087890625, -167.23046875, -160.373046875, -153.515625, -146.658203125, -139.80078125, -132.943359375, -126.0859375, -119.228515625, -112.37109375, -105.513671875, -98.65625, -91.798828125, -84.94140625, -78.083984375, -71.2265625, -64.369140625, -57.51171875, -50.654296875, -43.796875, -36.939453125, -30.08203125, -23.224609375, -16.3671875, -9.509765625, -2.65234375, 4.205078125, 11.0625, 17.919921875, 24.77734375, 31.634765625, 38.4921875, 45.349609375, 52.20703125, 59.064453125, 65.921875, 72.779296875, 79.63671875, 86.494140625, 93.3515625, 100.208984375, 107.06640625, 113.923828125, 120.78125, 127.638671875, 134.49609375, 141.353515625, 148.2109375, 155.068359375, 161.92578125, 168.783203125, 175.640625, 182.498046875, 189.35546875, 196.212890625, 203.0703125, 209.927734375, 216.78515625, 223.642578125, 230.5]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 6.0, 8.0, 3.0, 6.0, 18.0, 17.0, 16.0, 10.0, 14.0, 24.0, 25.0, 30.0, 24.0, 27.0, 39.0, 48.0, 47.0, 36.0, 33.0, 41.0, 45.0, 44.0, 36.0, 41.0, 26.0, 49.0, 40.0, 35.0, 39.0, 18.0, 27.0, 28.0, 20.0, 11.0, 14.0, 12.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.0, -111.431640625, -107.86328125, -104.294921875, -100.7265625, -97.158203125, -93.58984375, -90.021484375, -86.453125, -82.884765625, -79.31640625, -75.748046875, -72.1796875, -68.611328125, -65.04296875, -61.474609375, -57.90625, -54.337890625, -50.76953125, -47.201171875, -43.6328125, -40.064453125, -36.49609375, -32.927734375, -29.359375, -25.791015625, -22.22265625, -18.654296875, -15.0859375, -11.517578125, -7.94921875, -4.380859375, -0.8125, 2.755859375, 6.32421875, 9.892578125, 13.4609375, 17.029296875, 20.59765625, 24.166015625, 27.734375, 31.302734375, 34.87109375, 38.439453125, 42.0078125, 45.576171875, 49.14453125, 52.712890625, 56.28125, 59.849609375, 63.41796875, 66.986328125, 70.5546875, 74.123046875, 77.69140625, 81.259765625, 84.828125, 88.396484375, 91.96484375, 95.533203125, 99.1015625, 102.669921875, 106.23828125, 109.806640625, 113.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 7.0, 14.0, 16.0, 18.0, 34.0, 72.0, 121.0, 154.0, 280.0, 479.0, 819.0, 1399.0, 2416.0, 3963.0, 7097.0, 12505.0, 22166.0, 38226.0, 66934.0, 113626.0, 191997.0, 312977.0, 481061.0, 672622.0, 730343.0, 568556.0, 380966.0, 239674.0, 144990.0, 85483.0, 49339.0, 28158.0, 16106.0, 9226.0, 5097.0, 2875.0, 1788.0, 1085.0, 632.0, 344.0, 221.0, 137.0, 87.0, 54.0, 39.0, 31.0, 19.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-144.25, -139.7734375, -135.296875, -130.8203125, -126.34375, -121.8671875, -117.390625, -112.9140625, -108.4375, -103.9609375, -99.484375, -95.0078125, -90.53125, -86.0546875, -81.578125, -77.1015625, -72.625, -68.1484375, -63.671875, -59.1953125, -54.71875, -50.2421875, -45.765625, -41.2890625, -36.8125, -32.3359375, -27.859375, -23.3828125, -18.90625, -14.4296875, -9.953125, -5.4765625, -1.0, 3.4765625, 7.953125, 12.4296875, 16.90625, 21.3828125, 25.859375, 30.3359375, 34.8125, 39.2890625, 43.765625, 48.2421875, 52.71875, 57.1953125, 61.671875, 66.1484375, 70.625, 75.1015625, 79.578125, 84.0546875, 88.53125, 93.0078125, 97.484375, 101.9609375, 106.4375, 110.9140625, 115.390625, 119.8671875, 124.34375, 128.8203125, 133.296875, 137.7734375, 142.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 12.0, 12.0, 12.0, 21.0, 14.0, 22.0, 20.0, 46.0, 57.0, 62.0, 88.0, 98.0, 131.0, 117.0, 153.0, 170.0, 210.0, 266.0, 260.0, 292.0, 290.0, 244.0, 251.0, 191.0, 167.0, 145.0, 164.0, 103.0, 90.0, 80.0, 60.0, 53.0, 38.0, 38.0, 14.0, 20.0, 24.0, 7.0, 12.0, 3.0, 5.0, 0.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.21875, -56.3203125, -54.421875, -52.5234375, -50.625, -48.7265625, -46.828125, -44.9296875, -43.03125, -41.1328125, -39.234375, -37.3359375, -35.4375, -33.5390625, -31.640625, -29.7421875, -27.84375, -25.9453125, -24.046875, -22.1484375, -20.25, -18.3515625, -16.453125, -14.5546875, -12.65625, -10.7578125, -8.859375, -6.9609375, -5.0625, -3.1640625, -1.265625, 0.6328125, 2.53125, 4.4296875, 6.328125, 8.2265625, 10.125, 12.0234375, 13.921875, 15.8203125, 17.71875, 19.6171875, 21.515625, 23.4140625, 25.3125, 27.2109375, 29.109375, 31.0078125, 32.90625, 34.8046875, 36.703125, 38.6015625, 40.5, 42.3984375, 44.296875, 46.1953125, 48.09375, 49.9921875, 51.890625, 53.7890625, 55.6875, 57.5859375, 59.484375, 61.3828125, 63.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 5.0, 3.0, 8.0, 14.0, 12.0, 20.0, 20.0, 26.0, 26.0, 33.0, 31.0, 43.0, 39.0, 56.0, 50.0, 49.0, 60.0, 62.0, 62.0, 38.0, 45.0, 36.0, 44.0, 32.0, 33.0, 30.0, 24.0, 25.0, 23.0, 11.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-166.92550659179688, -162.397705078125, -157.86990356445312, -153.34210205078125, -148.81430053710938, -144.28648376464844, -139.75868225097656, -135.2308807373047, -130.7030792236328, -126.17527770996094, -121.64747619628906, -117.11966705322266, -112.59186553955078, -108.0640640258789, -103.5362548828125, -99.00845336914062, -94.48065185546875, -89.95285034179688, -85.425048828125, -80.8972396850586, -76.36943817138672, -71.84163665771484, -67.31382751464844, -62.78602600097656, -58.25822448730469, -53.73042297363281, -49.20261764526367, -44.67481231689453, -40.147010803222656, -35.61920928955078, -31.09140396118164, -26.563600540161133, -22.035781860351562, -17.507978439331055, -12.980175018310547, -8.452371597290039, -3.9245681762695312, 0.6032352447509766, 5.131038665771484, 9.658842086791992, 14.1866455078125, 18.714448928833008, 23.242252349853516, 27.770055770874023, 32.29785919189453, 36.825660705566406, 41.35346603393555, 45.88127136230469, 50.40907287597656, 54.93687438964844, 59.46467971801758, 63.99248504638672, 68.5202865600586, 73.04808807373047, 77.57589721679688, 82.10369873046875, 86.63150024414062, 91.1593017578125, 95.68710327148438, 100.21491241455078, 104.74271392822266, 109.27051544189453, 113.79832458496094, 118.32612609863281, 122.85392761230469]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 10.0, 9.0, 7.0, 12.0, 18.0, 13.0, 14.0, 16.0, 15.0, 35.0, 27.0, 23.0, 34.0, 24.0, 49.0, 39.0, 32.0, 42.0, 47.0, 40.0, 43.0, 32.0, 37.0, 45.0, 30.0, 41.0, 32.0, 27.0, 27.0, 34.0, 25.0, 23.0, 19.0, 10.0, 16.0, 13.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.46715545654297, -115.53140258789062, -111.59565734863281, -107.65990447998047, -103.72415161132812, -99.78840637207031, -95.85265350341797, -91.91690063476562, -87.98115539550781, -84.04540252685547, -80.10965728759766, -76.17390441894531, -72.23815155029297, -68.30239868164062, -64.36665344238281, -60.43090057373047, -56.495147705078125, -52.55939865112305, -48.6236457824707, -44.687896728515625, -40.75214385986328, -36.8163948059082, -32.880645751953125, -28.944894790649414, -25.009143829345703, -21.073392868041992, -17.13764190673828, -13.201892852783203, -9.266141891479492, -5.330390930175781, -1.3946418762207031, 2.541109085083008, 6.4768524169921875, 10.412603378295898, 14.348353385925293, 18.284103393554688, 22.2198543548584, 26.15560531616211, 30.091354370117188, 34.02710723876953, 37.96285629272461, 41.89860534667969, 45.83435821533203, 49.77010726928711, 53.70585632324219, 57.64160919189453, 61.57735824584961, 65.51310729980469, 69.44886016845703, 73.38461303710938, 77.32035827636719, 81.25611114501953, 85.19186401367188, 89.12760925292969, 93.06336212158203, 96.99911499023438, 100.93486022949219, 104.87061309814453, 108.80635833740234, 112.74211120605469, 116.67786407470703, 120.61361694335938, 124.54936218261719, 128.485107421875, 132.42086791992188]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 3.0, 8.0, 6.0, 14.0, 25.0, 46.0, 54.0, 78.0, 123.0, 170.0, 289.0, 426.0, 753.0, 1063.0, 1747.0, 2700.0, 4267.0, 6539.0, 10310.0, 16185.0, 25888.0, 41322.0, 66798.0, 106493.0, 153691.0, 177951.0, 151808.0, 104255.0, 65440.0, 40768.0, 25368.0, 15885.0, 10177.0, 6536.0, 4114.0, 2565.0, 1673.0, 1069.0, 676.0, 444.0, 298.0, 162.0, 124.0, 84.0, 51.0, 36.0, 29.0, 21.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-193.75, -187.962890625, -182.17578125, -176.388671875, -170.6015625, -164.814453125, -159.02734375, -153.240234375, -147.453125, -141.666015625, -135.87890625, -130.091796875, -124.3046875, -118.517578125, -112.73046875, -106.943359375, -101.15625, -95.369140625, -89.58203125, -83.794921875, -78.0078125, -72.220703125, -66.43359375, -60.646484375, -54.859375, -49.072265625, -43.28515625, -37.498046875, -31.7109375, -25.923828125, -20.13671875, -14.349609375, -8.5625, -2.775390625, 3.01171875, 8.798828125, 14.5859375, 20.373046875, 26.16015625, 31.947265625, 37.734375, 43.521484375, 49.30859375, 55.095703125, 60.8828125, 66.669921875, 72.45703125, 78.244140625, 84.03125, 89.818359375, 95.60546875, 101.392578125, 107.1796875, 112.966796875, 118.75390625, 124.541015625, 130.328125, 136.115234375, 141.90234375, 147.689453125, 153.4765625, 159.263671875, 165.05078125, 170.837890625, 176.625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 8.0, 4.0, 10.0, 5.0, 22.0, 23.0, 18.0, 28.0, 25.0, 22.0, 24.0, 27.0, 26.0, 30.0, 36.0, 42.0, 44.0, 42.0, 34.0, 36.0, 30.0, 44.0, 41.0, 44.0, 42.0, 40.0, 35.0, 25.0, 26.0, 25.0, 19.0, 17.0, 16.0, 16.0, 11.0, 6.0, 16.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.4375, -89.125, -85.8125, -82.5, -79.1875, -75.875, -72.5625, -69.25, -65.9375, -62.625, -59.3125, -56.0, -52.6875, -49.375, -46.0625, -42.75, -39.4375, -36.125, -32.8125, -29.5, -26.1875, -22.875, -19.5625, -16.25, -12.9375, -9.625, -6.3125, -3.0, 0.3125, 3.625, 6.9375, 10.25, 13.5625, 16.875, 20.1875, 23.5, 26.8125, 30.125, 33.4375, 36.75, 40.0625, 43.375, 46.6875, 50.0, 53.3125, 56.625, 59.9375, 63.25, 66.5625, 69.875, 73.1875, 76.5, 79.8125, 83.125, 86.4375, 89.75, 93.0625, 96.375, 99.6875, 103.0, 106.3125, 109.625, 112.9375, 116.25, 119.5625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 12.0, 20.0, 44.0, 38.0, 68.0, 96.0, 112.0, 182.0, 267.0, 360.0, 517.0, 766.0, 1233.0, 2073.0, 3145.0, 5135.0, 8740.0, 15803.0, 29857.0, 61687.0, 141734.0, 294670.0, 258318.0, 113885.0, 50816.0, 25364.0, 13497.0, 7643.0, 4415.0, 2845.0, 1700.0, 1137.0, 757.0, 506.0, 324.0, 225.0, 190.0, 87.0, 85.0, 53.0, 38.0, 32.0, 24.0, 13.0, 6.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-319.0, -308.66796875, -298.3359375, -288.00390625, -277.671875, -267.33984375, -257.0078125, -246.67578125, -236.34375, -226.01171875, -215.6796875, -205.34765625, -195.015625, -184.68359375, -174.3515625, -164.01953125, -153.6875, -143.35546875, -133.0234375, -122.69140625, -112.359375, -102.02734375, -91.6953125, -81.36328125, -71.03125, -60.69921875, -50.3671875, -40.03515625, -29.703125, -19.37109375, -9.0390625, 1.29296875, 11.625, 21.95703125, 32.2890625, 42.62109375, 52.953125, 63.28515625, 73.6171875, 83.94921875, 94.28125, 104.61328125, 114.9453125, 125.27734375, 135.609375, 145.94140625, 156.2734375, 166.60546875, 176.9375, 187.26953125, 197.6015625, 207.93359375, 218.265625, 228.59765625, 238.9296875, 249.26171875, 259.59375, 269.92578125, 280.2578125, 290.58984375, 300.921875, 311.25390625, 321.5859375, 331.91796875, 342.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 7.0, 8.0, 8.0, 14.0, 15.0, 5.0, 18.0, 12.0, 27.0, 16.0, 23.0, 27.0, 35.0, 41.0, 42.0, 39.0, 41.0, 41.0, 53.0, 44.0, 40.0, 40.0, 42.0, 27.0, 40.0, 33.0, 33.0, 30.0, 25.0, 22.0, 14.0, 22.0, 18.0, 15.0, 19.0, 9.0, 13.0, 13.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -72.580078125, -70.09765625, -67.615234375, -65.1328125, -62.650390625, -60.16796875, -57.685546875, -55.203125, -52.720703125, -50.23828125, -47.755859375, -45.2734375, -42.791015625, -40.30859375, -37.826171875, -35.34375, -32.861328125, -30.37890625, -27.896484375, -25.4140625, -22.931640625, -20.44921875, -17.966796875, -15.484375, -13.001953125, -10.51953125, -8.037109375, -5.5546875, -3.072265625, -0.58984375, 1.892578125, 4.375, 6.857421875, 9.33984375, 11.822265625, 14.3046875, 16.787109375, 19.26953125, 21.751953125, 24.234375, 26.716796875, 29.19921875, 31.681640625, 34.1640625, 36.646484375, 39.12890625, 41.611328125, 44.09375, 46.576171875, 49.05859375, 51.541015625, 54.0234375, 56.505859375, 58.98828125, 61.470703125, 63.953125, 66.435546875, 68.91796875, 71.400390625, 73.8828125, 76.365234375, 78.84765625, 81.330078125, 83.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 38.0, 51.0, 73.0, 104.0, 154.0, 249.0, 368.0, 640.0, 1245.0, 3131.0, 13068.0, 101937.0, 652468.0, 240525.0, 25595.0, 5021.0, 1667.0, 825.0, 466.0, 276.0, 185.0, 114.0, 81.0, 52.0, 42.0, 26.0, 26.0, 17.0, 7.0, 7.0, 8.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.5, -337.5, -326.5, -315.5, -304.5, -293.5, -282.5, -271.5, -260.5, -249.5, -238.5, -227.5, -216.5, -205.5, -194.5, -183.5, -172.5, -161.5, -150.5, -139.5, -128.5, -117.5, -106.5, -95.5, -84.5, -73.5, -62.5, -51.5, -40.5, -29.5, -18.5, -7.5, 3.5, 14.5, 25.5, 36.5, 47.5, 58.5, 69.5, 80.5, 91.5, 102.5, 113.5, 124.5, 135.5, 146.5, 157.5, 168.5, 179.5, 190.5, 201.5, 212.5, 223.5, 234.5, 245.5, 256.5, 267.5, 278.5, 289.5, 300.5, 311.5, 322.5, 333.5, 344.5, 355.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 9.0, 9.0, 14.0, 25.0, 26.0, 50.0, 141.0, 228.0, 214.0, 147.0, 60.0, 32.0, 14.0, 15.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224151611328125, -0.021712303161621094, -0.021009445190429688, -0.02030658721923828, -0.019603729248046875, -0.01890087127685547, -0.018198013305664062, -0.017495155334472656, -0.01679229736328125, -0.016089439392089844, -0.015386581420898438, -0.014683723449707031, -0.013980865478515625, -0.013278007507324219, -0.012575149536132812, -0.011872291564941406, -0.01116943359375, -0.010466575622558594, -0.009763717651367188, -0.009060859680175781, -0.008358001708984375, -0.007655143737792969, -0.0069522857666015625, -0.006249427795410156, -0.00554656982421875, -0.004843711853027344, -0.0041408538818359375, -0.0034379959106445312, -0.002735137939453125, -0.0020322799682617188, -0.0013294219970703125, -0.0006265640258789062, 7.62939453125e-05, 0.0007791519165039062, 0.0014820098876953125, 0.0021848678588867188, 0.002887725830078125, 0.0035905838012695312, 0.0042934417724609375, 0.004996299743652344, 0.00569915771484375, 0.006402015686035156, 0.0071048736572265625, 0.007807731628417969, 0.008510589599609375, 0.009213447570800781, 0.009916305541992188, 0.010619163513183594, 0.011322021484375, 0.012024879455566406, 0.012727737426757812, 0.013430595397949219, 0.014133453369140625, 0.014836311340332031, 0.015539169311523438, 0.016242027282714844, 0.01694488525390625, 0.017647743225097656, 0.018350601196289062, 0.01905345916748047, 0.019756317138671875, 0.02045917510986328, 0.021162033081054688, 0.021864891052246094, 0.0225677490234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 14.0, 9.0, 13.0, 38.0, 39.0, 57.0, 73.0, 77.0, 113.0, 143.0, 153.0, 237.0, 274.0, 452.0, 642.0, 962.0, 1613.0, 3250.0, 7974.0, 23796.0, 78933.0, 222650.0, 355951.0, 228150.0, 81691.0, 24898.0, 8077.0, 3357.0, 1655.0, 868.0, 595.0, 456.0, 324.0, 252.0, 198.0, 139.0, 104.0, 77.0, 53.0, 47.0, 35.0, 31.0, 20.0, 19.0, 13.0, 7.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-213.625, -207.435546875, -201.24609375, -195.056640625, -188.8671875, -182.677734375, -176.48828125, -170.298828125, -164.109375, -157.919921875, -151.73046875, -145.541015625, -139.3515625, -133.162109375, -126.97265625, -120.783203125, -114.59375, -108.404296875, -102.21484375, -96.025390625, -89.8359375, -83.646484375, -77.45703125, -71.267578125, -65.078125, -58.888671875, -52.69921875, -46.509765625, -40.3203125, -34.130859375, -27.94140625, -21.751953125, -15.5625, -9.373046875, -3.18359375, 3.005859375, 9.1953125, 15.384765625, 21.57421875, 27.763671875, 33.953125, 40.142578125, 46.33203125, 52.521484375, 58.7109375, 64.900390625, 71.08984375, 77.279296875, 83.46875, 89.658203125, 95.84765625, 102.037109375, 108.2265625, 114.416015625, 120.60546875, 126.794921875, 132.984375, 139.173828125, 145.36328125, 151.552734375, 157.7421875, 163.931640625, 170.12109375, 176.310546875, 182.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 10.0, 18.0, 24.0, 25.0, 28.0, 34.0, 53.0, 52.0, 78.0, 88.0, 71.0, 81.0, 75.0, 80.0, 53.0, 56.0, 39.0, 43.0, 14.0, 14.0, 16.0, 7.0, 6.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-60.6875, -58.99365234375, -57.2998046875, -55.60595703125, -53.912109375, -52.21826171875, -50.5244140625, -48.83056640625, -47.13671875, -45.44287109375, -43.7490234375, -42.05517578125, -40.361328125, -38.66748046875, -36.9736328125, -35.27978515625, -33.5859375, -31.89208984375, -30.1982421875, -28.50439453125, -26.810546875, -25.11669921875, -23.4228515625, -21.72900390625, -20.03515625, -18.34130859375, -16.6474609375, -14.95361328125, -13.259765625, -11.56591796875, -9.8720703125, -8.17822265625, -6.484375, -4.79052734375, -3.0966796875, -1.40283203125, 0.291015625, 1.98486328125, 3.6787109375, 5.37255859375, 7.06640625, 8.76025390625, 10.4541015625, 12.14794921875, 13.841796875, 15.53564453125, 17.2294921875, 18.92333984375, 20.6171875, 22.31103515625, 24.0048828125, 25.69873046875, 27.392578125, 29.08642578125, 30.7802734375, 32.47412109375, 34.16796875, 35.86181640625, 37.5556640625, 39.24951171875, 40.943359375, 42.63720703125, 44.3310546875, 46.02490234375, 47.71875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 16.0, 16.0, 20.0, 15.0, 21.0, 28.0, 21.0, 48.0, 33.0, 45.0, 53.0, 47.0, 42.0, 43.0, 57.0, 39.0, 47.0, 60.0, 39.0, 37.0, 45.0, 29.0, 24.0, 19.0, 33.0, 11.0, 11.0, 12.0, 12.0, 7.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-123.48811340332031, -119.9590835571289, -116.43004608154297, -112.90101623535156, -109.37197875976562, -105.84294891357422, -102.31391906738281, -98.78488159179688, -95.25584411621094, -91.72681427001953, -88.1977767944336, -84.66874694824219, -81.13970947265625, -77.61067962646484, -74.08164978027344, -70.5526123046875, -67.0235824584961, -63.49454879760742, -59.96551513671875, -56.436485290527344, -52.907447814941406, -49.37841796875, -45.84938430786133, -42.320350646972656, -38.791316986083984, -35.26228332519531, -31.73324966430664, -28.2042179107666, -24.67518424987793, -21.146150588989258, -17.61711883544922, -14.088085174560547, -10.559043884277344, -7.03001070022583, -3.5009775161743164, 0.028055191040039062, 3.557088851928711, 7.086122512817383, 10.615154266357422, 14.144187927246094, 17.673221588134766, 21.202255249023438, 24.73128890991211, 28.26032066345215, 31.78935432434082, 35.318389892578125, 38.84741973876953, 42.3764533996582, 45.905487060546875, 49.43452072143555, 52.96355438232422, 56.492584228515625, 60.02162170410156, 63.55065155029297, 67.07968139648438, 70.60871887207031, 74.13775634765625, 77.66678619384766, 81.1958236694336, 84.724853515625, 88.25389099121094, 91.78292083740234, 95.31195068359375, 98.84098815917969, 102.3700180053711]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 8.0, 6.0, 12.0, 11.0, 13.0, 16.0, 17.0, 17.0, 29.0, 29.0, 36.0, 24.0, 35.0, 35.0, 52.0, 40.0, 39.0, 43.0, 29.0, 37.0, 40.0, 43.0, 35.0, 45.0, 34.0, 37.0, 37.0, 23.0, 28.0, 24.0, 14.0, 20.0, 14.0, 15.0, 13.0, 8.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.05889129638672, -110.54922485351562, -107.03955841064453, -103.52989196777344, -100.02022552490234, -96.51055908203125, -93.00089263916016, -89.49122619628906, -85.98155975341797, -82.47189331054688, -78.96222686767578, -75.45256042480469, -71.9428939819336, -68.4332275390625, -64.9235610961914, -61.41389465332031, -57.90422439575195, -54.39455795288086, -50.884891510009766, -47.37522506713867, -43.86555862426758, -40.35588836669922, -36.846221923828125, -33.33655548095703, -29.82689094543457, -26.317224502563477, -22.807558059692383, -19.297889709472656, -15.788224220275879, -12.278556823730469, -8.768890380859375, -5.259223937988281, -1.7495574951171875, 1.7601091861724854, 5.269775867462158, 8.77944278717041, 12.289109230041504, 15.798776626586914, 19.308443069458008, 22.8181095123291, 26.327775955200195, 29.83744239807129, 33.347110748291016, 36.85677719116211, 40.3664436340332, 43.8761100769043, 47.38577651977539, 50.895442962646484, 54.40510940551758, 57.91477584838867, 61.424442291259766, 64.93411254882812, 68.44377899169922, 71.95344543457031, 75.4631118774414, 78.9727783203125, 82.4824447631836, 85.99211120605469, 89.50177764892578, 93.01144409179688, 96.52111053466797, 100.03077697753906, 103.54044342041016, 107.05010986328125, 110.55977630615234]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 10.0, 16.0, 26.0, 45.0, 67.0, 100.0, 162.0, 245.0, 415.0, 665.0, 999.0, 1570.0, 2462.0, 3730.0, 5804.0, 8949.0, 13743.0, 20482.0, 29909.0, 42420.0, 57996.0, 75721.0, 93355.0, 106658.0, 111350.0, 106843.0, 94144.0, 77013.0, 59177.0, 43402.0, 30517.0, 20662.0, 13984.0, 9234.0, 6000.0, 3825.0, 2513.0, 1558.0, 1045.0, 609.0, 388.0, 246.0, 180.0, 120.0, 83.0, 41.0, 38.0, 17.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0], "bins": [-128.5, -124.7783203125, -121.056640625, -117.3349609375, -113.61328125, -109.8916015625, -106.169921875, -102.4482421875, -98.7265625, -95.0048828125, -91.283203125, -87.5615234375, -83.83984375, -80.1181640625, -76.396484375, -72.6748046875, -68.953125, -65.2314453125, -61.509765625, -57.7880859375, -54.06640625, -50.3447265625, -46.623046875, -42.9013671875, -39.1796875, -35.4580078125, -31.736328125, -28.0146484375, -24.29296875, -20.5712890625, -16.849609375, -13.1279296875, -9.40625, -5.6845703125, -1.962890625, 1.7587890625, 5.48046875, 9.2021484375, 12.923828125, 16.6455078125, 20.3671875, 24.0888671875, 27.810546875, 31.5322265625, 35.25390625, 38.9755859375, 42.697265625, 46.4189453125, 50.140625, 53.8623046875, 57.583984375, 61.3056640625, 65.02734375, 68.7490234375, 72.470703125, 76.1923828125, 79.9140625, 83.6357421875, 87.357421875, 91.0791015625, 94.80078125, 98.5224609375, 102.244140625, 105.9658203125, 109.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 3.0, 8.0, 7.0, 3.0, 7.0, 11.0, 10.0, 20.0, 18.0, 18.0, 23.0, 27.0, 26.0, 35.0, 36.0, 36.0, 51.0, 40.0, 42.0, 35.0, 46.0, 37.0, 33.0, 44.0, 41.0, 34.0, 43.0, 33.0, 34.0, 40.0, 25.0, 21.0, 20.0, 16.0, 13.0, 13.0, 11.0, 12.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.3125, -96.953125, -93.59375, -90.234375, -86.875, -83.515625, -80.15625, -76.796875, -73.4375, -70.078125, -66.71875, -63.359375, -60.0, -56.640625, -53.28125, -49.921875, -46.5625, -43.203125, -39.84375, -36.484375, -33.125, -29.765625, -26.40625, -23.046875, -19.6875, -16.328125, -12.96875, -9.609375, -6.25, -2.890625, 0.46875, 3.828125, 7.1875, 10.546875, 13.90625, 17.265625, 20.625, 23.984375, 27.34375, 30.703125, 34.0625, 37.421875, 40.78125, 44.140625, 47.5, 50.859375, 54.21875, 57.578125, 60.9375, 64.296875, 67.65625, 71.015625, 74.375, 77.734375, 81.09375, 84.453125, 87.8125, 91.171875, 94.53125, 97.890625, 101.25, 104.609375, 107.96875, 111.328125, 114.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 9.0, 16.0, 30.0, 57.0, 78.0, 126.0, 177.0, 329.0, 507.0, 848.0, 1282.0, 2054.0, 3007.0, 4726.0, 7360.0, 11442.0, 17330.0, 26307.0, 37483.0, 53059.0, 70238.0, 88302.0, 104195.0, 112638.0, 110688.0, 100270.0, 83339.0, 64655.0, 47858.0, 33491.0, 23198.0, 15260.0, 10139.0, 6412.0, 4179.0, 2718.0, 1725.0, 1113.0, 690.0, 468.0, 283.0, 167.0, 113.0, 75.0, 42.0, 31.0, 20.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-120.25, -116.697265625, -113.14453125, -109.591796875, -106.0390625, -102.486328125, -98.93359375, -95.380859375, -91.828125, -88.275390625, -84.72265625, -81.169921875, -77.6171875, -74.064453125, -70.51171875, -66.958984375, -63.40625, -59.853515625, -56.30078125, -52.748046875, -49.1953125, -45.642578125, -42.08984375, -38.537109375, -34.984375, -31.431640625, -27.87890625, -24.326171875, -20.7734375, -17.220703125, -13.66796875, -10.115234375, -6.5625, -3.009765625, 0.54296875, 4.095703125, 7.6484375, 11.201171875, 14.75390625, 18.306640625, 21.859375, 25.412109375, 28.96484375, 32.517578125, 36.0703125, 39.623046875, 43.17578125, 46.728515625, 50.28125, 53.833984375, 57.38671875, 60.939453125, 64.4921875, 68.044921875, 71.59765625, 75.150390625, 78.703125, 82.255859375, 85.80859375, 89.361328125, 92.9140625, 96.466796875, 100.01953125, 103.572265625, 107.125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 7.0, 17.0, 12.0, 17.0, 24.0, 27.0, 21.0, 22.0, 21.0, 36.0, 29.0, 34.0, 45.0, 41.0, 39.0, 52.0, 54.0, 45.0, 31.0, 43.0, 29.0, 42.0, 31.0, 40.0, 36.0, 23.0, 23.0, 20.0, 21.0, 15.0, 18.0, 13.0, 13.0, 8.0, 8.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.724609375, -65.38671875, -63.048828125, -60.7109375, -58.373046875, -56.03515625, -53.697265625, -51.359375, -49.021484375, -46.68359375, -44.345703125, -42.0078125, -39.669921875, -37.33203125, -34.994140625, -32.65625, -30.318359375, -27.98046875, -25.642578125, -23.3046875, -20.966796875, -18.62890625, -16.291015625, -13.953125, -11.615234375, -9.27734375, -6.939453125, -4.6015625, -2.263671875, 0.07421875, 2.412109375, 4.75, 7.087890625, 9.42578125, 11.763671875, 14.1015625, 16.439453125, 18.77734375, 21.115234375, 23.453125, 25.791015625, 28.12890625, 30.466796875, 32.8046875, 35.142578125, 37.48046875, 39.818359375, 42.15625, 44.494140625, 46.83203125, 49.169921875, 51.5078125, 53.845703125, 56.18359375, 58.521484375, 60.859375, 63.197265625, 65.53515625, 67.873046875, 70.2109375, 72.548828125, 74.88671875, 77.224609375, 79.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 12.0, 8.0, 22.0, 26.0, 46.0, 61.0, 95.0, 159.0, 248.0, 437.0, 656.0, 1043.0, 1769.0, 3079.0, 5282.0, 9518.0, 17000.0, 30473.0, 52508.0, 85355.0, 124592.0, 158090.0, 164186.0, 141159.0, 100504.0, 64472.0, 38083.0, 21639.0, 11928.0, 6684.0, 3827.0, 2181.0, 1285.0, 772.0, 463.0, 312.0, 202.0, 129.0, 76.0, 52.0, 39.0, 20.0, 32.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0], "bins": [-55.84375, -54.25732421875, -52.6708984375, -51.08447265625, -49.498046875, -47.91162109375, -46.3251953125, -44.73876953125, -43.15234375, -41.56591796875, -39.9794921875, -38.39306640625, -36.806640625, -35.22021484375, -33.6337890625, -32.04736328125, -30.4609375, -28.87451171875, -27.2880859375, -25.70166015625, -24.115234375, -22.52880859375, -20.9423828125, -19.35595703125, -17.76953125, -16.18310546875, -14.5966796875, -13.01025390625, -11.423828125, -9.83740234375, -8.2509765625, -6.66455078125, -5.078125, -3.49169921875, -1.9052734375, -0.31884765625, 1.267578125, 2.85400390625, 4.4404296875, 6.02685546875, 7.61328125, 9.19970703125, 10.7861328125, 12.37255859375, 13.958984375, 15.54541015625, 17.1318359375, 18.71826171875, 20.3046875, 21.89111328125, 23.4775390625, 25.06396484375, 26.650390625, 28.23681640625, 29.8232421875, 31.40966796875, 32.99609375, 34.58251953125, 36.1689453125, 37.75537109375, 39.341796875, 40.92822265625, 42.5146484375, 44.10107421875, 45.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 13.0, 10.0, 12.0, 11.0, 16.0, 30.0, 26.0, 19.0, 43.0, 24.0, 45.0, 58.0, 59.0, 50.0, 56.0, 70.0, 62.0, 46.0, 44.0, 42.0, 36.0, 42.0, 20.0, 24.0, 23.0, 29.0, 16.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.004869401454925537, -0.004714846611022949, -0.004560291767120361, -0.0044057369232177734, -0.0042511820793151855, -0.004096627235412598, -0.00394207239151001, -0.003787517547607422, -0.003632962703704834, -0.003478407859802246, -0.003323853015899658, -0.0031692981719970703, -0.0030147433280944824, -0.0028601884841918945, -0.0027056336402893066, -0.0025510787963867188, -0.002396523952484131, -0.002241969108581543, -0.002087414264678955, -0.0019328594207763672, -0.0017783045768737793, -0.0016237497329711914, -0.0014691948890686035, -0.0013146400451660156, -0.0011600852012634277, -0.0010055303573608398, -0.000850975513458252, -0.0006964206695556641, -0.0005418658256530762, -0.0003873109817504883, -0.0002327561378479004, -7.82012939453125e-05, 7.635354995727539e-05, 0.00023090839385986328, 0.00038546323776245117, 0.0005400180816650391, 0.000694572925567627, 0.0008491277694702148, 0.0010036826133728027, 0.0011582374572753906, 0.0013127923011779785, 0.0014673471450805664, 0.0016219019889831543, 0.0017764568328857422, 0.00193101167678833, 0.002085566520690918, 0.002240121364593506, 0.0023946762084960938, 0.0025492310523986816, 0.0027037858963012695, 0.0028583407402038574, 0.0030128955841064453, 0.003167450428009033, 0.003322005271911621, 0.003476560115814209, 0.003631114959716797, 0.0037856698036193848, 0.003940224647521973, 0.0040947794914245605, 0.0042493343353271484, 0.004403889179229736, 0.004558444023132324, 0.004712998867034912, 0.0048675537109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 11.0, 11.0, 15.0, 36.0, 57.0, 87.0, 137.0, 224.0, 339.0, 612.0, 945.0, 1485.0, 2461.0, 4082.0, 6315.0, 10539.0, 16916.0, 26703.0, 40596.0, 60094.0, 83482.0, 107337.0, 123756.0, 128587.0, 118232.0, 98046.0, 73392.0, 51555.0, 34181.0, 22071.0, 13922.0, 8645.0, 5290.0, 3233.0, 2011.0, 1208.0, 699.0, 495.0, 291.0, 166.0, 118.0, 61.0, 48.0, 27.0, 17.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-40.21875, -39.0458984375, -37.873046875, -36.7001953125, -35.52734375, -34.3544921875, -33.181640625, -32.0087890625, -30.8359375, -29.6630859375, -28.490234375, -27.3173828125, -26.14453125, -24.9716796875, -23.798828125, -22.6259765625, -21.453125, -20.2802734375, -19.107421875, -17.9345703125, -16.76171875, -15.5888671875, -14.416015625, -13.2431640625, -12.0703125, -10.8974609375, -9.724609375, -8.5517578125, -7.37890625, -6.2060546875, -5.033203125, -3.8603515625, -2.6875, -1.5146484375, -0.341796875, 0.8310546875, 2.00390625, 3.1767578125, 4.349609375, 5.5224609375, 6.6953125, 7.8681640625, 9.041015625, 10.2138671875, 11.38671875, 12.5595703125, 13.732421875, 14.9052734375, 16.078125, 17.2509765625, 18.423828125, 19.5966796875, 20.76953125, 21.9423828125, 23.115234375, 24.2880859375, 25.4609375, 26.6337890625, 27.806640625, 28.9794921875, 30.15234375, 31.3251953125, 32.498046875, 33.6708984375, 34.84375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 3.0, 12.0, 10.0, 11.0, 10.0, 16.0, 13.0, 20.0, 22.0, 35.0, 32.0, 38.0, 39.0, 35.0, 27.0, 42.0, 44.0, 43.0, 49.0, 52.0, 45.0, 32.0, 40.0, 36.0, 26.0, 29.0, 23.0, 35.0, 24.0, 23.0, 15.0, 16.0, 14.0, 19.0, 12.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1796875, -12.7508544921875, -12.322021484375, -11.8931884765625, -11.46435546875, -11.0355224609375, -10.606689453125, -10.1778564453125, -9.7490234375, -9.3201904296875, -8.891357421875, -8.4625244140625, -8.03369140625, -7.6048583984375, -7.176025390625, -6.7471923828125, -6.318359375, -5.8895263671875, -5.460693359375, -5.0318603515625, -4.60302734375, -4.1741943359375, -3.745361328125, -3.3165283203125, -2.8876953125, -2.4588623046875, -2.030029296875, -1.6011962890625, -1.17236328125, -0.7435302734375, -0.314697265625, 0.1141357421875, 0.54296875, 0.9718017578125, 1.400634765625, 1.8294677734375, 2.25830078125, 2.6871337890625, 3.115966796875, 3.5447998046875, 3.9736328125, 4.4024658203125, 4.831298828125, 5.2601318359375, 5.68896484375, 6.1177978515625, 6.546630859375, 6.9754638671875, 7.404296875, 7.8331298828125, 8.261962890625, 8.6907958984375, 9.11962890625, 9.5484619140625, 9.977294921875, 10.4061279296875, 10.8349609375, 11.2637939453125, 11.692626953125, 12.1214599609375, 12.55029296875, 12.9791259765625, 13.407958984375, 13.8367919921875, 14.265625]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 3.0, 6.0, 8.0, 9.0, 10.0, 20.0, 8.0, 20.0, 18.0, 20.0, 28.0, 39.0, 32.0, 41.0, 34.0, 52.0, 48.0, 33.0, 50.0, 50.0, 52.0, 32.0, 41.0, 43.0, 31.0, 25.0, 29.0, 35.0, 21.0, 23.0, 20.0, 22.0, 10.0, 13.0, 12.0, 9.0, 10.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.63424682617188, -102.45063018798828, -99.26700592041016, -96.08338928222656, -92.89977264404297, -89.71615600585938, -86.53253173828125, -83.34891510009766, -80.16529846191406, -76.98168182373047, -73.79805755615234, -70.61444091796875, -67.43082427978516, -64.24720764160156, -61.06358337402344, -57.879966735839844, -54.69634246826172, -51.51272201538086, -48.329105377197266, -45.145484924316406, -41.96186828613281, -38.77824783325195, -35.594627380371094, -32.4110107421875, -29.22739028930664, -26.043771743774414, -22.860153198242188, -19.676532745361328, -16.4929141998291, -13.309295654296875, -10.125675201416016, -6.942056655883789, -3.7584381103515625, -0.5748190879821777, 2.608799934387207, 5.79241943359375, 8.976037979125977, 12.159656524658203, 15.343276977539062, 18.52689552307129, 21.710514068603516, 24.894132614135742, 28.07775115966797, 31.261371612548828, 34.44499206542969, 37.62860870361328, 40.81222915649414, 43.995849609375, 47.179466247558594, 50.36308670043945, 53.54670333862305, 56.730323791503906, 59.9139404296875, 63.09756088256836, 66.28118133544922, 69.46479797363281, 72.64842224121094, 75.83203887939453, 79.01566314697266, 82.19927978515625, 85.38289642333984, 88.56651306152344, 91.75013732910156, 94.93375396728516, 98.11737060546875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 9.0, 4.0, 15.0, 8.0, 10.0, 5.0, 23.0, 17.0, 27.0, 34.0, 24.0, 28.0, 29.0, 37.0, 25.0, 33.0, 42.0, 42.0, 48.0, 39.0, 45.0, 47.0, 49.0, 34.0, 36.0, 25.0, 35.0, 33.0, 25.0, 28.0, 11.0, 22.0, 19.0, 20.0, 13.0, 8.0, 11.0, 6.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-103.10801696777344, -99.7562484741211, -96.40447998046875, -93.0527114868164, -89.70094299316406, -86.34918212890625, -82.9974136352539, -79.64564514160156, -76.29387664794922, -72.94210815429688, -69.59033966064453, -66.23857116699219, -62.88680648803711, -59.535037994384766, -56.18327331542969, -52.831504821777344, -49.479736328125, -46.127967834472656, -42.77619934082031, -39.424434661865234, -36.07266616821289, -32.72089767456055, -29.369131088256836, -26.017364501953125, -22.66559600830078, -19.313827514648438, -15.962060928344727, -12.6102933883667, -9.258525848388672, -5.906757354736328, -2.554990768432617, 0.7967758178710938, 4.148536682128906, 7.500304222106934, 10.852071762084961, 14.203839302062988, 17.555606842041016, 20.90737533569336, 24.25914192199707, 27.61090850830078, 30.962677001953125, 34.31444549560547, 37.66621398925781, 41.01797866821289, 44.369747161865234, 47.72151565551758, 51.073280334472656, 54.425048828125, 57.776817321777344, 61.12858581542969, 64.48035430908203, 67.83212280273438, 71.18388366699219, 74.53565979003906, 77.88742065429688, 81.23918914794922, 84.59095764160156, 87.9427261352539, 91.29449462890625, 94.6462631225586, 97.99803161621094, 101.34979248046875, 104.7015609741211, 108.05332946777344, 111.40509796142578]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 18.0, 16.0, 42.0, 55.0, 82.0, 124.0, 205.0, 284.0, 506.0, 839.0, 1201.0, 1915.0, 3001.0, 4740.0, 7415.0, 11432.0, 18164.0, 28515.0, 45302.0, 72567.0, 116309.0, 186892.0, 301315.0, 479835.0, 685372.0, 728753.0, 553730.0, 359369.0, 222573.0, 137114.0, 84601.0, 53004.0, 33094.0, 20608.0, 12945.0, 8387.0, 5061.0, 3299.0, 2095.0, 1281.0, 884.0, 483.0, 296.0, 198.0, 128.0, 74.0, 69.0, 31.0, 24.0, 12.0, 9.0, 5.0, 0.0, 2.0, 5.0], "bins": [-126.5, -122.7978515625, -119.095703125, -115.3935546875, -111.69140625, -107.9892578125, -104.287109375, -100.5849609375, -96.8828125, -93.1806640625, -89.478515625, -85.7763671875, -82.07421875, -78.3720703125, -74.669921875, -70.9677734375, -67.265625, -63.5634765625, -59.861328125, -56.1591796875, -52.45703125, -48.7548828125, -45.052734375, -41.3505859375, -37.6484375, -33.9462890625, -30.244140625, -26.5419921875, -22.83984375, -19.1376953125, -15.435546875, -11.7333984375, -8.03125, -4.3291015625, -0.626953125, 3.0751953125, 6.77734375, 10.4794921875, 14.181640625, 17.8837890625, 21.5859375, 25.2880859375, 28.990234375, 32.6923828125, 36.39453125, 40.0966796875, 43.798828125, 47.5009765625, 51.203125, 54.9052734375, 58.607421875, 62.3095703125, 66.01171875, 69.7138671875, 73.416015625, 77.1181640625, 80.8203125, 84.5224609375, 88.224609375, 91.9267578125, 95.62890625, 99.3310546875, 103.033203125, 106.7353515625, 110.4375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 7.0, 7.0, 7.0, 14.0, 7.0, 8.0, 19.0, 19.0, 25.0, 24.0, 23.0, 31.0, 31.0, 19.0, 40.0, 38.0, 27.0, 37.0, 37.0, 44.0, 49.0, 41.0, 43.0, 51.0, 40.0, 33.0, 29.0, 35.0, 31.0, 28.0, 22.0, 25.0, 11.0, 19.0, 12.0, 9.0, 9.0, 12.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.3154296875, -73.880859375, -71.4462890625, -69.01171875, -66.5771484375, -64.142578125, -61.7080078125, -59.2734375, -56.8388671875, -54.404296875, -51.9697265625, -49.53515625, -47.1005859375, -44.666015625, -42.2314453125, -39.796875, -37.3623046875, -34.927734375, -32.4931640625, -30.05859375, -27.6240234375, -25.189453125, -22.7548828125, -20.3203125, -17.8857421875, -15.451171875, -13.0166015625, -10.58203125, -8.1474609375, -5.712890625, -3.2783203125, -0.84375, 1.5908203125, 4.025390625, 6.4599609375, 8.89453125, 11.3291015625, 13.763671875, 16.1982421875, 18.6328125, 21.0673828125, 23.501953125, 25.9365234375, 28.37109375, 30.8056640625, 33.240234375, 35.6748046875, 38.109375, 40.5439453125, 42.978515625, 45.4130859375, 47.84765625, 50.2822265625, 52.716796875, 55.1513671875, 57.5859375, 60.0205078125, 62.455078125, 64.8896484375, 67.32421875, 69.7587890625, 72.193359375, 74.6279296875, 77.0625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 5.0, 15.0, 12.0, 17.0, 41.0, 61.0, 100.0, 147.0, 213.0, 379.0, 598.0, 894.0, 1312.0, 2177.0, 3169.0, 4970.0, 7807.0, 12269.0, 19277.0, 29765.0, 45658.0, 70772.0, 108606.0, 162912.0, 240745.0, 342966.0, 458233.0, 554155.0, 559100.0, 470688.0, 353240.0, 250162.0, 170511.0, 113501.0, 74304.0, 48075.0, 31156.0, 20133.0, 12762.0, 8481.0, 5268.0, 3437.0, 2309.0, 1345.0, 860.0, 566.0, 411.0, 267.0, 165.0, 95.0, 70.0, 40.0, 22.0, 15.0, 19.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-76.125, -73.75, -71.375, -69.0, -66.625, -64.25, -61.875, -59.5, -57.125, -54.75, -52.375, -50.0, -47.625, -45.25, -42.875, -40.5, -38.125, -35.75, -33.375, -31.0, -28.625, -26.25, -23.875, -21.5, -19.125, -16.75, -14.375, -12.0, -9.625, -7.25, -4.875, -2.5, -0.125, 2.25, 4.625, 7.0, 9.375, 11.75, 14.125, 16.5, 18.875, 21.25, 23.625, 26.0, 28.375, 30.75, 33.125, 35.5, 37.875, 40.25, 42.625, 45.0, 47.375, 49.75, 52.125, 54.5, 56.875, 59.25, 61.625, 64.0, 66.375, 68.75, 71.125, 73.5, 75.875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 6.0, 6.0, 10.0, 13.0, 14.0, 15.0, 35.0, 27.0, 33.0, 43.0, 40.0, 60.0, 69.0, 85.0, 95.0, 128.0, 157.0, 175.0, 186.0, 221.0, 214.0, 247.0, 260.0, 236.0, 214.0, 191.0, 155.0, 163.0, 166.0, 126.0, 115.0, 107.0, 81.0, 78.0, 64.0, 34.0, 37.0, 35.0, 33.0, 26.0, 17.0, 15.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.1875, -36.017578125, -34.84765625, -33.677734375, -32.5078125, -31.337890625, -30.16796875, -28.998046875, -27.828125, -26.658203125, -25.48828125, -24.318359375, -23.1484375, -21.978515625, -20.80859375, -19.638671875, -18.46875, -17.298828125, -16.12890625, -14.958984375, -13.7890625, -12.619140625, -11.44921875, -10.279296875, -9.109375, -7.939453125, -6.76953125, -5.599609375, -4.4296875, -3.259765625, -2.08984375, -0.919921875, 0.25, 1.419921875, 2.58984375, 3.759765625, 4.9296875, 6.099609375, 7.26953125, 8.439453125, 9.609375, 10.779296875, 11.94921875, 13.119140625, 14.2890625, 15.458984375, 16.62890625, 17.798828125, 18.96875, 20.138671875, 21.30859375, 22.478515625, 23.6484375, 24.818359375, 25.98828125, 27.158203125, 28.328125, 29.498046875, 30.66796875, 31.837890625, 33.0078125, 34.177734375, 35.34765625, 36.517578125, 37.6875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 6.0, 7.0, 3.0, 14.0, 9.0, 6.0, 11.0, 24.0, 23.0, 30.0, 33.0, 28.0, 34.0, 33.0, 48.0, 56.0, 55.0, 40.0, 48.0, 58.0, 49.0, 66.0, 46.0, 32.0, 40.0, 28.0, 23.0, 29.0, 28.0, 20.0, 29.0, 5.0, 10.0, 7.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-107.5115966796875, -104.39836883544922, -101.28514099121094, -98.17191314697266, -95.05868530273438, -91.9454574584961, -88.83222961425781, -85.718994140625, -82.60577392578125, -79.49254608154297, -76.37931823730469, -73.2660903930664, -70.15286254882812, -67.03963470458984, -63.9264030456543, -60.813175201416016, -57.69994354248047, -54.58671569824219, -51.473487854003906, -48.360260009765625, -45.247032165527344, -42.13380432128906, -39.020572662353516, -35.907344818115234, -32.79411697387695, -29.680889129638672, -26.56766128540039, -23.454431533813477, -20.341203689575195, -17.227975845336914, -14.11474609375, -11.001518249511719, -7.888282775878906, -4.775054454803467, -1.6618261337280273, 1.4514026641845703, 4.564630508422852, 7.677858352661133, 10.791088104248047, 13.904315948486328, 17.01754379272461, 20.13077163696289, 23.243999481201172, 26.357229232788086, 29.470457077026367, 32.58368682861328, 35.69691467285156, 38.810142517089844, 41.923370361328125, 45.036598205566406, 48.14982604980469, 51.26305389404297, 54.37628173828125, 57.48950958251953, 60.60274124145508, 63.71596908569336, 66.82919311523438, 69.94242095947266, 73.05564880371094, 76.16887664794922, 79.2821044921875, 82.39533233642578, 85.50856018066406, 88.62179565429688, 91.73502349853516]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 17.0, 9.0, 12.0, 18.0, 20.0, 15.0, 21.0, 28.0, 23.0, 29.0, 44.0, 26.0, 36.0, 27.0, 39.0, 38.0, 38.0, 41.0, 45.0, 52.0, 44.0, 35.0, 38.0, 36.0, 25.0, 36.0, 25.0, 23.0, 20.0, 10.0, 21.0, 19.0, 16.0, 12.0, 12.0, 6.0, 9.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.69476318359375, -85.98043060302734, -83.26609802246094, -80.55176544189453, -77.83743286132812, -75.12310028076172, -72.40876770019531, -69.69444274902344, -66.9801025390625, -64.2657699584961, -61.55143737792969, -58.83710479736328, -56.122772216796875, -53.40843963623047, -50.69411087036133, -47.97977828979492, -45.26544952392578, -42.551116943359375, -39.83678436279297, -37.12245178222656, -34.408119201660156, -31.693788528442383, -28.97945785522461, -26.265125274658203, -23.550792694091797, -20.83646011352539, -18.122127532958984, -15.407796859741211, -12.693464279174805, -9.979131698608398, -7.264801025390625, -4.550468444824219, -1.8361358642578125, 0.8781962394714355, 3.5925283432006836, 6.306859970092773, 9.02119255065918, 11.735525131225586, 14.44985580444336, 17.164188385009766, 19.878520965576172, 22.592853546142578, 25.307186126708984, 28.021516799926758, 30.735849380493164, 33.45018005371094, 36.164512634277344, 38.87884521484375, 41.593177795410156, 44.30751037597656, 47.02184295654297, 49.736175537109375, 52.45050811767578, 55.16484069824219, 57.87916946411133, 60.593502044677734, 63.30783462524414, 66.02216339111328, 68.73649597167969, 71.4508285522461, 74.1651611328125, 76.8794937133789, 79.59382629394531, 82.30815887451172, 85.02249145507812]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 8.0, 13.0, 10.0, 18.0, 24.0, 40.0, 75.0, 110.0, 162.0, 237.0, 319.0, 533.0, 775.0, 1206.0, 1866.0, 2795.0, 4185.0, 6224.0, 9631.0, 14216.0, 21871.0, 32120.0, 45296.0, 63159.0, 83099.0, 101993.0, 114397.0, 116141.0, 106513.0, 89964.0, 70189.0, 51239.0, 36426.0, 24771.0, 16721.0, 11045.0, 7268.0, 4724.0, 3102.0, 2070.0, 1365.0, 881.0, 558.0, 384.0, 272.0, 183.0, 137.0, 75.0, 50.0, 34.0, 20.0, 12.0, 12.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0], "bins": [-144.5, -140.0078125, -135.515625, -131.0234375, -126.53125, -122.0390625, -117.546875, -113.0546875, -108.5625, -104.0703125, -99.578125, -95.0859375, -90.59375, -86.1015625, -81.609375, -77.1171875, -72.625, -68.1328125, -63.640625, -59.1484375, -54.65625, -50.1640625, -45.671875, -41.1796875, -36.6875, -32.1953125, -27.703125, -23.2109375, -18.71875, -14.2265625, -9.734375, -5.2421875, -0.75, 3.7421875, 8.234375, 12.7265625, 17.21875, 21.7109375, 26.203125, 30.6953125, 35.1875, 39.6796875, 44.171875, 48.6640625, 53.15625, 57.6484375, 62.140625, 66.6328125, 71.125, 75.6171875, 80.109375, 84.6015625, 89.09375, 93.5859375, 98.078125, 102.5703125, 107.0625, 111.5546875, 116.046875, 120.5390625, 125.03125, 129.5234375, 134.015625, 138.5078125, 143.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 6.0, 7.0, 16.0, 16.0, 11.0, 21.0, 20.0, 24.0, 17.0, 27.0, 30.0, 30.0, 33.0, 38.0, 27.0, 30.0, 35.0, 53.0, 49.0, 49.0, 45.0, 40.0, 43.0, 37.0, 37.0, 26.0, 22.0, 27.0, 22.0, 19.0, 22.0, 18.0, 18.0, 15.0, 13.0, 11.0, 8.0, 12.0, 6.0, 2.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.875, -53.9306640625, -51.986328125, -50.0419921875, -48.09765625, -46.1533203125, -44.208984375, -42.2646484375, -40.3203125, -38.3759765625, -36.431640625, -34.4873046875, -32.54296875, -30.5986328125, -28.654296875, -26.7099609375, -24.765625, -22.8212890625, -20.876953125, -18.9326171875, -16.98828125, -15.0439453125, -13.099609375, -11.1552734375, -9.2109375, -7.2666015625, -5.322265625, -3.3779296875, -1.43359375, 0.5107421875, 2.455078125, 4.3994140625, 6.34375, 8.2880859375, 10.232421875, 12.1767578125, 14.12109375, 16.0654296875, 18.009765625, 19.9541015625, 21.8984375, 23.8427734375, 25.787109375, 27.7314453125, 29.67578125, 31.6201171875, 33.564453125, 35.5087890625, 37.453125, 39.3974609375, 41.341796875, 43.2861328125, 45.23046875, 47.1748046875, 49.119140625, 51.0634765625, 53.0078125, 54.9521484375, 56.896484375, 58.8408203125, 60.78515625, 62.7294921875, 64.673828125, 66.6181640625, 68.5625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 13.0, 14.0, 25.0, 25.0, 56.0, 78.0, 113.0, 154.0, 215.0, 333.0, 455.0, 683.0, 1003.0, 1581.0, 2488.0, 3983.0, 6339.0, 10862.0, 19018.0, 34540.0, 63644.0, 116296.0, 194703.0, 227364.0, 160084.0, 90650.0, 49290.0, 26208.0, 14921.0, 8748.0, 5227.0, 3234.0, 2094.0, 1320.0, 883.0, 603.0, 385.0, 276.0, 186.0, 130.0, 110.0, 57.0, 57.0, 23.0, 25.0, 16.0, 18.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-253.625, -246.005859375, -238.38671875, -230.767578125, -223.1484375, -215.529296875, -207.91015625, -200.291015625, -192.671875, -185.052734375, -177.43359375, -169.814453125, -162.1953125, -154.576171875, -146.95703125, -139.337890625, -131.71875, -124.099609375, -116.48046875, -108.861328125, -101.2421875, -93.623046875, -86.00390625, -78.384765625, -70.765625, -63.146484375, -55.52734375, -47.908203125, -40.2890625, -32.669921875, -25.05078125, -17.431640625, -9.8125, -2.193359375, 5.42578125, 13.044921875, 20.6640625, 28.283203125, 35.90234375, 43.521484375, 51.140625, 58.759765625, 66.37890625, 73.998046875, 81.6171875, 89.236328125, 96.85546875, 104.474609375, 112.09375, 119.712890625, 127.33203125, 134.951171875, 142.5703125, 150.189453125, 157.80859375, 165.427734375, 173.046875, 180.666015625, 188.28515625, 195.904296875, 203.5234375, 211.142578125, 218.76171875, 226.380859375, 234.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 10.0, 17.0, 11.0, 10.0, 17.0, 19.0, 25.0, 16.0, 32.0, 24.0, 33.0, 28.0, 24.0, 33.0, 37.0, 38.0, 42.0, 45.0, 41.0, 42.0, 39.0, 44.0, 38.0, 36.0, 34.0, 35.0, 33.0, 22.0, 19.0, 13.0, 13.0, 25.0, 15.0, 18.0, 13.0, 11.0, 7.0, 4.0, 6.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.375, -44.8154296875, -43.255859375, -41.6962890625, -40.13671875, -38.5771484375, -37.017578125, -35.4580078125, -33.8984375, -32.3388671875, -30.779296875, -29.2197265625, -27.66015625, -26.1005859375, -24.541015625, -22.9814453125, -21.421875, -19.8623046875, -18.302734375, -16.7431640625, -15.18359375, -13.6240234375, -12.064453125, -10.5048828125, -8.9453125, -7.3857421875, -5.826171875, -4.2666015625, -2.70703125, -1.1474609375, 0.412109375, 1.9716796875, 3.53125, 5.0908203125, 6.650390625, 8.2099609375, 9.76953125, 11.3291015625, 12.888671875, 14.4482421875, 16.0078125, 17.5673828125, 19.126953125, 20.6865234375, 22.24609375, 23.8056640625, 25.365234375, 26.9248046875, 28.484375, 30.0439453125, 31.603515625, 33.1630859375, 34.72265625, 36.2822265625, 37.841796875, 39.4013671875, 40.9609375, 42.5205078125, 44.080078125, 45.6396484375, 47.19921875, 48.7587890625, 50.318359375, 51.8779296875, 53.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 7.0, 11.0, 21.0, 31.0, 48.0, 66.0, 79.0, 110.0, 178.0, 247.0, 385.0, 568.0, 896.0, 1382.0, 2158.0, 3533.0, 5699.0, 10460.0, 21792.0, 58661.0, 205606.0, 466803.0, 174912.0, 50860.0, 19762.0, 9685.0, 5517.0, 3273.0, 2040.0, 1283.0, 846.0, 531.0, 340.0, 239.0, 151.0, 106.0, 80.0, 56.0, 36.0, 24.0, 23.0, 8.0, 7.0, 7.0, 4.0, 5.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-245.25, -237.44921875, -229.6484375, -221.84765625, -214.046875, -206.24609375, -198.4453125, -190.64453125, -182.84375, -175.04296875, -167.2421875, -159.44140625, -151.640625, -143.83984375, -136.0390625, -128.23828125, -120.4375, -112.63671875, -104.8359375, -97.03515625, -89.234375, -81.43359375, -73.6328125, -65.83203125, -58.03125, -50.23046875, -42.4296875, -34.62890625, -26.828125, -19.02734375, -11.2265625, -3.42578125, 4.375, 12.17578125, 19.9765625, 27.77734375, 35.578125, 43.37890625, 51.1796875, 58.98046875, 66.78125, 74.58203125, 82.3828125, 90.18359375, 97.984375, 105.78515625, 113.5859375, 121.38671875, 129.1875, 136.98828125, 144.7890625, 152.58984375, 160.390625, 168.19140625, 175.9921875, 183.79296875, 191.59375, 199.39453125, 207.1953125, 214.99609375, 222.796875, 230.59765625, 238.3984375, 246.19921875, 254.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 10.0, 15.0, 11.0, 24.0, 31.0, 34.0, 56.0, 60.0, 94.0, 99.0, 100.0, 103.0, 98.0, 57.0, 50.0, 36.0, 32.0, 13.0, 12.0, 10.0, 4.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0230712890625, -0.02243518829345703, -0.021799087524414062, -0.021162986755371094, -0.020526885986328125, -0.019890785217285156, -0.019254684448242188, -0.01861858367919922, -0.01798248291015625, -0.01734638214111328, -0.016710281372070312, -0.016074180603027344, -0.015438079833984375, -0.014801979064941406, -0.014165878295898438, -0.013529777526855469, -0.0128936767578125, -0.012257575988769531, -0.011621475219726562, -0.010985374450683594, -0.010349273681640625, -0.009713172912597656, -0.009077072143554688, -0.008440971374511719, -0.00780487060546875, -0.007168769836425781, -0.0065326690673828125, -0.005896568298339844, -0.005260467529296875, -0.004624366760253906, -0.0039882659912109375, -0.0033521652221679688, -0.002716064453125, -0.0020799636840820312, -0.0014438629150390625, -0.0008077621459960938, -0.000171661376953125, 0.00046443939208984375, 0.0011005401611328125, 0.0017366409301757812, 0.00237274169921875, 0.0030088424682617188, 0.0036449432373046875, 0.004281044006347656, 0.004917144775390625, 0.005553245544433594, 0.0061893463134765625, 0.006825447082519531, 0.0074615478515625, 0.008097648620605469, 0.008733749389648438, 0.009369850158691406, 0.010005950927734375, 0.010642051696777344, 0.011278152465820312, 0.011914253234863281, 0.01255035400390625, 0.013186454772949219, 0.013822555541992188, 0.014458656311035156, 0.015094757080078125, 0.015730857849121094, 0.016366958618164062, 0.01700305938720703, 0.01763916015625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 18.0, 16.0, 35.0, 36.0, 69.0, 95.0, 127.0, 184.0, 259.0, 387.0, 544.0, 768.0, 1225.0, 1772.0, 2759.0, 4394.0, 7298.0, 13809.0, 30660.0, 79612.0, 211850.0, 344514.0, 206924.0, 78026.0, 29707.0, 13659.0, 7199.0, 4261.0, 2768.0, 1750.0, 1282.0, 758.0, 531.0, 385.0, 266.0, 174.0, 135.0, 84.0, 59.0, 42.0, 39.0, 19.0, 15.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-147.75, -143.337890625, -138.92578125, -134.513671875, -130.1015625, -125.689453125, -121.27734375, -116.865234375, -112.453125, -108.041015625, -103.62890625, -99.216796875, -94.8046875, -90.392578125, -85.98046875, -81.568359375, -77.15625, -72.744140625, -68.33203125, -63.919921875, -59.5078125, -55.095703125, -50.68359375, -46.271484375, -41.859375, -37.447265625, -33.03515625, -28.623046875, -24.2109375, -19.798828125, -15.38671875, -10.974609375, -6.5625, -2.150390625, 2.26171875, 6.673828125, 11.0859375, 15.498046875, 19.91015625, 24.322265625, 28.734375, 33.146484375, 37.55859375, 41.970703125, 46.3828125, 50.794921875, 55.20703125, 59.619140625, 64.03125, 68.443359375, 72.85546875, 77.267578125, 81.6796875, 86.091796875, 90.50390625, 94.916015625, 99.328125, 103.740234375, 108.15234375, 112.564453125, 116.9765625, 121.388671875, 125.80078125, 130.212890625, 134.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 6.0, 13.0, 28.0, 38.0, 66.0, 84.0, 116.0, 128.0, 126.0, 106.0, 67.0, 66.0, 35.0, 28.0, 18.0, 9.0, 11.0, 5.0, 3.0, 1.0, 2.0, 8.0, 1.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.53125, -60.6923828125, -58.853515625, -57.0146484375, -55.17578125, -53.3369140625, -51.498046875, -49.6591796875, -47.8203125, -45.9814453125, -44.142578125, -42.3037109375, -40.46484375, -38.6259765625, -36.787109375, -34.9482421875, -33.109375, -31.2705078125, -29.431640625, -27.5927734375, -25.75390625, -23.9150390625, -22.076171875, -20.2373046875, -18.3984375, -16.5595703125, -14.720703125, -12.8818359375, -11.04296875, -9.2041015625, -7.365234375, -5.5263671875, -3.6875, -1.8486328125, -0.009765625, 1.8291015625, 3.66796875, 5.5068359375, 7.345703125, 9.1845703125, 11.0234375, 12.8623046875, 14.701171875, 16.5400390625, 18.37890625, 20.2177734375, 22.056640625, 23.8955078125, 25.734375, 27.5732421875, 29.412109375, 31.2509765625, 33.08984375, 34.9287109375, 36.767578125, 38.6064453125, 40.4453125, 42.2841796875, 44.123046875, 45.9619140625, 47.80078125, 49.6396484375, 51.478515625, 53.3173828125, 55.15625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 11.0, 13.0, 13.0, 15.0, 16.0, 20.0, 20.0, 31.0, 33.0, 27.0, 36.0, 57.0, 37.0, 51.0, 49.0, 46.0, 40.0, 50.0, 45.0, 55.0, 33.0, 43.0, 32.0, 30.0, 21.0, 26.0, 21.0, 20.0, 12.0, 14.0, 11.0, 5.0, 7.0, 14.0, 1.0, 3.0, 9.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.33639526367188, -70.1641845703125, -67.99197387695312, -65.81976318359375, -63.647552490234375, -61.475341796875, -59.30312728881836, -57.130916595458984, -54.95870590209961, -52.786495208740234, -50.61428451538086, -48.442073822021484, -46.269859313964844, -44.09764862060547, -41.925437927246094, -39.75322723388672, -37.581016540527344, -35.40880584716797, -33.236595153808594, -31.064382553100586, -28.89217185974121, -26.719961166381836, -24.547748565673828, -22.375537872314453, -20.203327178955078, -18.031116485595703, -15.858904838562012, -13.68669319152832, -11.514482498168945, -9.34227180480957, -7.170060157775879, -4.9978485107421875, -2.8256454467773438, -0.6534342765808105, 1.5187768936157227, 3.690988063812256, 5.863199234008789, 8.035409927368164, 10.207621574401855, 12.379833221435547, 14.552043914794922, 16.724254608154297, 18.896465301513672, 21.06867790222168, 23.240888595581055, 25.41309928894043, 27.585311889648438, 29.757522583007812, 31.929733276367188, 34.10194396972656, 36.27415466308594, 38.44636535644531, 40.61857604980469, 42.79078674316406, 44.9630012512207, 47.13521194458008, 49.30742263793945, 51.47963333129883, 53.6518440246582, 55.82405471801758, 57.99626922607422, 60.168479919433594, 62.34069061279297, 64.51290130615234, 66.68511199951172]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 6.0, 12.0, 13.0, 12.0, 14.0, 25.0, 20.0, 18.0, 24.0, 27.0, 31.0, 32.0, 27.0, 33.0, 42.0, 32.0, 41.0, 45.0, 48.0, 43.0, 40.0, 37.0, 33.0, 36.0, 26.0, 32.0, 34.0, 28.0, 19.0, 28.0, 21.0, 12.0, 16.0, 17.0, 22.0, 9.0, 8.0, 6.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-74.7188720703125, -72.49765014648438, -70.27642822265625, -68.05520629882812, -65.833984375, -63.612762451171875, -61.391536712646484, -59.17031478881836, -56.949092864990234, -54.72787094116211, -52.506649017333984, -50.28542709350586, -48.06420135498047, -45.842979431152344, -43.62175750732422, -41.400535583496094, -39.17931365966797, -36.958091735839844, -34.73686981201172, -32.515647888183594, -30.294424057006836, -28.07320213317871, -25.851978302001953, -23.630756378173828, -21.409534454345703, -19.188312530517578, -16.967090606689453, -14.745866775512695, -12.52464485168457, -10.303422927856445, -8.082200050354004, -5.8609771728515625, -3.6397552490234375, -1.4185328483581543, 0.8026895523071289, 3.023911952972412, 5.245134353637695, 7.46635627746582, 9.687579154968262, 11.908802032470703, 14.130023956298828, 16.351245880126953, 18.572467803955078, 20.793691635131836, 23.01491355895996, 25.236135482788086, 27.457359313964844, 29.67858123779297, 31.899803161621094, 34.12102508544922, 36.342247009277344, 38.56346893310547, 40.784690856933594, 43.00591278076172, 45.22713851928711, 47.448360443115234, 49.66958236694336, 51.890804290771484, 54.11202621459961, 56.333248138427734, 58.554473876953125, 60.77569580078125, 62.996917724609375, 65.2181396484375, 67.43936157226562]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 12.0, 24.0, 38.0, 56.0, 78.0, 118.0, 186.0, 297.0, 453.0, 709.0, 1081.0, 1822.0, 3001.0, 4544.0, 7477.0, 11655.0, 18677.0, 28747.0, 43543.0, 63891.0, 89948.0, 116111.0, 133377.0, 133466.0, 115317.0, 89295.0, 63516.0, 43298.0, 28446.0, 18325.0, 11753.0, 7213.0, 4430.0, 2819.0, 1817.0, 1094.0, 727.0, 438.0, 253.0, 161.0, 121.0, 80.0, 61.0, 24.0, 22.0, 14.0, 6.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-61.3125, -59.267578125, -57.22265625, -55.177734375, -53.1328125, -51.087890625, -49.04296875, -46.998046875, -44.953125, -42.908203125, -40.86328125, -38.818359375, -36.7734375, -34.728515625, -32.68359375, -30.638671875, -28.59375, -26.548828125, -24.50390625, -22.458984375, -20.4140625, -18.369140625, -16.32421875, -14.279296875, -12.234375, -10.189453125, -8.14453125, -6.099609375, -4.0546875, -2.009765625, 0.03515625, 2.080078125, 4.125, 6.169921875, 8.21484375, 10.259765625, 12.3046875, 14.349609375, 16.39453125, 18.439453125, 20.484375, 22.529296875, 24.57421875, 26.619140625, 28.6640625, 30.708984375, 32.75390625, 34.798828125, 36.84375, 38.888671875, 40.93359375, 42.978515625, 45.0234375, 47.068359375, 49.11328125, 51.158203125, 53.203125, 55.248046875, 57.29296875, 59.337890625, 61.3828125, 63.427734375, 65.47265625, 67.517578125, 69.5625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 6.0, 11.0, 6.0, 17.0, 15.0, 14.0, 22.0, 20.0, 18.0, 27.0, 30.0, 31.0, 31.0, 41.0, 48.0, 41.0, 44.0, 39.0, 43.0, 50.0, 42.0, 50.0, 36.0, 33.0, 39.0, 30.0, 26.0, 31.0, 24.0, 12.0, 18.0, 19.0, 15.0, 14.0, 14.0, 9.0, 9.0, 5.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.625, -70.4365234375, -68.248046875, -66.0595703125, -63.87109375, -61.6826171875, -59.494140625, -57.3056640625, -55.1171875, -52.9287109375, -50.740234375, -48.5517578125, -46.36328125, -44.1748046875, -41.986328125, -39.7978515625, -37.609375, -35.4208984375, -33.232421875, -31.0439453125, -28.85546875, -26.6669921875, -24.478515625, -22.2900390625, -20.1015625, -17.9130859375, -15.724609375, -13.5361328125, -11.34765625, -9.1591796875, -6.970703125, -4.7822265625, -2.59375, -0.4052734375, 1.783203125, 3.9716796875, 6.16015625, 8.3486328125, 10.537109375, 12.7255859375, 14.9140625, 17.1025390625, 19.291015625, 21.4794921875, 23.66796875, 25.8564453125, 28.044921875, 30.2333984375, 32.421875, 34.6103515625, 36.798828125, 38.9873046875, 41.17578125, 43.3642578125, 45.552734375, 47.7412109375, 49.9296875, 52.1181640625, 54.306640625, 56.4951171875, 58.68359375, 60.8720703125, 63.060546875, 65.2490234375, 67.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 11.0, 15.0, 20.0, 35.0, 37.0, 46.0, 96.0, 130.0, 186.0, 331.0, 433.0, 593.0, 969.0, 1316.0, 1964.0, 2848.0, 4191.0, 6259.0, 9320.0, 14155.0, 21104.0, 31531.0, 46057.0, 66168.0, 92208.0, 118402.0, 134560.0, 129536.0, 107743.0, 80742.0, 57574.0, 39456.0, 26401.0, 17748.0, 11854.0, 7807.0, 5331.0, 3657.0, 2418.0, 1649.0, 1176.0, 791.0, 508.0, 373.0, 267.0, 177.0, 128.0, 75.0, 49.0, 39.0, 28.0, 12.0, 6.0, 11.0, 3.0, 2.0, 2.0, 3.0], "bins": [-79.125, -76.7119140625, -74.298828125, -71.8857421875, -69.47265625, -67.0595703125, -64.646484375, -62.2333984375, -59.8203125, -57.4072265625, -54.994140625, -52.5810546875, -50.16796875, -47.7548828125, -45.341796875, -42.9287109375, -40.515625, -38.1025390625, -35.689453125, -33.2763671875, -30.86328125, -28.4501953125, -26.037109375, -23.6240234375, -21.2109375, -18.7978515625, -16.384765625, -13.9716796875, -11.55859375, -9.1455078125, -6.732421875, -4.3193359375, -1.90625, 0.5068359375, 2.919921875, 5.3330078125, 7.74609375, 10.1591796875, 12.572265625, 14.9853515625, 17.3984375, 19.8115234375, 22.224609375, 24.6376953125, 27.05078125, 29.4638671875, 31.876953125, 34.2900390625, 36.703125, 39.1162109375, 41.529296875, 43.9423828125, 46.35546875, 48.7685546875, 51.181640625, 53.5947265625, 56.0078125, 58.4208984375, 60.833984375, 63.2470703125, 65.66015625, 68.0732421875, 70.486328125, 72.8994140625, 75.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 11.0, 10.0, 12.0, 18.0, 15.0, 15.0, 22.0, 24.0, 28.0, 29.0, 39.0, 30.0, 36.0, 32.0, 35.0, 38.0, 39.0, 41.0, 28.0, 41.0, 40.0, 56.0, 32.0, 30.0, 31.0, 33.0, 29.0, 26.0, 21.0, 22.0, 17.0, 17.0, 18.0, 8.0, 9.0, 9.0, 10.0, 3.0, 2.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-57.59375, -55.91259765625, -54.2314453125, -52.55029296875, -50.869140625, -49.18798828125, -47.5068359375, -45.82568359375, -44.14453125, -42.46337890625, -40.7822265625, -39.10107421875, -37.419921875, -35.73876953125, -34.0576171875, -32.37646484375, -30.6953125, -29.01416015625, -27.3330078125, -25.65185546875, -23.970703125, -22.28955078125, -20.6083984375, -18.92724609375, -17.24609375, -15.56494140625, -13.8837890625, -12.20263671875, -10.521484375, -8.84033203125, -7.1591796875, -5.47802734375, -3.796875, -2.11572265625, -0.4345703125, 1.24658203125, 2.927734375, 4.60888671875, 6.2900390625, 7.97119140625, 9.65234375, 11.33349609375, 13.0146484375, 14.69580078125, 16.376953125, 18.05810546875, 19.7392578125, 21.42041015625, 23.1015625, 24.78271484375, 26.4638671875, 28.14501953125, 29.826171875, 31.50732421875, 33.1884765625, 34.86962890625, 36.55078125, 38.23193359375, 39.9130859375, 41.59423828125, 43.275390625, 44.95654296875, 46.6376953125, 48.31884765625, 50.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 9.0, 7.0, 15.0, 28.0, 32.0, 49.0, 52.0, 88.0, 148.0, 197.0, 287.0, 406.0, 529.0, 843.0, 1275.0, 1832.0, 2737.0, 3984.0, 6319.0, 9915.0, 16671.0, 28621.0, 51787.0, 97416.0, 172311.0, 229689.0, 183586.0, 105237.0, 55843.0, 30232.0, 17689.0, 10731.0, 6636.0, 4281.0, 2955.0, 1965.0, 1332.0, 851.0, 606.0, 413.0, 271.0, 200.0, 145.0, 100.0, 69.0, 52.0, 33.0, 26.0, 26.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.9375, -69.4189453125, -66.900390625, -64.3818359375, -61.86328125, -59.3447265625, -56.826171875, -54.3076171875, -51.7890625, -49.2705078125, -46.751953125, -44.2333984375, -41.71484375, -39.1962890625, -36.677734375, -34.1591796875, -31.640625, -29.1220703125, -26.603515625, -24.0849609375, -21.56640625, -19.0478515625, -16.529296875, -14.0107421875, -11.4921875, -8.9736328125, -6.455078125, -3.9365234375, -1.41796875, 1.1005859375, 3.619140625, 6.1376953125, 8.65625, 11.1748046875, 13.693359375, 16.2119140625, 18.73046875, 21.2490234375, 23.767578125, 26.2861328125, 28.8046875, 31.3232421875, 33.841796875, 36.3603515625, 38.87890625, 41.3974609375, 43.916015625, 46.4345703125, 48.953125, 51.4716796875, 53.990234375, 56.5087890625, 59.02734375, 61.5458984375, 64.064453125, 66.5830078125, 69.1015625, 71.6201171875, 74.138671875, 76.6572265625, 79.17578125, 81.6943359375, 84.212890625, 86.7314453125, 89.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 6.0, 8.0, 10.0, 5.0, 14.0, 22.0, 32.0, 48.0, 59.0, 87.0, 96.0, 126.0, 113.0, 93.0, 77.0, 58.0, 38.0, 34.0, 17.0, 11.0, 7.0, 12.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01236724853515625, -0.011964917182922363, -0.011562585830688477, -0.01116025447845459, -0.010757923126220703, -0.010355591773986816, -0.00995326042175293, -0.009550929069519043, -0.009148597717285156, -0.00874626636505127, -0.008343935012817383, -0.007941603660583496, -0.007539272308349609, -0.007136940956115723, -0.006734609603881836, -0.006332278251647949, -0.0059299468994140625, -0.005527615547180176, -0.005125284194946289, -0.004722952842712402, -0.004320621490478516, -0.003918290138244629, -0.003515958786010742, -0.0031136274337768555, -0.0027112960815429688, -0.002308964729309082, -0.0019066333770751953, -0.0015043020248413086, -0.0011019706726074219, -0.0006996393203735352, -0.00029730796813964844, 0.00010502338409423828, 0.000507354736328125, 0.0009096860885620117, 0.0013120174407958984, 0.0017143487930297852, 0.002116680145263672, 0.0025190114974975586, 0.0029213428497314453, 0.003323674201965332, 0.0037260055541992188, 0.0041283369064331055, 0.004530668258666992, 0.004932999610900879, 0.005335330963134766, 0.005737662315368652, 0.006139993667602539, 0.006542325019836426, 0.0069446563720703125, 0.007346987724304199, 0.007749319076538086, 0.008151650428771973, 0.00855398178100586, 0.008956313133239746, 0.009358644485473633, 0.00976097583770752, 0.010163307189941406, 0.010565638542175293, 0.01096796989440918, 0.011370301246643066, 0.011772632598876953, 0.01217496395111084, 0.012577295303344727, 0.012979626655578613, 0.0133819580078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 15.0, 8.0, 13.0, 19.0, 29.0, 40.0, 64.0, 83.0, 109.0, 187.0, 242.0, 371.0, 544.0, 843.0, 1214.0, 1889.0, 2840.0, 4486.0, 7143.0, 11606.0, 18710.0, 31895.0, 54584.0, 96629.0, 158445.0, 207203.0, 177132.0, 112300.0, 64831.0, 37063.0, 21812.0, 13054.0, 8234.0, 5100.0, 3349.0, 2167.0, 1425.0, 954.0, 659.0, 390.0, 260.0, 174.0, 137.0, 95.0, 73.0, 36.0, 31.0, 29.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-69.6875, -67.552734375, -65.41796875, -63.283203125, -61.1484375, -59.013671875, -56.87890625, -54.744140625, -52.609375, -50.474609375, -48.33984375, -46.205078125, -44.0703125, -41.935546875, -39.80078125, -37.666015625, -35.53125, -33.396484375, -31.26171875, -29.126953125, -26.9921875, -24.857421875, -22.72265625, -20.587890625, -18.453125, -16.318359375, -14.18359375, -12.048828125, -9.9140625, -7.779296875, -5.64453125, -3.509765625, -1.375, 0.759765625, 2.89453125, 5.029296875, 7.1640625, 9.298828125, 11.43359375, 13.568359375, 15.703125, 17.837890625, 19.97265625, 22.107421875, 24.2421875, 26.376953125, 28.51171875, 30.646484375, 32.78125, 34.916015625, 37.05078125, 39.185546875, 41.3203125, 43.455078125, 45.58984375, 47.724609375, 49.859375, 51.994140625, 54.12890625, 56.263671875, 58.3984375, 60.533203125, 62.66796875, 64.802734375, 66.9375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 6.0, 4.0, 16.0, 12.0, 10.0, 19.0, 16.0, 22.0, 24.0, 24.0, 38.0, 43.0, 49.0, 54.0, 63.0, 68.0, 64.0, 58.0, 59.0, 52.0, 45.0, 43.0, 48.0, 25.0, 26.0, 19.0, 25.0, 11.0, 11.0, 9.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.947998046875, -22.14599609375, -21.343994140625, -20.5419921875, -19.739990234375, -18.93798828125, -18.135986328125, -17.333984375, -16.531982421875, -15.72998046875, -14.927978515625, -14.1259765625, -13.323974609375, -12.52197265625, -11.719970703125, -10.91796875, -10.115966796875, -9.31396484375, -8.511962890625, -7.7099609375, -6.907958984375, -6.10595703125, -5.303955078125, -4.501953125, -3.699951171875, -2.89794921875, -2.095947265625, -1.2939453125, -0.491943359375, 0.31005859375, 1.112060546875, 1.9140625, 2.716064453125, 3.51806640625, 4.320068359375, 5.1220703125, 5.924072265625, 6.72607421875, 7.528076171875, 8.330078125, 9.132080078125, 9.93408203125, 10.736083984375, 11.5380859375, 12.340087890625, 13.14208984375, 13.944091796875, 14.74609375, 15.548095703125, 16.35009765625, 17.152099609375, 17.9541015625, 18.756103515625, 19.55810546875, 20.360107421875, 21.162109375, 21.964111328125, 22.76611328125, 23.568115234375, 24.3701171875, 25.172119140625, 25.97412109375, 26.776123046875, 27.578125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 7.0, 9.0, 11.0, 14.0, 14.0, 24.0, 23.0, 28.0, 24.0, 29.0, 28.0, 39.0, 37.0, 46.0, 41.0, 44.0, 45.0, 53.0, 50.0, 42.0, 40.0, 34.0, 36.0, 28.0, 33.0, 26.0, 30.0, 23.0, 28.0, 23.0, 15.0, 17.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.84236907958984, -68.74482727050781, -66.64729309082031, -64.54975128173828, -62.452213287353516, -60.35467529296875, -58.25713348388672, -56.15959548950195, -54.06205749511719, -51.96451950073242, -49.86697769165039, -47.769439697265625, -45.67190170288086, -43.574363708496094, -41.47682189941406, -39.3792839050293, -37.281742095947266, -35.1842041015625, -33.08666229248047, -30.989124298095703, -28.891586303710938, -26.79404640197754, -24.69650650024414, -22.598968505859375, -20.501428604125977, -18.403888702392578, -16.306350708007812, -14.208810806274414, -12.111271858215332, -10.01373291015625, -7.916193008422852, -5.8186540603637695, -3.7211151123046875, -1.6235759258270264, 0.47396326065063477, 2.571502685546875, 4.669041633605957, 6.766580581665039, 8.864120483398438, 10.96165943145752, 13.059198379516602, 15.156737327575684, 17.254276275634766, 19.351816177368164, 21.449356079101562, 23.546894073486328, 25.644433975219727, 27.741973876953125, 29.83951187133789, 31.93705177307129, 34.03459167480469, 36.13212966918945, 38.22966766357422, 40.32720947265625, 42.424747467041016, 44.52228546142578, 46.61982727050781, 48.71736526489258, 50.81490707397461, 52.912445068359375, 55.00998306274414, 57.107521057128906, 59.20506286621094, 61.3026008605957, 63.40013885498047]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 0.0, 3.0, 4.0, 8.0, 10.0, 14.0, 11.0, 15.0, 17.0, 18.0, 25.0, 31.0, 36.0, 21.0, 32.0, 36.0, 35.0, 38.0, 48.0, 35.0, 35.0, 48.0, 50.0, 40.0, 31.0, 41.0, 31.0, 35.0, 32.0, 24.0, 21.0, 37.0, 16.0, 22.0, 14.0, 15.0, 8.0, 13.0, 12.0, 6.0, 11.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-82.25519561767578, -79.89909362792969, -77.5429916381836, -75.1868896484375, -72.83078002929688, -70.47467803955078, -68.11857604980469, -65.7624740600586, -63.4063720703125, -61.050270080566406, -58.69416427612305, -56.33806228637695, -53.98196029663086, -51.6258544921875, -49.269752502441406, -46.91365051269531, -44.55754470825195, -42.20144271850586, -39.8453369140625, -37.489234924316406, -35.13313293457031, -32.77703094482422, -30.42092514038086, -28.064823150634766, -25.70871925354004, -23.352615356445312, -20.99651336669922, -18.640409469604492, -16.284305572509766, -13.928203582763672, -11.572099685668945, -9.215997695922852, -6.859893798828125, -4.503790855407715, -2.1476874351501465, 0.20841598510742188, 2.564518928527832, 4.920621871948242, 7.276725769042969, 9.632827758789062, 11.988931655883789, 14.3450345993042, 16.70113754272461, 19.057241439819336, 21.413345336914062, 23.769447326660156, 26.125551223754883, 28.481653213500977, 30.837757110595703, 33.1938591003418, 35.549964904785156, 37.90606689453125, 40.262168884277344, 42.61827087402344, 44.9743766784668, 47.33047866821289, 49.68658447265625, 52.042686462402344, 54.3987922668457, 56.7548942565918, 59.11099624633789, 61.46710205078125, 63.823204040527344, 66.17930603027344, 68.53540802001953]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 8.0, 9.0, 15.0, 28.0, 34.0, 55.0, 94.0, 144.0, 299.0, 537.0, 910.0, 1701.0, 3022.0, 5942.0, 11319.0, 22160.0, 44759.0, 92201.0, 196775.0, 425776.0, 817788.0, 1052723.0, 774938.0, 392618.0, 181550.0, 85167.0, 41000.0, 20661.0, 10382.0, 5406.0, 2776.0, 1512.0, 829.0, 459.0, 295.0, 143.0, 94.0, 50.0, 40.0, 26.0, 13.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.6875, -84.1708984375, -81.654296875, -79.1376953125, -76.62109375, -74.1044921875, -71.587890625, -69.0712890625, -66.5546875, -64.0380859375, -61.521484375, -59.0048828125, -56.48828125, -53.9716796875, -51.455078125, -48.9384765625, -46.421875, -43.9052734375, -41.388671875, -38.8720703125, -36.35546875, -33.8388671875, -31.322265625, -28.8056640625, -26.2890625, -23.7724609375, -21.255859375, -18.7392578125, -16.22265625, -13.7060546875, -11.189453125, -8.6728515625, -6.15625, -3.6396484375, -1.123046875, 1.3935546875, 3.91015625, 6.4267578125, 8.943359375, 11.4599609375, 13.9765625, 16.4931640625, 19.009765625, 21.5263671875, 24.04296875, 26.5595703125, 29.076171875, 31.5927734375, 34.109375, 36.6259765625, 39.142578125, 41.6591796875, 44.17578125, 46.6923828125, 49.208984375, 51.7255859375, 54.2421875, 56.7587890625, 59.275390625, 61.7919921875, 64.30859375, 66.8251953125, 69.341796875, 71.8583984375, 74.375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 16.0, 18.0, 21.0, 21.0, 22.0, 20.0, 28.0, 30.0, 35.0, 46.0, 47.0, 39.0, 32.0, 27.0, 47.0, 49.0, 47.0, 30.0, 39.0, 48.0, 35.0, 24.0, 28.0, 35.0, 26.0, 23.0, 25.0, 18.0, 21.0, 10.0, 11.0, 13.0, 10.0, 9.0, 8.0, 3.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.0625, -63.27490234375, -61.4873046875, -59.69970703125, -57.912109375, -56.12451171875, -54.3369140625, -52.54931640625, -50.76171875, -48.97412109375, -47.1865234375, -45.39892578125, -43.611328125, -41.82373046875, -40.0361328125, -38.24853515625, -36.4609375, -34.67333984375, -32.8857421875, -31.09814453125, -29.310546875, -27.52294921875, -25.7353515625, -23.94775390625, -22.16015625, -20.37255859375, -18.5849609375, -16.79736328125, -15.009765625, -13.22216796875, -11.4345703125, -9.64697265625, -7.859375, -6.07177734375, -4.2841796875, -2.49658203125, -0.708984375, 1.07861328125, 2.8662109375, 4.65380859375, 6.44140625, 8.22900390625, 10.0166015625, 11.80419921875, 13.591796875, 15.37939453125, 17.1669921875, 18.95458984375, 20.7421875, 22.52978515625, 24.3173828125, 26.10498046875, 27.892578125, 29.68017578125, 31.4677734375, 33.25537109375, 35.04296875, 36.83056640625, 38.6181640625, 40.40576171875, 42.193359375, 43.98095703125, 45.7685546875, 47.55615234375, 49.34375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 11.0, 14.0, 22.0, 45.0, 57.0, 128.0, 212.0, 392.0, 697.0, 1231.0, 2222.0, 4284.0, 7743.0, 14628.0, 27537.0, 52178.0, 98188.0, 182586.0, 330433.0, 552318.0, 778712.0, 792791.0, 579803.0, 350044.0, 195364.0, 104400.0, 55414.0, 29086.0, 15386.0, 8341.0, 4481.0, 2457.0, 1365.0, 729.0, 424.0, 230.0, 141.0, 85.0, 40.0, 22.0, 11.0, 11.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-75.5625, -73.40673828125, -71.2509765625, -69.09521484375, -66.939453125, -64.78369140625, -62.6279296875, -60.47216796875, -58.31640625, -56.16064453125, -54.0048828125, -51.84912109375, -49.693359375, -47.53759765625, -45.3818359375, -43.22607421875, -41.0703125, -38.91455078125, -36.7587890625, -34.60302734375, -32.447265625, -30.29150390625, -28.1357421875, -25.97998046875, -23.82421875, -21.66845703125, -19.5126953125, -17.35693359375, -15.201171875, -13.04541015625, -10.8896484375, -8.73388671875, -6.578125, -4.42236328125, -2.2666015625, -0.11083984375, 2.044921875, 4.20068359375, 6.3564453125, 8.51220703125, 10.66796875, 12.82373046875, 14.9794921875, 17.13525390625, 19.291015625, 21.44677734375, 23.6025390625, 25.75830078125, 27.9140625, 30.06982421875, 32.2255859375, 34.38134765625, 36.537109375, 38.69287109375, 40.8486328125, 43.00439453125, 45.16015625, 47.31591796875, 49.4716796875, 51.62744140625, 53.783203125, 55.93896484375, 58.0947265625, 60.25048828125, 62.40625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 9.0, 31.0, 28.0, 30.0, 38.0, 50.0, 52.0, 68.0, 92.0, 111.0, 142.0, 154.0, 169.0, 194.0, 199.0, 239.0, 284.0, 257.0, 274.0, 237.0, 208.0, 193.0, 176.0, 174.0, 127.0, 123.0, 70.0, 70.0, 52.0, 48.0, 34.0, 29.0, 20.0, 13.0, 13.0, 11.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.140625, -27.32080078125, -26.5009765625, -25.68115234375, -24.861328125, -24.04150390625, -23.2216796875, -22.40185546875, -21.58203125, -20.76220703125, -19.9423828125, -19.12255859375, -18.302734375, -17.48291015625, -16.6630859375, -15.84326171875, -15.0234375, -14.20361328125, -13.3837890625, -12.56396484375, -11.744140625, -10.92431640625, -10.1044921875, -9.28466796875, -8.46484375, -7.64501953125, -6.8251953125, -6.00537109375, -5.185546875, -4.36572265625, -3.5458984375, -2.72607421875, -1.90625, -1.08642578125, -0.2666015625, 0.55322265625, 1.373046875, 2.19287109375, 3.0126953125, 3.83251953125, 4.65234375, 5.47216796875, 6.2919921875, 7.11181640625, 7.931640625, 8.75146484375, 9.5712890625, 10.39111328125, 11.2109375, 12.03076171875, 12.8505859375, 13.67041015625, 14.490234375, 15.31005859375, 16.1298828125, 16.94970703125, 17.76953125, 18.58935546875, 19.4091796875, 20.22900390625, 21.048828125, 21.86865234375, 22.6884765625, 23.50830078125, 24.328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 9.0, 10.0, 11.0, 12.0, 18.0, 19.0, 26.0, 36.0, 31.0, 28.0, 37.0, 43.0, 35.0, 45.0, 48.0, 57.0, 49.0, 60.0, 43.0, 49.0, 45.0, 45.0, 36.0, 40.0, 32.0, 19.0, 28.0, 17.0, 12.0, 10.0, 13.0, 3.0, 13.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.50790023803711, -59.4245719909668, -57.341243743896484, -55.257911682128906, -53.174583435058594, -51.09125518798828, -49.00792694091797, -46.924598693847656, -44.841270446777344, -42.75794219970703, -40.67461395263672, -38.591285705566406, -36.50795364379883, -34.424625396728516, -32.3412971496582, -30.25796890258789, -28.174636840820312, -26.09130859375, -24.007978439331055, -21.924650192260742, -19.841320037841797, -17.757991790771484, -15.674663543701172, -13.591334342956543, -11.508005142211914, -9.424675941467285, -7.3413472175598145, -5.258018493652344, -3.174689292907715, -1.091360092163086, 0.9919681549072266, 3.0752973556518555, 5.158622741699219, 7.241951942443848, 9.325281143188477, 11.408609390258789, 13.491938591003418, 15.575267791748047, 17.65859603881836, 19.741924285888672, 21.825254440307617, 23.90858268737793, 25.991912841796875, 28.075241088867188, 30.1585693359375, 32.24189758300781, 34.325225830078125, 36.4085578918457, 38.491886138916016, 40.57521438598633, 42.65854263305664, 44.74187469482422, 46.82520294189453, 48.908531188964844, 50.991859436035156, 53.07518768310547, 55.15851593017578, 57.241844177246094, 59.325172424316406, 61.40850067138672, 63.4918327331543, 65.57516479492188, 67.65849304199219, 69.7418212890625, 71.82514953613281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 5.0, 7.0, 5.0, 7.0, 16.0, 11.0, 8.0, 15.0, 26.0, 29.0, 28.0, 24.0, 38.0, 38.0, 36.0, 34.0, 41.0, 38.0, 38.0, 35.0, 36.0, 41.0, 40.0, 29.0, 33.0, 39.0, 31.0, 37.0, 23.0, 38.0, 22.0, 13.0, 19.0, 19.0, 14.0, 6.0, 14.0, 12.0, 9.0, 6.0, 3.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-71.58344268798828, -69.53543853759766, -67.48743438720703, -65.43943786621094, -63.39143371582031, -61.34342956542969, -59.29542541503906, -57.24742126464844, -55.19942092895508, -53.15141677856445, -51.103416442871094, -49.05541229248047, -47.007408142089844, -44.959407806396484, -42.91140365600586, -40.8634033203125, -38.815399169921875, -36.76739501953125, -34.71939468383789, -32.671390533447266, -30.623388290405273, -28.57538604736328, -26.527381896972656, -24.479379653930664, -22.431377410888672, -20.38337516784668, -18.335372924804688, -16.287368774414062, -14.23936653137207, -12.191364288330078, -10.14336109161377, -8.095357894897461, -6.047351837158203, -3.9993491172790527, -1.9513463973999023, 0.09665632247924805, 2.1446590423583984, 4.192661285400391, 6.240664482116699, 8.288667678833008, 10.336669921875, 12.384672164916992, 14.4326753616333, 16.48067855834961, 18.5286808013916, 20.576683044433594, 22.62468719482422, 24.67268943786621, 26.720691680908203, 28.768693923950195, 30.816696166992188, 32.86470031738281, 34.91270446777344, 36.9607048034668, 39.00870895385742, 41.05670928955078, 43.104713439941406, 45.15271759033203, 47.20071792602539, 49.248722076416016, 51.296722412109375, 53.3447265625, 55.392730712890625, 57.44073486328125, 59.48873519897461]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 6.0, 14.0, 10.0, 18.0, 25.0, 35.0, 52.0, 75.0, 109.0, 149.0, 202.0, 326.0, 461.0, 686.0, 1141.0, 1852.0, 2952.0, 4841.0, 8641.0, 14481.0, 25283.0, 45857.0, 81637.0, 143225.0, 212320.0, 203014.0, 130139.0, 73959.0, 41175.0, 23126.0, 13162.0, 7566.0, 4505.0, 2699.0, 1664.0, 990.0, 693.0, 486.0, 307.0, 212.0, 143.0, 105.0, 56.0, 41.0, 43.0, 11.0, 16.0, 8.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-212.375, -205.921875, -199.46875, -193.015625, -186.5625, -180.109375, -173.65625, -167.203125, -160.75, -154.296875, -147.84375, -141.390625, -134.9375, -128.484375, -122.03125, -115.578125, -109.125, -102.671875, -96.21875, -89.765625, -83.3125, -76.859375, -70.40625, -63.953125, -57.5, -51.046875, -44.59375, -38.140625, -31.6875, -25.234375, -18.78125, -12.328125, -5.875, 0.578125, 7.03125, 13.484375, 19.9375, 26.390625, 32.84375, 39.296875, 45.75, 52.203125, 58.65625, 65.109375, 71.5625, 78.015625, 84.46875, 90.921875, 97.375, 103.828125, 110.28125, 116.734375, 123.1875, 129.640625, 136.09375, 142.546875, 149.0, 155.453125, 161.90625, 168.359375, 174.8125, 181.265625, 187.71875, 194.171875, 200.625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 14.0, 14.0, 26.0, 23.0, 23.0, 27.0, 34.0, 44.0, 37.0, 35.0, 41.0, 37.0, 27.0, 46.0, 44.0, 33.0, 39.0, 42.0, 37.0, 29.0, 32.0, 21.0, 35.0, 30.0, 22.0, 21.0, 13.0, 22.0, 17.0, 10.0, 12.0, 6.0, 6.0, 8.0, 6.0, 8.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.28125, -57.58837890625, -55.8955078125, -54.20263671875, -52.509765625, -50.81689453125, -49.1240234375, -47.43115234375, -45.73828125, -44.04541015625, -42.3525390625, -40.65966796875, -38.966796875, -37.27392578125, -35.5810546875, -33.88818359375, -32.1953125, -30.50244140625, -28.8095703125, -27.11669921875, -25.423828125, -23.73095703125, -22.0380859375, -20.34521484375, -18.65234375, -16.95947265625, -15.2666015625, -13.57373046875, -11.880859375, -10.18798828125, -8.4951171875, -6.80224609375, -5.109375, -3.41650390625, -1.7236328125, -0.03076171875, 1.662109375, 3.35498046875, 5.0478515625, 6.74072265625, 8.43359375, 10.12646484375, 11.8193359375, 13.51220703125, 15.205078125, 16.89794921875, 18.5908203125, 20.28369140625, 21.9765625, 23.66943359375, 25.3623046875, 27.05517578125, 28.748046875, 30.44091796875, 32.1337890625, 33.82666015625, 35.51953125, 37.21240234375, 38.9052734375, 40.59814453125, 42.291015625, 43.98388671875, 45.6767578125, 47.36962890625, 49.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 6.0, 1.0, 11.0, 12.0, 18.0, 22.0, 38.0, 53.0, 91.0, 123.0, 159.0, 266.0, 379.0, 608.0, 980.0, 1598.0, 2556.0, 4200.0, 7067.0, 12334.0, 22326.0, 41958.0, 82661.0, 170457.0, 279383.0, 206331.0, 101843.0, 50639.0, 26649.0, 14676.0, 8306.0, 4893.0, 2781.0, 1814.0, 1109.0, 764.0, 479.0, 295.0, 213.0, 138.0, 100.0, 70.0, 38.0, 36.0, 27.0, 11.0, 15.0, 12.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-225.125, -218.43359375, -211.7421875, -205.05078125, -198.359375, -191.66796875, -184.9765625, -178.28515625, -171.59375, -164.90234375, -158.2109375, -151.51953125, -144.828125, -138.13671875, -131.4453125, -124.75390625, -118.0625, -111.37109375, -104.6796875, -97.98828125, -91.296875, -84.60546875, -77.9140625, -71.22265625, -64.53125, -57.83984375, -51.1484375, -44.45703125, -37.765625, -31.07421875, -24.3828125, -17.69140625, -11.0, -4.30859375, 2.3828125, 9.07421875, 15.765625, 22.45703125, 29.1484375, 35.83984375, 42.53125, 49.22265625, 55.9140625, 62.60546875, 69.296875, 75.98828125, 82.6796875, 89.37109375, 96.0625, 102.75390625, 109.4453125, 116.13671875, 122.828125, 129.51953125, 136.2109375, 142.90234375, 149.59375, 156.28515625, 162.9765625, 169.66796875, 176.359375, 183.05078125, 189.7421875, 196.43359375, 203.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 9.0, 12.0, 13.0, 12.0, 21.0, 17.0, 32.0, 24.0, 27.0, 41.0, 38.0, 47.0, 39.0, 39.0, 48.0, 43.0, 46.0, 52.0, 46.0, 46.0, 35.0, 51.0, 44.0, 32.0, 27.0, 20.0, 20.0, 22.0, 17.0, 10.0, 11.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.75, -61.7626953125, -59.775390625, -57.7880859375, -55.80078125, -53.8134765625, -51.826171875, -49.8388671875, -47.8515625, -45.8642578125, -43.876953125, -41.8896484375, -39.90234375, -37.9150390625, -35.927734375, -33.9404296875, -31.953125, -29.9658203125, -27.978515625, -25.9912109375, -24.00390625, -22.0166015625, -20.029296875, -18.0419921875, -16.0546875, -14.0673828125, -12.080078125, -10.0927734375, -8.10546875, -6.1181640625, -4.130859375, -2.1435546875, -0.15625, 1.8310546875, 3.818359375, 5.8056640625, 7.79296875, 9.7802734375, 11.767578125, 13.7548828125, 15.7421875, 17.7294921875, 19.716796875, 21.7041015625, 23.69140625, 25.6787109375, 27.666015625, 29.6533203125, 31.640625, 33.6279296875, 35.615234375, 37.6025390625, 39.58984375, 41.5771484375, 43.564453125, 45.5517578125, 47.5390625, 49.5263671875, 51.513671875, 53.5009765625, 55.48828125, 57.4755859375, 59.462890625, 61.4501953125, 63.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 8.0, 9.0, 12.0, 16.0, 27.0, 35.0, 44.0, 66.0, 85.0, 121.0, 173.0, 290.0, 415.0, 585.0, 963.0, 1503.0, 2504.0, 4149.0, 7397.0, 14005.0, 27936.0, 60832.0, 150946.0, 348750.0, 247563.0, 95088.0, 40846.0, 19754.0, 10286.0, 5613.0, 3126.0, 1888.0, 1164.0, 739.0, 501.0, 331.0, 236.0, 136.0, 124.0, 79.0, 57.0, 41.0, 29.0, 29.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0], "bins": [-150.25, -145.9267578125, -141.603515625, -137.2802734375, -132.95703125, -128.6337890625, -124.310546875, -119.9873046875, -115.6640625, -111.3408203125, -107.017578125, -102.6943359375, -98.37109375, -94.0478515625, -89.724609375, -85.4013671875, -81.078125, -76.7548828125, -72.431640625, -68.1083984375, -63.78515625, -59.4619140625, -55.138671875, -50.8154296875, -46.4921875, -42.1689453125, -37.845703125, -33.5224609375, -29.19921875, -24.8759765625, -20.552734375, -16.2294921875, -11.90625, -7.5830078125, -3.259765625, 1.0634765625, 5.38671875, 9.7099609375, 14.033203125, 18.3564453125, 22.6796875, 27.0029296875, 31.326171875, 35.6494140625, 39.97265625, 44.2958984375, 48.619140625, 52.9423828125, 57.265625, 61.5888671875, 65.912109375, 70.2353515625, 74.55859375, 78.8818359375, 83.205078125, 87.5283203125, 91.8515625, 96.1748046875, 100.498046875, 104.8212890625, 109.14453125, 113.4677734375, 117.791015625, 122.1142578125, 126.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 2.0, 7.0, 7.0, 8.0, 16.0, 22.0, 16.0, 31.0, 51.0, 59.0, 87.0, 127.0, 120.0, 121.0, 83.0, 64.0, 43.0, 28.0, 12.0, 22.0, 15.0, 6.0, 8.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01058197021484375, -0.010209918022155762, -0.009837865829467773, -0.009465813636779785, -0.009093761444091797, -0.008721709251403809, -0.00834965705871582, -0.007977604866027832, -0.007605552673339844, -0.0072335004806518555, -0.006861448287963867, -0.006489396095275879, -0.006117343902587891, -0.005745291709899902, -0.005373239517211914, -0.005001187324523926, -0.0046291351318359375, -0.004257082939147949, -0.003885030746459961, -0.0035129785537719727, -0.0031409263610839844, -0.002768874168395996, -0.002396821975708008, -0.0020247697830200195, -0.0016527175903320312, -0.001280665397644043, -0.0009086132049560547, -0.0005365610122680664, -0.00016450881958007812, 0.00020754337310791016, 0.0005795955657958984, 0.0009516477584838867, 0.001323699951171875, 0.0016957521438598633, 0.0020678043365478516, 0.00243985652923584, 0.002811908721923828, 0.0031839609146118164, 0.0035560131072998047, 0.003928065299987793, 0.004300117492675781, 0.0046721696853637695, 0.005044221878051758, 0.005416274070739746, 0.005788326263427734, 0.006160378456115723, 0.006532430648803711, 0.006904482841491699, 0.0072765350341796875, 0.007648587226867676, 0.008020639419555664, 0.008392691612243652, 0.00876474380493164, 0.009136795997619629, 0.009508848190307617, 0.009880900382995605, 0.010252952575683594, 0.010625004768371582, 0.01099705696105957, 0.011369109153747559, 0.011741161346435547, 0.012113213539123535, 0.012485265731811523, 0.012857317924499512, 0.0132293701171875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 1.0, 10.0, 11.0, 13.0, 20.0, 29.0, 51.0, 56.0, 91.0, 114.0, 167.0, 241.0, 323.0, 499.0, 663.0, 926.0, 1420.0, 2112.0, 3354.0, 5621.0, 10124.0, 19827.0, 41169.0, 93400.0, 210790.0, 302237.0, 191986.0, 84172.0, 37122.0, 18013.0, 9376.0, 5170.0, 3052.0, 2000.0, 1354.0, 858.0, 626.0, 401.0, 326.0, 235.0, 166.0, 129.0, 75.0, 78.0, 46.0, 33.0, 29.0, 14.0, 14.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-115.375, -112.0244140625, -108.673828125, -105.3232421875, -101.97265625, -98.6220703125, -95.271484375, -91.9208984375, -88.5703125, -85.2197265625, -81.869140625, -78.5185546875, -75.16796875, -71.8173828125, -68.466796875, -65.1162109375, -61.765625, -58.4150390625, -55.064453125, -51.7138671875, -48.36328125, -45.0126953125, -41.662109375, -38.3115234375, -34.9609375, -31.6103515625, -28.259765625, -24.9091796875, -21.55859375, -18.2080078125, -14.857421875, -11.5068359375, -8.15625, -4.8056640625, -1.455078125, 1.8955078125, 5.24609375, 8.5966796875, 11.947265625, 15.2978515625, 18.6484375, 21.9990234375, 25.349609375, 28.7001953125, 32.05078125, 35.4013671875, 38.751953125, 42.1025390625, 45.453125, 48.8037109375, 52.154296875, 55.5048828125, 58.85546875, 62.2060546875, 65.556640625, 68.9072265625, 72.2578125, 75.6083984375, 78.958984375, 82.3095703125, 85.66015625, 89.0107421875, 92.361328125, 95.7119140625, 99.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 13.0, 15.0, 20.0, 19.0, 28.0, 32.0, 65.0, 52.0, 67.0, 98.0, 98.0, 94.0, 81.0, 53.0, 53.0, 44.0, 23.0, 26.0, 18.0, 16.0, 16.0, 6.0, 8.0, 8.0, 0.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.16845703125, -41.8056640625, -40.44287109375, -39.080078125, -37.71728515625, -36.3544921875, -34.99169921875, -33.62890625, -32.26611328125, -30.9033203125, -29.54052734375, -28.177734375, -26.81494140625, -25.4521484375, -24.08935546875, -22.7265625, -21.36376953125, -20.0009765625, -18.63818359375, -17.275390625, -15.91259765625, -14.5498046875, -13.18701171875, -11.82421875, -10.46142578125, -9.0986328125, -7.73583984375, -6.373046875, -5.01025390625, -3.6474609375, -2.28466796875, -0.921875, 0.44091796875, 1.8037109375, 3.16650390625, 4.529296875, 5.89208984375, 7.2548828125, 8.61767578125, 9.98046875, 11.34326171875, 12.7060546875, 14.06884765625, 15.431640625, 16.79443359375, 18.1572265625, 19.52001953125, 20.8828125, 22.24560546875, 23.6083984375, 24.97119140625, 26.333984375, 27.69677734375, 29.0595703125, 30.42236328125, 31.78515625, 33.14794921875, 34.5107421875, 35.87353515625, 37.236328125, 38.59912109375, 39.9619140625, 41.32470703125, 42.6875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 14.0, 18.0, 16.0, 38.0, 33.0, 35.0, 48.0, 39.0, 64.0, 52.0, 58.0, 66.0, 53.0, 56.0, 54.0, 44.0, 48.0, 40.0, 46.0, 25.0, 27.0, 26.0, 13.0, 11.0, 9.0, 11.0, 9.0, 4.0, 6.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23002624511719, -67.13697814941406, -65.04393768310547, -62.95089340209961, -60.85784912109375, -58.76480484008789, -56.67176055908203, -54.57871627807617, -52.48567199707031, -50.39262771606445, -48.299583435058594, -46.206539154052734, -44.113494873046875, -42.020450592041016, -39.927406311035156, -37.8343620300293, -35.74131774902344, -33.64827346801758, -31.55522918701172, -29.46218490600586, -27.369140625, -25.27609634399414, -23.18305206298828, -21.090007781982422, -18.996963500976562, -16.903919219970703, -14.810874938964844, -12.717830657958984, -10.624786376953125, -8.531742095947266, -6.438697814941406, -4.345653533935547, -2.2526168823242188, -0.15957260131835938, 1.9334716796875, 4.026515960693359, 6.119560241699219, 8.212604522705078, 10.305648803710938, 12.398693084716797, 14.491737365722656, 16.584781646728516, 18.677825927734375, 20.770870208740234, 22.863914489746094, 24.956958770751953, 27.050003051757812, 29.143047332763672, 31.23609161376953, 33.32913589477539, 35.42218017578125, 37.51522445678711, 39.60826873779297, 41.70131301879883, 43.79435729980469, 45.88740158081055, 47.980445861816406, 50.073490142822266, 52.166534423828125, 54.259578704833984, 56.352622985839844, 58.4456672668457, 60.53871154785156, 62.63175582885742, 64.72480010986328]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 8.0, 12.0, 16.0, 13.0, 16.0, 24.0, 17.0, 32.0, 32.0, 39.0, 39.0, 37.0, 35.0, 51.0, 45.0, 46.0, 56.0, 45.0, 44.0, 46.0, 52.0, 37.0, 33.0, 29.0, 31.0, 29.0, 18.0, 27.0, 16.0, 11.0, 15.0, 10.0, 6.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.37081909179688, -71.34426879882812, -69.3177261352539, -67.29117584228516, -65.2646255493164, -63.23807907104492, -61.21153259277344, -59.18498229980469, -57.15843200683594, -55.13188552856445, -53.1053352355957, -51.07878875732422, -49.05223846435547, -47.025691986083984, -44.9991455078125, -42.97259521484375, -40.946048736572266, -38.91950225830078, -36.89295196533203, -34.86640548706055, -32.8398551940918, -30.813308715820312, -28.786760330200195, -26.760211944580078, -24.73366355895996, -22.707115173339844, -20.680566787719727, -18.65401840209961, -16.627471923828125, -14.600922584533691, -12.57437515258789, -10.547826766967773, -8.521278381347656, -6.494729995727539, -4.46818208694458, -2.441634178161621, -0.4150857925415039, 1.6114625930786133, 3.638010025024414, 5.664558410644531, 7.691106796264648, 9.717655181884766, 11.744203567504883, 13.770750999450684, 15.7972993850708, 17.823848724365234, 19.85039520263672, 21.876943588256836, 23.903491973876953, 25.93004035949707, 27.956588745117188, 29.983135223388672, 32.00968551635742, 34.036231994628906, 36.062782287597656, 38.08932876586914, 40.115875244140625, 42.14242172241211, 44.16897201538086, 46.195518493652344, 48.222068786621094, 50.24861526489258, 52.27516174316406, 54.30171203613281, 56.32826232910156]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 14.0, 26.0, 35.0, 41.0, 66.0, 100.0, 157.0, 215.0, 340.0, 532.0, 671.0, 1036.0, 1562.0, 2443.0, 3686.0, 5468.0, 8493.0, 12559.0, 19438.0, 28922.0, 42544.0, 60025.0, 82178.0, 103700.0, 119772.0, 122973.0, 113078.0, 92472.0, 70804.0, 50452.0, 35098.0, 23602.0, 15647.0, 10376.0, 6709.0, 4525.0, 2933.0, 2003.0, 1223.0, 857.0, 559.0, 407.0, 257.0, 185.0, 112.0, 70.0, 68.0, 42.0, 29.0, 18.0, 9.0, 5.0, 5.0, 0.0, 4.0, 2.0], "bins": [-43.875, -42.55517578125, -41.2353515625, -39.91552734375, -38.595703125, -37.27587890625, -35.9560546875, -34.63623046875, -33.31640625, -31.99658203125, -30.6767578125, -29.35693359375, -28.037109375, -26.71728515625, -25.3974609375, -24.07763671875, -22.7578125, -21.43798828125, -20.1181640625, -18.79833984375, -17.478515625, -16.15869140625, -14.8388671875, -13.51904296875, -12.19921875, -10.87939453125, -9.5595703125, -8.23974609375, -6.919921875, -5.60009765625, -4.2802734375, -2.96044921875, -1.640625, -0.32080078125, 0.9990234375, 2.31884765625, 3.638671875, 4.95849609375, 6.2783203125, 7.59814453125, 8.91796875, 10.23779296875, 11.5576171875, 12.87744140625, 14.197265625, 15.51708984375, 16.8369140625, 18.15673828125, 19.4765625, 20.79638671875, 22.1162109375, 23.43603515625, 24.755859375, 26.07568359375, 27.3955078125, 28.71533203125, 30.03515625, 31.35498046875, 32.6748046875, 33.99462890625, 35.314453125, 36.63427734375, 37.9541015625, 39.27392578125, 40.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 12.0, 5.0, 7.0, 11.0, 17.0, 13.0, 17.0, 22.0, 19.0, 33.0, 38.0, 46.0, 37.0, 44.0, 48.0, 43.0, 45.0, 50.0, 54.0, 40.0, 55.0, 45.0, 35.0, 41.0, 39.0, 28.0, 30.0, 24.0, 16.0, 20.0, 13.0, 17.0, 11.0, 5.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-69.1875, -67.30078125, -65.4140625, -63.52734375, -61.640625, -59.75390625, -57.8671875, -55.98046875, -54.09375, -52.20703125, -50.3203125, -48.43359375, -46.546875, -44.66015625, -42.7734375, -40.88671875, -39.0, -37.11328125, -35.2265625, -33.33984375, -31.453125, -29.56640625, -27.6796875, -25.79296875, -23.90625, -22.01953125, -20.1328125, -18.24609375, -16.359375, -14.47265625, -12.5859375, -10.69921875, -8.8125, -6.92578125, -5.0390625, -3.15234375, -1.265625, 0.62109375, 2.5078125, 4.39453125, 6.28125, 8.16796875, 10.0546875, 11.94140625, 13.828125, 15.71484375, 17.6015625, 19.48828125, 21.375, 23.26171875, 25.1484375, 27.03515625, 28.921875, 30.80859375, 32.6953125, 34.58203125, 36.46875, 38.35546875, 40.2421875, 42.12890625, 44.015625, 45.90234375, 47.7890625, 49.67578125, 51.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 16.0, 25.0, 36.0, 68.0, 71.0, 116.0, 177.0, 246.0, 398.0, 637.0, 959.0, 1549.0, 2320.0, 3580.0, 5734.0, 9485.0, 15195.0, 24534.0, 40083.0, 64904.0, 101147.0, 142122.0, 165885.0, 153991.0, 115217.0, 75889.0, 47534.0, 28849.0, 17851.0, 10986.0, 6919.0, 4316.0, 2703.0, 1761.0, 1157.0, 723.0, 470.0, 267.0, 188.0, 145.0, 104.0, 67.0, 36.0, 31.0, 10.0, 15.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-58.5625, -56.77001953125, -54.9775390625, -53.18505859375, -51.392578125, -49.60009765625, -47.8076171875, -46.01513671875, -44.22265625, -42.43017578125, -40.6376953125, -38.84521484375, -37.052734375, -35.26025390625, -33.4677734375, -31.67529296875, -29.8828125, -28.09033203125, -26.2978515625, -24.50537109375, -22.712890625, -20.92041015625, -19.1279296875, -17.33544921875, -15.54296875, -13.75048828125, -11.9580078125, -10.16552734375, -8.373046875, -6.58056640625, -4.7880859375, -2.99560546875, -1.203125, 0.58935546875, 2.3818359375, 4.17431640625, 5.966796875, 7.75927734375, 9.5517578125, 11.34423828125, 13.13671875, 14.92919921875, 16.7216796875, 18.51416015625, 20.306640625, 22.09912109375, 23.8916015625, 25.68408203125, 27.4765625, 29.26904296875, 31.0615234375, 32.85400390625, 34.646484375, 36.43896484375, 38.2314453125, 40.02392578125, 41.81640625, 43.60888671875, 45.4013671875, 47.19384765625, 48.986328125, 50.77880859375, 52.5712890625, 54.36376953125, 56.15625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 0.0, 2.0, 9.0, 9.0, 13.0, 12.0, 19.0, 24.0, 15.0, 30.0, 27.0, 35.0, 30.0, 51.0, 40.0, 47.0, 48.0, 53.0, 63.0, 52.0, 41.0, 41.0, 53.0, 44.0, 43.0, 31.0, 31.0, 35.0, 13.0, 22.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.25, -53.6064453125, -51.962890625, -50.3193359375, -48.67578125, -47.0322265625, -45.388671875, -43.7451171875, -42.1015625, -40.4580078125, -38.814453125, -37.1708984375, -35.52734375, -33.8837890625, -32.240234375, -30.5966796875, -28.953125, -27.3095703125, -25.666015625, -24.0224609375, -22.37890625, -20.7353515625, -19.091796875, -17.4482421875, -15.8046875, -14.1611328125, -12.517578125, -10.8740234375, -9.23046875, -7.5869140625, -5.943359375, -4.2998046875, -2.65625, -1.0126953125, 0.630859375, 2.2744140625, 3.91796875, 5.5615234375, 7.205078125, 8.8486328125, 10.4921875, 12.1357421875, 13.779296875, 15.4228515625, 17.06640625, 18.7099609375, 20.353515625, 21.9970703125, 23.640625, 25.2841796875, 26.927734375, 28.5712890625, 30.21484375, 31.8583984375, 33.501953125, 35.1455078125, 36.7890625, 38.4326171875, 40.076171875, 41.7197265625, 43.36328125, 45.0068359375, 46.650390625, 48.2939453125, 49.9375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 13.0, 12.0, 26.0, 32.0, 44.0, 71.0, 83.0, 144.0, 199.0, 274.0, 404.0, 624.0, 885.0, 1424.0, 2237.0, 3713.0, 6424.0, 11413.0, 21477.0, 42368.0, 86334.0, 176113.0, 269101.0, 208176.0, 106242.0, 51545.0, 26173.0, 13593.0, 7571.0, 4494.0, 2602.0, 1568.0, 1046.0, 698.0, 439.0, 313.0, 221.0, 137.0, 88.0, 68.0, 47.0, 38.0, 25.0, 18.0, 11.0, 10.0, 2.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-82.625, -80.09375, -77.5625, -75.03125, -72.5, -69.96875, -67.4375, -64.90625, -62.375, -59.84375, -57.3125, -54.78125, -52.25, -49.71875, -47.1875, -44.65625, -42.125, -39.59375, -37.0625, -34.53125, -32.0, -29.46875, -26.9375, -24.40625, -21.875, -19.34375, -16.8125, -14.28125, -11.75, -9.21875, -6.6875, -4.15625, -1.625, 0.90625, 3.4375, 5.96875, 8.5, 11.03125, 13.5625, 16.09375, 18.625, 21.15625, 23.6875, 26.21875, 28.75, 31.28125, 33.8125, 36.34375, 38.875, 41.40625, 43.9375, 46.46875, 49.0, 51.53125, 54.0625, 56.59375, 59.125, 61.65625, 64.1875, 66.71875, 69.25, 71.78125, 74.3125, 76.84375, 79.375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 10.0, 8.0, 5.0, 12.0, 12.0, 22.0, 24.0, 20.0, 35.0, 42.0, 42.0, 54.0, 53.0, 49.0, 63.0, 65.0, 57.0, 53.0, 57.0, 41.0, 42.0, 34.0, 19.0, 25.0, 20.0, 21.0, 20.0, 12.0, 11.0, 9.0, 10.0, 1.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00479888916015625, -0.0046347975730896, -0.004470705986022949, -0.004306614398956299, -0.0041425228118896484, -0.003978431224822998, -0.0038143396377563477, -0.0036502480506896973, -0.003486156463623047, -0.0033220648765563965, -0.003157973289489746, -0.0029938817024230957, -0.0028297901153564453, -0.002665698528289795, -0.0025016069412231445, -0.002337515354156494, -0.0021734237670898438, -0.0020093321800231934, -0.001845240592956543, -0.0016811490058898926, -0.0015170574188232422, -0.0013529658317565918, -0.0011888742446899414, -0.001024782657623291, -0.0008606910705566406, -0.0006965994834899902, -0.0005325078964233398, -0.00036841630935668945, -0.00020432472229003906, -4.023313522338867e-05, 0.00012385845184326172, 0.0002879500389099121, 0.0004520416259765625, 0.0006161332130432129, 0.0007802248001098633, 0.0009443163871765137, 0.001108407974243164, 0.0012724995613098145, 0.0014365911483764648, 0.0016006827354431152, 0.0017647743225097656, 0.001928865909576416, 0.0020929574966430664, 0.002257049083709717, 0.002421140670776367, 0.0025852322578430176, 0.002749323844909668, 0.0029134154319763184, 0.0030775070190429688, 0.003241598606109619, 0.0034056901931762695, 0.00356978178024292, 0.0037338733673095703, 0.0038979649543762207, 0.004062056541442871, 0.0042261481285095215, 0.004390239715576172, 0.004554331302642822, 0.004718422889709473, 0.004882514476776123, 0.0050466060638427734, 0.005210697650909424, 0.005374789237976074, 0.005538880825042725, 0.005702972412109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 6.0, 12.0, 23.0, 23.0, 59.0, 72.0, 114.0, 172.0, 241.0, 414.0, 661.0, 1092.0, 2008.0, 3642.0, 6591.0, 12860.0, 26916.0, 58426.0, 130060.0, 259502.0, 274922.0, 144786.0, 65647.0, 29621.0, 14242.0, 7247.0, 3930.0, 2085.0, 1222.0, 730.0, 416.0, 256.0, 179.0, 111.0, 88.0, 58.0, 32.0, 27.0, 8.0, 17.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.8125, -85.07421875, -82.3359375, -79.59765625, -76.859375, -74.12109375, -71.3828125, -68.64453125, -65.90625, -63.16796875, -60.4296875, -57.69140625, -54.953125, -52.21484375, -49.4765625, -46.73828125, -44.0, -41.26171875, -38.5234375, -35.78515625, -33.046875, -30.30859375, -27.5703125, -24.83203125, -22.09375, -19.35546875, -16.6171875, -13.87890625, -11.140625, -8.40234375, -5.6640625, -2.92578125, -0.1875, 2.55078125, 5.2890625, 8.02734375, 10.765625, 13.50390625, 16.2421875, 18.98046875, 21.71875, 24.45703125, 27.1953125, 29.93359375, 32.671875, 35.41015625, 38.1484375, 40.88671875, 43.625, 46.36328125, 49.1015625, 51.83984375, 54.578125, 57.31640625, 60.0546875, 62.79296875, 65.53125, 68.26953125, 71.0078125, 73.74609375, 76.484375, 79.22265625, 81.9609375, 84.69921875, 87.4375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 20.0, 17.0, 10.0, 13.0, 17.0, 24.0, 30.0, 47.0, 46.0, 51.0, 67.0, 58.0, 66.0, 57.0, 48.0, 47.0, 52.0, 44.0, 44.0, 39.0, 30.0, 39.0, 19.0, 19.0, 12.0, 12.0, 12.0, 9.0, 12.0, 5.0, 2.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.40625, -20.74658203125, -20.0869140625, -19.42724609375, -18.767578125, -18.10791015625, -17.4482421875, -16.78857421875, -16.12890625, -15.46923828125, -14.8095703125, -14.14990234375, -13.490234375, -12.83056640625, -12.1708984375, -11.51123046875, -10.8515625, -10.19189453125, -9.5322265625, -8.87255859375, -8.212890625, -7.55322265625, -6.8935546875, -6.23388671875, -5.57421875, -4.91455078125, -4.2548828125, -3.59521484375, -2.935546875, -2.27587890625, -1.6162109375, -0.95654296875, -0.296875, 0.36279296875, 1.0224609375, 1.68212890625, 2.341796875, 3.00146484375, 3.6611328125, 4.32080078125, 4.98046875, 5.64013671875, 6.2998046875, 6.95947265625, 7.619140625, 8.27880859375, 8.9384765625, 9.59814453125, 10.2578125, 10.91748046875, 11.5771484375, 12.23681640625, 12.896484375, 13.55615234375, 14.2158203125, 14.87548828125, 15.53515625, 16.19482421875, 16.8544921875, 17.51416015625, 18.173828125, 18.83349609375, 19.4931640625, 20.15283203125, 20.8125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 11.0, 8.0, 10.0, 19.0, 11.0, 18.0, 19.0, 31.0, 32.0, 45.0, 45.0, 50.0, 53.0, 63.0, 57.0, 76.0, 51.0, 59.0, 45.0, 45.0, 59.0, 42.0, 31.0, 24.0, 19.0, 24.0, 15.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.30104064941406, -72.1893310546875, -70.07762145996094, -67.96591186523438, -65.85420227050781, -63.742496490478516, -61.63079071044922, -59.519081115722656, -57.407371520996094, -55.29566192626953, -53.18395233154297, -51.07224655151367, -48.96053695678711, -46.84882736206055, -44.73712158203125, -42.62541198730469, -40.513702392578125, -38.40199279785156, -36.290283203125, -34.1785774230957, -32.06686782836914, -29.955158233642578, -27.84345054626465, -25.73174285888672, -23.620033264160156, -21.508323669433594, -19.396615982055664, -17.284908294677734, -15.173198699951172, -13.061490058898926, -10.94978141784668, -8.838072776794434, -6.726371765136719, -4.614663124084473, -2.5029544830322266, -0.39124584197998047, 1.7204627990722656, 3.8321714401245117, 5.943880081176758, 8.055588722229004, 10.16729736328125, 12.279006004333496, 14.390714645385742, 16.502422332763672, 18.614131927490234, 20.725841522216797, 22.837549209594727, 24.949256896972656, 27.06096649169922, 29.17267608642578, 31.28438377380371, 33.39609146118164, 35.5078010559082, 37.619510650634766, 39.73121643066406, 41.842926025390625, 43.95463562011719, 46.06634521484375, 48.17805480957031, 50.28976058959961, 52.40147018432617, 54.513179779052734, 56.62488555908203, 58.736595153808594, 60.848304748535156]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 6.0, 4.0, 4.0, 7.0, 7.0, 7.0, 12.0, 18.0, 14.0, 23.0, 26.0, 30.0, 26.0, 31.0, 42.0, 34.0, 45.0, 32.0, 41.0, 52.0, 46.0, 48.0, 47.0, 41.0, 40.0, 47.0, 48.0, 32.0, 29.0, 19.0, 23.0, 26.0, 13.0, 17.0, 16.0, 11.0, 17.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.2049560546875, -68.05781555175781, -65.91067504882812, -63.76353454589844, -61.61639404296875, -59.46925354003906, -57.32210922241211, -55.17496871948242, -53.027828216552734, -50.88068771362305, -48.73354721069336, -46.58640670776367, -44.43926239013672, -42.29212188720703, -40.144981384277344, -37.997840881347656, -35.85070037841797, -33.70355987548828, -31.556419372558594, -29.409276962280273, -27.262136459350586, -25.1149959564209, -22.967853546142578, -20.82071304321289, -18.673572540283203, -16.526432037353516, -14.379290580749512, -12.232149124145508, -10.08500862121582, -7.937868118286133, -5.790726661682129, -3.643585205078125, -1.4964370727539062, 0.6507039070129395, 2.797844886779785, 4.944985866546631, 7.092126846313477, 9.239267349243164, 11.386408805847168, 13.533550262451172, 15.68069076538086, 17.827831268310547, 19.974971771240234, 22.122114181518555, 24.269254684448242, 26.41639518737793, 28.56353759765625, 30.710678100585938, 32.857818603515625, 35.00495910644531, 37.152099609375, 39.29924011230469, 41.446380615234375, 43.59352111816406, 45.740665435791016, 47.8878059387207, 50.03494644165039, 52.18208694458008, 54.329227447509766, 56.47636795043945, 58.623512268066406, 60.770652770996094, 62.91779327392578, 65.06493377685547, 67.21207427978516]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 13.0, 26.0, 36.0, 52.0, 104.0, 144.0, 198.0, 332.0, 473.0, 806.0, 1353.0, 2379.0, 3962.0, 6753.0, 11954.0, 20958.0, 37621.0, 70564.0, 133206.0, 259327.0, 491185.0, 779244.0, 879261.0, 674995.0, 391103.0, 201879.0, 103449.0, 54656.0, 29454.0, 16266.0, 9317.0, 5266.0, 3075.0, 1837.0, 1105.0, 705.0, 440.0, 278.0, 203.0, 91.0, 82.0, 33.0, 34.0, 16.0, 17.0, 12.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-49.09375, -47.66259765625, -46.2314453125, -44.80029296875, -43.369140625, -41.93798828125, -40.5068359375, -39.07568359375, -37.64453125, -36.21337890625, -34.7822265625, -33.35107421875, -31.919921875, -30.48876953125, -29.0576171875, -27.62646484375, -26.1953125, -24.76416015625, -23.3330078125, -21.90185546875, -20.470703125, -19.03955078125, -17.6083984375, -16.17724609375, -14.74609375, -13.31494140625, -11.8837890625, -10.45263671875, -9.021484375, -7.59033203125, -6.1591796875, -4.72802734375, -3.296875, -1.86572265625, -0.4345703125, 0.99658203125, 2.427734375, 3.85888671875, 5.2900390625, 6.72119140625, 8.15234375, 9.58349609375, 11.0146484375, 12.44580078125, 13.876953125, 15.30810546875, 16.7392578125, 18.17041015625, 19.6015625, 21.03271484375, 22.4638671875, 23.89501953125, 25.326171875, 26.75732421875, 28.1884765625, 29.61962890625, 31.05078125, 32.48193359375, 33.9130859375, 35.34423828125, 36.775390625, 38.20654296875, 39.6376953125, 41.06884765625, 42.5]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 5.0, 2.0, 11.0, 10.0, 17.0, 21.0, 19.0, 27.0, 32.0, 31.0, 34.0, 20.0, 35.0, 41.0, 40.0, 35.0, 48.0, 56.0, 49.0, 40.0, 39.0, 41.0, 37.0, 45.0, 39.0, 31.0, 27.0, 26.0, 20.0, 17.0, 14.0, 28.0, 13.0, 12.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-50.0625, -48.55517578125, -47.0478515625, -45.54052734375, -44.033203125, -42.52587890625, -41.0185546875, -39.51123046875, -38.00390625, -36.49658203125, -34.9892578125, -33.48193359375, -31.974609375, -30.46728515625, -28.9599609375, -27.45263671875, -25.9453125, -24.43798828125, -22.9306640625, -21.42333984375, -19.916015625, -18.40869140625, -16.9013671875, -15.39404296875, -13.88671875, -12.37939453125, -10.8720703125, -9.36474609375, -7.857421875, -6.35009765625, -4.8427734375, -3.33544921875, -1.828125, -0.32080078125, 1.1865234375, 2.69384765625, 4.201171875, 5.70849609375, 7.2158203125, 8.72314453125, 10.23046875, 11.73779296875, 13.2451171875, 14.75244140625, 16.259765625, 17.76708984375, 19.2744140625, 20.78173828125, 22.2890625, 23.79638671875, 25.3037109375, 26.81103515625, 28.318359375, 29.82568359375, 31.3330078125, 32.84033203125, 34.34765625, 35.85498046875, 37.3623046875, 38.86962890625, 40.376953125, 41.88427734375, 43.3916015625, 44.89892578125, 46.40625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 13.0, 9.0, 27.0, 42.0, 49.0, 75.0, 118.0, 172.0, 279.0, 415.0, 636.0, 1002.0, 1685.0, 2592.0, 4152.0, 6585.0, 11203.0, 18485.0, 30812.0, 51205.0, 86540.0, 146329.0, 241643.0, 382777.0, 565210.0, 698068.0, 654968.0, 486479.0, 317157.0, 194887.0, 116839.0, 69570.0, 41301.0, 24434.0, 14788.0, 8944.0, 5494.0, 3331.0, 2198.0, 1362.0, 850.0, 514.0, 376.0, 232.0, 137.0, 102.0, 69.0, 40.0, 33.0, 23.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.4375, -38.19677734375, -36.9560546875, -35.71533203125, -34.474609375, -33.23388671875, -31.9931640625, -30.75244140625, -29.51171875, -28.27099609375, -27.0302734375, -25.78955078125, -24.548828125, -23.30810546875, -22.0673828125, -20.82666015625, -19.5859375, -18.34521484375, -17.1044921875, -15.86376953125, -14.623046875, -13.38232421875, -12.1416015625, -10.90087890625, -9.66015625, -8.41943359375, -7.1787109375, -5.93798828125, -4.697265625, -3.45654296875, -2.2158203125, -0.97509765625, 0.265625, 1.50634765625, 2.7470703125, 3.98779296875, 5.228515625, 6.46923828125, 7.7099609375, 8.95068359375, 10.19140625, 11.43212890625, 12.6728515625, 13.91357421875, 15.154296875, 16.39501953125, 17.6357421875, 18.87646484375, 20.1171875, 21.35791015625, 22.5986328125, 23.83935546875, 25.080078125, 26.32080078125, 27.5615234375, 28.80224609375, 30.04296875, 31.28369140625, 32.5244140625, 33.76513671875, 35.005859375, 36.24658203125, 37.4873046875, 38.72802734375, 39.96875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 11.0, 18.0, 10.0, 19.0, 19.0, 24.0, 46.0, 52.0, 66.0, 58.0, 93.0, 120.0, 123.0, 138.0, 194.0, 198.0, 206.0, 243.0, 248.0, 246.0, 294.0, 228.0, 229.0, 221.0, 196.0, 164.0, 139.0, 105.0, 77.0, 72.0, 46.0, 36.0, 31.0, 22.0, 17.0, 16.0, 8.0, 7.0, 5.0, 7.0, 2.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.050537109375, -15.44482421875, -14.839111328125, -14.2333984375, -13.627685546875, -13.02197265625, -12.416259765625, -11.810546875, -11.204833984375, -10.59912109375, -9.993408203125, -9.3876953125, -8.781982421875, -8.17626953125, -7.570556640625, -6.96484375, -6.359130859375, -5.75341796875, -5.147705078125, -4.5419921875, -3.936279296875, -3.33056640625, -2.724853515625, -2.119140625, -1.513427734375, -0.90771484375, -0.302001953125, 0.3037109375, 0.909423828125, 1.51513671875, 2.120849609375, 2.7265625, 3.332275390625, 3.93798828125, 4.543701171875, 5.1494140625, 5.755126953125, 6.36083984375, 6.966552734375, 7.572265625, 8.177978515625, 8.78369140625, 9.389404296875, 9.9951171875, 10.600830078125, 11.20654296875, 11.812255859375, 12.41796875, 13.023681640625, 13.62939453125, 14.235107421875, 14.8408203125, 15.446533203125, 16.05224609375, 16.657958984375, 17.263671875, 17.869384765625, 18.47509765625, 19.080810546875, 19.6865234375, 20.292236328125, 20.89794921875, 21.503662109375, 22.109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 9.0, 23.0, 17.0, 17.0, 29.0, 38.0, 43.0, 42.0, 43.0, 69.0, 72.0, 63.0, 88.0, 55.0, 56.0, 59.0, 45.0, 52.0, 38.0, 22.0, 20.0, 13.0, 11.0, 17.0, 7.0, 7.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-70.68123626708984, -68.78840637207031, -66.89556884765625, -65.00273895263672, -63.10990905761719, -61.21707534790039, -59.324241638183594, -57.43141174316406, -55.538578033447266, -53.64574432373047, -51.75291442871094, -49.86008071899414, -47.967247009277344, -46.07441711425781, -44.181583404541016, -42.28874969482422, -40.39591979980469, -38.50308609008789, -36.61025619506836, -34.71742248535156, -32.82459259033203, -30.931758880615234, -29.038925170898438, -27.146093368530273, -25.25326156616211, -23.360429763793945, -21.46759796142578, -19.574764251708984, -17.68193244934082, -15.789100646972656, -13.896267890930176, -12.003435134887695, -10.110599517822266, -8.217767715454102, -6.324934959411621, -4.432102680206299, -2.5392704010009766, -0.6464385986328125, 1.246394157409668, 3.1392269134521484, 5.0320587158203125, 6.924890995025635, 8.817723274230957, 10.710556030273438, 12.603387832641602, 14.496219635009766, 16.389053344726562, 18.281885147094727, 20.17471694946289, 22.067548751831055, 23.96038055419922, 25.853214263916016, 27.74604606628418, 29.638877868652344, 31.53171157836914, 33.42454528808594, 35.31737518310547, 37.210208892822266, 39.1030387878418, 40.995872497558594, 42.888702392578125, 44.78153610229492, 46.67436981201172, 48.56719970703125, 50.46003341674805]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 10.0, 15.0, 18.0, 35.0, 24.0, 24.0, 27.0, 23.0, 38.0, 31.0, 25.0, 29.0, 43.0, 48.0, 48.0, 44.0, 42.0, 40.0, 47.0, 36.0, 38.0, 48.0, 30.0, 27.0, 20.0, 27.0, 23.0, 23.0, 23.0, 14.0, 16.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.50748062133789, -51.859893798828125, -50.212310791015625, -48.56472396850586, -46.917137145996094, -45.269554138183594, -43.62196731567383, -41.97438049316406, -40.32679748535156, -38.6792106628418, -37.0316276550293, -35.38404083251953, -33.73645782470703, -32.088871002197266, -30.4412841796875, -28.793699264526367, -27.146114349365234, -25.4985294342041, -23.85094451904297, -22.203357696533203, -20.55577278137207, -18.908187866210938, -17.260601043701172, -15.613016128540039, -13.965431213378906, -12.317846298217773, -10.670260429382324, -9.022674560546875, -7.375089645385742, -5.727504730224609, -4.07991886138916, -2.432332992553711, -0.7847480773925781, 0.8628373146057129, 2.510422706604004, 4.158008098602295, 5.805593490600586, 7.453178405761719, 9.100764274597168, 10.748350143432617, 12.39593505859375, 14.043519973754883, 15.691105842590332, 17.33869171142578, 18.986276626586914, 20.633861541748047, 22.281448364257812, 23.929033279418945, 25.576618194580078, 27.22420310974121, 28.871788024902344, 30.51937484741211, 32.166961669921875, 33.814544677734375, 35.46213150024414, 37.109718322753906, 38.757301330566406, 40.40488815307617, 42.05247116088867, 43.70005798339844, 45.34764099121094, 46.9952278137207, 48.64281463623047, 50.29039764404297, 51.937984466552734]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 10.0, 12.0, 21.0, 26.0, 37.0, 56.0, 57.0, 101.0, 134.0, 181.0, 297.0, 412.0, 624.0, 960.0, 1478.0, 2340.0, 3902.0, 6608.0, 12109.0, 24410.0, 57485.0, 151646.0, 330137.0, 266277.0, 105670.0, 40949.0, 18672.0, 9676.0, 5321.0, 3162.0, 1935.0, 1280.0, 793.0, 565.0, 374.0, 271.0, 174.0, 123.0, 87.0, 59.0, 38.0, 21.0, 17.0, 16.0, 8.0, 5.0, 8.0, 1.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-146.25, -141.50390625, -136.7578125, -132.01171875, -127.265625, -122.51953125, -117.7734375, -113.02734375, -108.28125, -103.53515625, -98.7890625, -94.04296875, -89.296875, -84.55078125, -79.8046875, -75.05859375, -70.3125, -65.56640625, -60.8203125, -56.07421875, -51.328125, -46.58203125, -41.8359375, -37.08984375, -32.34375, -27.59765625, -22.8515625, -18.10546875, -13.359375, -8.61328125, -3.8671875, 0.87890625, 5.625, 10.37109375, 15.1171875, 19.86328125, 24.609375, 29.35546875, 34.1015625, 38.84765625, 43.59375, 48.33984375, 53.0859375, 57.83203125, 62.578125, 67.32421875, 72.0703125, 76.81640625, 81.5625, 86.30859375, 91.0546875, 95.80078125, 100.546875, 105.29296875, 110.0390625, 114.78515625, 119.53125, 124.27734375, 129.0234375, 133.76953125, 138.515625, 143.26171875, 148.0078125, 152.75390625, 157.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 4.0, 12.0, 15.0, 23.0, 16.0, 20.0, 23.0, 26.0, 28.0, 23.0, 33.0, 27.0, 34.0, 38.0, 46.0, 50.0, 41.0, 49.0, 40.0, 34.0, 49.0, 42.0, 38.0, 36.0, 31.0, 34.0, 23.0, 25.0, 23.0, 17.0, 16.0, 17.0, 12.0, 13.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.8125, -47.3427734375, -45.873046875, -44.4033203125, -42.93359375, -41.4638671875, -39.994140625, -38.5244140625, -37.0546875, -35.5849609375, -34.115234375, -32.6455078125, -31.17578125, -29.7060546875, -28.236328125, -26.7666015625, -25.296875, -23.8271484375, -22.357421875, -20.8876953125, -19.41796875, -17.9482421875, -16.478515625, -15.0087890625, -13.5390625, -12.0693359375, -10.599609375, -9.1298828125, -7.66015625, -6.1904296875, -4.720703125, -3.2509765625, -1.78125, -0.3115234375, 1.158203125, 2.6279296875, 4.09765625, 5.5673828125, 7.037109375, 8.5068359375, 9.9765625, 11.4462890625, 12.916015625, 14.3857421875, 15.85546875, 17.3251953125, 18.794921875, 20.2646484375, 21.734375, 23.2041015625, 24.673828125, 26.1435546875, 27.61328125, 29.0830078125, 30.552734375, 32.0224609375, 33.4921875, 34.9619140625, 36.431640625, 37.9013671875, 39.37109375, 40.8408203125, 42.310546875, 43.7802734375, 45.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 21.0, 16.0, 25.0, 24.0, 29.0, 38.0, 49.0, 70.0, 99.0, 148.0, 198.0, 275.0, 403.0, 745.0, 1094.0, 1820.0, 3082.0, 5800.0, 11212.0, 23412.0, 58049.0, 184377.0, 450701.0, 195368.0, 61147.0, 24677.0, 11510.0, 5791.0, 3235.0, 1812.0, 1107.0, 694.0, 436.0, 266.0, 193.0, 178.0, 95.0, 83.0, 64.0, 55.0, 27.0, 28.0, 19.0, 18.0, 13.0, 8.0, 9.0, 2.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-177.5, -171.869140625, -166.23828125, -160.607421875, -154.9765625, -149.345703125, -143.71484375, -138.083984375, -132.453125, -126.822265625, -121.19140625, -115.560546875, -109.9296875, -104.298828125, -98.66796875, -93.037109375, -87.40625, -81.775390625, -76.14453125, -70.513671875, -64.8828125, -59.251953125, -53.62109375, -47.990234375, -42.359375, -36.728515625, -31.09765625, -25.466796875, -19.8359375, -14.205078125, -8.57421875, -2.943359375, 2.6875, 8.318359375, 13.94921875, 19.580078125, 25.2109375, 30.841796875, 36.47265625, 42.103515625, 47.734375, 53.365234375, 58.99609375, 64.626953125, 70.2578125, 75.888671875, 81.51953125, 87.150390625, 92.78125, 98.412109375, 104.04296875, 109.673828125, 115.3046875, 120.935546875, 126.56640625, 132.197265625, 137.828125, 143.458984375, 149.08984375, 154.720703125, 160.3515625, 165.982421875, 171.61328125, 177.244140625, 182.875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 13.0, 14.0, 12.0, 23.0, 32.0, 34.0, 44.0, 50.0, 62.0, 66.0, 93.0, 89.0, 66.0, 61.0, 54.0, 63.0, 48.0, 42.0, 31.0, 21.0, 11.0, 18.0, 15.0, 7.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.63623046875, -53.7724609375, -51.90869140625, -50.044921875, -48.18115234375, -46.3173828125, -44.45361328125, -42.58984375, -40.72607421875, -38.8623046875, -36.99853515625, -35.134765625, -33.27099609375, -31.4072265625, -29.54345703125, -27.6796875, -25.81591796875, -23.9521484375, -22.08837890625, -20.224609375, -18.36083984375, -16.4970703125, -14.63330078125, -12.76953125, -10.90576171875, -9.0419921875, -7.17822265625, -5.314453125, -3.45068359375, -1.5869140625, 0.27685546875, 2.140625, 4.00439453125, 5.8681640625, 7.73193359375, 9.595703125, 11.45947265625, 13.3232421875, 15.18701171875, 17.05078125, 18.91455078125, 20.7783203125, 22.64208984375, 24.505859375, 26.36962890625, 28.2333984375, 30.09716796875, 31.9609375, 33.82470703125, 35.6884765625, 37.55224609375, 39.416015625, 41.27978515625, 43.1435546875, 45.00732421875, 46.87109375, 48.73486328125, 50.5986328125, 52.46240234375, 54.326171875, 56.18994140625, 58.0537109375, 59.91748046875, 61.78125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 18.0, 12.0, 34.0, 54.0, 94.0, 160.0, 268.0, 476.0, 735.0, 1270.0, 2412.0, 4545.0, 9413.0, 22137.0, 62632.0, 240190.0, 470686.0, 156502.0, 44489.0, 16725.0, 7347.0, 3738.0, 1969.0, 1117.0, 592.0, 356.0, 206.0, 117.0, 80.0, 60.0, 36.0, 30.0, 18.0, 8.0, 7.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.625, -85.7978515625, -82.970703125, -80.1435546875, -77.31640625, -74.4892578125, -71.662109375, -68.8349609375, -66.0078125, -63.1806640625, -60.353515625, -57.5263671875, -54.69921875, -51.8720703125, -49.044921875, -46.2177734375, -43.390625, -40.5634765625, -37.736328125, -34.9091796875, -32.08203125, -29.2548828125, -26.427734375, -23.6005859375, -20.7734375, -17.9462890625, -15.119140625, -12.2919921875, -9.46484375, -6.6376953125, -3.810546875, -0.9833984375, 1.84375, 4.6708984375, 7.498046875, 10.3251953125, 13.15234375, 15.9794921875, 18.806640625, 21.6337890625, 24.4609375, 27.2880859375, 30.115234375, 32.9423828125, 35.76953125, 38.5966796875, 41.423828125, 44.2509765625, 47.078125, 49.9052734375, 52.732421875, 55.5595703125, 58.38671875, 61.2138671875, 64.041015625, 66.8681640625, 69.6953125, 72.5224609375, 75.349609375, 78.1767578125, 81.00390625, 83.8310546875, 86.658203125, 89.4853515625, 92.3125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 9.0, 3.0, 6.0, 2.0, 4.0, 6.0, 14.0, 13.0, 20.0, 24.0, 42.0, 97.0, 141.0, 178.0, 148.0, 109.0, 58.0, 41.0, 21.0, 22.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0064239501953125, -0.00625300407409668, -0.006082057952880859, -0.005911111831665039, -0.005740165710449219, -0.0055692195892333984, -0.005398273468017578, -0.005227327346801758, -0.0050563812255859375, -0.004885435104370117, -0.004714488983154297, -0.0045435428619384766, -0.004372596740722656, -0.004201650619506836, -0.004030704498291016, -0.0038597583770751953, -0.003688812255859375, -0.0035178661346435547, -0.0033469200134277344, -0.003175973892211914, -0.0030050277709960938, -0.0028340816497802734, -0.002663135528564453, -0.002492189407348633, -0.0023212432861328125, -0.002150297164916992, -0.001979351043701172, -0.0018084049224853516, -0.0016374588012695312, -0.001466512680053711, -0.0012955665588378906, -0.0011246204376220703, -0.00095367431640625, -0.0007827281951904297, -0.0006117820739746094, -0.00044083595275878906, -0.00026988983154296875, -9.894371032714844e-05, 7.200241088867188e-05, 0.0002429485321044922, 0.0004138946533203125, 0.0005848407745361328, 0.0007557868957519531, 0.0009267330169677734, 0.0010976791381835938, 0.001268625259399414, 0.0014395713806152344, 0.0016105175018310547, 0.001781463623046875, 0.0019524097442626953, 0.0021233558654785156, 0.002294301986694336, 0.0024652481079101562, 0.0026361942291259766, 0.002807140350341797, 0.002978086471557617, 0.0031490325927734375, 0.003319978713989258, 0.003490924835205078, 0.0036618709564208984, 0.0038328170776367188, 0.004003763198852539, 0.004174709320068359, 0.00434565544128418, 0.0045166015625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 9.0, 12.0, 18.0, 20.0, 31.0, 58.0, 82.0, 118.0, 151.0, 224.0, 349.0, 533.0, 819.0, 1255.0, 2040.0, 3329.0, 5468.0, 9783.0, 18869.0, 38845.0, 89453.0, 202259.0, 300046.0, 203097.0, 89200.0, 39088.0, 19007.0, 9854.0, 5610.0, 3155.0, 2026.0, 1263.0, 800.0, 552.0, 380.0, 253.0, 157.0, 99.0, 73.0, 47.0, 37.0, 26.0, 18.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-59.59375, -57.81494140625, -56.0361328125, -54.25732421875, -52.478515625, -50.69970703125, -48.9208984375, -47.14208984375, -45.36328125, -43.58447265625, -41.8056640625, -40.02685546875, -38.248046875, -36.46923828125, -34.6904296875, -32.91162109375, -31.1328125, -29.35400390625, -27.5751953125, -25.79638671875, -24.017578125, -22.23876953125, -20.4599609375, -18.68115234375, -16.90234375, -15.12353515625, -13.3447265625, -11.56591796875, -9.787109375, -8.00830078125, -6.2294921875, -4.45068359375, -2.671875, -0.89306640625, 0.8857421875, 2.66455078125, 4.443359375, 6.22216796875, 8.0009765625, 9.77978515625, 11.55859375, 13.33740234375, 15.1162109375, 16.89501953125, 18.673828125, 20.45263671875, 22.2314453125, 24.01025390625, 25.7890625, 27.56787109375, 29.3466796875, 31.12548828125, 32.904296875, 34.68310546875, 36.4619140625, 38.24072265625, 40.01953125, 41.79833984375, 43.5771484375, 45.35595703125, 47.134765625, 48.91357421875, 50.6923828125, 52.47119140625, 54.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 6.0, 7.0, 14.0, 11.0, 17.0, 23.0, 26.0, 41.0, 44.0, 61.0, 82.0, 82.0, 105.0, 85.0, 90.0, 71.0, 58.0, 41.0, 35.0, 23.0, 18.0, 12.0, 7.0, 4.0, 8.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -23.889404296875, -23.06005859375, -22.230712890625, -21.4013671875, -20.572021484375, -19.74267578125, -18.913330078125, -18.083984375, -17.254638671875, -16.42529296875, -15.595947265625, -14.7666015625, -13.937255859375, -13.10791015625, -12.278564453125, -11.44921875, -10.619873046875, -9.79052734375, -8.961181640625, -8.1318359375, -7.302490234375, -6.47314453125, -5.643798828125, -4.814453125, -3.985107421875, -3.15576171875, -2.326416015625, -1.4970703125, -0.667724609375, 0.16162109375, 0.990966796875, 1.8203125, 2.649658203125, 3.47900390625, 4.308349609375, 5.1376953125, 5.967041015625, 6.79638671875, 7.625732421875, 8.455078125, 9.284423828125, 10.11376953125, 10.943115234375, 11.7724609375, 12.601806640625, 13.43115234375, 14.260498046875, 15.08984375, 15.919189453125, 16.74853515625, 17.577880859375, 18.4072265625, 19.236572265625, 20.06591796875, 20.895263671875, 21.724609375, 22.553955078125, 23.38330078125, 24.212646484375, 25.0419921875, 25.871337890625, 26.70068359375, 27.530029296875, 28.359375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 2.0, 0.0, 6.0, 9.0, 14.0, 14.0, 16.0, 30.0, 22.0, 32.0, 38.0, 57.0, 54.0, 39.0, 58.0, 54.0, 72.0, 64.0, 57.0, 53.0, 56.0, 49.0, 46.0, 34.0, 22.0, 30.0, 18.0, 9.0, 6.0, 13.0, 5.0, 8.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.05623245239258, -48.432655334472656, -46.809078216552734, -45.18550109863281, -43.56192398071289, -41.93834686279297, -40.31477355957031, -38.69119644165039, -37.06761932373047, -35.44404220581055, -33.820465087890625, -32.1968879699707, -30.573312759399414, -28.949735641479492, -27.32615852355957, -25.70258331298828, -24.079004287719727, -22.455427169799805, -20.831850051879883, -19.208274841308594, -17.584697723388672, -15.96112060546875, -14.337543487548828, -12.713967323303223, -11.0903902053833, -9.466813087463379, -7.843236923217773, -6.219659805297852, -4.596083164215088, -2.972506523132324, -1.3489294052124023, 0.2746467590332031, 1.898223876953125, 3.5218005180358887, 5.145377159118652, 6.768954277038574, 8.39253044128418, 10.016107559204102, 11.639684677124023, 13.263260841369629, 14.88683795928955, 16.510414123535156, 18.133991241455078, 19.757568359375, 21.381145477294922, 23.004722595214844, 24.628299713134766, 26.251874923706055, 27.875452041625977, 29.4990291595459, 31.12260627746582, 32.74618148803711, 34.36975860595703, 35.99333572387695, 37.616912841796875, 39.2404899597168, 40.86406707763672, 42.48764419555664, 44.11122131347656, 45.734798431396484, 47.358375549316406, 48.98194885253906, 50.60552978515625, 52.229103088378906, 53.85268020629883]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 8.0, 11.0, 15.0, 12.0, 17.0, 22.0, 20.0, 32.0, 22.0, 27.0, 31.0, 24.0, 28.0, 41.0, 40.0, 50.0, 55.0, 27.0, 41.0, 41.0, 35.0, 28.0, 36.0, 36.0, 39.0, 23.0, 27.0, 29.0, 23.0, 21.0, 18.0, 15.0, 19.0, 13.0, 11.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-41.95718002319336, -40.70591735839844, -39.45465087890625, -38.20338821411133, -36.952125549316406, -35.700862884521484, -34.44960021972656, -33.198333740234375, -31.947071075439453, -30.69580841064453, -29.444543838500977, -28.193279266357422, -26.9420166015625, -25.690753936767578, -24.439489364624023, -23.18822479248047, -21.936962127685547, -20.685699462890625, -19.43443489074707, -18.183170318603516, -16.931907653808594, -15.680644035339355, -14.429380416870117, -13.178116798400879, -11.92685317993164, -10.675589561462402, -9.424325942993164, -8.173062324523926, -6.9217987060546875, -5.670535087585449, -4.419271469116211, -3.1680078506469727, -1.9167442321777344, -0.6654806137084961, 0.5857830047607422, 1.8370466232299805, 3.0883102416992188, 4.339573860168457, 5.590837478637695, 6.842101097106934, 8.093364715576172, 9.34462833404541, 10.595891952514648, 11.847155570983887, 13.098419189453125, 14.349682807922363, 15.600946426391602, 16.852210998535156, 18.103473663330078, 19.354736328125, 20.606000900268555, 21.85726547241211, 23.10852813720703, 24.359790802001953, 25.611055374145508, 26.862319946289062, 28.113582611083984, 29.364845275878906, 30.61610984802246, 31.867374420166016, 33.11863708496094, 34.36989974975586, 35.62116241455078, 36.87242889404297, 38.12369155883789]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 18.0, 29.0, 32.0, 56.0, 89.0, 120.0, 229.0, 321.0, 508.0, 769.0, 1218.0, 1986.0, 3195.0, 5218.0, 7978.0, 13360.0, 21682.0, 34792.0, 54989.0, 82508.0, 117315.0, 147298.0, 152921.0, 130741.0, 95787.0, 64495.0, 41984.0, 25982.0, 16393.0, 9931.0, 6185.0, 3803.0, 2401.0, 1495.0, 992.0, 608.0, 398.0, 248.0, 162.0, 110.0, 59.0, 60.0, 33.0, 12.0, 18.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-41.125, -39.88623046875, -38.6474609375, -37.40869140625, -36.169921875, -34.93115234375, -33.6923828125, -32.45361328125, -31.21484375, -29.97607421875, -28.7373046875, -27.49853515625, -26.259765625, -25.02099609375, -23.7822265625, -22.54345703125, -21.3046875, -20.06591796875, -18.8271484375, -17.58837890625, -16.349609375, -15.11083984375, -13.8720703125, -12.63330078125, -11.39453125, -10.15576171875, -8.9169921875, -7.67822265625, -6.439453125, -5.20068359375, -3.9619140625, -2.72314453125, -1.484375, -0.24560546875, 0.9931640625, 2.23193359375, 3.470703125, 4.70947265625, 5.9482421875, 7.18701171875, 8.42578125, 9.66455078125, 10.9033203125, 12.14208984375, 13.380859375, 14.61962890625, 15.8583984375, 17.09716796875, 18.3359375, 19.57470703125, 20.8134765625, 22.05224609375, 23.291015625, 24.52978515625, 25.7685546875, 27.00732421875, 28.24609375, 29.48486328125, 30.7236328125, 31.96240234375, 33.201171875, 34.43994140625, 35.6787109375, 36.91748046875, 38.15625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 7.0, 11.0, 6.0, 8.0, 21.0, 19.0, 14.0, 17.0, 19.0, 31.0, 23.0, 27.0, 31.0, 27.0, 37.0, 39.0, 37.0, 38.0, 45.0, 49.0, 39.0, 33.0, 36.0, 32.0, 41.0, 32.0, 33.0, 33.0, 24.0, 25.0, 26.0, 27.0, 18.0, 19.0, 13.0, 10.0, 3.0, 10.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-37.4375, -36.24951171875, -35.0615234375, -33.87353515625, -32.685546875, -31.49755859375, -30.3095703125, -29.12158203125, -27.93359375, -26.74560546875, -25.5576171875, -24.36962890625, -23.181640625, -21.99365234375, -20.8056640625, -19.61767578125, -18.4296875, -17.24169921875, -16.0537109375, -14.86572265625, -13.677734375, -12.48974609375, -11.3017578125, -10.11376953125, -8.92578125, -7.73779296875, -6.5498046875, -5.36181640625, -4.173828125, -2.98583984375, -1.7978515625, -0.60986328125, 0.578125, 1.76611328125, 2.9541015625, 4.14208984375, 5.330078125, 6.51806640625, 7.7060546875, 8.89404296875, 10.08203125, 11.27001953125, 12.4580078125, 13.64599609375, 14.833984375, 16.02197265625, 17.2099609375, 18.39794921875, 19.5859375, 20.77392578125, 21.9619140625, 23.14990234375, 24.337890625, 25.52587890625, 26.7138671875, 27.90185546875, 29.08984375, 30.27783203125, 31.4658203125, 32.65380859375, 33.841796875, 35.02978515625, 36.2177734375, 37.40576171875, 38.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 12.0, 11.0, 19.0, 23.0, 32.0, 71.0, 109.0, 139.0, 238.0, 316.0, 511.0, 736.0, 1154.0, 1763.0, 2675.0, 4248.0, 6646.0, 10092.0, 15752.0, 24521.0, 37484.0, 56261.0, 81122.0, 109266.0, 131553.0, 137465.0, 123154.0, 97196.0, 69339.0, 47437.0, 31581.0, 20340.0, 13259.0, 8595.0, 5374.0, 3503.0, 2245.0, 1526.0, 925.0, 639.0, 434.0, 266.0, 163.0, 126.0, 81.0, 45.0, 42.0, 16.0, 17.0, 8.0, 7.0, 8.0, 4.0, 7.0, 1.0, 3.0, 2.0], "bins": [-32.40625, -31.402587890625, -30.39892578125, -29.395263671875, -28.3916015625, -27.387939453125, -26.38427734375, -25.380615234375, -24.376953125, -23.373291015625, -22.36962890625, -21.365966796875, -20.3623046875, -19.358642578125, -18.35498046875, -17.351318359375, -16.34765625, -15.343994140625, -14.34033203125, -13.336669921875, -12.3330078125, -11.329345703125, -10.32568359375, -9.322021484375, -8.318359375, -7.314697265625, -6.31103515625, -5.307373046875, -4.3037109375, -3.300048828125, -2.29638671875, -1.292724609375, -0.2890625, 0.714599609375, 1.71826171875, 2.721923828125, 3.7255859375, 4.729248046875, 5.73291015625, 6.736572265625, 7.740234375, 8.743896484375, 9.74755859375, 10.751220703125, 11.7548828125, 12.758544921875, 13.76220703125, 14.765869140625, 15.76953125, 16.773193359375, 17.77685546875, 18.780517578125, 19.7841796875, 20.787841796875, 21.79150390625, 22.795166015625, 23.798828125, 24.802490234375, 25.80615234375, 26.809814453125, 27.8134765625, 28.817138671875, 29.82080078125, 30.824462890625, 31.828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 6.0, 13.0, 7.0, 15.0, 16.0, 16.0, 13.0, 21.0, 18.0, 25.0, 26.0, 37.0, 23.0, 27.0, 31.0, 45.0, 38.0, 38.0, 42.0, 48.0, 31.0, 38.0, 46.0, 44.0, 34.0, 29.0, 31.0, 29.0, 24.0, 13.0, 25.0, 24.0, 14.0, 17.0, 12.0, 12.0, 12.0, 7.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.921875, -21.212646484375, -20.50341796875, -19.794189453125, -19.0849609375, -18.375732421875, -17.66650390625, -16.957275390625, -16.248046875, -15.538818359375, -14.82958984375, -14.120361328125, -13.4111328125, -12.701904296875, -11.99267578125, -11.283447265625, -10.57421875, -9.864990234375, -9.15576171875, -8.446533203125, -7.7373046875, -7.028076171875, -6.31884765625, -5.609619140625, -4.900390625, -4.191162109375, -3.48193359375, -2.772705078125, -2.0634765625, -1.354248046875, -0.64501953125, 0.064208984375, 0.7734375, 1.482666015625, 2.19189453125, 2.901123046875, 3.6103515625, 4.319580078125, 5.02880859375, 5.738037109375, 6.447265625, 7.156494140625, 7.86572265625, 8.574951171875, 9.2841796875, 9.993408203125, 10.70263671875, 11.411865234375, 12.12109375, 12.830322265625, 13.53955078125, 14.248779296875, 14.9580078125, 15.667236328125, 16.37646484375, 17.085693359375, 17.794921875, 18.504150390625, 19.21337890625, 19.922607421875, 20.6318359375, 21.341064453125, 22.05029296875, 22.759521484375, 23.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 8.0, 5.0, 12.0, 20.0, 17.0, 27.0, 43.0, 46.0, 80.0, 93.0, 139.0, 168.0, 248.0, 352.0, 498.0, 770.0, 1068.0, 1859.0, 3158.0, 6060.0, 12692.0, 31188.0, 84872.0, 233400.0, 360935.0, 193120.0, 68165.0, 25631.0, 10820.0, 5189.0, 2798.0, 1664.0, 1090.0, 699.0, 426.0, 338.0, 214.0, 181.0, 133.0, 77.0, 55.0, 44.0, 45.0, 36.0, 15.0, 19.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.5625, -47.98388671875, -46.4052734375, -44.82666015625, -43.248046875, -41.66943359375, -40.0908203125, -38.51220703125, -36.93359375, -35.35498046875, -33.7763671875, -32.19775390625, -30.619140625, -29.04052734375, -27.4619140625, -25.88330078125, -24.3046875, -22.72607421875, -21.1474609375, -19.56884765625, -17.990234375, -16.41162109375, -14.8330078125, -13.25439453125, -11.67578125, -10.09716796875, -8.5185546875, -6.93994140625, -5.361328125, -3.78271484375, -2.2041015625, -0.62548828125, 0.953125, 2.53173828125, 4.1103515625, 5.68896484375, 7.267578125, 8.84619140625, 10.4248046875, 12.00341796875, 13.58203125, 15.16064453125, 16.7392578125, 18.31787109375, 19.896484375, 21.47509765625, 23.0537109375, 24.63232421875, 26.2109375, 27.78955078125, 29.3681640625, 30.94677734375, 32.525390625, 34.10400390625, 35.6826171875, 37.26123046875, 38.83984375, 40.41845703125, 41.9970703125, 43.57568359375, 45.154296875, 46.73291015625, 48.3115234375, 49.89013671875, 51.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 5.0, 7.0, 15.0, 26.0, 31.0, 60.0, 69.0, 90.0, 135.0, 138.0, 120.0, 93.0, 66.0, 40.0, 38.0, 19.0, 6.0, 14.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00440216064453125, -0.004246711730957031, -0.0040912628173828125, -0.003935813903808594, -0.003780364990234375, -0.0036249160766601562, -0.0034694671630859375, -0.0033140182495117188, -0.0031585693359375, -0.0030031204223632812, -0.0028476715087890625, -0.0026922225952148438, -0.002536773681640625, -0.0023813247680664062, -0.0022258758544921875, -0.0020704269409179688, -0.00191497802734375, -0.0017595291137695312, -0.0016040802001953125, -0.0014486312866210938, -0.001293182373046875, -0.0011377334594726562, -0.0009822845458984375, -0.0008268356323242188, -0.00067138671875, -0.0005159378051757812, -0.0003604888916015625, -0.00020503997802734375, -4.9591064453125e-05, 0.00010585784912109375, 0.0002613067626953125, 0.00041675567626953125, 0.00057220458984375, 0.0007276535034179688, 0.0008831024169921875, 0.0010385513305664062, 0.001194000244140625, 0.0013494491577148438, 0.0015048980712890625, 0.0016603469848632812, 0.0018157958984375, 0.0019712448120117188, 0.0021266937255859375, 0.0022821426391601562, 0.002437591552734375, 0.0025930404663085938, 0.0027484893798828125, 0.0029039382934570312, 0.00305938720703125, 0.0032148361206054688, 0.0033702850341796875, 0.0035257339477539062, 0.003681182861328125, 0.0038366317749023438, 0.0039920806884765625, 0.004147529602050781, 0.004302978515625, 0.004458427429199219, 0.0046138763427734375, 0.004769325256347656, 0.004924774169921875, 0.005080223083496094, 0.0052356719970703125, 0.005391120910644531, 0.00554656982421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 6.0, 13.0, 22.0, 32.0, 41.0, 58.0, 75.0, 116.0, 165.0, 279.0, 324.0, 506.0, 808.0, 1139.0, 1765.0, 2661.0, 4071.0, 6740.0, 11136.0, 18846.0, 32743.0, 57284.0, 97009.0, 149795.0, 188198.0, 172547.0, 122548.0, 74373.0, 43168.0, 24369.0, 14175.0, 8729.0, 5229.0, 3240.0, 2137.0, 1349.0, 951.0, 571.0, 418.0, 266.0, 204.0, 130.0, 109.0, 60.0, 52.0, 38.0, 14.0, 10.0, 19.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.183349609375, -22.42919921875, -21.675048828125, -20.9208984375, -20.166748046875, -19.41259765625, -18.658447265625, -17.904296875, -17.150146484375, -16.39599609375, -15.641845703125, -14.8876953125, -14.133544921875, -13.37939453125, -12.625244140625, -11.87109375, -11.116943359375, -10.36279296875, -9.608642578125, -8.8544921875, -8.100341796875, -7.34619140625, -6.592041015625, -5.837890625, -5.083740234375, -4.32958984375, -3.575439453125, -2.8212890625, -2.067138671875, -1.31298828125, -0.558837890625, 0.1953125, 0.949462890625, 1.70361328125, 2.457763671875, 3.2119140625, 3.966064453125, 4.72021484375, 5.474365234375, 6.228515625, 6.982666015625, 7.73681640625, 8.490966796875, 9.2451171875, 9.999267578125, 10.75341796875, 11.507568359375, 12.26171875, 13.015869140625, 13.77001953125, 14.524169921875, 15.2783203125, 16.032470703125, 16.78662109375, 17.540771484375, 18.294921875, 19.049072265625, 19.80322265625, 20.557373046875, 21.3115234375, 22.065673828125, 22.81982421875, 23.573974609375, 24.328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 9.0, 6.0, 8.0, 9.0, 14.0, 11.0, 16.0, 28.0, 33.0, 33.0, 33.0, 47.0, 50.0, 72.0, 71.0, 62.0, 78.0, 58.0, 54.0, 49.0, 44.0, 43.0, 27.0, 31.0, 25.0, 13.0, 12.0, 16.0, 12.0, 9.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.7421875, -10.4505615234375, -10.158935546875, -9.8673095703125, -9.57568359375, -9.2840576171875, -8.992431640625, -8.7008056640625, -8.4091796875, -8.1175537109375, -7.825927734375, -7.5343017578125, -7.24267578125, -6.9510498046875, -6.659423828125, -6.3677978515625, -6.076171875, -5.7845458984375, -5.492919921875, -5.2012939453125, -4.90966796875, -4.6180419921875, -4.326416015625, -4.0347900390625, -3.7431640625, -3.4515380859375, -3.159912109375, -2.8682861328125, -2.57666015625, -2.2850341796875, -1.993408203125, -1.7017822265625, -1.41015625, -1.1185302734375, -0.826904296875, -0.5352783203125, -0.24365234375, 0.0479736328125, 0.339599609375, 0.6312255859375, 0.9228515625, 1.2144775390625, 1.506103515625, 1.7977294921875, 2.08935546875, 2.3809814453125, 2.672607421875, 2.9642333984375, 3.255859375, 3.5474853515625, 3.839111328125, 4.1307373046875, 4.42236328125, 4.7139892578125, 5.005615234375, 5.2972412109375, 5.5888671875, 5.8804931640625, 6.172119140625, 6.4637451171875, 6.75537109375, 7.0469970703125, 7.338623046875, 7.6302490234375, 7.921875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 13.0, 20.0, 23.0, 23.0, 30.0, 35.0, 39.0, 53.0, 57.0, 49.0, 57.0, 79.0, 57.0, 65.0, 70.0, 62.0, 58.0, 40.0, 27.0, 26.0, 20.0, 20.0, 15.0, 7.0, 2.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.41061019897461, -48.828453063964844, -47.246299743652344, -45.66414260864258, -44.08198547363281, -42.49983215332031, -40.91767501831055, -39.33551788330078, -37.75336456298828, -36.171207427978516, -34.589054107666016, -33.00689697265625, -31.424741744995117, -29.842586517333984, -28.26042938232422, -26.678274154663086, -25.09611701965332, -23.513961791992188, -21.931804656982422, -20.34964942932129, -18.767494201660156, -17.18533706665039, -15.603181838989258, -14.021026611328125, -12.438870429992676, -10.856714248657227, -9.274559020996094, -7.6924028396606445, -6.1102471351623535, -4.5280914306640625, -2.9459352493286133, -1.3637800216674805, 0.21837615966796875, 1.8005319833755493, 3.38268780708313, 4.96484375, 6.546999454498291, 8.129155158996582, 9.711311340332031, 11.293466567993164, 12.875622749328613, 14.457778930664062, 16.039934158325195, 17.622089385986328, 19.204246520996094, 20.786401748657227, 22.36855697631836, 23.950714111328125, 25.532869338989258, 27.11502456665039, 28.697181701660156, 30.27933692932129, 31.861492156982422, 33.44364929199219, 35.02580261230469, 36.60795974731445, 38.19011688232422, 39.772274017333984, 41.354427337646484, 42.93658447265625, 44.518741607666016, 46.100894927978516, 47.68305206298828, 49.26520538330078, 50.84736251831055]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 4.0, 5.0, 12.0, 10.0, 9.0, 13.0, 20.0, 14.0, 25.0, 19.0, 20.0, 26.0, 36.0, 40.0, 30.0, 36.0, 47.0, 39.0, 39.0, 42.0, 26.0, 33.0, 41.0, 48.0, 37.0, 34.0, 32.0, 28.0, 39.0, 27.0, 22.0, 28.0, 20.0, 17.0, 15.0, 19.0, 12.0, 7.0, 4.0, 1.0, 4.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.945762634277344, -39.7737922668457, -38.60182189941406, -37.429847717285156, -36.257877349853516, -35.085906982421875, -33.913936614990234, -32.741966247558594, -31.56999397277832, -30.39802360534668, -29.226051330566406, -28.054080963134766, -26.882110595703125, -25.71013832092285, -24.53816795349121, -23.366195678710938, -22.194225311279297, -21.022254943847656, -19.850282669067383, -18.678312301635742, -17.50634002685547, -16.334369659423828, -15.162399291992188, -13.99042797088623, -12.818456649780273, -11.646485328674316, -10.47451400756836, -9.302543640136719, -8.130572319030762, -6.958600997924805, -5.786630153656006, -4.614659309387207, -3.44268798828125, -2.270716905593872, -1.0987458229064941, 0.07322525978088379, 1.2451963424682617, 2.4171676635742188, 3.5891385078430176, 4.761109352111816, 5.933080673217773, 7.1050519943237305, 8.277023315429688, 9.448993682861328, 10.620965003967285, 11.792936325073242, 12.964906692504883, 14.13687801361084, 15.308849334716797, 16.480819702148438, 17.65279197692871, 18.82476234436035, 19.996734619140625, 21.168704986572266, 22.340675354003906, 23.512645721435547, 24.68461799621582, 25.85658836364746, 27.028560638427734, 28.200531005859375, 29.372501373291016, 30.54447364807129, 31.71644401550293, 32.8884162902832, 34.060386657714844]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 30.0, 52.0, 75.0, 94.0, 171.0, 263.0, 385.0, 645.0, 949.0, 1478.0, 2152.0, 3267.0, 5214.0, 8384.0, 12862.0, 21182.0, 34367.0, 57172.0, 96861.0, 166869.0, 286547.0, 470811.0, 664112.0, 733194.0, 611312.0, 409949.0, 245962.0, 142854.0, 84457.0, 49803.0, 30466.0, 19128.0, 11910.0, 7491.0, 4870.0, 3087.0, 2018.0, 1289.0, 861.0, 536.0, 376.0, 242.0, 176.0, 133.0, 67.0, 52.0, 32.0, 22.0, 10.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-26.28125, -25.41552734375, -24.5498046875, -23.68408203125, -22.818359375, -21.95263671875, -21.0869140625, -20.22119140625, -19.35546875, -18.48974609375, -17.6240234375, -16.75830078125, -15.892578125, -15.02685546875, -14.1611328125, -13.29541015625, -12.4296875, -11.56396484375, -10.6982421875, -9.83251953125, -8.966796875, -8.10107421875, -7.2353515625, -6.36962890625, -5.50390625, -4.63818359375, -3.7724609375, -2.90673828125, -2.041015625, -1.17529296875, -0.3095703125, 0.55615234375, 1.421875, 2.28759765625, 3.1533203125, 4.01904296875, 4.884765625, 5.75048828125, 6.6162109375, 7.48193359375, 8.34765625, 9.21337890625, 10.0791015625, 10.94482421875, 11.810546875, 12.67626953125, 13.5419921875, 14.40771484375, 15.2734375, 16.13916015625, 17.0048828125, 17.87060546875, 18.736328125, 19.60205078125, 20.4677734375, 21.33349609375, 22.19921875, 23.06494140625, 23.9306640625, 24.79638671875, 25.662109375, 26.52783203125, 27.3935546875, 28.25927734375, 29.125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 3.0, 9.0, 9.0, 16.0, 15.0, 13.0, 15.0, 20.0, 18.0, 14.0, 23.0, 27.0, 25.0, 30.0, 32.0, 30.0, 35.0, 37.0, 37.0, 44.0, 32.0, 39.0, 35.0, 36.0, 23.0, 37.0, 29.0, 21.0, 34.0, 27.0, 44.0, 22.0, 24.0, 22.0, 19.0, 18.0, 17.0, 12.0, 12.0, 9.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0], "bins": [-26.0, -25.259033203125, -24.51806640625, -23.777099609375, -23.0361328125, -22.295166015625, -21.55419921875, -20.813232421875, -20.072265625, -19.331298828125, -18.59033203125, -17.849365234375, -17.1083984375, -16.367431640625, -15.62646484375, -14.885498046875, -14.14453125, -13.403564453125, -12.66259765625, -11.921630859375, -11.1806640625, -10.439697265625, -9.69873046875, -8.957763671875, -8.216796875, -7.475830078125, -6.73486328125, -5.993896484375, -5.2529296875, -4.511962890625, -3.77099609375, -3.030029296875, -2.2890625, -1.548095703125, -0.80712890625, -0.066162109375, 0.6748046875, 1.415771484375, 2.15673828125, 2.897705078125, 3.638671875, 4.379638671875, 5.12060546875, 5.861572265625, 6.6025390625, 7.343505859375, 8.08447265625, 8.825439453125, 9.56640625, 10.307373046875, 11.04833984375, 11.789306640625, 12.5302734375, 13.271240234375, 14.01220703125, 14.753173828125, 15.494140625, 16.235107421875, 16.97607421875, 17.717041015625, 18.4580078125, 19.198974609375, 19.93994140625, 20.680908203125, 21.421875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 13.0, 28.0, 36.0, 47.0, 74.0, 94.0, 163.0, 272.0, 367.0, 608.0, 961.0, 1476.0, 2503.0, 3905.0, 6369.0, 10576.0, 17554.0, 30280.0, 51555.0, 88417.0, 152494.0, 259206.0, 422624.0, 626253.0, 749351.0, 650134.0, 447870.0, 276649.0, 163944.0, 95059.0, 55061.0, 32055.0, 18930.0, 11283.0, 7012.0, 4055.0, 2524.0, 1575.0, 1047.0, 629.0, 427.0, 254.0, 180.0, 118.0, 74.0, 53.0, 38.0, 26.0, 15.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.507080078125, -26.57666015625, -25.646240234375, -24.7158203125, -23.785400390625, -22.85498046875, -21.924560546875, -20.994140625, -20.063720703125, -19.13330078125, -18.202880859375, -17.2724609375, -16.342041015625, -15.41162109375, -14.481201171875, -13.55078125, -12.620361328125, -11.68994140625, -10.759521484375, -9.8291015625, -8.898681640625, -7.96826171875, -7.037841796875, -6.107421875, -5.177001953125, -4.24658203125, -3.316162109375, -2.3857421875, -1.455322265625, -0.52490234375, 0.405517578125, 1.3359375, 2.266357421875, 3.19677734375, 4.127197265625, 5.0576171875, 5.988037109375, 6.91845703125, 7.848876953125, 8.779296875, 9.709716796875, 10.64013671875, 11.570556640625, 12.5009765625, 13.431396484375, 14.36181640625, 15.292236328125, 16.22265625, 17.153076171875, 18.08349609375, 19.013916015625, 19.9443359375, 20.874755859375, 21.80517578125, 22.735595703125, 23.666015625, 24.596435546875, 25.52685546875, 26.457275390625, 27.3876953125, 28.318115234375, 29.24853515625, 30.178955078125, 31.109375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 14.0, 11.0, 20.0, 27.0, 27.0, 28.0, 50.0, 54.0, 65.0, 82.0, 94.0, 93.0, 133.0, 157.0, 140.0, 195.0, 211.0, 230.0, 229.0, 235.0, 260.0, 200.0, 209.0, 183.0, 178.0, 144.0, 124.0, 131.0, 107.0, 72.0, 77.0, 55.0, 48.0, 30.0, 35.0, 15.0, 16.0, 19.0, 11.0, 9.0, 11.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.328125, -9.976806640625, -9.62548828125, -9.274169921875, -8.9228515625, -8.571533203125, -8.22021484375, -7.868896484375, -7.517578125, -7.166259765625, -6.81494140625, -6.463623046875, -6.1123046875, -5.760986328125, -5.40966796875, -5.058349609375, -4.70703125, -4.355712890625, -4.00439453125, -3.653076171875, -3.3017578125, -2.950439453125, -2.59912109375, -2.247802734375, -1.896484375, -1.545166015625, -1.19384765625, -0.842529296875, -0.4912109375, -0.139892578125, 0.21142578125, 0.562744140625, 0.9140625, 1.265380859375, 1.61669921875, 1.968017578125, 2.3193359375, 2.670654296875, 3.02197265625, 3.373291015625, 3.724609375, 4.075927734375, 4.42724609375, 4.778564453125, 5.1298828125, 5.481201171875, 5.83251953125, 6.183837890625, 6.53515625, 6.886474609375, 7.23779296875, 7.589111328125, 7.9404296875, 8.291748046875, 8.64306640625, 8.994384765625, 9.345703125, 9.697021484375, 10.04833984375, 10.399658203125, 10.7509765625, 11.102294921875, 11.45361328125, 11.804931640625, 12.15625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 3.0, 4.0, 7.0, 6.0, 8.0, 9.0, 14.0, 24.0, 23.0, 20.0, 29.0, 25.0, 36.0, 37.0, 46.0, 43.0, 63.0, 45.0, 69.0, 46.0, 51.0, 40.0, 51.0, 53.0, 40.0, 33.0, 24.0, 20.0, 20.0, 12.0, 20.0, 13.0, 9.0, 15.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.933067321777344, -34.862876892089844, -33.792686462402344, -32.72249221801758, -31.652301788330078, -30.582111358642578, -29.511919021606445, -28.441726684570312, -27.371536254882812, -26.301345825195312, -25.23115348815918, -24.160961151123047, -23.090770721435547, -22.020580291748047, -20.950387954711914, -19.88019561767578, -18.81000518798828, -17.73981475830078, -16.66962242126465, -15.599431037902832, -14.529239654541016, -13.4590482711792, -12.388856887817383, -11.318665504455566, -10.24847412109375, -9.178282737731934, -8.108091354370117, -7.037899971008301, -5.967708587646484, -4.897517204284668, -3.8273258209228516, -2.757134437561035, -1.6869392395019531, -0.6167478561401367, 0.4534435272216797, 1.523634910583496, 2.5938262939453125, 3.664017677307129, 4.734209060668945, 5.804400444030762, 6.874591827392578, 7.9447832107543945, 9.014974594116211, 10.085165977478027, 11.155357360839844, 12.22554874420166, 13.295740127563477, 14.365931510925293, 15.43612289428711, 16.50631332397461, 17.576505661010742, 18.646697998046875, 19.716888427734375, 20.787078857421875, 21.857271194458008, 22.92746353149414, 23.99765396118164, 25.06784439086914, 26.138036727905273, 27.208229064941406, 28.278419494628906, 29.348609924316406, 30.41880226135254, 31.488994598388672, 32.55918502807617]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 2.0, 10.0, 6.0, 8.0, 5.0, 16.0, 15.0, 27.0, 21.0, 24.0, 34.0, 29.0, 31.0, 36.0, 25.0, 34.0, 44.0, 46.0, 53.0, 31.0, 44.0, 50.0, 42.0, 38.0, 37.0, 40.0, 33.0, 29.0, 28.0, 25.0, 17.0, 13.0, 15.0, 17.0, 15.0, 10.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.264554977416992, -28.384599685668945, -27.5046443939209, -26.62468910217285, -25.744733810424805, -24.864778518676758, -23.984825134277344, -23.104869842529297, -22.22491455078125, -21.344959259033203, -20.465003967285156, -19.58504867553711, -18.705093383789062, -17.825138092041016, -16.94518280029297, -16.065227508544922, -15.185272216796875, -14.305316925048828, -13.425361633300781, -12.545406341552734, -11.665451049804688, -10.78549575805664, -9.90554141998291, -9.025586128234863, -8.145630836486816, -7.2656755447387695, -6.385720252990723, -5.505765438079834, -4.625810146331787, -3.7458548545837402, -2.8659000396728516, -1.9859447479248047, -1.1059894561767578, -0.2260342836380005, 0.6539208889007568, 1.5338759422302246, 2.4138312339782715, 3.2937865257263184, 4.173741340637207, 5.053696632385254, 5.933651924133301, 6.813607215881348, 7.6935625076293945, 8.573516845703125, 9.453472137451172, 10.333427429199219, 11.213382720947266, 12.093338012695312, 12.97329330444336, 13.853248596191406, 14.733203887939453, 15.6131591796875, 16.493114471435547, 17.373069763183594, 18.25302505493164, 19.132980346679688, 20.012935638427734, 20.89289093017578, 21.772846221923828, 22.652801513671875, 23.532756805419922, 24.41271209716797, 25.292667388916016, 26.172622680664062, 27.052576065063477]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 14.0, 35.0, 33.0, 60.0, 78.0, 108.0, 174.0, 271.0, 424.0, 650.0, 1033.0, 1687.0, 2799.0, 4627.0, 7967.0, 13674.0, 24296.0, 43021.0, 78120.0, 132827.0, 193216.0, 200139.0, 144819.0, 86150.0, 48282.0, 26953.0, 15204.0, 8608.0, 5130.0, 3081.0, 1923.0, 1169.0, 674.0, 430.0, 291.0, 197.0, 123.0, 99.0, 57.0, 33.0, 27.0, 13.0, 9.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.625, -42.306640625, -40.98828125, -39.669921875, -38.3515625, -37.033203125, -35.71484375, -34.396484375, -33.078125, -31.759765625, -30.44140625, -29.123046875, -27.8046875, -26.486328125, -25.16796875, -23.849609375, -22.53125, -21.212890625, -19.89453125, -18.576171875, -17.2578125, -15.939453125, -14.62109375, -13.302734375, -11.984375, -10.666015625, -9.34765625, -8.029296875, -6.7109375, -5.392578125, -4.07421875, -2.755859375, -1.4375, -0.119140625, 1.19921875, 2.517578125, 3.8359375, 5.154296875, 6.47265625, 7.791015625, 9.109375, 10.427734375, 11.74609375, 13.064453125, 14.3828125, 15.701171875, 17.01953125, 18.337890625, 19.65625, 20.974609375, 22.29296875, 23.611328125, 24.9296875, 26.248046875, 27.56640625, 28.884765625, 30.203125, 31.521484375, 32.83984375, 34.158203125, 35.4765625, 36.794921875, 38.11328125, 39.431640625, 40.75]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 8.0, 3.0, 5.0, 8.0, 11.0, 14.0, 13.0, 10.0, 26.0, 24.0, 19.0, 27.0, 19.0, 37.0, 32.0, 35.0, 32.0, 37.0, 43.0, 47.0, 49.0, 47.0, 42.0, 42.0, 42.0, 36.0, 35.0, 29.0, 19.0, 34.0, 20.0, 14.0, 33.0, 18.0, 14.0, 17.0, 8.0, 10.0, 8.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.78125, -27.923095703125, -27.06494140625, -26.206787109375, -25.3486328125, -24.490478515625, -23.63232421875, -22.774169921875, -21.916015625, -21.057861328125, -20.19970703125, -19.341552734375, -18.4833984375, -17.625244140625, -16.76708984375, -15.908935546875, -15.05078125, -14.192626953125, -13.33447265625, -12.476318359375, -11.6181640625, -10.760009765625, -9.90185546875, -9.043701171875, -8.185546875, -7.327392578125, -6.46923828125, -5.611083984375, -4.7529296875, -3.894775390625, -3.03662109375, -2.178466796875, -1.3203125, -0.462158203125, 0.39599609375, 1.254150390625, 2.1123046875, 2.970458984375, 3.82861328125, 4.686767578125, 5.544921875, 6.403076171875, 7.26123046875, 8.119384765625, 8.9775390625, 9.835693359375, 10.69384765625, 11.552001953125, 12.41015625, 13.268310546875, 14.12646484375, 14.984619140625, 15.8427734375, 16.700927734375, 17.55908203125, 18.417236328125, 19.275390625, 20.133544921875, 20.99169921875, 21.849853515625, 22.7080078125, 23.566162109375, 24.42431640625, 25.282470703125, 26.140625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 9.0, 7.0, 7.0, 19.0, 23.0, 30.0, 50.0, 64.0, 77.0, 118.0, 212.0, 289.0, 406.0, 665.0, 984.0, 1595.0, 2476.0, 4155.0, 7073.0, 12803.0, 26875.0, 64776.0, 179128.0, 371929.0, 224769.0, 81384.0, 32810.0, 15212.0, 8128.0, 4619.0, 2745.0, 1728.0, 1146.0, 760.0, 508.0, 330.0, 198.0, 140.0, 92.0, 54.0, 56.0, 41.0, 23.0, 19.0, 12.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.6220703125, -69.119140625, -66.6162109375, -64.11328125, -61.6103515625, -59.107421875, -56.6044921875, -54.1015625, -51.5986328125, -49.095703125, -46.5927734375, -44.08984375, -41.5869140625, -39.083984375, -36.5810546875, -34.078125, -31.5751953125, -29.072265625, -26.5693359375, -24.06640625, -21.5634765625, -19.060546875, -16.5576171875, -14.0546875, -11.5517578125, -9.048828125, -6.5458984375, -4.04296875, -1.5400390625, 0.962890625, 3.4658203125, 5.96875, 8.4716796875, 10.974609375, 13.4775390625, 15.98046875, 18.4833984375, 20.986328125, 23.4892578125, 25.9921875, 28.4951171875, 30.998046875, 33.5009765625, 36.00390625, 38.5068359375, 41.009765625, 43.5126953125, 46.015625, 48.5185546875, 51.021484375, 53.5244140625, 56.02734375, 58.5302734375, 61.033203125, 63.5361328125, 66.0390625, 68.5419921875, 71.044921875, 73.5478515625, 76.05078125, 78.5537109375, 81.056640625, 83.5595703125, 86.0625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 1.0, 6.0, 12.0, 6.0, 11.0, 19.0, 9.0, 17.0, 28.0, 14.0, 17.0, 22.0, 30.0, 23.0, 31.0, 34.0, 35.0, 52.0, 37.0, 43.0, 38.0, 50.0, 42.0, 31.0, 36.0, 35.0, 40.0, 34.0, 27.0, 26.0, 35.0, 16.0, 22.0, 21.0, 23.0, 12.0, 14.0, 9.0, 9.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.296875, -15.7578125, -15.21875, -14.6796875, -14.140625, -13.6015625, -13.0625, -12.5234375, -11.984375, -11.4453125, -10.90625, -10.3671875, -9.828125, -9.2890625, -8.75, -8.2109375, -7.671875, -7.1328125, -6.59375, -6.0546875, -5.515625, -4.9765625, -4.4375, -3.8984375, -3.359375, -2.8203125, -2.28125, -1.7421875, -1.203125, -0.6640625, -0.125, 0.4140625, 0.953125, 1.4921875, 2.03125, 2.5703125, 3.109375, 3.6484375, 4.1875, 4.7265625, 5.265625, 5.8046875, 6.34375, 6.8828125, 7.421875, 7.9609375, 8.5, 9.0390625, 9.578125, 10.1171875, 10.65625, 11.1953125, 11.734375, 12.2734375, 12.8125, 13.3515625, 13.890625, 14.4296875, 14.96875, 15.5078125, 16.046875, 16.5859375, 17.125, 17.6640625, 18.203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 14.0, 15.0, 19.0, 29.0, 43.0, 65.0, 85.0, 112.0, 203.0, 280.0, 502.0, 789.0, 1327.0, 2336.0, 4495.0, 8823.0, 17827.0, 38093.0, 86998.0, 192638.0, 301301.0, 211659.0, 97833.0, 42709.0, 19481.0, 9641.0, 4896.0, 2642.0, 1488.0, 812.0, 478.0, 300.0, 196.0, 127.0, 94.0, 66.0, 31.0, 30.0, 19.0, 15.0, 16.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-30.65625, -29.76953125, -28.8828125, -27.99609375, -27.109375, -26.22265625, -25.3359375, -24.44921875, -23.5625, -22.67578125, -21.7890625, -20.90234375, -20.015625, -19.12890625, -18.2421875, -17.35546875, -16.46875, -15.58203125, -14.6953125, -13.80859375, -12.921875, -12.03515625, -11.1484375, -10.26171875, -9.375, -8.48828125, -7.6015625, -6.71484375, -5.828125, -4.94140625, -4.0546875, -3.16796875, -2.28125, -1.39453125, -0.5078125, 0.37890625, 1.265625, 2.15234375, 3.0390625, 3.92578125, 4.8125, 5.69921875, 6.5859375, 7.47265625, 8.359375, 9.24609375, 10.1328125, 11.01953125, 11.90625, 12.79296875, 13.6796875, 14.56640625, 15.453125, 16.33984375, 17.2265625, 18.11328125, 19.0, 19.88671875, 20.7734375, 21.66015625, 22.546875, 23.43359375, 24.3203125, 25.20703125, 26.09375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 21.0, 30.0, 24.0, 34.0, 43.0, 66.0, 65.0, 73.0, 96.0, 94.0, 84.0, 54.0, 51.0, 39.0, 29.0, 23.0, 21.0, 19.0, 12.0, 11.0, 5.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0012836456298828125, -0.0012420117855072021, -0.0012003779411315918, -0.0011587440967559814, -0.001117110252380371, -0.0010754764080047607, -0.0010338425636291504, -0.00099220871925354, -0.0009505748748779297, -0.0009089410305023193, -0.000867307186126709, -0.0008256733417510986, -0.0007840394973754883, -0.0007424056529998779, -0.0007007718086242676, -0.0006591379642486572, -0.0006175041198730469, -0.0005758702754974365, -0.0005342364311218262, -0.0004926025867462158, -0.00045096874237060547, -0.0004093348979949951, -0.00036770105361938477, -0.0003260672092437744, -0.00028443336486816406, -0.0002427995204925537, -0.00020116567611694336, -0.000159531831741333, -0.00011789798736572266, -7.62641429901123e-05, -3.463029861450195e-05, 7.0035457611083984e-06, 4.863739013671875e-05, 9.02712345123291e-05, 0.00013190507888793945, 0.0001735389232635498, 0.00021517276763916016, 0.0002568066120147705, 0.00029844045639038086, 0.0003400743007659912, 0.00038170814514160156, 0.0004233419895172119, 0.00046497583389282227, 0.0005066096782684326, 0.000548243522644043, 0.0005898773670196533, 0.0006315112113952637, 0.000673145055770874, 0.0007147789001464844, 0.0007564127445220947, 0.0007980465888977051, 0.0008396804332733154, 0.0008813142776489258, 0.0009229481220245361, 0.0009645819664001465, 0.0010062158107757568, 0.0010478496551513672, 0.0010894834995269775, 0.0011311173439025879, 0.0011727511882781982, 0.0012143850326538086, 0.001256018877029419, 0.0012976527214050293, 0.0013392865657806396, 0.00138092041015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 5.0, 11.0, 7.0, 13.0, 27.0, 30.0, 48.0, 83.0, 102.0, 153.0, 256.0, 400.0, 646.0, 960.0, 1580.0, 2447.0, 3868.0, 5965.0, 9760.0, 15722.0, 25756.0, 41738.0, 66663.0, 100801.0, 138213.0, 159472.0, 148962.0, 114568.0, 78875.0, 50210.0, 30711.0, 18775.0, 11770.0, 7274.0, 4457.0, 2991.0, 1886.0, 1211.0, 788.0, 490.0, 298.0, 182.0, 139.0, 91.0, 48.0, 38.0, 33.0, 13.0, 13.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.114501953125, -12.60400390625, -12.093505859375, -11.5830078125, -11.072509765625, -10.56201171875, -10.051513671875, -9.541015625, -9.030517578125, -8.52001953125, -8.009521484375, -7.4990234375, -6.988525390625, -6.47802734375, -5.967529296875, -5.45703125, -4.946533203125, -4.43603515625, -3.925537109375, -3.4150390625, -2.904541015625, -2.39404296875, -1.883544921875, -1.373046875, -0.862548828125, -0.35205078125, 0.158447265625, 0.6689453125, 1.179443359375, 1.68994140625, 2.200439453125, 2.7109375, 3.221435546875, 3.73193359375, 4.242431640625, 4.7529296875, 5.263427734375, 5.77392578125, 6.284423828125, 6.794921875, 7.305419921875, 7.81591796875, 8.326416015625, 8.8369140625, 9.347412109375, 9.85791015625, 10.368408203125, 10.87890625, 11.389404296875, 11.89990234375, 12.410400390625, 12.9208984375, 13.431396484375, 13.94189453125, 14.452392578125, 14.962890625, 15.473388671875, 15.98388671875, 16.494384765625, 17.0048828125, 17.515380859375, 18.02587890625, 18.536376953125, 19.046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 6.0, 10.0, 12.0, 13.0, 20.0, 26.0, 34.0, 20.0, 40.0, 29.0, 43.0, 55.0, 53.0, 48.0, 58.0, 49.0, 53.0, 46.0, 45.0, 54.0, 40.0, 29.0, 26.0, 27.0, 25.0, 19.0, 23.0, 17.0, 20.0, 14.0, 7.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.515625, -5.32623291015625, -5.1368408203125, -4.94744873046875, -4.758056640625, -4.56866455078125, -4.3792724609375, -4.18988037109375, -4.00048828125, -3.81109619140625, -3.6217041015625, -3.43231201171875, -3.242919921875, -3.05352783203125, -2.8641357421875, -2.67474365234375, -2.4853515625, -2.29595947265625, -2.1065673828125, -1.91717529296875, -1.727783203125, -1.53839111328125, -1.3489990234375, -1.15960693359375, -0.97021484375, -0.78082275390625, -0.5914306640625, -0.40203857421875, -0.212646484375, -0.02325439453125, 0.1661376953125, 0.35552978515625, 0.544921875, 0.73431396484375, 0.9237060546875, 1.11309814453125, 1.302490234375, 1.49188232421875, 1.6812744140625, 1.87066650390625, 2.06005859375, 2.24945068359375, 2.4388427734375, 2.62823486328125, 2.817626953125, 3.00701904296875, 3.1964111328125, 3.38580322265625, 3.5751953125, 3.76458740234375, 3.9539794921875, 4.14337158203125, 4.332763671875, 4.52215576171875, 4.7115478515625, 4.90093994140625, 5.09033203125, 5.27972412109375, 5.4691162109375, 5.65850830078125, 5.847900390625, 6.03729248046875, 6.2266845703125, 6.41607666015625, 6.60546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 4.0, 4.0, 9.0, 10.0, 12.0, 12.0, 19.0, 15.0, 21.0, 23.0, 35.0, 41.0, 45.0, 60.0, 55.0, 40.0, 53.0, 54.0, 56.0, 47.0, 48.0, 43.0, 44.0, 38.0, 26.0, 26.0, 31.0, 23.0, 13.0, 11.0, 10.0, 8.0, 13.0, 3.0, 8.0, 8.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-35.86669921875, -34.82542419433594, -33.78415298461914, -32.74287796020508, -31.70160675048828, -30.66033172607422, -29.61905860900879, -28.57778549194336, -27.53651237487793, -26.4952392578125, -25.45396614074707, -24.41269302368164, -23.371417999267578, -22.33014678955078, -21.28887176513672, -20.24759864807129, -19.20632553100586, -18.16505241394043, -17.123779296875, -16.08250617980957, -15.041232109069824, -13.999958992004395, -12.958684921264648, -11.917411804199219, -10.876138687133789, -9.83486557006836, -8.79359245300293, -7.752318382263184, -6.711045265197754, -5.669772148132324, -4.628498554229736, -3.5872249603271484, -2.545949935913086, -1.5046765804290771, -0.46340322494506836, 0.5778701305389404, 1.6191434860229492, 2.660416603088379, 3.701690196990967, 4.742963790893555, 5.784236907958984, 6.825510025024414, 7.866783618927002, 8.90805721282959, 9.94933032989502, 10.99060344696045, 12.031877517700195, 13.073150634765625, 14.114423751831055, 15.155696868896484, 16.196969985961914, 17.238243103027344, 18.279518127441406, 19.320789337158203, 20.362064361572266, 21.403337478637695, 22.444610595703125, 23.485883712768555, 24.527156829833984, 25.568429946899414, 26.609703063964844, 27.650978088378906, 28.692251205444336, 29.733524322509766, 30.774797439575195]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 3.0, 9.0, 5.0, 4.0, 9.0, 9.0, 9.0, 6.0, 7.0, 19.0, 16.0, 22.0, 24.0, 29.0, 31.0, 31.0, 33.0, 33.0, 36.0, 37.0, 41.0, 45.0, 43.0, 43.0, 41.0, 40.0, 37.0, 43.0, 34.0, 36.0, 35.0, 28.0, 26.0, 20.0, 15.0, 21.0, 15.0, 18.0, 10.0, 9.0, 6.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-27.09512710571289, -26.266862869262695, -25.438600540161133, -24.610336303710938, -23.782072067260742, -22.953807830810547, -22.125545501708984, -21.29728126525879, -20.469017028808594, -19.6407527923584, -18.812490463256836, -17.98422622680664, -17.155961990356445, -16.32769775390625, -15.499435424804688, -14.671171188354492, -13.84290885925293, -13.01464557647705, -12.186381340026855, -11.358118057250977, -10.529853820800781, -9.701590538024902, -8.873327255249023, -8.045063018798828, -7.216799736022949, -6.388535976409912, -5.560272216796875, -4.732008934020996, -3.903745174407959, -3.075481414794922, -2.247218132019043, -1.4189543724060059, -0.5906925201416016, 0.237571120262146, 1.0658347606658936, 1.8940982818603516, 2.7223620414733887, 3.550625801086426, 4.378889083862305, 5.207152843475342, 6.035416603088379, 6.863680362701416, 7.691944122314453, 8.520207405090332, 9.348470687866211, 10.176734924316406, 11.004998207092285, 11.833261489868164, 12.66152572631836, 13.489789009094238, 14.318053245544434, 15.146316528320312, 15.974580764770508, 16.802845001220703, 17.631107330322266, 18.45937156677246, 19.287635803222656, 20.11590003967285, 20.944162368774414, 21.77242660522461, 22.600690841674805, 23.428955078125, 24.257217407226562, 25.085481643676758, 25.91374397277832]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 5.0, 8.0, 17.0, 21.0, 38.0, 67.0, 90.0, 106.0, 174.0, 261.0, 401.0, 574.0, 933.0, 1476.0, 2143.0, 3122.0, 4869.0, 7706.0, 11536.0, 17682.0, 26467.0, 39236.0, 57273.0, 78022.0, 101954.0, 119871.0, 126162.0, 117114.0, 97191.0, 74099.0, 52769.0, 36335.0, 24328.0, 16440.0, 10522.0, 6805.0, 4385.0, 2908.0, 1838.0, 1214.0, 808.0, 499.0, 346.0, 255.0, 157.0, 93.0, 82.0, 52.0, 41.0, 24.0, 18.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-24.65625, -23.844970703125, -23.03369140625, -22.222412109375, -21.4111328125, -20.599853515625, -19.78857421875, -18.977294921875, -18.166015625, -17.354736328125, -16.54345703125, -15.732177734375, -14.9208984375, -14.109619140625, -13.29833984375, -12.487060546875, -11.67578125, -10.864501953125, -10.05322265625, -9.241943359375, -8.4306640625, -7.619384765625, -6.80810546875, -5.996826171875, -5.185546875, -4.374267578125, -3.56298828125, -2.751708984375, -1.9404296875, -1.129150390625, -0.31787109375, 0.493408203125, 1.3046875, 2.115966796875, 2.92724609375, 3.738525390625, 4.5498046875, 5.361083984375, 6.17236328125, 6.983642578125, 7.794921875, 8.606201171875, 9.41748046875, 10.228759765625, 11.0400390625, 11.851318359375, 12.66259765625, 13.473876953125, 14.28515625, 15.096435546875, 15.90771484375, 16.718994140625, 17.5302734375, 18.341552734375, 19.15283203125, 19.964111328125, 20.775390625, 21.586669921875, 22.39794921875, 23.209228515625, 24.0205078125, 24.831787109375, 25.64306640625, 26.454345703125, 27.265625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 1.0, 7.0, 3.0, 9.0, 10.0, 11.0, 6.0, 10.0, 18.0, 20.0, 21.0, 17.0, 26.0, 31.0, 29.0, 36.0, 34.0, 32.0, 41.0, 43.0, 37.0, 38.0, 46.0, 49.0, 38.0, 40.0, 38.0, 46.0, 27.0, 33.0, 23.0, 24.0, 23.0, 16.0, 27.0, 10.0, 12.0, 16.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.53125, -25.72119140625, -24.9111328125, -24.10107421875, -23.291015625, -22.48095703125, -21.6708984375, -20.86083984375, -20.05078125, -19.24072265625, -18.4306640625, -17.62060546875, -16.810546875, -16.00048828125, -15.1904296875, -14.38037109375, -13.5703125, -12.76025390625, -11.9501953125, -11.14013671875, -10.330078125, -9.52001953125, -8.7099609375, -7.89990234375, -7.08984375, -6.27978515625, -5.4697265625, -4.65966796875, -3.849609375, -3.03955078125, -2.2294921875, -1.41943359375, -0.609375, 0.20068359375, 1.0107421875, 1.82080078125, 2.630859375, 3.44091796875, 4.2509765625, 5.06103515625, 5.87109375, 6.68115234375, 7.4912109375, 8.30126953125, 9.111328125, 9.92138671875, 10.7314453125, 11.54150390625, 12.3515625, 13.16162109375, 13.9716796875, 14.78173828125, 15.591796875, 16.40185546875, 17.2119140625, 18.02197265625, 18.83203125, 19.64208984375, 20.4521484375, 21.26220703125, 22.072265625, 22.88232421875, 23.6923828125, 24.50244140625, 25.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 7.0, 18.0, 29.0, 43.0, 78.0, 118.0, 165.0, 321.0, 520.0, 920.0, 1449.0, 2567.0, 4263.0, 7484.0, 12927.0, 22233.0, 37407.0, 61531.0, 94115.0, 131088.0, 156965.0, 154664.0, 127300.0, 89690.0, 57676.0, 35106.0, 20933.0, 11986.0, 7033.0, 4030.0, 2346.0, 1422.0, 811.0, 518.0, 324.0, 161.0, 115.0, 79.0, 42.0, 26.0, 14.0, 14.0, 5.0, 6.0, 2.0, 5.0, 3.0], "bins": [-35.4375, -34.50341796875, -33.5693359375, -32.63525390625, -31.701171875, -30.76708984375, -29.8330078125, -28.89892578125, -27.96484375, -27.03076171875, -26.0966796875, -25.16259765625, -24.228515625, -23.29443359375, -22.3603515625, -21.42626953125, -20.4921875, -19.55810546875, -18.6240234375, -17.68994140625, -16.755859375, -15.82177734375, -14.8876953125, -13.95361328125, -13.01953125, -12.08544921875, -11.1513671875, -10.21728515625, -9.283203125, -8.34912109375, -7.4150390625, -6.48095703125, -5.546875, -4.61279296875, -3.6787109375, -2.74462890625, -1.810546875, -0.87646484375, 0.0576171875, 0.99169921875, 1.92578125, 2.85986328125, 3.7939453125, 4.72802734375, 5.662109375, 6.59619140625, 7.5302734375, 8.46435546875, 9.3984375, 10.33251953125, 11.2666015625, 12.20068359375, 13.134765625, 14.06884765625, 15.0029296875, 15.93701171875, 16.87109375, 17.80517578125, 18.7392578125, 19.67333984375, 20.607421875, 21.54150390625, 22.4755859375, 23.40966796875, 24.34375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 2.0, 6.0, 8.0, 14.0, 9.0, 13.0, 11.0, 22.0, 16.0, 26.0, 32.0, 38.0, 38.0, 29.0, 33.0, 37.0, 54.0, 63.0, 52.0, 51.0, 43.0, 51.0, 33.0, 42.0, 43.0, 37.0, 22.0, 24.0, 29.0, 19.0, 19.0, 21.0, 11.0, 9.0, 11.0, 7.0, 4.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.335693359375, -19.74951171875, -19.163330078125, -18.5771484375, -17.990966796875, -17.40478515625, -16.818603515625, -16.232421875, -15.646240234375, -15.06005859375, -14.473876953125, -13.8876953125, -13.301513671875, -12.71533203125, -12.129150390625, -11.54296875, -10.956787109375, -10.37060546875, -9.784423828125, -9.1982421875, -8.612060546875, -8.02587890625, -7.439697265625, -6.853515625, -6.267333984375, -5.68115234375, -5.094970703125, -4.5087890625, -3.922607421875, -3.33642578125, -2.750244140625, -2.1640625, -1.577880859375, -0.99169921875, -0.405517578125, 0.1806640625, 0.766845703125, 1.35302734375, 1.939208984375, 2.525390625, 3.111572265625, 3.69775390625, 4.283935546875, 4.8701171875, 5.456298828125, 6.04248046875, 6.628662109375, 7.21484375, 7.801025390625, 8.38720703125, 8.973388671875, 9.5595703125, 10.145751953125, 10.73193359375, 11.318115234375, 11.904296875, 12.490478515625, 13.07666015625, 13.662841796875, 14.2490234375, 14.835205078125, 15.42138671875, 16.007568359375, 16.59375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 34.0, 30.0, 49.0, 52.0, 110.0, 143.0, 206.0, 283.0, 451.0, 665.0, 994.0, 1597.0, 2408.0, 3944.0, 6167.0, 10044.0, 16480.0, 27047.0, 44638.0, 70786.0, 108537.0, 147490.0, 166036.0, 147302.0, 107754.0, 70824.0, 44164.0, 26742.0, 16426.0, 9979.0, 6229.0, 3885.0, 2461.0, 1559.0, 1039.0, 639.0, 427.0, 285.0, 205.0, 128.0, 117.0, 48.0, 47.0, 31.0, 15.0, 13.0, 5.0, 10.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.43994140625, -16.8486328125, -16.25732421875, -15.666015625, -15.07470703125, -14.4833984375, -13.89208984375, -13.30078125, -12.70947265625, -12.1181640625, -11.52685546875, -10.935546875, -10.34423828125, -9.7529296875, -9.16162109375, -8.5703125, -7.97900390625, -7.3876953125, -6.79638671875, -6.205078125, -5.61376953125, -5.0224609375, -4.43115234375, -3.83984375, -3.24853515625, -2.6572265625, -2.06591796875, -1.474609375, -0.88330078125, -0.2919921875, 0.29931640625, 0.890625, 1.48193359375, 2.0732421875, 2.66455078125, 3.255859375, 3.84716796875, 4.4384765625, 5.02978515625, 5.62109375, 6.21240234375, 6.8037109375, 7.39501953125, 7.986328125, 8.57763671875, 9.1689453125, 9.76025390625, 10.3515625, 10.94287109375, 11.5341796875, 12.12548828125, 12.716796875, 13.30810546875, 13.8994140625, 14.49072265625, 15.08203125, 15.67333984375, 16.2646484375, 16.85595703125, 17.447265625, 18.03857421875, 18.6298828125, 19.22119140625, 19.8125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 5.0, 9.0, 12.0, 15.0, 16.0, 26.0, 28.0, 29.0, 34.0, 46.0, 47.0, 48.0, 60.0, 54.0, 55.0, 74.0, 69.0, 53.0, 41.0, 47.0, 42.0, 26.0, 20.0, 30.0, 19.0, 20.0, 11.0, 11.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001750946044921875, -0.0016855597496032715, -0.001620173454284668, -0.0015547871589660645, -0.001489400863647461, -0.0014240145683288574, -0.001358628273010254, -0.0012932419776916504, -0.0012278556823730469, -0.0011624693870544434, -0.0010970830917358398, -0.0010316967964172363, -0.0009663105010986328, -0.0009009242057800293, -0.0008355379104614258, -0.0007701516151428223, -0.0007047653198242188, -0.0006393790245056152, -0.0005739927291870117, -0.0005086064338684082, -0.0004432201385498047, -0.00037783384323120117, -0.00031244754791259766, -0.00024706125259399414, -0.00018167495727539062, -0.00011628866195678711, -5.0902366638183594e-05, 1.4483928680419922e-05, 7.987022399902344e-05, 0.00014525651931762695, 0.00021064281463623047, 0.000276029109954834, 0.0003414154052734375, 0.000406801700592041, 0.00047218799591064453, 0.000537574291229248, 0.0006029605865478516, 0.0006683468818664551, 0.0007337331771850586, 0.0007991194725036621, 0.0008645057678222656, 0.0009298920631408691, 0.0009952783584594727, 0.0010606646537780762, 0.0011260509490966797, 0.0011914372444152832, 0.0012568235397338867, 0.0013222098350524902, 0.0013875961303710938, 0.0014529824256896973, 0.0015183687210083008, 0.0015837550163269043, 0.0016491413116455078, 0.0017145276069641113, 0.0017799139022827148, 0.0018453001976013184, 0.0019106864929199219, 0.0019760727882385254, 0.002041459083557129, 0.0021068453788757324, 0.002172231674194336, 0.0022376179695129395, 0.002303004264831543, 0.0023683905601501465, 0.00243377685546875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 15.0, 16.0, 12.0, 26.0, 31.0, 53.0, 72.0, 103.0, 183.0, 242.0, 365.0, 590.0, 1011.0, 1546.0, 2629.0, 4405.0, 7418.0, 12127.0, 21011.0, 35351.0, 57625.0, 89821.0, 128291.0, 157968.0, 159453.0, 130251.0, 91224.0, 58536.0, 35638.0, 21352.0, 12477.0, 7357.0, 4421.0, 2571.0, 1614.0, 1011.0, 634.0, 384.0, 248.0, 156.0, 112.0, 64.0, 59.0, 23.0, 24.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.438720703125, -15.90869140625, -15.378662109375, -14.8486328125, -14.318603515625, -13.78857421875, -13.258544921875, -12.728515625, -12.198486328125, -11.66845703125, -11.138427734375, -10.6083984375, -10.078369140625, -9.54833984375, -9.018310546875, -8.48828125, -7.958251953125, -7.42822265625, -6.898193359375, -6.3681640625, -5.838134765625, -5.30810546875, -4.778076171875, -4.248046875, -3.718017578125, -3.18798828125, -2.657958984375, -2.1279296875, -1.597900390625, -1.06787109375, -0.537841796875, -0.0078125, 0.522216796875, 1.05224609375, 1.582275390625, 2.1123046875, 2.642333984375, 3.17236328125, 3.702392578125, 4.232421875, 4.762451171875, 5.29248046875, 5.822509765625, 6.3525390625, 6.882568359375, 7.41259765625, 7.942626953125, 8.47265625, 9.002685546875, 9.53271484375, 10.062744140625, 10.5927734375, 11.122802734375, 11.65283203125, 12.182861328125, 12.712890625, 13.242919921875, 13.77294921875, 14.302978515625, 14.8330078125, 15.363037109375, 15.89306640625, 16.423095703125, 16.953125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 9.0, 13.0, 14.0, 16.0, 17.0, 14.0, 35.0, 28.0, 27.0, 35.0, 49.0, 33.0, 59.0, 47.0, 58.0, 66.0, 41.0, 45.0, 47.0, 33.0, 34.0, 35.0, 35.0, 28.0, 19.0, 27.0, 20.0, 15.0, 14.0, 8.0, 7.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.890625, -5.71954345703125, -5.5484619140625, -5.37738037109375, -5.206298828125, -5.03521728515625, -4.8641357421875, -4.69305419921875, -4.52197265625, -4.35089111328125, -4.1798095703125, -4.00872802734375, -3.837646484375, -3.66656494140625, -3.4954833984375, -3.32440185546875, -3.1533203125, -2.98223876953125, -2.8111572265625, -2.64007568359375, -2.468994140625, -2.29791259765625, -2.1268310546875, -1.95574951171875, -1.78466796875, -1.61358642578125, -1.4425048828125, -1.27142333984375, -1.100341796875, -0.92926025390625, -0.7581787109375, -0.58709716796875, -0.416015625, -0.24493408203125, -0.0738525390625, 0.09722900390625, 0.268310546875, 0.43939208984375, 0.6104736328125, 0.78155517578125, 0.95263671875, 1.12371826171875, 1.2947998046875, 1.46588134765625, 1.636962890625, 1.80804443359375, 1.9791259765625, 2.15020751953125, 2.3212890625, 2.49237060546875, 2.6634521484375, 2.83453369140625, 3.005615234375, 3.17669677734375, 3.3477783203125, 3.51885986328125, 3.68994140625, 3.86102294921875, 4.0321044921875, 4.20318603515625, 4.374267578125, 4.54534912109375, 4.7164306640625, 4.88751220703125, 5.05859375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 5.0, 7.0, 10.0, 12.0, 16.0, 25.0, 22.0, 29.0, 26.0, 41.0, 55.0, 45.0, 60.0, 39.0, 67.0, 62.0, 71.0, 53.0, 51.0, 40.0, 38.0, 54.0, 22.0, 25.0, 24.0, 17.0, 11.0, 13.0, 12.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-38.23472595214844, -37.09128952026367, -35.94785690307617, -34.804420471191406, -33.66098403930664, -32.51755142211914, -31.374114990234375, -30.230680465698242, -29.08724594116211, -27.943811416625977, -26.80037498474121, -25.656940460205078, -24.513505935668945, -23.370071411132812, -22.226634979248047, -21.083200454711914, -19.93976402282715, -18.796329498291016, -17.65289306640625, -16.509458541870117, -15.366024017333984, -14.222588539123535, -13.079153060913086, -11.935718536376953, -10.792283058166504, -9.648847579956055, -8.505413055419922, -7.361977577209473, -6.218542575836182, -5.075107574462891, -3.9316720962524414, -2.7882375717163086, -1.6448020935058594, -0.5013669729232788, 0.6420681476593018, 1.7855033874511719, 2.928938388824463, 4.072373390197754, 5.215808868408203, 6.359243392944336, 7.502678871154785, 8.646114349365234, 9.789548873901367, 10.932984352111816, 12.076419830322266, 13.219854354858398, 14.363289833068848, 15.50672435760498, 16.65015983581543, 17.793594360351562, 18.937030792236328, 20.08046531677246, 21.223899841308594, 22.36733627319336, 23.510770797729492, 24.654205322265625, 25.79764175415039, 26.941076278686523, 28.08451271057129, 29.227947235107422, 30.371381759643555, 31.514816284179688, 32.65825271606445, 33.80168914794922, 34.94512176513672]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 9.0, 10.0, 13.0, 9.0, 9.0, 15.0, 16.0, 14.0, 22.0, 22.0, 26.0, 28.0, 35.0, 32.0, 33.0, 31.0, 37.0, 46.0, 40.0, 31.0, 32.0, 50.0, 51.0, 41.0, 35.0, 32.0, 36.0, 35.0, 31.0, 21.0, 20.0, 27.0, 17.0, 21.0, 10.0, 13.0, 7.0, 4.0, 9.0, 6.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.145259857177734, -25.346248626708984, -24.547239303588867, -23.748228073120117, -22.94921875, -22.15020751953125, -21.3511962890625, -20.552186965942383, -19.753177642822266, -18.954166412353516, -18.1551570892334, -17.35614585876465, -16.55713653564453, -15.758125305175781, -14.959115028381348, -14.160104751586914, -13.361093521118164, -12.56208324432373, -11.763072967529297, -10.964061737060547, -10.16505241394043, -9.36604118347168, -8.567030906677246, -7.7680206298828125, -6.969010353088379, -6.170000076293945, -5.370989799499512, -4.57197904586792, -3.7729687690734863, -2.9739584922790527, -2.174947738647461, -1.3759374618530273, -0.5769290924072266, 0.22208130359649658, 1.0210916996002197, 1.8201022148132324, 2.619112491607666, 3.4181227684020996, 4.217133522033691, 5.016143798828125, 5.815154075622559, 6.614164352416992, 7.413174629211426, 8.21218490600586, 9.01119613647461, 9.810205459594727, 10.609216690063477, 11.40822696685791, 12.207237243652344, 13.006247520446777, 13.805257797241211, 14.604269027709961, 15.403278350830078, 16.202289581298828, 17.001300811767578, 17.800310134887695, 18.599319458007812, 19.398330688476562, 20.19734001159668, 20.99635124206543, 21.795360565185547, 22.594371795654297, 23.393383026123047, 24.192392349243164, 24.991403579711914]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 12.0, 14.0, 23.0, 31.0, 58.0, 107.0, 147.0, 231.0, 387.0, 638.0, 1073.0, 1740.0, 2824.0, 4738.0, 8422.0, 14605.0, 26498.0, 48500.0, 94013.0, 186193.0, 373862.0, 682533.0, 926404.0, 808754.0, 489696.0, 250258.0, 126039.0, 65270.0, 35146.0, 19319.0, 10936.0, 6399.0, 3828.0, 2213.0, 1330.0, 804.0, 462.0, 298.0, 195.0, 117.0, 79.0, 31.0, 22.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.625, -27.75, -26.875, -26.0, -25.125, -24.25, -23.375, -22.5, -21.625, -20.75, -19.875, -19.0, -18.125, -17.25, -16.375, -15.5, -14.625, -13.75, -12.875, -12.0, -11.125, -10.25, -9.375, -8.5, -7.625, -6.75, -5.875, -5.0, -4.125, -3.25, -2.375, -1.5, -0.625, 0.25, 1.125, 2.0, 2.875, 3.75, 4.625, 5.5, 6.375, 7.25, 8.125, 9.0, 9.875, 10.75, 11.625, 12.5, 13.375, 14.25, 15.125, 16.0, 16.875, 17.75, 18.625, 19.5, 20.375, 21.25, 22.125, 23.0, 23.875, 24.75, 25.625, 26.5, 27.375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 5.0, 11.0, 9.0, 7.0, 20.0, 17.0, 15.0, 22.0, 23.0, 31.0, 27.0, 35.0, 46.0, 21.0, 38.0, 54.0, 36.0, 44.0, 42.0, 46.0, 46.0, 42.0, 32.0, 37.0, 34.0, 36.0, 28.0, 32.0, 21.0, 24.0, 14.0, 18.0, 16.0, 3.0, 10.0, 8.0, 13.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.459228515625, -18.87158203125, -18.283935546875, -17.6962890625, -17.108642578125, -16.52099609375, -15.933349609375, -15.345703125, -14.758056640625, -14.17041015625, -13.582763671875, -12.9951171875, -12.407470703125, -11.81982421875, -11.232177734375, -10.64453125, -10.056884765625, -9.46923828125, -8.881591796875, -8.2939453125, -7.706298828125, -7.11865234375, -6.531005859375, -5.943359375, -5.355712890625, -4.76806640625, -4.180419921875, -3.5927734375, -3.005126953125, -2.41748046875, -1.829833984375, -1.2421875, -0.654541015625, -0.06689453125, 0.520751953125, 1.1083984375, 1.696044921875, 2.28369140625, 2.871337890625, 3.458984375, 4.046630859375, 4.63427734375, 5.221923828125, 5.8095703125, 6.397216796875, 6.98486328125, 7.572509765625, 8.16015625, 8.747802734375, 9.33544921875, 9.923095703125, 10.5107421875, 11.098388671875, 11.68603515625, 12.273681640625, 12.861328125, 13.448974609375, 14.03662109375, 14.624267578125, 15.2119140625, 15.799560546875, 16.38720703125, 16.974853515625, 17.5625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 9.0, 15.0, 14.0, 30.0, 44.0, 68.0, 104.0, 136.0, 227.0, 380.0, 603.0, 928.0, 1490.0, 2511.0, 3920.0, 6602.0, 10990.0, 18038.0, 30446.0, 51085.0, 86409.0, 146994.0, 247335.0, 402288.0, 596026.0, 731272.0, 660557.0, 467094.0, 294986.0, 177286.0, 104770.0, 61044.0, 36241.0, 21470.0, 12802.0, 7831.0, 4640.0, 2825.0, 1767.0, 1088.0, 678.0, 450.0, 279.0, 177.0, 115.0, 81.0, 52.0, 32.0, 18.0, 15.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.5, -22.758056640625, -22.01611328125, -21.274169921875, -20.5322265625, -19.790283203125, -19.04833984375, -18.306396484375, -17.564453125, -16.822509765625, -16.08056640625, -15.338623046875, -14.5966796875, -13.854736328125, -13.11279296875, -12.370849609375, -11.62890625, -10.886962890625, -10.14501953125, -9.403076171875, -8.6611328125, -7.919189453125, -7.17724609375, -6.435302734375, -5.693359375, -4.951416015625, -4.20947265625, -3.467529296875, -2.7255859375, -1.983642578125, -1.24169921875, -0.499755859375, 0.2421875, 0.984130859375, 1.72607421875, 2.468017578125, 3.2099609375, 3.951904296875, 4.69384765625, 5.435791015625, 6.177734375, 6.919677734375, 7.66162109375, 8.403564453125, 9.1455078125, 9.887451171875, 10.62939453125, 11.371337890625, 12.11328125, 12.855224609375, 13.59716796875, 14.339111328125, 15.0810546875, 15.822998046875, 16.56494140625, 17.306884765625, 18.048828125, 18.790771484375, 19.53271484375, 20.274658203125, 21.0166015625, 21.758544921875, 22.50048828125, 23.242431640625, 23.984375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 6.0, 10.0, 15.0, 25.0, 34.0, 23.0, 37.0, 50.0, 50.0, 72.0, 83.0, 103.0, 100.0, 138.0, 155.0, 168.0, 192.0, 187.0, 223.0, 244.0, 222.0, 236.0, 248.0, 192.0, 173.0, 177.0, 143.0, 143.0, 126.0, 91.0, 75.0, 77.0, 55.0, 25.0, 33.0, 22.0, 24.0, 16.0, 7.0, 13.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-9.28125, -9.0115966796875, -8.741943359375, -8.4722900390625, -8.20263671875, -7.9329833984375, -7.663330078125, -7.3936767578125, -7.1240234375, -6.8543701171875, -6.584716796875, -6.3150634765625, -6.04541015625, -5.7757568359375, -5.506103515625, -5.2364501953125, -4.966796875, -4.6971435546875, -4.427490234375, -4.1578369140625, -3.88818359375, -3.6185302734375, -3.348876953125, -3.0792236328125, -2.8095703125, -2.5399169921875, -2.270263671875, -2.0006103515625, -1.73095703125, -1.4613037109375, -1.191650390625, -0.9219970703125, -0.65234375, -0.3826904296875, -0.113037109375, 0.1566162109375, 0.42626953125, 0.6959228515625, 0.965576171875, 1.2352294921875, 1.5048828125, 1.7745361328125, 2.044189453125, 2.3138427734375, 2.58349609375, 2.8531494140625, 3.122802734375, 3.3924560546875, 3.662109375, 3.9317626953125, 4.201416015625, 4.4710693359375, 4.74072265625, 5.0103759765625, 5.280029296875, 5.5496826171875, 5.8193359375, 6.0889892578125, 6.358642578125, 6.6282958984375, 6.89794921875, 7.1676025390625, 7.437255859375, 7.7069091796875, 7.9765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 15.0, 8.0, 18.0, 29.0, 36.0, 49.0, 45.0, 39.0, 47.0, 50.0, 55.0, 56.0, 61.0, 57.0, 44.0, 60.0, 50.0, 47.0, 36.0, 37.0, 20.0, 19.0, 14.0, 16.0, 13.0, 16.0, 7.0, 5.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-40.7682991027832, -39.72697448730469, -38.685646057128906, -37.644317626953125, -36.60299301147461, -35.561668395996094, -34.52033996582031, -33.47901153564453, -32.437686920166016, -31.396360397338867, -30.35503387451172, -29.31370735168457, -28.272380828857422, -27.231054306030273, -26.189727783203125, -25.148401260375977, -24.107074737548828, -23.06574821472168, -22.02442169189453, -20.983095169067383, -19.941768646240234, -18.900442123413086, -17.859115600585938, -16.81778907775879, -15.77646255493164, -14.735136032104492, -13.693809509277344, -12.652482986450195, -11.611156463623047, -10.569829940795898, -9.52850341796875, -8.487176895141602, -7.445850372314453, -6.404523849487305, -5.363197326660156, -4.321870803833008, -3.2805442810058594, -2.239217758178711, -1.1978912353515625, -0.15656471252441406, 0.8847618103027344, 1.9260883331298828, 2.9674148559570312, 4.00874137878418, 5.050067901611328, 6.091394424438477, 7.132720947265625, 8.174047470092773, 9.215373992919922, 10.25670051574707, 11.298027038574219, 12.339353561401367, 13.380680084228516, 14.422006607055664, 15.463333129882812, 16.50465965270996, 17.54598617553711, 18.587312698364258, 19.628639221191406, 20.669965744018555, 21.711292266845703, 22.75261878967285, 23.7939453125, 24.83527183532715, 25.876598358154297]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 12.0, 13.0, 10.0, 14.0, 14.0, 27.0, 23.0, 28.0, 29.0, 36.0, 43.0, 40.0, 35.0, 30.0, 48.0, 51.0, 41.0, 53.0, 55.0, 44.0, 48.0, 31.0, 30.0, 28.0, 29.0, 23.0, 28.0, 19.0, 24.0, 16.0, 13.0, 12.0, 5.0, 3.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.79245376586914, -22.08443832397461, -21.376422882080078, -20.668407440185547, -19.960390090942383, -19.25237464904785, -18.54435920715332, -17.83634376525879, -17.128328323364258, -16.420312881469727, -15.712296485900879, -15.004281044006348, -14.296265602111816, -13.588249206542969, -12.880233764648438, -12.172218322753906, -11.464201927185059, -10.756186485290527, -10.04817008972168, -9.340154647827148, -8.632139205932617, -7.924123287200928, -7.216107368469238, -6.508091926574707, -5.800076007843018, -5.092060089111328, -4.384044647216797, -3.6760287284851074, -2.968013048171997, -2.2599973678588867, -1.5519814491271973, -0.843966007232666, -0.13595008850097656, 0.5720656514167786, 1.2800813913345337, 1.9880971908569336, 2.696112871170044, 3.4041285514831543, 4.112144470214844, 4.820159912109375, 5.5281758308410645, 6.236191749572754, 6.944207191467285, 7.652223110198975, 8.360239028930664, 9.068254470825195, 9.776269912719727, 10.484285354614258, 11.192301750183105, 11.900317192077637, 12.608333587646484, 13.316349029541016, 14.024364471435547, 14.732379913330078, 15.440396308898926, 16.14841079711914, 16.856428146362305, 17.564443588256836, 18.272459030151367, 18.98047637939453, 19.688491821289062, 20.396507263183594, 21.104522705078125, 21.812538146972656, 22.520553588867188]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 7.0, 8.0, 5.0, 7.0, 9.0, 13.0, 29.0, 39.0, 43.0, 74.0, 111.0, 125.0, 165.0, 267.0, 374.0, 527.0, 760.0, 986.0, 1625.0, 2445.0, 4167.0, 7625.0, 15984.0, 36079.0, 87204.0, 191308.0, 285082.0, 220314.0, 106811.0, 44708.0, 19355.0, 9197.0, 4706.0, 2690.0, 1802.0, 1175.0, 781.0, 548.0, 411.0, 298.0, 218.0, 131.0, 85.0, 74.0, 56.0, 36.0, 28.0, 20.0, 13.0, 12.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40625, -40.00830078125, -38.6103515625, -37.21240234375, -35.814453125, -34.41650390625, -33.0185546875, -31.62060546875, -30.22265625, -28.82470703125, -27.4267578125, -26.02880859375, -24.630859375, -23.23291015625, -21.8349609375, -20.43701171875, -19.0390625, -17.64111328125, -16.2431640625, -14.84521484375, -13.447265625, -12.04931640625, -10.6513671875, -9.25341796875, -7.85546875, -6.45751953125, -5.0595703125, -3.66162109375, -2.263671875, -0.86572265625, 0.5322265625, 1.93017578125, 3.328125, 4.72607421875, 6.1240234375, 7.52197265625, 8.919921875, 10.31787109375, 11.7158203125, 13.11376953125, 14.51171875, 15.90966796875, 17.3076171875, 18.70556640625, 20.103515625, 21.50146484375, 22.8994140625, 24.29736328125, 25.6953125, 27.09326171875, 28.4912109375, 29.88916015625, 31.287109375, 32.68505859375, 34.0830078125, 35.48095703125, 36.87890625, 38.27685546875, 39.6748046875, 41.07275390625, 42.470703125, 43.86865234375, 45.2666015625, 46.66455078125, 48.0625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 2.0, 5.0, 9.0, 13.0, 14.0, 8.0, 13.0, 13.0, 15.0, 18.0, 33.0, 18.0, 26.0, 32.0, 38.0, 38.0, 41.0, 54.0, 34.0, 38.0, 42.0, 49.0, 48.0, 44.0, 31.0, 42.0, 31.0, 32.0, 33.0, 28.0, 24.0, 22.0, 19.0, 18.0, 9.0, 8.0, 7.0, 14.0, 11.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.234375, -20.55615234375, -19.8779296875, -19.19970703125, -18.521484375, -17.84326171875, -17.1650390625, -16.48681640625, -15.80859375, -15.13037109375, -14.4521484375, -13.77392578125, -13.095703125, -12.41748046875, -11.7392578125, -11.06103515625, -10.3828125, -9.70458984375, -9.0263671875, -8.34814453125, -7.669921875, -6.99169921875, -6.3134765625, -5.63525390625, -4.95703125, -4.27880859375, -3.6005859375, -2.92236328125, -2.244140625, -1.56591796875, -0.8876953125, -0.20947265625, 0.46875, 1.14697265625, 1.8251953125, 2.50341796875, 3.181640625, 3.85986328125, 4.5380859375, 5.21630859375, 5.89453125, 6.57275390625, 7.2509765625, 7.92919921875, 8.607421875, 9.28564453125, 9.9638671875, 10.64208984375, 11.3203125, 11.99853515625, 12.6767578125, 13.35498046875, 14.033203125, 14.71142578125, 15.3896484375, 16.06787109375, 16.74609375, 17.42431640625, 18.1025390625, 18.78076171875, 19.458984375, 20.13720703125, 20.8154296875, 21.49365234375, 22.171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 8.0, 10.0, 27.0, 31.0, 39.0, 62.0, 70.0, 109.0, 177.0, 237.0, 334.0, 482.0, 691.0, 1078.0, 1587.0, 2517.0, 3916.0, 6572.0, 12241.0, 24950.0, 57287.0, 142684.0, 302616.0, 273765.0, 120022.0, 48105.0, 21764.0, 10714.0, 6037.0, 3517.0, 2268.0, 1478.0, 1027.0, 632.0, 449.0, 293.0, 199.0, 175.0, 119.0, 75.0, 51.0, 35.0, 24.0, 20.0, 12.0, 20.0, 9.0, 1.0, 2.0, 3.0, 5.0, 4.0], "bins": [-54.65625, -53.09033203125, -51.5244140625, -49.95849609375, -48.392578125, -46.82666015625, -45.2607421875, -43.69482421875, -42.12890625, -40.56298828125, -38.9970703125, -37.43115234375, -35.865234375, -34.29931640625, -32.7333984375, -31.16748046875, -29.6015625, -28.03564453125, -26.4697265625, -24.90380859375, -23.337890625, -21.77197265625, -20.2060546875, -18.64013671875, -17.07421875, -15.50830078125, -13.9423828125, -12.37646484375, -10.810546875, -9.24462890625, -7.6787109375, -6.11279296875, -4.546875, -2.98095703125, -1.4150390625, 0.15087890625, 1.716796875, 3.28271484375, 4.8486328125, 6.41455078125, 7.98046875, 9.54638671875, 11.1123046875, 12.67822265625, 14.244140625, 15.81005859375, 17.3759765625, 18.94189453125, 20.5078125, 22.07373046875, 23.6396484375, 25.20556640625, 26.771484375, 28.33740234375, 29.9033203125, 31.46923828125, 33.03515625, 34.60107421875, 36.1669921875, 37.73291015625, 39.298828125, 40.86474609375, 42.4306640625, 43.99658203125, 45.5625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 6.0, 9.0, 14.0, 13.0, 17.0, 18.0, 22.0, 22.0, 31.0, 25.0, 29.0, 29.0, 28.0, 29.0, 32.0, 45.0, 56.0, 39.0, 34.0, 32.0, 36.0, 31.0, 32.0, 34.0, 32.0, 29.0, 30.0, 25.0, 31.0, 19.0, 23.0, 14.0, 21.0, 8.0, 17.0, 12.0, 13.0, 11.0, 5.0, 6.0, 7.0, 10.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-13.0546875, -12.6796875, -12.3046875, -11.9296875, -11.5546875, -11.1796875, -10.8046875, -10.4296875, -10.0546875, -9.6796875, -9.3046875, -8.9296875, -8.5546875, -8.1796875, -7.8046875, -7.4296875, -7.0546875, -6.6796875, -6.3046875, -5.9296875, -5.5546875, -5.1796875, -4.8046875, -4.4296875, -4.0546875, -3.6796875, -3.3046875, -2.9296875, -2.5546875, -2.1796875, -1.8046875, -1.4296875, -1.0546875, -0.6796875, -0.3046875, 0.0703125, 0.4453125, 0.8203125, 1.1953125, 1.5703125, 1.9453125, 2.3203125, 2.6953125, 3.0703125, 3.4453125, 3.8203125, 4.1953125, 4.5703125, 4.9453125, 5.3203125, 5.6953125, 6.0703125, 6.4453125, 6.8203125, 7.1953125, 7.5703125, 7.9453125, 8.3203125, 8.6953125, 9.0703125, 9.4453125, 9.8203125, 10.1953125, 10.5703125, 10.9453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 16.0, 31.0, 24.0, 39.0, 58.0, 78.0, 143.0, 205.0, 321.0, 432.0, 703.0, 1107.0, 1953.0, 3103.0, 5573.0, 9653.0, 17853.0, 34847.0, 70834.0, 149651.0, 262940.0, 238722.0, 125613.0, 59927.0, 29275.0, 15252.0, 8330.0, 4726.0, 2689.0, 1609.0, 1030.0, 634.0, 396.0, 252.0, 157.0, 105.0, 85.0, 48.0, 38.0, 22.0, 20.0, 13.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.0625, -20.421875, -19.78125, -19.140625, -18.5, -17.859375, -17.21875, -16.578125, -15.9375, -15.296875, -14.65625, -14.015625, -13.375, -12.734375, -12.09375, -11.453125, -10.8125, -10.171875, -9.53125, -8.890625, -8.25, -7.609375, -6.96875, -6.328125, -5.6875, -5.046875, -4.40625, -3.765625, -3.125, -2.484375, -1.84375, -1.203125, -0.5625, 0.078125, 0.71875, 1.359375, 2.0, 2.640625, 3.28125, 3.921875, 4.5625, 5.203125, 5.84375, 6.484375, 7.125, 7.765625, 8.40625, 9.046875, 9.6875, 10.328125, 10.96875, 11.609375, 12.25, 12.890625, 13.53125, 14.171875, 14.8125, 15.453125, 16.09375, 16.734375, 17.375, 18.015625, 18.65625, 19.296875, 19.9375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 16.0, 25.0, 50.0, 57.0, 82.0, 112.0, 121.0, 109.0, 125.0, 70.0, 52.0, 37.0, 32.0, 21.0, 10.0, 7.0, 9.0, 7.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0014095306396484375, -0.0013667196035385132, -0.0013239085674285889, -0.0012810975313186646, -0.0012382864952087402, -0.001195475459098816, -0.0011526644229888916, -0.0011098533868789673, -0.001067042350769043, -0.0010242313146591187, -0.0009814202785491943, -0.00093860924243927, -0.0008957982063293457, -0.0008529871702194214, -0.0008101761341094971, -0.0007673650979995728, -0.0007245540618896484, -0.0006817430257797241, -0.0006389319896697998, -0.0005961209535598755, -0.0005533099174499512, -0.0005104988813400269, -0.00046768784523010254, -0.0004248768091201782, -0.0003820657730102539, -0.0003392547369003296, -0.0002964437007904053, -0.00025363266468048096, -0.00021082162857055664, -0.00016801059246063232, -0.000125199556350708, -8.238852024078369e-05, -3.9577484130859375e-05, 3.2335519790649414e-06, 4.604458808898926e-05, 8.885562419891357e-05, 0.0001316666603088379, 0.0001744776964187622, 0.00021728873252868652, 0.00026009976863861084, 0.00030291080474853516, 0.00034572184085845947, 0.0003885328769683838, 0.0004313439130783081, 0.0004741549491882324, 0.0005169659852981567, 0.0005597770214080811, 0.0006025880575180054, 0.0006453990936279297, 0.000688210129737854, 0.0007310211658477783, 0.0007738322019577026, 0.000816643238067627, 0.0008594542741775513, 0.0009022653102874756, 0.0009450763463973999, 0.0009878873825073242, 0.0010306984186172485, 0.0010735094547271729, 0.0011163204908370972, 0.0011591315269470215, 0.0012019425630569458, 0.0012447535991668701, 0.0012875646352767944, 0.0013303756713867188]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 13.0, 26.0, 21.0, 34.0, 60.0, 65.0, 121.0, 189.0, 244.0, 377.0, 521.0, 862.0, 1385.0, 2165.0, 3383.0, 5693.0, 9110.0, 15594.0, 26905.0, 46359.0, 79305.0, 128325.0, 176929.0, 184791.0, 143344.0, 91472.0, 53960.0, 31248.0, 18001.0, 10778.0, 6510.0, 3864.0, 2398.0, 1493.0, 1010.0, 623.0, 438.0, 314.0, 199.0, 132.0, 86.0, 57.0, 35.0, 37.0, 16.0, 12.0, 15.0, 9.0, 7.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0], "bins": [-14.3984375, -13.950439453125, -13.50244140625, -13.054443359375, -12.6064453125, -12.158447265625, -11.71044921875, -11.262451171875, -10.814453125, -10.366455078125, -9.91845703125, -9.470458984375, -9.0224609375, -8.574462890625, -8.12646484375, -7.678466796875, -7.23046875, -6.782470703125, -6.33447265625, -5.886474609375, -5.4384765625, -4.990478515625, -4.54248046875, -4.094482421875, -3.646484375, -3.198486328125, -2.75048828125, -2.302490234375, -1.8544921875, -1.406494140625, -0.95849609375, -0.510498046875, -0.0625, 0.385498046875, 0.83349609375, 1.281494140625, 1.7294921875, 2.177490234375, 2.62548828125, 3.073486328125, 3.521484375, 3.969482421875, 4.41748046875, 4.865478515625, 5.3134765625, 5.761474609375, 6.20947265625, 6.657470703125, 7.10546875, 7.553466796875, 8.00146484375, 8.449462890625, 8.8974609375, 9.345458984375, 9.79345703125, 10.241455078125, 10.689453125, 11.137451171875, 11.58544921875, 12.033447265625, 12.4814453125, 12.929443359375, 13.37744140625, 13.825439453125, 14.2734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 8.0, 11.0, 11.0, 15.0, 24.0, 26.0, 26.0, 31.0, 42.0, 41.0, 56.0, 57.0, 66.0, 64.0, 64.0, 56.0, 49.0, 52.0, 44.0, 46.0, 35.0, 26.0, 26.0, 20.0, 18.0, 8.0, 12.0, 7.0, 2.0, 5.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.06640625, -4.90667724609375, -4.7469482421875, -4.58721923828125, -4.427490234375, -4.26776123046875, -4.1080322265625, -3.94830322265625, -3.78857421875, -3.62884521484375, -3.4691162109375, -3.30938720703125, -3.149658203125, -2.98992919921875, -2.8302001953125, -2.67047119140625, -2.5107421875, -2.35101318359375, -2.1912841796875, -2.03155517578125, -1.871826171875, -1.71209716796875, -1.5523681640625, -1.39263916015625, -1.23291015625, -1.07318115234375, -0.9134521484375, -0.75372314453125, -0.593994140625, -0.43426513671875, -0.2745361328125, -0.11480712890625, 0.044921875, 0.20465087890625, 0.3643798828125, 0.52410888671875, 0.683837890625, 0.84356689453125, 1.0032958984375, 1.16302490234375, 1.32275390625, 1.48248291015625, 1.6422119140625, 1.80194091796875, 1.961669921875, 2.12139892578125, 2.2811279296875, 2.44085693359375, 2.6005859375, 2.76031494140625, 2.9200439453125, 3.07977294921875, 3.239501953125, 3.39923095703125, 3.5589599609375, 3.71868896484375, 3.87841796875, 4.03814697265625, 4.1978759765625, 4.35760498046875, 4.517333984375, 4.67706298828125, 4.8367919921875, 4.99652099609375, 5.15625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 5.0, 8.0, 15.0, 15.0, 20.0, 29.0, 28.0, 37.0, 37.0, 50.0, 45.0, 53.0, 65.0, 50.0, 47.0, 53.0, 52.0, 52.0, 51.0, 34.0, 33.0, 40.0, 23.0, 25.0, 17.0, 14.0, 22.0, 16.0, 8.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-33.87684631347656, -32.922794342041016, -31.96874237060547, -31.014690399169922, -30.060638427734375, -29.106586456298828, -28.152536392211914, -27.198484420776367, -26.24443244934082, -25.290380477905273, -24.336328506469727, -23.38227653503418, -22.428226470947266, -21.47417449951172, -20.520122528076172, -19.566070556640625, -18.612018585205078, -17.65796661376953, -16.703914642333984, -15.749863624572754, -14.795811653137207, -13.84175968170166, -12.88770866394043, -11.933656692504883, -10.979604721069336, -10.025552749633789, -9.071500778198242, -8.117449760437012, -7.163397789001465, -6.209345817565918, -5.255294322967529, -4.301242828369141, -3.347188949584961, -2.393137216567993, -1.4390854835510254, -0.4850337505340576, 0.46901798248291016, 1.423069953918457, 2.3771214485168457, 3.3311729431152344, 4.285224914550781, 5.239276885986328, 6.193328380584717, 7.1473798751831055, 8.101431846618652, 9.0554838180542, 10.00953483581543, 10.963586807250977, 11.917638778686523, 12.87169075012207, 13.825742721557617, 14.779793739318848, 15.733845710754395, 16.687896728515625, 17.641948699951172, 18.59600067138672, 19.550052642822266, 20.504104614257812, 21.45815658569336, 22.412208557128906, 23.366260528564453, 24.3203125, 25.274362564086914, 26.22841453552246, 27.182466506958008]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 3.0, 5.0, 9.0, 10.0, 10.0, 16.0, 15.0, 10.0, 21.0, 24.0, 19.0, 35.0, 26.0, 35.0, 45.0, 42.0, 38.0, 40.0, 48.0, 50.0, 48.0, 50.0, 47.0, 47.0, 36.0, 34.0, 31.0, 41.0, 18.0, 29.0, 22.0, 22.0, 18.0, 15.0, 11.0, 8.0, 5.0, 11.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.00705337524414, -22.3016414642334, -21.596229553222656, -20.890817642211914, -20.185405731201172, -19.47999382019043, -18.774581909179688, -18.069169998168945, -17.363758087158203, -16.65834617614746, -15.952934265136719, -15.247522354125977, -14.542110443115234, -13.836698532104492, -13.13128662109375, -12.425874710083008, -11.720462799072266, -11.015050888061523, -10.309638977050781, -9.604227066040039, -8.898815155029297, -8.193403244018555, -7.4879913330078125, -6.78257942199707, -6.077167510986328, -5.371755599975586, -4.666343688964844, -3.9609317779541016, -3.2555198669433594, -2.550107955932617, -1.844696044921875, -1.1392841339111328, -0.4338722229003906, 0.27153968811035156, 0.9769515991210938, 1.682363510131836, 2.387775421142578, 3.0931873321533203, 3.7985992431640625, 4.504011154174805, 5.209423065185547, 5.914834976196289, 6.620246887207031, 7.325658798217773, 8.031070709228516, 8.736482620239258, 9.44189453125, 10.147306442260742, 10.852718353271484, 11.558130264282227, 12.263542175292969, 12.968954086303711, 13.674365997314453, 14.379777908325195, 15.085189819335938, 15.79060173034668, 16.496013641357422, 17.201425552368164, 17.906837463378906, 18.61224937438965, 19.31766128540039, 20.023073196411133, 20.728485107421875, 21.433897018432617, 22.13930892944336]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 4.0, 9.0, 14.0, 28.0, 26.0, 41.0, 57.0, 94.0, 149.0, 246.0, 385.0, 562.0, 862.0, 1314.0, 2100.0, 3304.0, 5366.0, 8192.0, 13061.0, 20516.0, 32183.0, 48693.0, 71432.0, 98800.0, 123633.0, 137162.0, 130374.0, 108574.0, 81289.0, 56197.0, 37341.0, 24092.0, 15359.0, 9992.0, 6255.0, 3984.0, 2432.0, 1569.0, 1011.0, 665.0, 389.0, 295.0, 183.0, 119.0, 84.0, 59.0, 23.0, 9.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-25.53125, -24.75, -23.96875, -23.1875, -22.40625, -21.625, -20.84375, -20.0625, -19.28125, -18.5, -17.71875, -16.9375, -16.15625, -15.375, -14.59375, -13.8125, -13.03125, -12.25, -11.46875, -10.6875, -9.90625, -9.125, -8.34375, -7.5625, -6.78125, -6.0, -5.21875, -4.4375, -3.65625, -2.875, -2.09375, -1.3125, -0.53125, 0.25, 1.03125, 1.8125, 2.59375, 3.375, 4.15625, 4.9375, 5.71875, 6.5, 7.28125, 8.0625, 8.84375, 9.625, 10.40625, 11.1875, 11.96875, 12.75, 13.53125, 14.3125, 15.09375, 15.875, 16.65625, 17.4375, 18.21875, 19.0, 19.78125, 20.5625, 21.34375, 22.125, 22.90625, 23.6875, 24.46875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 11.0, 16.0, 8.0, 20.0, 19.0, 25.0, 14.0, 24.0, 25.0, 40.0, 26.0, 38.0, 40.0, 38.0, 35.0, 34.0, 39.0, 59.0, 36.0, 52.0, 21.0, 44.0, 57.0, 33.0, 31.0, 25.0, 31.0, 14.0, 23.0, 29.0, 7.0, 14.0, 10.0, 15.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.9580078125, -21.291015625, -20.6240234375, -19.95703125, -19.2900390625, -18.623046875, -17.9560546875, -17.2890625, -16.6220703125, -15.955078125, -15.2880859375, -14.62109375, -13.9541015625, -13.287109375, -12.6201171875, -11.953125, -11.2861328125, -10.619140625, -9.9521484375, -9.28515625, -8.6181640625, -7.951171875, -7.2841796875, -6.6171875, -5.9501953125, -5.283203125, -4.6162109375, -3.94921875, -3.2822265625, -2.615234375, -1.9482421875, -1.28125, -0.6142578125, 0.052734375, 0.7197265625, 1.38671875, 2.0537109375, 2.720703125, 3.3876953125, 4.0546875, 4.7216796875, 5.388671875, 6.0556640625, 6.72265625, 7.3896484375, 8.056640625, 8.7236328125, 9.390625, 10.0576171875, 10.724609375, 11.3916015625, 12.05859375, 12.7255859375, 13.392578125, 14.0595703125, 14.7265625, 15.3935546875, 16.060546875, 16.7275390625, 17.39453125, 18.0615234375, 18.728515625, 19.3955078125, 20.0625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 7.0, 7.0, 10.0, 10.0, 16.0, 28.0, 51.0, 67.0, 96.0, 145.0, 195.0, 292.0, 424.0, 648.0, 990.0, 1471.0, 2098.0, 3047.0, 4485.0, 6724.0, 9939.0, 14267.0, 21146.0, 30029.0, 42714.0, 58114.0, 77550.0, 96020.0, 110873.0, 115247.0, 107571.0, 91567.0, 72209.0, 54139.0, 38919.0, 27525.0, 19130.0, 13129.0, 8837.0, 6051.0, 4039.0, 2768.0, 1915.0, 1305.0, 860.0, 599.0, 414.0, 271.0, 197.0, 124.0, 94.0, 57.0, 42.0, 31.0, 26.0, 13.0, 13.0, 4.0, 4.0, 4.0, 3.0, 1.0], "bins": [-18.703125, -18.10693359375, -17.5107421875, -16.91455078125, -16.318359375, -15.72216796875, -15.1259765625, -14.52978515625, -13.93359375, -13.33740234375, -12.7412109375, -12.14501953125, -11.548828125, -10.95263671875, -10.3564453125, -9.76025390625, -9.1640625, -8.56787109375, -7.9716796875, -7.37548828125, -6.779296875, -6.18310546875, -5.5869140625, -4.99072265625, -4.39453125, -3.79833984375, -3.2021484375, -2.60595703125, -2.009765625, -1.41357421875, -0.8173828125, -0.22119140625, 0.375, 0.97119140625, 1.5673828125, 2.16357421875, 2.759765625, 3.35595703125, 3.9521484375, 4.54833984375, 5.14453125, 5.74072265625, 6.3369140625, 6.93310546875, 7.529296875, 8.12548828125, 8.7216796875, 9.31787109375, 9.9140625, 10.51025390625, 11.1064453125, 11.70263671875, 12.298828125, 12.89501953125, 13.4912109375, 14.08740234375, 14.68359375, 15.27978515625, 15.8759765625, 16.47216796875, 17.068359375, 17.66455078125, 18.2607421875, 18.85693359375, 19.453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 8.0, 7.0, 15.0, 16.0, 15.0, 18.0, 23.0, 29.0, 23.0, 30.0, 39.0, 30.0, 38.0, 35.0, 49.0, 46.0, 32.0, 42.0, 36.0, 43.0, 39.0, 37.0, 41.0, 41.0, 29.0, 29.0, 29.0, 18.0, 20.0, 15.0, 22.0, 14.0, 12.0, 8.0, 10.0, 9.0, 4.0, 3.0, 2.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8671875, -14.431396484375, -13.99560546875, -13.559814453125, -13.1240234375, -12.688232421875, -12.25244140625, -11.816650390625, -11.380859375, -10.945068359375, -10.50927734375, -10.073486328125, -9.6376953125, -9.201904296875, -8.76611328125, -8.330322265625, -7.89453125, -7.458740234375, -7.02294921875, -6.587158203125, -6.1513671875, -5.715576171875, -5.27978515625, -4.843994140625, -4.408203125, -3.972412109375, -3.53662109375, -3.100830078125, -2.6650390625, -2.229248046875, -1.79345703125, -1.357666015625, -0.921875, -0.486083984375, -0.05029296875, 0.385498046875, 0.8212890625, 1.257080078125, 1.69287109375, 2.128662109375, 2.564453125, 3.000244140625, 3.43603515625, 3.871826171875, 4.3076171875, 4.743408203125, 5.17919921875, 5.614990234375, 6.05078125, 6.486572265625, 6.92236328125, 7.358154296875, 7.7939453125, 8.229736328125, 8.66552734375, 9.101318359375, 9.537109375, 9.972900390625, 10.40869140625, 10.844482421875, 11.2802734375, 11.716064453125, 12.15185546875, 12.587646484375, 13.0234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 10.0, 19.0, 14.0, 47.0, 55.0, 78.0, 154.0, 203.0, 347.0, 614.0, 959.0, 1581.0, 2669.0, 4686.0, 7927.0, 13739.0, 24533.0, 43465.0, 76888.0, 128276.0, 181770.0, 193883.0, 149005.0, 93865.0, 53679.0, 29865.0, 16946.0, 9617.0, 5550.0, 3213.0, 1887.0, 1133.0, 701.0, 401.0, 269.0, 174.0, 112.0, 75.0, 48.0, 24.0, 29.0, 12.0, 6.0, 8.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-21.4375, -20.810302734375, -20.18310546875, -19.555908203125, -18.9287109375, -18.301513671875, -17.67431640625, -17.047119140625, -16.419921875, -15.792724609375, -15.16552734375, -14.538330078125, -13.9111328125, -13.283935546875, -12.65673828125, -12.029541015625, -11.40234375, -10.775146484375, -10.14794921875, -9.520751953125, -8.8935546875, -8.266357421875, -7.63916015625, -7.011962890625, -6.384765625, -5.757568359375, -5.13037109375, -4.503173828125, -3.8759765625, -3.248779296875, -2.62158203125, -1.994384765625, -1.3671875, -0.739990234375, -0.11279296875, 0.514404296875, 1.1416015625, 1.768798828125, 2.39599609375, 3.023193359375, 3.650390625, 4.277587890625, 4.90478515625, 5.531982421875, 6.1591796875, 6.786376953125, 7.41357421875, 8.040771484375, 8.66796875, 9.295166015625, 9.92236328125, 10.549560546875, 11.1767578125, 11.803955078125, 12.43115234375, 13.058349609375, 13.685546875, 14.312744140625, 14.93994140625, 15.567138671875, 16.1943359375, 16.821533203125, 17.44873046875, 18.075927734375, 18.703125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 10.0, 8.0, 10.0, 14.0, 13.0, 23.0, 28.0, 41.0, 29.0, 31.0, 31.0, 42.0, 50.0, 40.0, 48.0, 62.0, 57.0, 53.0, 50.0, 49.0, 40.0, 44.0, 27.0, 35.0, 32.0, 13.0, 13.0, 12.0, 12.0, 11.0, 5.0, 6.0, 9.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0015411376953125, -0.0014872103929519653, -0.0014332830905914307, -0.001379355788230896, -0.0013254284858703613, -0.0012715011835098267, -0.001217573881149292, -0.0011636465787887573, -0.0011097192764282227, -0.001055791974067688, -0.0010018646717071533, -0.0009479373693466187, -0.000894010066986084, -0.0008400827646255493, -0.0007861554622650146, -0.00073222815990448, -0.0006783008575439453, -0.0006243735551834106, -0.000570446252822876, -0.0005165189504623413, -0.00046259164810180664, -0.00040866434574127197, -0.0003547370433807373, -0.00030080974102020264, -0.00024688243865966797, -0.0001929551362991333, -0.00013902783393859863, -8.510053157806396e-05, -3.11732292175293e-05, 2.275407314300537e-05, 7.668137550354004e-05, 0.0001306086778640747, 0.00018453598022460938, 0.00023846328258514404, 0.0002923905849456787, 0.0003463178873062134, 0.00040024518966674805, 0.0004541724920272827, 0.0005080997943878174, 0.000562027096748352, 0.0006159543991088867, 0.0006698817014694214, 0.0007238090038299561, 0.0007777363061904907, 0.0008316636085510254, 0.0008855909109115601, 0.0009395182132720947, 0.0009934455156326294, 0.001047372817993164, 0.0011013001203536987, 0.0011552274227142334, 0.001209154725074768, 0.0012630820274353027, 0.0013170093297958374, 0.001370936632156372, 0.0014248639345169067, 0.0014787912368774414, 0.001532718539237976, 0.0015866458415985107, 0.0016405731439590454, 0.00169450044631958, 0.0017484277486801147, 0.0018023550510406494, 0.001856282353401184, 0.0019102096557617188]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 10.0, 24.0, 37.0, 49.0, 61.0, 110.0, 182.0, 319.0, 535.0, 925.0, 1705.0, 3200.0, 5877.0, 10967.0, 20489.0, 38682.0, 71508.0, 123413.0, 182991.0, 203440.0, 161573.0, 101239.0, 56396.0, 29923.0, 16158.0, 8376.0, 4583.0, 2599.0, 1336.0, 757.0, 468.0, 227.0, 126.0, 72.0, 45.0, 40.0, 26.0, 14.0, 17.0, 11.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.487548828125, -17.89697265625, -17.306396484375, -16.7158203125, -16.125244140625, -15.53466796875, -14.944091796875, -14.353515625, -13.762939453125, -13.17236328125, -12.581787109375, -11.9912109375, -11.400634765625, -10.81005859375, -10.219482421875, -9.62890625, -9.038330078125, -8.44775390625, -7.857177734375, -7.2666015625, -6.676025390625, -6.08544921875, -5.494873046875, -4.904296875, -4.313720703125, -3.72314453125, -3.132568359375, -2.5419921875, -1.951416015625, -1.36083984375, -0.770263671875, -0.1796875, 0.410888671875, 1.00146484375, 1.592041015625, 2.1826171875, 2.773193359375, 3.36376953125, 3.954345703125, 4.544921875, 5.135498046875, 5.72607421875, 6.316650390625, 6.9072265625, 7.497802734375, 8.08837890625, 8.678955078125, 9.26953125, 9.860107421875, 10.45068359375, 11.041259765625, 11.6318359375, 12.222412109375, 12.81298828125, 13.403564453125, 13.994140625, 14.584716796875, 15.17529296875, 15.765869140625, 16.3564453125, 16.947021484375, 17.53759765625, 18.128173828125, 18.71875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 8.0, 3.0, 6.0, 10.0, 8.0, 16.0, 20.0, 32.0, 18.0, 20.0, 26.0, 43.0, 36.0, 50.0, 53.0, 57.0, 64.0, 66.0, 54.0, 59.0, 57.0, 49.0, 35.0, 42.0, 30.0, 24.0, 25.0, 20.0, 13.0, 12.0, 15.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.46875, -6.296875, -6.125, -5.953125, -5.78125, -5.609375, -5.4375, -5.265625, -5.09375, -4.921875, -4.75, -4.578125, -4.40625, -4.234375, -4.0625, -3.890625, -3.71875, -3.546875, -3.375, -3.203125, -3.03125, -2.859375, -2.6875, -2.515625, -2.34375, -2.171875, -2.0, -1.828125, -1.65625, -1.484375, -1.3125, -1.140625, -0.96875, -0.796875, -0.625, -0.453125, -0.28125, -0.109375, 0.0625, 0.234375, 0.40625, 0.578125, 0.75, 0.921875, 1.09375, 1.265625, 1.4375, 1.609375, 1.78125, 1.953125, 2.125, 2.296875, 2.46875, 2.640625, 2.8125, 2.984375, 3.15625, 3.328125, 3.5, 3.671875, 3.84375, 4.015625, 4.1875, 4.359375, 4.53125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 13.0, 8.0, 14.0, 17.0, 23.0, 35.0, 41.0, 35.0, 37.0, 60.0, 63.0, 52.0, 63.0, 61.0, 46.0, 71.0, 56.0, 49.0, 51.0, 39.0, 37.0, 19.0, 30.0, 12.0, 14.0, 6.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.52616882324219, -36.46769714355469, -35.40922546386719, -34.35075378417969, -33.29228210449219, -32.23381042480469, -31.175338745117188, -30.116867065429688, -29.058395385742188, -27.999923706054688, -26.941452026367188, -25.882980346679688, -24.824508666992188, -23.766036987304688, -22.707565307617188, -21.649093627929688, -20.590621948242188, -19.532150268554688, -18.473678588867188, -17.415206909179688, -16.356735229492188, -15.298263549804688, -14.239791870117188, -13.181320190429688, -12.122848510742188, -11.064376831054688, -10.005905151367188, -8.947433471679688, -7.8889617919921875, -6.8304901123046875, -5.7720184326171875, -4.7135467529296875, -3.655078887939453, -2.596607208251953, -1.5381355285644531, -0.4796638488769531, 0.5788078308105469, 1.6372795104980469, 2.695751190185547, 3.754222869873047, 4.812694549560547, 5.871166229248047, 6.929637908935547, 7.988109588623047, 9.046581268310547, 10.105052947998047, 11.163524627685547, 12.221996307373047, 13.280467987060547, 14.338939666748047, 15.397411346435547, 16.455883026123047, 17.514354705810547, 18.572826385498047, 19.631298065185547, 20.689769744873047, 21.748241424560547, 22.806713104248047, 23.865184783935547, 24.923656463623047, 25.982128143310547, 27.040599822998047, 28.099071502685547, 29.157543182373047, 30.216014862060547]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 9.0, 11.0, 10.0, 12.0, 10.0, 12.0, 16.0, 18.0, 28.0, 25.0, 23.0, 30.0, 36.0, 35.0, 21.0, 32.0, 28.0, 41.0, 64.0, 38.0, 39.0, 36.0, 39.0, 39.0, 40.0, 36.0, 29.0, 33.0, 27.0, 31.0, 24.0, 21.0, 11.0, 17.0, 17.0, 13.0, 11.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.468870162963867, -19.79831886291504, -19.12776756286621, -18.457216262817383, -17.786663055419922, -17.116111755371094, -16.445560455322266, -15.775009155273438, -15.10445785522461, -14.433906555175781, -13.763355255126953, -13.092803001403809, -12.42225170135498, -11.751700401306152, -11.081148147583008, -10.41059684753418, -9.740045547485352, -9.069494247436523, -8.398942947387695, -7.728390693664551, -7.057839393615723, -6.3872880935668945, -5.716736316680908, -5.046184539794922, -4.375633239746094, -3.7050817012786865, -3.0345301628112793, -2.363978624343872, -1.6934270858764648, -1.0228755474090576, -0.3523240089416504, 0.31822776794433594, 0.9887771606445312, 1.6593286991119385, 2.3298802375793457, 3.000431776046753, 3.67098331451416, 4.341534614562988, 5.012086391448975, 5.682638168334961, 6.353189468383789, 7.023740768432617, 7.6942925453186035, 8.36484432220459, 9.035395622253418, 9.705946922302246, 10.37649917602539, 11.047050476074219, 11.717601776123047, 12.388153076171875, 13.058704376220703, 13.729256629943848, 14.399807929992676, 15.070359230041504, 15.740911483764648, 16.411462783813477, 17.082014083862305, 17.752565383911133, 18.42311668395996, 19.09366798400879, 19.76422119140625, 20.434772491455078, 21.105323791503906, 21.775875091552734, 22.446426391601562]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 18.0, 32.0, 52.0, 73.0, 120.0, 154.0, 310.0, 503.0, 830.0, 1451.0, 2572.0, 4488.0, 8294.0, 15348.0, 29663.0, 59609.0, 127794.0, 284348.0, 631812.0, 1066958.0, 985485.0, 531654.0, 234427.0, 105595.0, 49829.0, 24729.0, 12691.0, 6735.0, 3591.0, 2138.0, 1192.0, 672.0, 426.0, 255.0, 157.0, 83.0, 65.0, 36.0, 22.0, 29.0, 12.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.890625, -31.02587890625, -30.1611328125, -29.29638671875, -28.431640625, -27.56689453125, -26.7021484375, -25.83740234375, -24.97265625, -24.10791015625, -23.2431640625, -22.37841796875, -21.513671875, -20.64892578125, -19.7841796875, -18.91943359375, -18.0546875, -17.18994140625, -16.3251953125, -15.46044921875, -14.595703125, -13.73095703125, -12.8662109375, -12.00146484375, -11.13671875, -10.27197265625, -9.4072265625, -8.54248046875, -7.677734375, -6.81298828125, -5.9482421875, -5.08349609375, -4.21875, -3.35400390625, -2.4892578125, -1.62451171875, -0.759765625, 0.10498046875, 0.9697265625, 1.83447265625, 2.69921875, 3.56396484375, 4.4287109375, 5.29345703125, 6.158203125, 7.02294921875, 7.8876953125, 8.75244140625, 9.6171875, 10.48193359375, 11.3466796875, 12.21142578125, 13.076171875, 13.94091796875, 14.8056640625, 15.67041015625, 16.53515625, 17.39990234375, 18.2646484375, 19.12939453125, 19.994140625, 20.85888671875, 21.7236328125, 22.58837890625, 23.453125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 8.0, 12.0, 8.0, 5.0, 16.0, 14.0, 10.0, 17.0, 10.0, 12.0, 18.0, 14.0, 23.0, 25.0, 17.0, 29.0, 30.0, 35.0, 28.0, 32.0, 28.0, 34.0, 29.0, 43.0, 33.0, 39.0, 36.0, 26.0, 35.0, 30.0, 28.0, 29.0, 33.0, 19.0, 34.0, 22.0, 19.0, 18.0, 20.0, 7.0, 17.0, 8.0, 5.0, 5.0, 5.0, 4.0, 10.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-13.1015625, -12.6968994140625, -12.292236328125, -11.8875732421875, -11.48291015625, -11.0782470703125, -10.673583984375, -10.2689208984375, -9.8642578125, -9.4595947265625, -9.054931640625, -8.6502685546875, -8.24560546875, -7.8409423828125, -7.436279296875, -7.0316162109375, -6.626953125, -6.2222900390625, -5.817626953125, -5.4129638671875, -5.00830078125, -4.6036376953125, -4.198974609375, -3.7943115234375, -3.3896484375, -2.9849853515625, -2.580322265625, -2.1756591796875, -1.77099609375, -1.3663330078125, -0.961669921875, -0.5570068359375, -0.15234375, 0.2523193359375, 0.656982421875, 1.0616455078125, 1.46630859375, 1.8709716796875, 2.275634765625, 2.6802978515625, 3.0849609375, 3.4896240234375, 3.894287109375, 4.2989501953125, 4.70361328125, 5.1082763671875, 5.512939453125, 5.9176025390625, 6.322265625, 6.7269287109375, 7.131591796875, 7.5362548828125, 7.94091796875, 8.3455810546875, 8.750244140625, 9.1549072265625, 9.5595703125, 9.9642333984375, 10.368896484375, 10.7735595703125, 11.17822265625, 11.5828857421875, 11.987548828125, 12.3922119140625, 12.796875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 11.0, 20.0, 36.0, 43.0, 60.0, 87.0, 173.0, 260.0, 418.0, 722.0, 1056.0, 1704.0, 2847.0, 4682.0, 7793.0, 13422.0, 23310.0, 41282.0, 74234.0, 136741.0, 249543.0, 445873.0, 719056.0, 870437.0, 678937.0, 410138.0, 227983.0, 124342.0, 67820.0, 38299.0, 21771.0, 12446.0, 7230.0, 4457.0, 2623.0, 1608.0, 1035.0, 588.0, 412.0, 261.0, 180.0, 130.0, 59.0, 58.0, 29.0, 17.0, 9.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-22.703125, -21.980712890625, -21.25830078125, -20.535888671875, -19.8134765625, -19.091064453125, -18.36865234375, -17.646240234375, -16.923828125, -16.201416015625, -15.47900390625, -14.756591796875, -14.0341796875, -13.311767578125, -12.58935546875, -11.866943359375, -11.14453125, -10.422119140625, -9.69970703125, -8.977294921875, -8.2548828125, -7.532470703125, -6.81005859375, -6.087646484375, -5.365234375, -4.642822265625, -3.92041015625, -3.197998046875, -2.4755859375, -1.753173828125, -1.03076171875, -0.308349609375, 0.4140625, 1.136474609375, 1.85888671875, 2.581298828125, 3.3037109375, 4.026123046875, 4.74853515625, 5.470947265625, 6.193359375, 6.915771484375, 7.63818359375, 8.360595703125, 9.0830078125, 9.805419921875, 10.52783203125, 11.250244140625, 11.97265625, 12.695068359375, 13.41748046875, 14.139892578125, 14.8623046875, 15.584716796875, 16.30712890625, 17.029541015625, 17.751953125, 18.474365234375, 19.19677734375, 19.919189453125, 20.6416015625, 21.364013671875, 22.08642578125, 22.808837890625, 23.53125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 4.0, 10.0, 8.0, 12.0, 22.0, 26.0, 37.0, 48.0, 72.0, 74.0, 102.0, 121.0, 141.0, 192.0, 214.0, 261.0, 253.0, 299.0, 294.0, 275.0, 269.0, 246.0, 226.0, 160.0, 151.0, 120.0, 81.0, 92.0, 50.0, 58.0, 43.0, 31.0, 25.0, 19.0, 7.0, 9.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.228271484375, -7.94873046875, -7.669189453125, -7.3896484375, -7.110107421875, -6.83056640625, -6.551025390625, -6.271484375, -5.991943359375, -5.71240234375, -5.432861328125, -5.1533203125, -4.873779296875, -4.59423828125, -4.314697265625, -4.03515625, -3.755615234375, -3.47607421875, -3.196533203125, -2.9169921875, -2.637451171875, -2.35791015625, -2.078369140625, -1.798828125, -1.519287109375, -1.23974609375, -0.960205078125, -0.6806640625, -0.401123046875, -0.12158203125, 0.157958984375, 0.4375, 0.717041015625, 0.99658203125, 1.276123046875, 1.5556640625, 1.835205078125, 2.11474609375, 2.394287109375, 2.673828125, 2.953369140625, 3.23291015625, 3.512451171875, 3.7919921875, 4.071533203125, 4.35107421875, 4.630615234375, 4.91015625, 5.189697265625, 5.46923828125, 5.748779296875, 6.0283203125, 6.307861328125, 6.58740234375, 6.866943359375, 7.146484375, 7.426025390625, 7.70556640625, 7.985107421875, 8.2646484375, 8.544189453125, 8.82373046875, 9.103271484375, 9.3828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 9.0, 8.0, 6.0, 17.0, 12.0, 20.0, 26.0, 32.0, 42.0, 50.0, 60.0, 62.0, 51.0, 85.0, 54.0, 61.0, 63.0, 59.0, 55.0, 41.0, 35.0, 30.0, 22.0, 20.0, 17.0, 17.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.959232330322266, -32.002872467041016, -31.0465087890625, -30.090147018432617, -29.133785247802734, -28.17742347717285, -27.22106170654297, -26.26470184326172, -25.308338165283203, -24.35197639465332, -23.395614624023438, -22.439252853393555, -21.482891082763672, -20.52652931213379, -19.570167541503906, -18.613807678222656, -17.657445907592773, -16.70108413696289, -15.744722366333008, -14.788360595703125, -13.831998825073242, -12.87563705444336, -11.919276237487793, -10.96291446685791, -10.006552696228027, -9.050190925598145, -8.093829154968262, -7.137467861175537, -6.181106090545654, -5.2247443199157715, -4.268383026123047, -3.312021255493164, -2.3556575775146484, -1.3992959260940552, -0.4429342746734619, 0.5134272575378418, 1.4697890281677246, 2.4261507987976074, 3.382512092590332, 4.338873863220215, 5.295235633850098, 6.2515974044799805, 7.207959175109863, 8.16431999206543, 9.120681762695312, 10.077043533325195, 11.033405303955078, 11.989767074584961, 12.946128845214844, 13.902490615844727, 14.85885238647461, 15.815214157104492, 16.771575927734375, 17.727937698364258, 18.68429946899414, 19.64065933227539, 20.597023010253906, 21.55338478088379, 22.509746551513672, 23.466108322143555, 24.422470092773438, 25.37883186340332, 26.335193634033203, 27.291553497314453, 28.247915267944336]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 12.0, 9.0, 14.0, 18.0, 13.0, 15.0, 17.0, 33.0, 33.0, 27.0, 40.0, 36.0, 32.0, 33.0, 45.0, 32.0, 37.0, 41.0, 48.0, 42.0, 35.0, 44.0, 45.0, 40.0, 33.0, 35.0, 29.0, 20.0, 19.0, 19.0, 17.0, 16.0, 14.0, 11.0, 7.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-19.292423248291016, -18.728939056396484, -18.16545295715332, -17.60196876525879, -17.038482666015625, -16.474998474121094, -15.911514282226562, -15.348029136657715, -14.784543991088867, -14.22105884552002, -13.657573699951172, -13.09408950805664, -12.530604362487793, -11.967119216918945, -11.403635025024414, -10.840149879455566, -10.276664733886719, -9.713179588317871, -9.149694442749023, -8.586210250854492, -8.022725105285645, -7.459239959716797, -6.895755290985107, -6.332270622253418, -5.76878547668457, -5.205300331115723, -4.641815662384033, -4.078330993652344, -3.514845848083496, -2.9513609409332275, -2.387876033782959, -1.8243911266326904, -1.2609062194824219, -0.6974213123321533, -0.13393640518188477, 0.4295485019683838, 0.9930334091186523, 1.556518316268921, 2.1200032234191895, 2.683488130569458, 3.2469730377197266, 3.810457944869995, 4.373942852020264, 4.937427520751953, 5.500912666320801, 6.064397811889648, 6.627882480621338, 7.191367149353027, 7.754852294921875, 8.318337440490723, 8.88182258605957, 9.445306777954102, 10.00879192352295, 10.572277069091797, 11.135761260986328, 11.699246406555176, 12.262731552124023, 12.826216697692871, 13.389701843261719, 13.95318603515625, 14.516671180725098, 15.080156326293945, 15.643640518188477, 16.20712661743164, 16.770610809326172]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 13.0, 21.0, 23.0, 38.0, 51.0, 87.0, 149.0, 198.0, 258.0, 416.0, 678.0, 1032.0, 1501.0, 2448.0, 3892.0, 6362.0, 10782.0, 18914.0, 33600.0, 61275.0, 109124.0, 172749.0, 208047.0, 170437.0, 107018.0, 59974.0, 33217.0, 18779.0, 10590.0, 6318.0, 3744.0, 2332.0, 1493.0, 1033.0, 675.0, 405.0, 267.0, 181.0, 144.0, 86.0, 68.0, 44.0, 26.0, 17.0, 12.0, 8.0, 13.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.390625, -22.623291015625, -21.85595703125, -21.088623046875, -20.3212890625, -19.553955078125, -18.78662109375, -18.019287109375, -17.251953125, -16.484619140625, -15.71728515625, -14.949951171875, -14.1826171875, -13.415283203125, -12.64794921875, -11.880615234375, -11.11328125, -10.345947265625, -9.57861328125, -8.811279296875, -8.0439453125, -7.276611328125, -6.50927734375, -5.741943359375, -4.974609375, -4.207275390625, -3.43994140625, -2.672607421875, -1.9052734375, -1.137939453125, -0.37060546875, 0.396728515625, 1.1640625, 1.931396484375, 2.69873046875, 3.466064453125, 4.2333984375, 5.000732421875, 5.76806640625, 6.535400390625, 7.302734375, 8.070068359375, 8.83740234375, 9.604736328125, 10.3720703125, 11.139404296875, 11.90673828125, 12.674072265625, 13.44140625, 14.208740234375, 14.97607421875, 15.743408203125, 16.5107421875, 17.278076171875, 18.04541015625, 18.812744140625, 19.580078125, 20.347412109375, 21.11474609375, 21.882080078125, 22.6494140625, 23.416748046875, 24.18408203125, 24.951416015625, 25.71875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 4.0, 10.0, 5.0, 7.0, 10.0, 15.0, 16.0, 15.0, 20.0, 27.0, 26.0, 33.0, 37.0, 31.0, 31.0, 36.0, 44.0, 39.0, 55.0, 36.0, 50.0, 30.0, 46.0, 46.0, 31.0, 40.0, 30.0, 33.0, 28.0, 29.0, 29.0, 21.0, 10.0, 10.0, 11.0, 9.0, 12.0, 8.0, 8.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.75, -20.166259765625, -19.58251953125, -18.998779296875, -18.4150390625, -17.831298828125, -17.24755859375, -16.663818359375, -16.080078125, -15.496337890625, -14.91259765625, -14.328857421875, -13.7451171875, -13.161376953125, -12.57763671875, -11.993896484375, -11.41015625, -10.826416015625, -10.24267578125, -9.658935546875, -9.0751953125, -8.491455078125, -7.90771484375, -7.323974609375, -6.740234375, -6.156494140625, -5.57275390625, -4.989013671875, -4.4052734375, -3.821533203125, -3.23779296875, -2.654052734375, -2.0703125, -1.486572265625, -0.90283203125, -0.319091796875, 0.2646484375, 0.848388671875, 1.43212890625, 2.015869140625, 2.599609375, 3.183349609375, 3.76708984375, 4.350830078125, 4.9345703125, 5.518310546875, 6.10205078125, 6.685791015625, 7.26953125, 7.853271484375, 8.43701171875, 9.020751953125, 9.6044921875, 10.188232421875, 10.77197265625, 11.355712890625, 11.939453125, 12.523193359375, 13.10693359375, 13.690673828125, 14.2744140625, 14.858154296875, 15.44189453125, 16.025634765625, 16.609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 8.0, 8.0, 10.0, 22.0, 29.0, 44.0, 80.0, 112.0, 152.0, 214.0, 362.0, 569.0, 820.0, 1457.0, 2630.0, 5186.0, 11282.0, 29827.0, 101025.0, 365164.0, 371429.0, 103709.0, 30946.0, 11532.0, 5281.0, 2727.0, 1406.0, 932.0, 568.0, 356.0, 192.0, 141.0, 103.0, 64.0, 54.0, 32.0, 20.0, 14.0, 13.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.0, -66.0576171875, -64.115234375, -62.1728515625, -60.23046875, -58.2880859375, -56.345703125, -54.4033203125, -52.4609375, -50.5185546875, -48.576171875, -46.6337890625, -44.69140625, -42.7490234375, -40.806640625, -38.8642578125, -36.921875, -34.9794921875, -33.037109375, -31.0947265625, -29.15234375, -27.2099609375, -25.267578125, -23.3251953125, -21.3828125, -19.4404296875, -17.498046875, -15.5556640625, -13.61328125, -11.6708984375, -9.728515625, -7.7861328125, -5.84375, -3.9013671875, -1.958984375, -0.0166015625, 1.92578125, 3.8681640625, 5.810546875, 7.7529296875, 9.6953125, 11.6376953125, 13.580078125, 15.5224609375, 17.46484375, 19.4072265625, 21.349609375, 23.2919921875, 25.234375, 27.1767578125, 29.119140625, 31.0615234375, 33.00390625, 34.9462890625, 36.888671875, 38.8310546875, 40.7734375, 42.7158203125, 44.658203125, 46.6005859375, 48.54296875, 50.4853515625, 52.427734375, 54.3701171875, 56.3125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 10.0, 12.0, 15.0, 12.0, 13.0, 17.0, 22.0, 22.0, 20.0, 35.0, 32.0, 44.0, 42.0, 34.0, 50.0, 45.0, 37.0, 46.0, 55.0, 44.0, 35.0, 39.0, 40.0, 41.0, 32.0, 29.0, 33.0, 16.0, 17.0, 23.0, 16.0, 9.0, 14.0, 6.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.522216796875, -11.13037109375, -10.738525390625, -10.3466796875, -9.954833984375, -9.56298828125, -9.171142578125, -8.779296875, -8.387451171875, -7.99560546875, -7.603759765625, -7.2119140625, -6.820068359375, -6.42822265625, -6.036376953125, -5.64453125, -5.252685546875, -4.86083984375, -4.468994140625, -4.0771484375, -3.685302734375, -3.29345703125, -2.901611328125, -2.509765625, -2.117919921875, -1.72607421875, -1.334228515625, -0.9423828125, -0.550537109375, -0.15869140625, 0.233154296875, 0.625, 1.016845703125, 1.40869140625, 1.800537109375, 2.1923828125, 2.584228515625, 2.97607421875, 3.367919921875, 3.759765625, 4.151611328125, 4.54345703125, 4.935302734375, 5.3271484375, 5.718994140625, 6.11083984375, 6.502685546875, 6.89453125, 7.286376953125, 7.67822265625, 8.070068359375, 8.4619140625, 8.853759765625, 9.24560546875, 9.637451171875, 10.029296875, 10.421142578125, 10.81298828125, 11.204833984375, 11.5966796875, 11.988525390625, 12.38037109375, 12.772216796875, 13.1640625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 6.0, 10.0, 10.0, 17.0, 24.0, 26.0, 42.0, 57.0, 57.0, 78.0, 114.0, 121.0, 166.0, 231.0, 343.0, 404.0, 679.0, 881.0, 1244.0, 1998.0, 3012.0, 5015.0, 8555.0, 15847.0, 32252.0, 73205.0, 173359.0, 318032.0, 225611.0, 97421.0, 42110.0, 20242.0, 10602.0, 5928.0, 3614.0, 2228.0, 1419.0, 961.0, 694.0, 486.0, 352.0, 272.0, 205.0, 134.0, 126.0, 90.0, 75.0, 46.0, 45.0, 39.0, 22.0, 17.0, 13.0, 13.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.21875, -18.592041015625, -17.96533203125, -17.338623046875, -16.7119140625, -16.085205078125, -15.45849609375, -14.831787109375, -14.205078125, -13.578369140625, -12.95166015625, -12.324951171875, -11.6982421875, -11.071533203125, -10.44482421875, -9.818115234375, -9.19140625, -8.564697265625, -7.93798828125, -7.311279296875, -6.6845703125, -6.057861328125, -5.43115234375, -4.804443359375, -4.177734375, -3.551025390625, -2.92431640625, -2.297607421875, -1.6708984375, -1.044189453125, -0.41748046875, 0.209228515625, 0.8359375, 1.462646484375, 2.08935546875, 2.716064453125, 3.3427734375, 3.969482421875, 4.59619140625, 5.222900390625, 5.849609375, 6.476318359375, 7.10302734375, 7.729736328125, 8.3564453125, 8.983154296875, 9.60986328125, 10.236572265625, 10.86328125, 11.489990234375, 12.11669921875, 12.743408203125, 13.3701171875, 13.996826171875, 14.62353515625, 15.250244140625, 15.876953125, 16.503662109375, 17.13037109375, 17.757080078125, 18.3837890625, 19.010498046875, 19.63720703125, 20.263916015625, 20.890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 15.0, 21.0, 40.0, 74.0, 152.0, 154.0, 189.0, 129.0, 81.0, 50.0, 26.0, 16.0, 7.0, 5.0, 6.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018215179443359375, -0.0017646849155426025, -0.0017078518867492676, -0.0016510188579559326, -0.0015941858291625977, -0.0015373528003692627, -0.0014805197715759277, -0.0014236867427825928, -0.0013668537139892578, -0.0013100206851959229, -0.0012531876564025879, -0.001196354627609253, -0.001139521598815918, -0.001082688570022583, -0.001025855541229248, -0.0009690225124359131, -0.0009121894836425781, -0.0008553564548492432, -0.0007985234260559082, -0.0007416903972625732, -0.0006848573684692383, -0.0006280243396759033, -0.0005711913108825684, -0.0005143582820892334, -0.00045752525329589844, -0.0004006922245025635, -0.0003438591957092285, -0.00028702616691589355, -0.0002301931381225586, -0.00017336010932922363, -0.00011652708053588867, -5.969405174255371e-05, -2.86102294921875e-06, 5.397200584411621e-05, 0.00011080503463745117, 0.00016763806343078613, 0.0002244710922241211, 0.00028130412101745605, 0.000338137149810791, 0.000394970178604126, 0.00045180320739746094, 0.0005086362361907959, 0.0005654692649841309, 0.0006223022937774658, 0.0006791353225708008, 0.0007359683513641357, 0.0007928013801574707, 0.0008496344089508057, 0.0009064674377441406, 0.0009633004665374756, 0.0010201334953308105, 0.0010769665241241455, 0.0011337995529174805, 0.0011906325817108154, 0.0012474656105041504, 0.0013042986392974854, 0.0013611316680908203, 0.0014179646968841553, 0.0014747977256774902, 0.0015316307544708252, 0.0015884637832641602, 0.0016452968120574951, 0.00170212984085083, 0.001758962869644165, 0.0018157958984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 12.0, 17.0, 25.0, 35.0, 37.0, 55.0, 88.0, 108.0, 188.0, 273.0, 371.0, 556.0, 876.0, 1487.0, 2583.0, 4644.0, 9812.0, 22382.0, 58083.0, 158866.0, 315917.0, 275410.0, 118389.0, 43577.0, 17204.0, 7813.0, 3912.0, 2135.0, 1297.0, 801.0, 499.0, 329.0, 216.0, 167.0, 91.0, 77.0, 44.0, 37.0, 31.0, 18.0, 25.0, 14.0, 15.0, 6.0, 6.0, 2.0, 0.0, 3.0], "bins": [-23.859375, -23.2119140625, -22.564453125, -21.9169921875, -21.26953125, -20.6220703125, -19.974609375, -19.3271484375, -18.6796875, -18.0322265625, -17.384765625, -16.7373046875, -16.08984375, -15.4423828125, -14.794921875, -14.1474609375, -13.5, -12.8525390625, -12.205078125, -11.5576171875, -10.91015625, -10.2626953125, -9.615234375, -8.9677734375, -8.3203125, -7.6728515625, -7.025390625, -6.3779296875, -5.73046875, -5.0830078125, -4.435546875, -3.7880859375, -3.140625, -2.4931640625, -1.845703125, -1.1982421875, -0.55078125, 0.0966796875, 0.744140625, 1.3916015625, 2.0390625, 2.6865234375, 3.333984375, 3.9814453125, 4.62890625, 5.2763671875, 5.923828125, 6.5712890625, 7.21875, 7.8662109375, 8.513671875, 9.1611328125, 9.80859375, 10.4560546875, 11.103515625, 11.7509765625, 12.3984375, 13.0458984375, 13.693359375, 14.3408203125, 14.98828125, 15.6357421875, 16.283203125, 16.9306640625, 17.578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 8.0, 5.0, 7.0, 9.0, 8.0, 11.0, 11.0, 16.0, 32.0, 32.0, 41.0, 48.0, 58.0, 69.0, 82.0, 73.0, 68.0, 90.0, 67.0, 58.0, 39.0, 37.0, 22.0, 16.0, 18.0, 15.0, 9.0, 6.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.828857421875, -4.68505859375, -4.541259765625, -4.3974609375, -4.253662109375, -4.10986328125, -3.966064453125, -3.822265625, -3.678466796875, -3.53466796875, -3.390869140625, -3.2470703125, -3.103271484375, -2.95947265625, -2.815673828125, -2.671875, -2.528076171875, -2.38427734375, -2.240478515625, -2.0966796875, -1.952880859375, -1.80908203125, -1.665283203125, -1.521484375, -1.377685546875, -1.23388671875, -1.090087890625, -0.9462890625, -0.802490234375, -0.65869140625, -0.514892578125, -0.37109375, -0.227294921875, -0.08349609375, 0.060302734375, 0.2041015625, 0.347900390625, 0.49169921875, 0.635498046875, 0.779296875, 0.923095703125, 1.06689453125, 1.210693359375, 1.3544921875, 1.498291015625, 1.64208984375, 1.785888671875, 1.9296875, 2.073486328125, 2.21728515625, 2.361083984375, 2.5048828125, 2.648681640625, 2.79248046875, 2.936279296875, 3.080078125, 3.223876953125, 3.36767578125, 3.511474609375, 3.6552734375, 3.799072265625, 3.94287109375, 4.086669921875, 4.23046875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 9.0, 15.0, 24.0, 26.0, 25.0, 39.0, 29.0, 41.0, 45.0, 61.0, 66.0, 75.0, 61.0, 64.0, 65.0, 59.0, 45.0, 52.0, 27.0, 25.0, 27.0, 24.0, 11.0, 13.0, 14.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.970867156982422, -31.039974212646484, -30.109081268310547, -29.17818832397461, -28.247295379638672, -27.316402435302734, -26.385509490966797, -25.45461654663086, -24.523723602294922, -23.592830657958984, -22.661937713623047, -21.73104476928711, -20.800151824951172, -19.869258880615234, -18.938365936279297, -18.00747299194336, -17.076580047607422, -16.145687103271484, -15.214794158935547, -14.28390121459961, -13.353008270263672, -12.422115325927734, -11.491222381591797, -10.56032943725586, -9.629434585571289, -8.698541641235352, -7.767648696899414, -6.836755752563477, -5.905862808227539, -4.974969387054443, -4.044076442718506, -3.1131834983825684, -2.182291030883789, -1.2513980865478516, -0.3205050230026245, 0.6103880405426025, 1.54128098487854, 2.4721741676330566, 3.403067111968994, 4.333960056304932, 5.264853000640869, 6.195745944976807, 7.126638889312744, 8.05753231048584, 8.988425254821777, 9.919318199157715, 10.850211143493652, 11.78110408782959, 12.711997032165527, 13.642889976501465, 14.573782920837402, 15.50467586517334, 16.435569763183594, 17.36646270751953, 18.29735565185547, 19.228248596191406, 20.159141540527344, 21.09003448486328, 22.02092742919922, 22.951820373535156, 23.882713317871094, 24.81360626220703, 25.74449920654297, 26.675392150878906, 27.606285095214844]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 14.0, 11.0, 13.0, 10.0, 18.0, 11.0, 22.0, 26.0, 20.0, 45.0, 32.0, 39.0, 27.0, 42.0, 31.0, 41.0, 35.0, 35.0, 36.0, 46.0, 45.0, 36.0, 43.0, 49.0, 33.0, 38.0, 17.0, 25.0, 24.0, 25.0, 20.0, 16.0, 15.0, 14.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-18.145809173583984, -17.60721206665039, -17.068614959716797, -16.530019760131836, -15.991422653198242, -15.452825546264648, -14.914229393005371, -14.375633239746094, -13.8370361328125, -13.298439025878906, -12.759842872619629, -12.221246719360352, -11.682649612426758, -11.144052505493164, -10.605456352233887, -10.06686019897461, -9.528263092041016, -8.989665985107422, -8.451069831848145, -7.912473201751709, -7.373876571655273, -6.835279941558838, -6.296683311462402, -5.758086681365967, -5.219490051269531, -4.680893421173096, -4.14229679107666, -3.6037001609802246, -3.065103530883789, -2.5265069007873535, -1.987910270690918, -1.4493136405944824, -0.9107189178466797, -0.37212228775024414, 0.1664743423461914, 0.705070972442627, 1.2436676025390625, 1.782264232635498, 2.3208608627319336, 2.859457492828369, 3.3980541229248047, 3.9366507530212402, 4.475247383117676, 5.013844013214111, 5.552440643310547, 6.091037273406982, 6.629633903503418, 7.1682305335998535, 7.706827163696289, 8.245424270629883, 8.78402042388916, 9.322616577148438, 9.861213684082031, 10.399810791015625, 10.938406944274902, 11.47700309753418, 12.015600204467773, 12.554197311401367, 13.092793464660645, 13.631389617919922, 14.169986724853516, 14.70858383178711, 15.247179985046387, 15.785776138305664, 16.324373245239258]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 14.0, 16.0, 16.0, 25.0, 45.0, 58.0, 79.0, 108.0, 172.0, 266.0, 396.0, 596.0, 998.0, 1451.0, 2503.0, 3734.0, 6284.0, 10698.0, 17478.0, 29304.0, 48740.0, 77279.0, 116948.0, 154322.0, 167137.0, 141915.0, 100627.0, 65354.0, 40144.0, 24464.0, 14424.0, 8743.0, 5369.0, 3277.0, 2002.0, 1253.0, 838.0, 498.0, 329.0, 196.0, 130.0, 101.0, 77.0, 58.0, 31.0, 20.0, 18.0, 11.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.34375, -22.621337890625, -21.89892578125, -21.176513671875, -20.4541015625, -19.731689453125, -19.00927734375, -18.286865234375, -17.564453125, -16.842041015625, -16.11962890625, -15.397216796875, -14.6748046875, -13.952392578125, -13.22998046875, -12.507568359375, -11.78515625, -11.062744140625, -10.34033203125, -9.617919921875, -8.8955078125, -8.173095703125, -7.45068359375, -6.728271484375, -6.005859375, -5.283447265625, -4.56103515625, -3.838623046875, -3.1162109375, -2.393798828125, -1.67138671875, -0.948974609375, -0.2265625, 0.495849609375, 1.21826171875, 1.940673828125, 2.6630859375, 3.385498046875, 4.10791015625, 4.830322265625, 5.552734375, 6.275146484375, 6.99755859375, 7.719970703125, 8.4423828125, 9.164794921875, 9.88720703125, 10.609619140625, 11.33203125, 12.054443359375, 12.77685546875, 13.499267578125, 14.2216796875, 14.944091796875, 15.66650390625, 16.388916015625, 17.111328125, 17.833740234375, 18.55615234375, 19.278564453125, 20.0009765625, 20.723388671875, 21.44580078125, 22.168212890625, 22.890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 3.0, 4.0, 8.0, 14.0, 14.0, 19.0, 18.0, 16.0, 25.0, 36.0, 40.0, 30.0, 37.0, 50.0, 51.0, 36.0, 45.0, 50.0, 60.0, 51.0, 37.0, 51.0, 45.0, 44.0, 28.0, 41.0, 31.0, 27.0, 26.0, 17.0, 9.0, 8.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.609375, -18.951171875, -18.29296875, -17.634765625, -16.9765625, -16.318359375, -15.66015625, -15.001953125, -14.34375, -13.685546875, -13.02734375, -12.369140625, -11.7109375, -11.052734375, -10.39453125, -9.736328125, -9.078125, -8.419921875, -7.76171875, -7.103515625, -6.4453125, -5.787109375, -5.12890625, -4.470703125, -3.8125, -3.154296875, -2.49609375, -1.837890625, -1.1796875, -0.521484375, 0.13671875, 0.794921875, 1.453125, 2.111328125, 2.76953125, 3.427734375, 4.0859375, 4.744140625, 5.40234375, 6.060546875, 6.71875, 7.376953125, 8.03515625, 8.693359375, 9.3515625, 10.009765625, 10.66796875, 11.326171875, 11.984375, 12.642578125, 13.30078125, 13.958984375, 14.6171875, 15.275390625, 15.93359375, 16.591796875, 17.25, 17.908203125, 18.56640625, 19.224609375, 19.8828125, 20.541015625, 21.19921875, 21.857421875, 22.515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 6.0, 19.0, 35.0, 43.0, 55.0, 108.0, 156.0, 241.0, 374.0, 593.0, 1005.0, 1577.0, 2650.0, 4147.0, 6965.0, 11021.0, 18442.0, 28703.0, 45381.0, 69061.0, 99694.0, 130789.0, 147207.0, 139926.0, 112702.0, 80903.0, 54508.0, 34617.0, 22066.0, 13531.0, 8324.0, 5238.0, 3180.0, 1981.0, 1296.0, 761.0, 448.0, 300.0, 160.0, 135.0, 86.0, 52.0, 25.0, 19.0, 13.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.65625, -17.099365234375, -16.54248046875, -15.985595703125, -15.4287109375, -14.871826171875, -14.31494140625, -13.758056640625, -13.201171875, -12.644287109375, -12.08740234375, -11.530517578125, -10.9736328125, -10.416748046875, -9.85986328125, -9.302978515625, -8.74609375, -8.189208984375, -7.63232421875, -7.075439453125, -6.5185546875, -5.961669921875, -5.40478515625, -4.847900390625, -4.291015625, -3.734130859375, -3.17724609375, -2.620361328125, -2.0634765625, -1.506591796875, -0.94970703125, -0.392822265625, 0.1640625, 0.720947265625, 1.27783203125, 1.834716796875, 2.3916015625, 2.948486328125, 3.50537109375, 4.062255859375, 4.619140625, 5.176025390625, 5.73291015625, 6.289794921875, 6.8466796875, 7.403564453125, 7.96044921875, 8.517333984375, 9.07421875, 9.631103515625, 10.18798828125, 10.744873046875, 11.3017578125, 11.858642578125, 12.41552734375, 12.972412109375, 13.529296875, 14.086181640625, 14.64306640625, 15.199951171875, 15.7568359375, 16.313720703125, 16.87060546875, 17.427490234375, 17.984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 17.0, 13.0, 17.0, 25.0, 25.0, 34.0, 36.0, 24.0, 39.0, 34.0, 34.0, 40.0, 45.0, 55.0, 50.0, 40.0, 48.0, 33.0, 41.0, 37.0, 39.0, 28.0, 29.0, 31.0, 21.0, 24.0, 18.0, 23.0, 18.0, 9.0, 13.0, 7.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.046875, -11.6805419921875, -11.314208984375, -10.9478759765625, -10.58154296875, -10.2152099609375, -9.848876953125, -9.4825439453125, -9.1162109375, -8.7498779296875, -8.383544921875, -8.0172119140625, -7.65087890625, -7.2845458984375, -6.918212890625, -6.5518798828125, -6.185546875, -5.8192138671875, -5.452880859375, -5.0865478515625, -4.72021484375, -4.3538818359375, -3.987548828125, -3.6212158203125, -3.2548828125, -2.8885498046875, -2.522216796875, -2.1558837890625, -1.78955078125, -1.4232177734375, -1.056884765625, -0.6905517578125, -0.32421875, 0.0421142578125, 0.408447265625, 0.7747802734375, 1.14111328125, 1.5074462890625, 1.873779296875, 2.2401123046875, 2.6064453125, 2.9727783203125, 3.339111328125, 3.7054443359375, 4.07177734375, 4.4381103515625, 4.804443359375, 5.1707763671875, 5.537109375, 5.9034423828125, 6.269775390625, 6.6361083984375, 7.00244140625, 7.3687744140625, 7.735107421875, 8.1014404296875, 8.4677734375, 8.8341064453125, 9.200439453125, 9.5667724609375, 9.93310546875, 10.2994384765625, 10.665771484375, 11.0321044921875, 11.3984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 22.0, 31.0, 51.0, 66.0, 99.0, 113.0, 175.0, 275.0, 353.0, 531.0, 847.0, 1348.0, 2094.0, 3087.0, 4952.0, 7676.0, 12482.0, 19936.0, 32705.0, 54208.0, 88267.0, 135683.0, 177069.0, 171387.0, 125971.0, 80762.0, 49143.0, 29690.0, 18351.0, 11241.0, 7040.0, 4406.0, 2805.0, 1895.0, 1206.0, 795.0, 561.0, 364.0, 242.0, 158.0, 124.0, 95.0, 56.0, 48.0, 32.0, 16.0, 16.0, 14.0, 13.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0], "bins": [-14.3359375, -13.8865966796875, -13.437255859375, -12.9879150390625, -12.53857421875, -12.0892333984375, -11.639892578125, -11.1905517578125, -10.7412109375, -10.2918701171875, -9.842529296875, -9.3931884765625, -8.94384765625, -8.4945068359375, -8.045166015625, -7.5958251953125, -7.146484375, -6.6971435546875, -6.247802734375, -5.7984619140625, -5.34912109375, -4.8997802734375, -4.450439453125, -4.0010986328125, -3.5517578125, -3.1024169921875, -2.653076171875, -2.2037353515625, -1.75439453125, -1.3050537109375, -0.855712890625, -0.4063720703125, 0.04296875, 0.4923095703125, 0.941650390625, 1.3909912109375, 1.84033203125, 2.2896728515625, 2.739013671875, 3.1883544921875, 3.6376953125, 4.0870361328125, 4.536376953125, 4.9857177734375, 5.43505859375, 5.8843994140625, 6.333740234375, 6.7830810546875, 7.232421875, 7.6817626953125, 8.131103515625, 8.5804443359375, 9.02978515625, 9.4791259765625, 9.928466796875, 10.3778076171875, 10.8271484375, 11.2764892578125, 11.725830078125, 12.1751708984375, 12.62451171875, 13.0738525390625, 13.523193359375, 13.9725341796875, 14.421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 7.0, 9.0, 5.0, 11.0, 20.0, 26.0, 39.0, 71.0, 85.0, 106.0, 122.0, 120.0, 75.0, 91.0, 69.0, 43.0, 26.0, 20.0, 10.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020427703857421875, -0.001950383186340332, -0.0018579959869384766, -0.001765608787536621, -0.0016732215881347656, -0.0015808343887329102, -0.0014884471893310547, -0.0013960599899291992, -0.0013036727905273438, -0.0012112855911254883, -0.0011188983917236328, -0.0010265111923217773, -0.0009341239929199219, -0.0008417367935180664, -0.0007493495941162109, -0.0006569623947143555, -0.0005645751953125, -0.00047218799591064453, -0.00037980079650878906, -0.0002874135971069336, -0.00019502639770507812, -0.00010263919830322266, -1.0251998901367188e-05, 8.213520050048828e-05, 0.00017452239990234375, 0.0002669095993041992, 0.0003592967987060547, 0.00045168399810791016, 0.0005440711975097656, 0.0006364583969116211, 0.0007288455963134766, 0.000821232795715332, 0.0009136199951171875, 0.001006007194519043, 0.0010983943939208984, 0.001190781593322754, 0.0012831687927246094, 0.0013755559921264648, 0.0014679431915283203, 0.0015603303909301758, 0.0016527175903320312, 0.0017451047897338867, 0.0018374919891357422, 0.0019298791885375977, 0.002022266387939453, 0.0021146535873413086, 0.002207040786743164, 0.0022994279861450195, 0.002391815185546875, 0.0024842023849487305, 0.002576589584350586, 0.0026689767837524414, 0.002761363983154297, 0.0028537511825561523, 0.002946138381958008, 0.0030385255813598633, 0.0031309127807617188, 0.0032232999801635742, 0.0033156871795654297, 0.003408074378967285, 0.0035004615783691406, 0.003592848777770996, 0.0036852359771728516, 0.003777623176574707, 0.0038700103759765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 17.0, 13.0, 21.0, 26.0, 29.0, 47.0, 85.0, 99.0, 150.0, 202.0, 290.0, 428.0, 618.0, 843.0, 1318.0, 1760.0, 2532.0, 3865.0, 5603.0, 8622.0, 13282.0, 20747.0, 32771.0, 52461.0, 81896.0, 120894.0, 155094.0, 160105.0, 130547.0, 91537.0, 58735.0, 36745.0, 23081.0, 14776.0, 9434.0, 6273.0, 4285.0, 2869.0, 1903.0, 1338.0, 931.0, 687.0, 498.0, 338.0, 242.0, 162.0, 115.0, 89.0, 42.0, 35.0, 31.0, 12.0, 20.0, 7.0, 8.0, 1.0, 5.0, 0.0, 1.0], "bins": [-12.1484375, -11.770263671875, -11.39208984375, -11.013916015625, -10.6357421875, -10.257568359375, -9.87939453125, -9.501220703125, -9.123046875, -8.744873046875, -8.36669921875, -7.988525390625, -7.6103515625, -7.232177734375, -6.85400390625, -6.475830078125, -6.09765625, -5.719482421875, -5.34130859375, -4.963134765625, -4.5849609375, -4.206787109375, -3.82861328125, -3.450439453125, -3.072265625, -2.694091796875, -2.31591796875, -1.937744140625, -1.5595703125, -1.181396484375, -0.80322265625, -0.425048828125, -0.046875, 0.331298828125, 0.70947265625, 1.087646484375, 1.4658203125, 1.843994140625, 2.22216796875, 2.600341796875, 2.978515625, 3.356689453125, 3.73486328125, 4.113037109375, 4.4912109375, 4.869384765625, 5.24755859375, 5.625732421875, 6.00390625, 6.382080078125, 6.76025390625, 7.138427734375, 7.5166015625, 7.894775390625, 8.27294921875, 8.651123046875, 9.029296875, 9.407470703125, 9.78564453125, 10.163818359375, 10.5419921875, 10.920166015625, 11.29833984375, 11.676513671875, 12.0546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 20.0, 17.0, 26.0, 23.0, 34.0, 39.0, 44.0, 55.0, 63.0, 52.0, 59.0, 72.0, 41.0, 48.0, 47.0, 47.0, 32.0, 26.0, 43.0, 17.0, 29.0, 24.0, 14.0, 12.0, 15.0, 13.0, 8.0, 5.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 3.0, 3.0], "bins": [-5.84765625, -5.699462890625, -5.55126953125, -5.403076171875, -5.2548828125, -5.106689453125, -4.95849609375, -4.810302734375, -4.662109375, -4.513916015625, -4.36572265625, -4.217529296875, -4.0693359375, -3.921142578125, -3.77294921875, -3.624755859375, -3.4765625, -3.328369140625, -3.18017578125, -3.031982421875, -2.8837890625, -2.735595703125, -2.58740234375, -2.439208984375, -2.291015625, -2.142822265625, -1.99462890625, -1.846435546875, -1.6982421875, -1.550048828125, -1.40185546875, -1.253662109375, -1.10546875, -0.957275390625, -0.80908203125, -0.660888671875, -0.5126953125, -0.364501953125, -0.21630859375, -0.068115234375, 0.080078125, 0.228271484375, 0.37646484375, 0.524658203125, 0.6728515625, 0.821044921875, 0.96923828125, 1.117431640625, 1.265625, 1.413818359375, 1.56201171875, 1.710205078125, 1.8583984375, 2.006591796875, 2.15478515625, 2.302978515625, 2.451171875, 2.599365234375, 2.74755859375, 2.895751953125, 3.0439453125, 3.192138671875, 3.34033203125, 3.488525390625, 3.63671875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 9.0, 18.0, 22.0, 21.0, 25.0, 21.0, 46.0, 45.0, 49.0, 49.0, 62.0, 58.0, 68.0, 76.0, 57.0, 59.0, 45.0, 63.0, 36.0, 34.0, 29.0, 29.0, 16.0, 8.0, 14.0, 8.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.97602081298828, -30.03790283203125, -29.09978485107422, -28.161666870117188, -27.223548889160156, -26.285430908203125, -25.347312927246094, -24.409194946289062, -23.47107696533203, -22.532958984375, -21.59484100341797, -20.656723022460938, -19.718605041503906, -18.780487060546875, -17.842369079589844, -16.904251098632812, -15.966133117675781, -15.02801513671875, -14.089897155761719, -13.151779174804688, -12.213661193847656, -11.275543212890625, -10.337425231933594, -9.399307250976562, -8.461189270019531, -7.5230712890625, -6.584953308105469, -5.6468353271484375, -4.708717346191406, -3.770599365234375, -2.8324813842773438, -1.8943634033203125, -0.9562473297119141, -0.018129348754882812, 0.9199886322021484, 1.8581066131591797, 2.796224594116211, 3.734342575073242, 4.672460556030273, 5.610578536987305, 6.548696517944336, 7.486814498901367, 8.424932479858398, 9.36305046081543, 10.301168441772461, 11.239286422729492, 12.177404403686523, 13.115522384643555, 14.053640365600586, 14.991758346557617, 15.929876327514648, 16.86799430847168, 17.80611228942871, 18.744230270385742, 19.682348251342773, 20.620466232299805, 21.558584213256836, 22.496702194213867, 23.4348201751709, 24.37293815612793, 25.31105613708496, 26.249174118041992, 27.187292098999023, 28.125410079956055, 29.063528060913086]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0, 4.0, 5.0, 7.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 24.0, 34.0, 20.0, 23.0, 31.0, 31.0, 45.0, 40.0, 33.0, 34.0, 45.0, 32.0, 37.0, 53.0, 50.0, 29.0, 44.0, 34.0, 33.0, 42.0, 18.0, 26.0, 27.0, 19.0, 20.0, 14.0, 13.0, 14.0, 2.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-17.848920822143555, -17.321720123291016, -16.79452133178711, -16.26732063293457, -15.740120887756348, -15.212921142578125, -14.685720443725586, -14.158520698547363, -13.63132095336914, -13.104121208190918, -12.576921463012695, -12.049720764160156, -11.522521018981934, -10.995321273803711, -10.468120574951172, -9.94092082977295, -9.413721084594727, -8.886521339416504, -8.359321594238281, -7.832120895385742, -7.3049211502075195, -6.777721405029297, -6.250521183013916, -5.723320960998535, -5.1961212158203125, -4.66892147064209, -4.141721248626709, -3.6145212650299072, -3.0873212814331055, -2.5601212978363037, -2.032921314239502, -1.5057213306427002, -0.9785223007202148, -0.4513223171234131, 0.07587766647338867, 0.6030776500701904, 1.1302776336669922, 1.657477617263794, 2.1846776008605957, 2.7118775844573975, 3.239077568054199, 3.766277551651001, 4.293477535247803, 4.820677757263184, 5.347877502441406, 5.875077247619629, 6.40227746963501, 6.929477691650391, 7.456677436828613, 7.983877182006836, 8.511077880859375, 9.038277626037598, 9.56547737121582, 10.092677116394043, 10.619876861572266, 11.147077560424805, 11.674277305603027, 12.20147705078125, 12.728677749633789, 13.255877494812012, 13.783077239990234, 14.310276985168457, 14.83747673034668, 15.364677429199219, 15.891877174377441]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 9.0, 22.0, 28.0, 38.0, 43.0, 98.0, 137.0, 217.0, 296.0, 468.0, 752.0, 1148.0, 1680.0, 2782.0, 4465.0, 7223.0, 11697.0, 20046.0, 34415.0, 61549.0, 111691.0, 211138.0, 403587.0, 699685.0, 898662.0, 747450.0, 447110.0, 237355.0, 125895.0, 68493.0, 38589.0, 22362.0, 13181.0, 8233.0, 5059.0, 3196.0, 1963.0, 1281.0, 795.0, 513.0, 335.0, 214.0, 131.0, 90.0, 62.0, 34.0, 24.0, 13.0, 10.0, 10.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-19.390625, -18.795654296875, -18.20068359375, -17.605712890625, -17.0107421875, -16.415771484375, -15.82080078125, -15.225830078125, -14.630859375, -14.035888671875, -13.44091796875, -12.845947265625, -12.2509765625, -11.656005859375, -11.06103515625, -10.466064453125, -9.87109375, -9.276123046875, -8.68115234375, -8.086181640625, -7.4912109375, -6.896240234375, -6.30126953125, -5.706298828125, -5.111328125, -4.516357421875, -3.92138671875, -3.326416015625, -2.7314453125, -2.136474609375, -1.54150390625, -0.946533203125, -0.3515625, 0.243408203125, 0.83837890625, 1.433349609375, 2.0283203125, 2.623291015625, 3.21826171875, 3.813232421875, 4.408203125, 5.003173828125, 5.59814453125, 6.193115234375, 6.7880859375, 7.383056640625, 7.97802734375, 8.572998046875, 9.16796875, 9.762939453125, 10.35791015625, 10.952880859375, 11.5478515625, 12.142822265625, 12.73779296875, 13.332763671875, 13.927734375, 14.522705078125, 15.11767578125, 15.712646484375, 16.3076171875, 16.902587890625, 17.49755859375, 18.092529296875, 18.6875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 8.0, 9.0, 7.0, 12.0, 12.0, 17.0, 18.0, 30.0, 22.0, 24.0, 31.0, 36.0, 40.0, 31.0, 40.0, 31.0, 43.0, 52.0, 34.0, 55.0, 41.0, 35.0, 35.0, 31.0, 38.0, 31.0, 33.0, 34.0, 29.0, 25.0, 19.0, 21.0, 14.0, 12.0, 11.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9088134765625, -10.528564453125, -10.1483154296875, -9.76806640625, -9.3878173828125, -9.007568359375, -8.6273193359375, -8.2470703125, -7.8668212890625, -7.486572265625, -7.1063232421875, -6.72607421875, -6.3458251953125, -5.965576171875, -5.5853271484375, -5.205078125, -4.8248291015625, -4.444580078125, -4.0643310546875, -3.68408203125, -3.3038330078125, -2.923583984375, -2.5433349609375, -2.1630859375, -1.7828369140625, -1.402587890625, -1.0223388671875, -0.64208984375, -0.2618408203125, 0.118408203125, 0.4986572265625, 0.87890625, 1.2591552734375, 1.639404296875, 2.0196533203125, 2.39990234375, 2.7801513671875, 3.160400390625, 3.5406494140625, 3.9208984375, 4.3011474609375, 4.681396484375, 5.0616455078125, 5.44189453125, 5.8221435546875, 6.202392578125, 6.5826416015625, 6.962890625, 7.3431396484375, 7.723388671875, 8.1036376953125, 8.48388671875, 8.8641357421875, 9.244384765625, 9.6246337890625, 10.0048828125, 10.3851318359375, 10.765380859375, 11.1456298828125, 11.52587890625, 11.9061279296875, 12.286376953125, 12.6666259765625, 13.046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 8.0, 25.0, 30.0, 42.0, 60.0, 101.0, 187.0, 292.0, 416.0, 651.0, 1018.0, 1564.0, 2576.0, 4263.0, 6923.0, 11905.0, 19841.0, 33560.0, 58908.0, 104026.0, 184420.0, 324443.0, 541175.0, 770886.0, 782593.0, 558549.0, 337277.0, 192609.0, 108068.0, 61466.0, 35211.0, 20470.0, 12014.0, 7128.0, 4374.0, 2712.0, 1628.0, 991.0, 682.0, 424.0, 270.0, 172.0, 100.0, 75.0, 53.0, 25.0, 25.0, 15.0, 16.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.08349609375, -16.4951171875, -15.90673828125, -15.318359375, -14.72998046875, -14.1416015625, -13.55322265625, -12.96484375, -12.37646484375, -11.7880859375, -11.19970703125, -10.611328125, -10.02294921875, -9.4345703125, -8.84619140625, -8.2578125, -7.66943359375, -7.0810546875, -6.49267578125, -5.904296875, -5.31591796875, -4.7275390625, -4.13916015625, -3.55078125, -2.96240234375, -2.3740234375, -1.78564453125, -1.197265625, -0.60888671875, -0.0205078125, 0.56787109375, 1.15625, 1.74462890625, 2.3330078125, 2.92138671875, 3.509765625, 4.09814453125, 4.6865234375, 5.27490234375, 5.86328125, 6.45166015625, 7.0400390625, 7.62841796875, 8.216796875, 8.80517578125, 9.3935546875, 9.98193359375, 10.5703125, 11.15869140625, 11.7470703125, 12.33544921875, 12.923828125, 13.51220703125, 14.1005859375, 14.68896484375, 15.27734375, 15.86572265625, 16.4541015625, 17.04248046875, 17.630859375, 18.21923828125, 18.8076171875, 19.39599609375, 19.984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 11.0, 14.0, 13.0, 19.0, 20.0, 28.0, 44.0, 48.0, 42.0, 61.0, 82.0, 94.0, 95.0, 120.0, 153.0, 162.0, 204.0, 194.0, 225.0, 236.0, 257.0, 215.0, 227.0, 192.0, 205.0, 181.0, 137.0, 133.0, 95.0, 92.0, 91.0, 76.0, 55.0, 55.0, 38.0, 23.0, 26.0, 13.0, 16.0, 14.0, 17.0, 7.0, 3.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0], "bins": [-5.875, -5.6947021484375, -5.514404296875, -5.3341064453125, -5.15380859375, -4.9735107421875, -4.793212890625, -4.6129150390625, -4.4326171875, -4.2523193359375, -4.072021484375, -3.8917236328125, -3.71142578125, -3.5311279296875, -3.350830078125, -3.1705322265625, -2.990234375, -2.8099365234375, -2.629638671875, -2.4493408203125, -2.26904296875, -2.0887451171875, -1.908447265625, -1.7281494140625, -1.5478515625, -1.3675537109375, -1.187255859375, -1.0069580078125, -0.82666015625, -0.6463623046875, -0.466064453125, -0.2857666015625, -0.10546875, 0.0748291015625, 0.255126953125, 0.4354248046875, 0.61572265625, 0.7960205078125, 0.976318359375, 1.1566162109375, 1.3369140625, 1.5172119140625, 1.697509765625, 1.8778076171875, 2.05810546875, 2.2384033203125, 2.418701171875, 2.5989990234375, 2.779296875, 2.9595947265625, 3.139892578125, 3.3201904296875, 3.50048828125, 3.6807861328125, 3.861083984375, 4.0413818359375, 4.2216796875, 4.4019775390625, 4.582275390625, 4.7625732421875, 4.94287109375, 5.1231689453125, 5.303466796875, 5.4837646484375, 5.6640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 7.0, 7.0, 6.0, 13.0, 15.0, 26.0, 28.0, 36.0, 41.0, 53.0, 51.0, 75.0, 86.0, 73.0, 88.0, 52.0, 74.0, 50.0, 48.0, 33.0, 32.0, 21.0, 26.0, 4.0, 16.0, 12.0, 7.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.978443145751953, -29.03729820251465, -28.09615135192871, -27.155006408691406, -26.2138614654541, -25.272716522216797, -24.33156967163086, -23.390424728393555, -22.44927978515625, -21.508134841918945, -20.566987991333008, -19.625843048095703, -18.6846981048584, -17.743553161621094, -16.802406311035156, -15.861261367797852, -14.920114517211914, -13.978968620300293, -13.037823677062988, -12.096677780151367, -11.155532836914062, -10.214386940002441, -9.27324104309082, -8.332096099853516, -7.3909502029418945, -6.449804782867432, -5.508659362792969, -4.567513465881348, -3.6263680458068848, -2.685222625732422, -1.7440767288208008, -0.8029313087463379, 0.1382160186767578, 1.0793615579605103, 2.0205070972442627, 2.9616527557373047, 3.9027981758117676, 4.8439435958862305, 5.785089492797852, 6.7262349128723145, 7.667380332946777, 8.608526229858398, 9.549671173095703, 10.490817070007324, 11.431962966918945, 12.37310791015625, 13.314253807067871, 14.255399703979492, 15.196544647216797, 16.1376895904541, 17.07883644104004, 18.019981384277344, 18.96112632751465, 19.902271270751953, 20.84341812133789, 21.784563064575195, 22.7257080078125, 23.666852951049805, 24.607999801635742, 25.549144744873047, 26.49028968811035, 27.431434631347656, 28.372581481933594, 29.3137264251709, 30.254873275756836]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 5.0, 14.0, 9.0, 20.0, 17.0, 22.0, 16.0, 32.0, 18.0, 24.0, 36.0, 31.0, 42.0, 38.0, 40.0, 41.0, 47.0, 47.0, 52.0, 50.0, 40.0, 38.0, 32.0, 40.0, 32.0, 29.0, 24.0, 23.0, 24.0, 16.0, 15.0, 16.0, 9.0, 9.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.447772026062012, -15.009613037109375, -14.571454048156738, -14.133295059204102, -13.695135116577148, -13.256977081298828, -12.818817138671875, -12.380658149719238, -11.942499160766602, -11.504340171813965, -11.066181182861328, -10.628022193908691, -10.189863204956055, -9.751703262329102, -9.313544273376465, -8.875385284423828, -8.437226295471191, -7.999067306518555, -7.560908317565918, -7.122748851776123, -6.684589862823486, -6.24643087387085, -5.808271408081055, -5.370112419128418, -4.931953430175781, -4.4937944412231445, -4.055635452270508, -3.617475986480713, -3.179316997528076, -2.7411580085754395, -2.3029987812042236, -1.8648395538330078, -1.426680564880371, -0.9885214567184448, -0.5503623485565186, -0.11220324039459229, 0.325955867767334, 0.7641148567199707, 1.2022740840911865, 1.6404333114624023, 2.078592300415039, 2.516751289367676, 2.9549105167388916, 3.3930697441101074, 3.831228733062744, 4.269387722015381, 4.707547187805176, 5.1457061767578125, 5.583865165710449, 6.022024154663086, 6.460183143615723, 6.898342609405518, 7.336501598358154, 7.774660587310791, 8.212820053100586, 8.650979042053223, 9.08913803100586, 9.527297019958496, 9.965456008911133, 10.40361499786377, 10.841773986816406, 11.27993392944336, 11.718092918395996, 12.156251907348633, 12.59441089630127]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 22.0, 30.0, 39.0, 68.0, 99.0, 138.0, 255.0, 418.0, 708.0, 1266.0, 2312.0, 4535.0, 9445.0, 19870.0, 42956.0, 88470.0, 161694.0, 228097.0, 212543.0, 137940.0, 71881.0, 34063.0, 15960.0, 7550.0, 3625.0, 2004.0, 1014.0, 584.0, 394.0, 186.0, 130.0, 71.0, 53.0, 25.0, 25.0, 23.0, 20.0, 6.0, 3.0, 7.0, 7.0, 3.0, 1.0], "bins": [-23.21875, -22.62109375, -22.0234375, -21.42578125, -20.828125, -20.23046875, -19.6328125, -19.03515625, -18.4375, -17.83984375, -17.2421875, -16.64453125, -16.046875, -15.44921875, -14.8515625, -14.25390625, -13.65625, -13.05859375, -12.4609375, -11.86328125, -11.265625, -10.66796875, -10.0703125, -9.47265625, -8.875, -8.27734375, -7.6796875, -7.08203125, -6.484375, -5.88671875, -5.2890625, -4.69140625, -4.09375, -3.49609375, -2.8984375, -2.30078125, -1.703125, -1.10546875, -0.5078125, 0.08984375, 0.6875, 1.28515625, 1.8828125, 2.48046875, 3.078125, 3.67578125, 4.2734375, 4.87109375, 5.46875, 6.06640625, 6.6640625, 7.26171875, 7.859375, 8.45703125, 9.0546875, 9.65234375, 10.25, 10.84765625, 11.4453125, 12.04296875, 12.640625, 13.23828125, 13.8359375, 14.43359375, 15.03125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 2.0, 9.0, 7.0, 10.0, 14.0, 17.0, 13.0, 24.0, 27.0, 23.0, 30.0, 25.0, 33.0, 34.0, 44.0, 32.0, 38.0, 46.0, 45.0, 48.0, 46.0, 40.0, 38.0, 40.0, 33.0, 32.0, 39.0, 24.0, 18.0, 31.0, 29.0, 20.0, 17.0, 17.0, 10.0, 4.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0], "bins": [-16.59375, -16.1480712890625, -15.702392578125, -15.2567138671875, -14.81103515625, -14.3653564453125, -13.919677734375, -13.4739990234375, -13.0283203125, -12.5826416015625, -12.136962890625, -11.6912841796875, -11.24560546875, -10.7999267578125, -10.354248046875, -9.9085693359375, -9.462890625, -9.0172119140625, -8.571533203125, -8.1258544921875, -7.68017578125, -7.2344970703125, -6.788818359375, -6.3431396484375, -5.8974609375, -5.4517822265625, -5.006103515625, -4.5604248046875, -4.11474609375, -3.6690673828125, -3.223388671875, -2.7777099609375, -2.33203125, -1.8863525390625, -1.440673828125, -0.9949951171875, -0.54931640625, -0.1036376953125, 0.342041015625, 0.7877197265625, 1.2333984375, 1.6790771484375, 2.124755859375, 2.5704345703125, 3.01611328125, 3.4617919921875, 3.907470703125, 4.3531494140625, 4.798828125, 5.2445068359375, 5.690185546875, 6.1358642578125, 6.58154296875, 7.0272216796875, 7.472900390625, 7.9185791015625, 8.3642578125, 8.8099365234375, 9.255615234375, 9.7012939453125, 10.14697265625, 10.5926513671875, 11.038330078125, 11.4840087890625, 11.9296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 2.0, 12.0, 12.0, 11.0, 27.0, 34.0, 51.0, 70.0, 120.0, 200.0, 327.0, 526.0, 982.0, 1755.0, 3346.0, 6190.0, 13110.0, 27371.0, 60249.0, 127837.0, 236837.0, 266083.0, 159365.0, 75566.0, 35308.0, 16326.0, 7895.0, 4046.0, 2102.0, 1132.0, 619.0, 373.0, 242.0, 169.0, 88.0, 48.0, 49.0, 19.0, 14.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.296875, -22.59423828125, -21.8916015625, -21.18896484375, -20.486328125, -19.78369140625, -19.0810546875, -18.37841796875, -17.67578125, -16.97314453125, -16.2705078125, -15.56787109375, -14.865234375, -14.16259765625, -13.4599609375, -12.75732421875, -12.0546875, -11.35205078125, -10.6494140625, -9.94677734375, -9.244140625, -8.54150390625, -7.8388671875, -7.13623046875, -6.43359375, -5.73095703125, -5.0283203125, -4.32568359375, -3.623046875, -2.92041015625, -2.2177734375, -1.51513671875, -0.8125, -0.10986328125, 0.5927734375, 1.29541015625, 1.998046875, 2.70068359375, 3.4033203125, 4.10595703125, 4.80859375, 5.51123046875, 6.2138671875, 6.91650390625, 7.619140625, 8.32177734375, 9.0244140625, 9.72705078125, 10.4296875, 11.13232421875, 11.8349609375, 12.53759765625, 13.240234375, 13.94287109375, 14.6455078125, 15.34814453125, 16.05078125, 16.75341796875, 17.4560546875, 18.15869140625, 18.861328125, 19.56396484375, 20.2666015625, 20.96923828125, 21.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 9.0, 8.0, 11.0, 12.0, 10.0, 19.0, 16.0, 17.0, 20.0, 20.0, 27.0, 27.0, 29.0, 29.0, 34.0, 32.0, 40.0, 38.0, 36.0, 42.0, 39.0, 32.0, 41.0, 34.0, 39.0, 37.0, 38.0, 37.0, 31.0, 27.0, 28.0, 20.0, 15.0, 14.0, 10.0, 8.0, 18.0, 8.0, 7.0, 3.0, 6.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.0711669921875, -6.829833984375, -6.5885009765625, -6.34716796875, -6.1058349609375, -5.864501953125, -5.6231689453125, -5.3818359375, -5.1405029296875, -4.899169921875, -4.6578369140625, -4.41650390625, -4.1751708984375, -3.933837890625, -3.6925048828125, -3.451171875, -3.2098388671875, -2.968505859375, -2.7271728515625, -2.48583984375, -2.2445068359375, -2.003173828125, -1.7618408203125, -1.5205078125, -1.2791748046875, -1.037841796875, -0.7965087890625, -0.55517578125, -0.3138427734375, -0.072509765625, 0.1688232421875, 0.41015625, 0.6514892578125, 0.892822265625, 1.1341552734375, 1.37548828125, 1.6168212890625, 1.858154296875, 2.0994873046875, 2.3408203125, 2.5821533203125, 2.823486328125, 3.0648193359375, 3.30615234375, 3.5474853515625, 3.788818359375, 4.0301513671875, 4.271484375, 4.5128173828125, 4.754150390625, 4.9954833984375, 5.23681640625, 5.4781494140625, 5.719482421875, 5.9608154296875, 6.2021484375, 6.4434814453125, 6.684814453125, 6.9261474609375, 7.16748046875, 7.4088134765625, 7.650146484375, 7.8914794921875, 8.1328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 14.0, 12.0, 26.0, 40.0, 70.0, 109.0, 170.0, 247.0, 388.0, 634.0, 1020.0, 1881.0, 3208.0, 5762.0, 10770.0, 21674.0, 45625.0, 100446.0, 214045.0, 293346.0, 185170.0, 84835.0, 38826.0, 18645.0, 9446.0, 5219.0, 2752.0, 1606.0, 964.0, 595.0, 354.0, 220.0, 155.0, 80.0, 60.0, 44.0, 23.0, 23.0, 7.0, 13.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.35302734375, -10.9794921875, -10.60595703125, -10.232421875, -9.85888671875, -9.4853515625, -9.11181640625, -8.73828125, -8.36474609375, -7.9912109375, -7.61767578125, -7.244140625, -6.87060546875, -6.4970703125, -6.12353515625, -5.75, -5.37646484375, -5.0029296875, -4.62939453125, -4.255859375, -3.88232421875, -3.5087890625, -3.13525390625, -2.76171875, -2.38818359375, -2.0146484375, -1.64111328125, -1.267578125, -0.89404296875, -0.5205078125, -0.14697265625, 0.2265625, 0.60009765625, 0.9736328125, 1.34716796875, 1.720703125, 2.09423828125, 2.4677734375, 2.84130859375, 3.21484375, 3.58837890625, 3.9619140625, 4.33544921875, 4.708984375, 5.08251953125, 5.4560546875, 5.82958984375, 6.203125, 6.57666015625, 6.9501953125, 7.32373046875, 7.697265625, 8.07080078125, 8.4443359375, 8.81787109375, 9.19140625, 9.56494140625, 9.9384765625, 10.31201171875, 10.685546875, 11.05908203125, 11.4326171875, 11.80615234375, 12.1796875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 8.0, 11.0, 7.0, 15.0, 8.0, 31.0, 33.0, 50.0, 46.0, 44.0, 64.0, 53.0, 73.0, 64.0, 66.0, 63.0, 52.0, 62.0, 54.0, 36.0, 25.0, 28.0, 22.0, 23.0, 14.0, 9.0, 5.0, 6.0, 3.0, 6.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004525184631347656, -0.0004387795925140381, -0.00042504072189331055, -0.000411301851272583, -0.00039756298065185547, -0.00038382411003112793, -0.0003700852394104004, -0.00035634636878967285, -0.0003426074981689453, -0.0003288686275482178, -0.00031512975692749023, -0.0003013908863067627, -0.00028765201568603516, -0.0002739131450653076, -0.0002601742744445801, -0.00024643540382385254, -0.000232696533203125, -0.00021895766258239746, -0.00020521879196166992, -0.00019147992134094238, -0.00017774105072021484, -0.0001640021800994873, -0.00015026330947875977, -0.00013652443885803223, -0.0001227855682373047, -0.00010904669761657715, -9.530782699584961e-05, -8.156895637512207e-05, -6.783008575439453e-05, -5.409121513366699e-05, -4.035234451293945e-05, -2.6613473892211914e-05, -1.2874603271484375e-05, 8.642673492431641e-07, 1.4603137969970703e-05, 2.8342008590698242e-05, 4.208087921142578e-05, 5.581974983215332e-05, 6.955862045288086e-05, 8.32974910736084e-05, 9.703636169433594e-05, 0.00011077523231506348, 0.00012451410293579102, 0.00013825297355651855, 0.0001519918441772461, 0.00016573071479797363, 0.00017946958541870117, 0.0001932084560394287, 0.00020694732666015625, 0.0002206861972808838, 0.00023442506790161133, 0.00024816393852233887, 0.0002619028091430664, 0.00027564167976379395, 0.0002893805503845215, 0.000303119421005249, 0.00031685829162597656, 0.0003305971622467041, 0.00034433603286743164, 0.0003580749034881592, 0.0003718137741088867, 0.00038555264472961426, 0.0003992915153503418, 0.00041303038597106934, 0.0004267692565917969]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 15.0, 17.0, 21.0, 32.0, 51.0, 68.0, 109.0, 175.0, 263.0, 444.0, 729.0, 1176.0, 1987.0, 3424.0, 5740.0, 10252.0, 18431.0, 33547.0, 59727.0, 101245.0, 153565.0, 188641.0, 172928.0, 123220.0, 75111.0, 42843.0, 23817.0, 13081.0, 7376.0, 4215.0, 2496.0, 1510.0, 816.0, 550.0, 356.0, 202.0, 123.0, 93.0, 45.0, 36.0, 24.0, 16.0, 12.0, 6.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.97613525390625, -6.7413330078125, -6.50653076171875, -6.271728515625, -6.03692626953125, -5.8021240234375, -5.56732177734375, -5.33251953125, -5.09771728515625, -4.8629150390625, -4.62811279296875, -4.393310546875, -4.15850830078125, -3.9237060546875, -3.68890380859375, -3.4541015625, -3.21929931640625, -2.9844970703125, -2.74969482421875, -2.514892578125, -2.28009033203125, -2.0452880859375, -1.81048583984375, -1.57568359375, -1.34088134765625, -1.1060791015625, -0.87127685546875, -0.636474609375, -0.40167236328125, -0.1668701171875, 0.06793212890625, 0.302734375, 0.53753662109375, 0.7723388671875, 1.00714111328125, 1.241943359375, 1.47674560546875, 1.7115478515625, 1.94635009765625, 2.18115234375, 2.41595458984375, 2.6507568359375, 2.88555908203125, 3.120361328125, 3.35516357421875, 3.5899658203125, 3.82476806640625, 4.0595703125, 4.29437255859375, 4.5291748046875, 4.76397705078125, 4.998779296875, 5.23358154296875, 5.4683837890625, 5.70318603515625, 5.93798828125, 6.17279052734375, 6.4075927734375, 6.64239501953125, 6.877197265625, 7.11199951171875, 7.3468017578125, 7.58160400390625, 7.81640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 12.0, 15.0, 18.0, 18.0, 25.0, 35.0, 43.0, 33.0, 38.0, 53.0, 47.0, 51.0, 59.0, 56.0, 54.0, 54.0, 54.0, 46.0, 33.0, 42.0, 29.0, 22.0, 22.0, 17.0, 16.0, 14.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.125, -2.058868408203125, -1.99273681640625, -1.926605224609375, -1.8604736328125, -1.794342041015625, -1.72821044921875, -1.662078857421875, -1.595947265625, -1.529815673828125, -1.46368408203125, -1.397552490234375, -1.3314208984375, -1.265289306640625, -1.19915771484375, -1.133026123046875, -1.06689453125, -1.000762939453125, -0.93463134765625, -0.868499755859375, -0.8023681640625, -0.736236572265625, -0.67010498046875, -0.603973388671875, -0.537841796875, -0.471710205078125, -0.40557861328125, -0.339447021484375, -0.2733154296875, -0.207183837890625, -0.14105224609375, -0.074920654296875, -0.0087890625, 0.057342529296875, 0.12347412109375, 0.189605712890625, 0.2557373046875, 0.321868896484375, 0.38800048828125, 0.454132080078125, 0.520263671875, 0.586395263671875, 0.65252685546875, 0.718658447265625, 0.7847900390625, 0.850921630859375, 0.91705322265625, 0.983184814453125, 1.04931640625, 1.115447998046875, 1.18157958984375, 1.247711181640625, 1.3138427734375, 1.379974365234375, 1.44610595703125, 1.512237548828125, 1.578369140625, 1.644500732421875, 1.71063232421875, 1.776763916015625, 1.8428955078125, 1.909027099609375, 1.97515869140625, 2.041290283203125, 2.107421875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 10.0, 8.0, 21.0, 42.0, 39.0, 46.0, 51.0, 69.0, 77.0, 84.0, 83.0, 71.0, 71.0, 60.0, 55.0, 37.0, 38.0, 29.0, 19.0, 16.0, 14.0, 14.0, 7.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.729543685913086, -28.753942489624023, -27.778343200683594, -26.80274200439453, -25.82714080810547, -24.85154151916504, -23.875940322875977, -22.900341033935547, -21.924739837646484, -20.949138641357422, -19.973539352416992, -18.99793815612793, -18.0223388671875, -17.046737670898438, -16.071136474609375, -15.095536231994629, -14.119935989379883, -13.144335746765137, -12.16873550415039, -11.193134307861328, -10.217534065246582, -9.241933822631836, -8.266332626342773, -7.290732383728027, -6.315132141113281, -5.339531898498535, -4.363931179046631, -3.3883306980133057, -2.4127302169799805, -1.4371299743652344, -0.4615292549133301, 0.5140714645385742, 1.4896736145019531, 2.4652740955352783, 3.4408745765686035, 4.416475296020508, 5.392075538635254, 6.36767578125, 7.343276500701904, 8.318877220153809, 9.294477462768555, 10.2700777053833, 11.245677947998047, 12.22127914428711, 13.196879386901855, 14.172479629516602, 15.148080825805664, 16.123680114746094, 17.099281311035156, 18.07488250732422, 19.05048179626465, 20.02608299255371, 21.00168228149414, 21.977283477783203, 22.952884674072266, 23.928485870361328, 24.904085159301758, 25.87968635559082, 26.85528564453125, 27.830886840820312, 28.806488037109375, 29.782087326049805, 30.757688522338867, 31.733287811279297, 32.70888900756836]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 6.0, 7.0, 18.0, 11.0, 22.0, 14.0, 25.0, 24.0, 26.0, 25.0, 34.0, 36.0, 38.0, 35.0, 51.0, 45.0, 55.0, 44.0, 42.0, 57.0, 49.0, 33.0, 33.0, 39.0, 37.0, 24.0, 21.0, 27.0, 20.0, 21.0, 11.0, 13.0, 6.0, 7.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.315722465515137, -14.86660099029541, -14.417479515075684, -13.968358039855957, -13.51923656463623, -13.070115089416504, -12.620992660522461, -12.171871185302734, -11.722749710083008, -11.273628234863281, -10.824506759643555, -10.375385284423828, -9.926263809204102, -9.477142333984375, -9.028020858764648, -8.578899383544922, -8.129777908325195, -7.680656433105469, -7.231534957885742, -6.782413482666016, -6.333292007446289, -5.8841705322265625, -5.435048580169678, -4.985927104949951, -4.536805629730225, -4.087684154510498, -3.6385626792907715, -3.189440965652466, -2.7403194904327393, -2.2911980152130127, -1.842076301574707, -1.3929548263549805, -0.9438333511352539, -0.49471181631088257, -0.04559028148651123, 0.4035313129425049, 0.8526527881622314, 1.301774263381958, 1.7508959770202637, 2.2000174522399902, 2.649138927459717, 3.0982604026794434, 3.54738187789917, 3.9965035915374756, 4.445625305175781, 4.894746780395508, 5.343868255615234, 5.792989730834961, 6.2421112060546875, 6.691232681274414, 7.140354156494141, 7.589475631713867, 8.038597106933594, 8.48771858215332, 8.936840057373047, 9.385961532592773, 9.8350830078125, 10.284204483032227, 10.733325958251953, 11.18244743347168, 11.631568908691406, 12.080690383911133, 12.52981185913086, 12.978933334350586, 13.428055763244629]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 10.0, 15.0, 26.0, 48.0, 51.0, 80.0, 124.0, 193.0, 292.0, 456.0, 691.0, 1115.0, 1617.0, 2578.0, 4171.0, 6560.0, 10701.0, 17148.0, 27464.0, 42696.0, 65214.0, 93633.0, 122722.0, 140931.0, 138732.0, 117389.0, 87851.0, 59754.0, 39667.0, 24731.0, 15712.0, 9706.0, 6121.0, 3695.0, 2378.0, 1527.0, 931.0, 652.0, 403.0, 253.0, 176.0, 113.0, 82.0, 44.0, 31.0, 14.0, 15.0, 8.0, 11.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.015625, -13.546875, -13.078125, -12.609375, -12.140625, -11.671875, -11.203125, -10.734375, -10.265625, -9.796875, -9.328125, -8.859375, -8.390625, -7.921875, -7.453125, -6.984375, -6.515625, -6.046875, -5.578125, -5.109375, -4.640625, -4.171875, -3.703125, -3.234375, -2.765625, -2.296875, -1.828125, -1.359375, -0.890625, -0.421875, 0.046875, 0.515625, 0.984375, 1.453125, 1.921875, 2.390625, 2.859375, 3.328125, 3.796875, 4.265625, 4.734375, 5.203125, 5.671875, 6.140625, 6.609375, 7.078125, 7.546875, 8.015625, 8.484375, 8.953125, 9.421875, 9.890625, 10.359375, 10.828125, 11.296875, 11.765625, 12.234375, 12.703125, 13.171875, 13.640625, 14.109375, 14.578125, 15.046875, 15.515625, 15.984375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 4.0, 3.0, 12.0, 8.0, 11.0, 13.0, 10.0, 20.0, 18.0, 31.0, 35.0, 28.0, 33.0, 45.0, 46.0, 33.0, 44.0, 43.0, 46.0, 50.0, 44.0, 41.0, 45.0, 29.0, 53.0, 38.0, 29.0, 36.0, 23.0, 24.0, 20.0, 11.0, 9.0, 15.0, 9.0, 10.0, 11.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.7265625, -15.252685546875, -14.77880859375, -14.304931640625, -13.8310546875, -13.357177734375, -12.88330078125, -12.409423828125, -11.935546875, -11.461669921875, -10.98779296875, -10.513916015625, -10.0400390625, -9.566162109375, -9.09228515625, -8.618408203125, -8.14453125, -7.670654296875, -7.19677734375, -6.722900390625, -6.2490234375, -5.775146484375, -5.30126953125, -4.827392578125, -4.353515625, -3.879638671875, -3.40576171875, -2.931884765625, -2.4580078125, -1.984130859375, -1.51025390625, -1.036376953125, -0.5625, -0.088623046875, 0.38525390625, 0.859130859375, 1.3330078125, 1.806884765625, 2.28076171875, 2.754638671875, 3.228515625, 3.702392578125, 4.17626953125, 4.650146484375, 5.1240234375, 5.597900390625, 6.07177734375, 6.545654296875, 7.01953125, 7.493408203125, 7.96728515625, 8.441162109375, 8.9150390625, 9.388916015625, 9.86279296875, 10.336669921875, 10.810546875, 11.284423828125, 11.75830078125, 12.232177734375, 12.7060546875, 13.179931640625, 13.65380859375, 14.127685546875, 14.6015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 14.0, 16.0, 23.0, 43.0, 52.0, 88.0, 123.0, 205.0, 302.0, 503.0, 800.0, 1264.0, 2087.0, 3510.0, 5626.0, 9451.0, 15523.0, 25340.0, 40597.0, 62940.0, 92275.0, 124003.0, 146159.0, 145156.0, 121007.0, 89633.0, 60298.0, 38837.0, 24407.0, 14975.0, 8894.0, 5638.0, 3381.0, 2025.0, 1204.0, 826.0, 498.0, 310.0, 187.0, 128.0, 79.0, 43.0, 33.0, 27.0, 7.0, 6.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.515625, -13.064453125, -12.61328125, -12.162109375, -11.7109375, -11.259765625, -10.80859375, -10.357421875, -9.90625, -9.455078125, -9.00390625, -8.552734375, -8.1015625, -7.650390625, -7.19921875, -6.748046875, -6.296875, -5.845703125, -5.39453125, -4.943359375, -4.4921875, -4.041015625, -3.58984375, -3.138671875, -2.6875, -2.236328125, -1.78515625, -1.333984375, -0.8828125, -0.431640625, 0.01953125, 0.470703125, 0.921875, 1.373046875, 1.82421875, 2.275390625, 2.7265625, 3.177734375, 3.62890625, 4.080078125, 4.53125, 4.982421875, 5.43359375, 5.884765625, 6.3359375, 6.787109375, 7.23828125, 7.689453125, 8.140625, 8.591796875, 9.04296875, 9.494140625, 9.9453125, 10.396484375, 10.84765625, 11.298828125, 11.75, 12.201171875, 12.65234375, 13.103515625, 13.5546875, 14.005859375, 14.45703125, 14.908203125, 15.359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 15.0, 10.0, 18.0, 16.0, 15.0, 18.0, 22.0, 29.0, 33.0, 16.0, 40.0, 41.0, 30.0, 34.0, 36.0, 37.0, 45.0, 41.0, 41.0, 39.0, 49.0, 39.0, 39.0, 39.0, 37.0, 29.0, 32.0, 20.0, 26.0, 18.0, 19.0, 9.0, 10.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.8173828125, -8.525390625, -8.2333984375, -7.94140625, -7.6494140625, -7.357421875, -7.0654296875, -6.7734375, -6.4814453125, -6.189453125, -5.8974609375, -5.60546875, -5.3134765625, -5.021484375, -4.7294921875, -4.4375, -4.1455078125, -3.853515625, -3.5615234375, -3.26953125, -2.9775390625, -2.685546875, -2.3935546875, -2.1015625, -1.8095703125, -1.517578125, -1.2255859375, -0.93359375, -0.6416015625, -0.349609375, -0.0576171875, 0.234375, 0.5263671875, 0.818359375, 1.1103515625, 1.40234375, 1.6943359375, 1.986328125, 2.2783203125, 2.5703125, 2.8623046875, 3.154296875, 3.4462890625, 3.73828125, 4.0302734375, 4.322265625, 4.6142578125, 4.90625, 5.1982421875, 5.490234375, 5.7822265625, 6.07421875, 6.3662109375, 6.658203125, 6.9501953125, 7.2421875, 7.5341796875, 7.826171875, 8.1181640625, 8.41015625, 8.7021484375, 8.994140625, 9.2861328125, 9.578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 12.0, 11.0, 19.0, 37.0, 54.0, 57.0, 109.0, 165.0, 291.0, 478.0, 902.0, 1643.0, 2913.0, 5765.0, 11628.0, 24338.0, 51876.0, 107984.0, 199469.0, 254920.0, 190259.0, 101953.0, 48566.0, 22503.0, 10823.0, 5396.0, 2775.0, 1572.0, 850.0, 466.0, 283.0, 172.0, 100.0, 54.0, 45.0, 27.0, 20.0, 11.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.1875, -14.7335205078125, -14.279541015625, -13.8255615234375, -13.37158203125, -12.9176025390625, -12.463623046875, -12.0096435546875, -11.5556640625, -11.1016845703125, -10.647705078125, -10.1937255859375, -9.73974609375, -9.2857666015625, -8.831787109375, -8.3778076171875, -7.923828125, -7.4698486328125, -7.015869140625, -6.5618896484375, -6.10791015625, -5.6539306640625, -5.199951171875, -4.7459716796875, -4.2919921875, -3.8380126953125, -3.384033203125, -2.9300537109375, -2.47607421875, -2.0220947265625, -1.568115234375, -1.1141357421875, -0.66015625, -0.2061767578125, 0.247802734375, 0.7017822265625, 1.15576171875, 1.6097412109375, 2.063720703125, 2.5177001953125, 2.9716796875, 3.4256591796875, 3.879638671875, 4.3336181640625, 4.78759765625, 5.2415771484375, 5.695556640625, 6.1495361328125, 6.603515625, 7.0574951171875, 7.511474609375, 7.9654541015625, 8.41943359375, 8.8734130859375, 9.327392578125, 9.7813720703125, 10.2353515625, 10.6893310546875, 11.143310546875, 11.5972900390625, 12.05126953125, 12.5052490234375, 12.959228515625, 13.4132080078125, 13.8671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 12.0, 7.0, 11.0, 25.0, 31.0, 37.0, 45.0, 40.0, 69.0, 69.0, 78.0, 82.0, 72.0, 83.0, 61.0, 57.0, 37.0, 32.0, 27.0, 27.0, 15.0, 10.0, 15.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015783309936523438, -0.0015366077423095703, -0.0014948844909667969, -0.0014531612396240234, -0.00141143798828125, -0.0013697147369384766, -0.0013279914855957031, -0.0012862682342529297, -0.0012445449829101562, -0.0012028217315673828, -0.0011610984802246094, -0.001119375228881836, -0.0010776519775390625, -0.001035928726196289, -0.0009942054748535156, -0.0009524822235107422, -0.0009107589721679688, -0.0008690357208251953, -0.0008273124694824219, -0.0007855892181396484, -0.000743865966796875, -0.0007021427154541016, -0.0006604194641113281, -0.0006186962127685547, -0.0005769729614257812, -0.0005352497100830078, -0.0004935264587402344, -0.00045180320739746094, -0.0004100799560546875, -0.00036835670471191406, -0.0003266334533691406, -0.0002849102020263672, -0.00024318695068359375, -0.0002014636993408203, -0.00015974044799804688, -0.00011801719665527344, -7.62939453125e-05, -3.457069396972656e-05, 7.152557373046875e-06, 4.887580871582031e-05, 9.059906005859375e-05, 0.0001323223114013672, 0.00017404556274414062, 0.00021576881408691406, 0.0002574920654296875, 0.00029921531677246094, 0.0003409385681152344, 0.0003826618194580078, 0.00042438507080078125, 0.0004661083221435547, 0.0005078315734863281, 0.0005495548248291016, 0.000591278076171875, 0.0006330013275146484, 0.0006747245788574219, 0.0007164478302001953, 0.0007581710815429688, 0.0007998943328857422, 0.0008416175842285156, 0.0008833408355712891, 0.0009250640869140625, 0.0009667873382568359, 0.0010085105895996094, 0.0010502338409423828, 0.0010919570922851562]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 4.0, 9.0, 16.0, 17.0, 25.0, 33.0, 61.0, 85.0, 128.0, 211.0, 284.0, 430.0, 688.0, 1051.0, 1741.0, 2922.0, 4852.0, 8167.0, 13799.0, 23679.0, 39870.0, 65667.0, 102419.0, 142858.0, 167724.0, 156435.0, 118234.0, 78251.0, 47995.0, 28806.0, 16846.0, 10083.0, 5976.0, 3456.0, 2083.0, 1318.0, 800.0, 512.0, 342.0, 202.0, 158.0, 92.0, 78.0, 40.0, 33.0, 22.0, 7.0, 11.0, 8.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8446044921875, -8.556396484375, -8.2681884765625, -7.97998046875, -7.6917724609375, -7.403564453125, -7.1153564453125, -6.8271484375, -6.5389404296875, -6.250732421875, -5.9625244140625, -5.67431640625, -5.3861083984375, -5.097900390625, -4.8096923828125, -4.521484375, -4.2332763671875, -3.945068359375, -3.6568603515625, -3.36865234375, -3.0804443359375, -2.792236328125, -2.5040283203125, -2.2158203125, -1.9276123046875, -1.639404296875, -1.3511962890625, -1.06298828125, -0.7747802734375, -0.486572265625, -0.1983642578125, 0.08984375, 0.3780517578125, 0.666259765625, 0.9544677734375, 1.24267578125, 1.5308837890625, 1.819091796875, 2.1072998046875, 2.3955078125, 2.6837158203125, 2.971923828125, 3.2601318359375, 3.54833984375, 3.8365478515625, 4.124755859375, 4.4129638671875, 4.701171875, 4.9893798828125, 5.277587890625, 5.5657958984375, 5.85400390625, 6.1422119140625, 6.430419921875, 6.7186279296875, 7.0068359375, 7.2950439453125, 7.583251953125, 7.8714599609375, 8.15966796875, 8.4478759765625, 8.736083984375, 9.0242919921875, 9.3125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 14.0, 10.0, 24.0, 29.0, 41.0, 42.0, 53.0, 67.0, 78.0, 88.0, 76.0, 73.0, 78.0, 65.0, 62.0, 56.0, 37.0, 27.0, 17.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5491943359375, -4.395263671875, -4.2413330078125, -4.08740234375, -3.9334716796875, -3.779541015625, -3.6256103515625, -3.4716796875, -3.3177490234375, -3.163818359375, -3.0098876953125, -2.85595703125, -2.7020263671875, -2.548095703125, -2.3941650390625, -2.240234375, -2.0863037109375, -1.932373046875, -1.7784423828125, -1.62451171875, -1.4705810546875, -1.316650390625, -1.1627197265625, -1.0087890625, -0.8548583984375, -0.700927734375, -0.5469970703125, -0.39306640625, -0.2391357421875, -0.085205078125, 0.0687255859375, 0.22265625, 0.3765869140625, 0.530517578125, 0.6844482421875, 0.83837890625, 0.9923095703125, 1.146240234375, 1.3001708984375, 1.4541015625, 1.6080322265625, 1.761962890625, 1.9158935546875, 2.06982421875, 2.2237548828125, 2.377685546875, 2.5316162109375, 2.685546875, 2.8394775390625, 2.993408203125, 3.1473388671875, 3.30126953125, 3.4552001953125, 3.609130859375, 3.7630615234375, 3.9169921875, 4.0709228515625, 4.224853515625, 4.3787841796875, 4.53271484375, 4.6866455078125, 4.840576171875, 4.9945068359375, 5.1484375]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 10.0, 18.0, 23.0, 26.0, 40.0, 34.0, 41.0, 56.0, 60.0, 79.0, 94.0, 75.0, 80.0, 47.0, 49.0, 49.0, 49.0, 37.0, 21.0, 25.0, 18.0, 13.0, 11.0, 8.0, 8.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.850130081176758, -27.93405532836914, -27.017980575561523, -26.101905822753906, -25.18583106994629, -24.269756317138672, -23.353683471679688, -22.437606811523438, -21.521533966064453, -20.605459213256836, -19.68938446044922, -18.7733097076416, -17.857234954833984, -16.941160202026367, -16.02508544921875, -15.10901165008545, -14.192935943603516, -13.276861190795898, -12.360786437988281, -11.444711685180664, -10.528636932373047, -9.61256217956543, -8.696488380432129, -7.780413627624512, -6.8643388748168945, -5.948264122009277, -5.03218936920166, -4.116115093231201, -3.200040340423584, -2.283965587615967, -1.3678913116455078, -0.4518165588378906, 0.4642601013183594, 1.380334734916687, 2.2964093685150146, 3.2124838829040527, 4.12855863571167, 5.044633388519287, 5.960707664489746, 6.876782417297363, 7.7928571701049805, 8.708931922912598, 9.625006675720215, 10.541080474853516, 11.457155227661133, 12.37322998046875, 13.289304733276367, 14.205379486083984, 15.121454238891602, 16.03752899169922, 16.953603744506836, 17.869678497314453, 18.78575325012207, 19.701828002929688, 20.617900848388672, 21.533977508544922, 22.450050354003906, 23.366125106811523, 24.28219985961914, 25.198274612426758, 26.114349365234375, 27.030424118041992, 27.94649887084961, 28.862571716308594, 29.778648376464844]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 8.0, 14.0, 11.0, 13.0, 25.0, 23.0, 25.0, 19.0, 35.0, 30.0, 29.0, 37.0, 40.0, 52.0, 42.0, 51.0, 45.0, 46.0, 38.0, 47.0, 34.0, 44.0, 49.0, 27.0, 31.0, 27.0, 26.0, 25.0, 11.0, 16.0, 15.0, 10.0, 9.0, 6.0, 9.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.063613891601562, -15.586197853088379, -15.108782768249512, -14.631366729736328, -14.153950691223145, -13.676534652709961, -13.199119567871094, -12.72170352935791, -12.244287490844727, -11.766871452331543, -11.289456367492676, -10.812040328979492, -10.334624290466309, -9.857208251953125, -9.379793167114258, -8.902377128601074, -8.42496109008789, -7.947545528411865, -7.470129489898682, -6.992713928222656, -6.515297889709473, -6.037882328033447, -5.560466766357422, -5.083050727844238, -4.605635643005371, -4.128220081329346, -3.650804042816162, -3.1733884811401367, -2.695972442626953, -2.2185568809509277, -1.7411410808563232, -1.2637252807617188, -0.7863092422485352, -0.30889347195625305, 0.16852229833602905, 0.6459380388259888, 1.1233538389205933, 1.6007695198059082, 2.0781853199005127, 2.555601119995117, 3.0330169200897217, 3.510432720184326, 3.9878485202789307, 4.465264320373535, 4.9426798820495605, 5.420095443725586, 5.8975114822387695, 6.374927520751953, 6.8523430824279785, 7.329758644104004, 7.8071746826171875, 8.284590721130371, 8.762005805969238, 9.239421844482422, 9.716837882995605, 10.194253921508789, 10.671669006347656, 11.14908504486084, 11.626500129699707, 12.10391616821289, 12.581332206726074, 13.058748245239258, 13.536163330078125, 14.013579368591309, 14.490995407104492]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 7.0, 4.0, 4.0, 10.0, 11.0, 22.0, 30.0, 41.0, 58.0, 84.0, 136.0, 178.0, 305.0, 460.0, 797.0, 1301.0, 2123.0, 3553.0, 6592.0, 12129.0, 22876.0, 45786.0, 96648.0, 215759.0, 501709.0, 1000826.0, 1121214.0, 640720.0, 278849.0, 122940.0, 57372.0, 28396.0, 14436.0, 7876.0, 4346.0, 2548.0, 1534.0, 897.0, 587.0, 373.0, 243.0, 185.0, 115.0, 64.0, 52.0, 31.0, 17.0, 20.0, 4.0, 10.0, 2.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.072509765625, -18.39501953125, -17.717529296875, -17.0400390625, -16.362548828125, -15.68505859375, -15.007568359375, -14.330078125, -13.652587890625, -12.97509765625, -12.297607421875, -11.6201171875, -10.942626953125, -10.26513671875, -9.587646484375, -8.91015625, -8.232666015625, -7.55517578125, -6.877685546875, -6.2001953125, -5.522705078125, -4.84521484375, -4.167724609375, -3.490234375, -2.812744140625, -2.13525390625, -1.457763671875, -0.7802734375, -0.102783203125, 0.57470703125, 1.252197265625, 1.9296875, 2.607177734375, 3.28466796875, 3.962158203125, 4.6396484375, 5.317138671875, 5.99462890625, 6.672119140625, 7.349609375, 8.027099609375, 8.70458984375, 9.382080078125, 10.0595703125, 10.737060546875, 11.41455078125, 12.092041015625, 12.76953125, 13.447021484375, 14.12451171875, 14.802001953125, 15.4794921875, 16.156982421875, 16.83447265625, 17.511962890625, 18.189453125, 18.866943359375, 19.54443359375, 20.221923828125, 20.8994140625, 21.576904296875, 22.25439453125, 22.931884765625, 23.609375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 4.0, 9.0, 5.0, 7.0, 12.0, 15.0, 22.0, 20.0, 26.0, 24.0, 24.0, 30.0, 31.0, 28.0, 30.0, 45.0, 43.0, 41.0, 42.0, 40.0, 37.0, 44.0, 47.0, 39.0, 35.0, 29.0, 31.0, 30.0, 30.0, 31.0, 25.0, 16.0, 16.0, 16.0, 10.0, 11.0, 7.0, 10.0, 9.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.3125, -11.003173828125, -10.69384765625, -10.384521484375, -10.0751953125, -9.765869140625, -9.45654296875, -9.147216796875, -8.837890625, -8.528564453125, -8.21923828125, -7.909912109375, -7.6005859375, -7.291259765625, -6.98193359375, -6.672607421875, -6.36328125, -6.053955078125, -5.74462890625, -5.435302734375, -5.1259765625, -4.816650390625, -4.50732421875, -4.197998046875, -3.888671875, -3.579345703125, -3.27001953125, -2.960693359375, -2.6513671875, -2.342041015625, -2.03271484375, -1.723388671875, -1.4140625, -1.104736328125, -0.79541015625, -0.486083984375, -0.1767578125, 0.132568359375, 0.44189453125, 0.751220703125, 1.060546875, 1.369873046875, 1.67919921875, 1.988525390625, 2.2978515625, 2.607177734375, 2.91650390625, 3.225830078125, 3.53515625, 3.844482421875, 4.15380859375, 4.463134765625, 4.7724609375, 5.081787109375, 5.39111328125, 5.700439453125, 6.009765625, 6.319091796875, 6.62841796875, 6.937744140625, 7.2470703125, 7.556396484375, 7.86572265625, 8.175048828125, 8.484375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 10.0, 7.0, 12.0, 37.0, 31.0, 63.0, 82.0, 129.0, 230.0, 305.0, 533.0, 819.0, 1419.0, 2346.0, 4012.0, 7208.0, 13144.0, 25066.0, 49075.0, 97280.0, 198694.0, 403904.0, 759442.0, 1038040.0, 770654.0, 412691.0, 202435.0, 99913.0, 49822.0, 25820.0, 13598.0, 7268.0, 4167.0, 2378.0, 1389.0, 887.0, 492.0, 309.0, 196.0, 126.0, 86.0, 59.0, 37.0, 29.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.551025390625, -19.89892578125, -19.246826171875, -18.5947265625, -17.942626953125, -17.29052734375, -16.638427734375, -15.986328125, -15.334228515625, -14.68212890625, -14.030029296875, -13.3779296875, -12.725830078125, -12.07373046875, -11.421630859375, -10.76953125, -10.117431640625, -9.46533203125, -8.813232421875, -8.1611328125, -7.509033203125, -6.85693359375, -6.204833984375, -5.552734375, -4.900634765625, -4.24853515625, -3.596435546875, -2.9443359375, -2.292236328125, -1.64013671875, -0.988037109375, -0.3359375, 0.316162109375, 0.96826171875, 1.620361328125, 2.2724609375, 2.924560546875, 3.57666015625, 4.228759765625, 4.880859375, 5.532958984375, 6.18505859375, 6.837158203125, 7.4892578125, 8.141357421875, 8.79345703125, 9.445556640625, 10.09765625, 10.749755859375, 11.40185546875, 12.053955078125, 12.7060546875, 13.358154296875, 14.01025390625, 14.662353515625, 15.314453125, 15.966552734375, 16.61865234375, 17.270751953125, 17.9228515625, 18.574951171875, 19.22705078125, 19.879150390625, 20.53125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 7.0, 9.0, 17.0, 24.0, 28.0, 31.0, 40.0, 62.0, 83.0, 110.0, 119.0, 157.0, 189.0, 231.0, 270.0, 283.0, 307.0, 290.0, 315.0, 272.0, 226.0, 188.0, 183.0, 127.0, 126.0, 76.0, 67.0, 56.0, 47.0, 30.0, 23.0, 23.0, 13.0, 22.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.7421875, -6.53192138671875, -6.3216552734375, -6.11138916015625, -5.901123046875, -5.69085693359375, -5.4805908203125, -5.27032470703125, -5.06005859375, -4.84979248046875, -4.6395263671875, -4.42926025390625, -4.218994140625, -4.00872802734375, -3.7984619140625, -3.58819580078125, -3.3779296875, -3.16766357421875, -2.9573974609375, -2.74713134765625, -2.536865234375, -2.32659912109375, -2.1163330078125, -1.90606689453125, -1.69580078125, -1.48553466796875, -1.2752685546875, -1.06500244140625, -0.854736328125, -0.64447021484375, -0.4342041015625, -0.22393798828125, -0.013671875, 0.19659423828125, 0.4068603515625, 0.61712646484375, 0.827392578125, 1.03765869140625, 1.2479248046875, 1.45819091796875, 1.66845703125, 1.87872314453125, 2.0889892578125, 2.29925537109375, 2.509521484375, 2.71978759765625, 2.9300537109375, 3.14031982421875, 3.3505859375, 3.56085205078125, 3.7711181640625, 3.98138427734375, 4.191650390625, 4.40191650390625, 4.6121826171875, 4.82244873046875, 5.03271484375, 5.24298095703125, 5.4532470703125, 5.66351318359375, 5.873779296875, 6.08404541015625, 6.2943115234375, 6.50457763671875, 6.71484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 4.0, 7.0, 9.0, 6.0, 31.0, 25.0, 33.0, 33.0, 39.0, 45.0, 38.0, 45.0, 56.0, 72.0, 48.0, 56.0, 53.0, 54.0, 38.0, 47.0, 37.0, 42.0, 28.0, 31.0, 16.0, 16.0, 15.0, 12.0, 6.0, 11.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.8176326751709, -19.158353805541992, -18.499074935913086, -17.839797973632812, -17.180519104003906, -16.521240234375, -15.861961364746094, -15.202682495117188, -14.543403625488281, -13.884124755859375, -13.224846839904785, -12.565567970275879, -11.906289100646973, -11.247011184692383, -10.587732315063477, -9.92845344543457, -9.26917552947998, -8.609896659851074, -7.950618267059326, -7.291339874267578, -6.632061004638672, -5.972782611846924, -5.313504219055176, -4.6542253494262695, -3.9949469566345215, -3.3356683254241943, -2.676389694213867, -2.017111301422119, -1.357832670211792, -0.6985540390014648, -0.0392756462097168, 0.6200032234191895, 1.2792816162109375, 1.9385602474212646, 2.597838878631592, 3.25711727142334, 3.916395902633667, 4.575674533843994, 5.234952926635742, 5.894231796264648, 6.5535101890563965, 7.2127885818481445, 7.872067451477051, 8.53134536743164, 9.190624237060547, 9.849903106689453, 10.50918197631836, 11.168460845947266, 11.827738761901855, 12.487017631530762, 13.146295547485352, 13.805574417114258, 14.464853286743164, 15.12413215637207, 15.78341007232666, 16.44268798828125, 17.101966857910156, 17.761245727539062, 18.42052459716797, 19.079803466796875, 19.73908042907715, 20.398359298706055, 21.05763816833496, 21.716917037963867, 22.376195907592773]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 9.0, 9.0, 13.0, 24.0, 17.0, 25.0, 31.0, 27.0, 38.0, 39.0, 32.0, 40.0, 50.0, 44.0, 50.0, 53.0, 44.0, 47.0, 51.0, 39.0, 37.0, 46.0, 43.0, 37.0, 25.0, 22.0, 13.0, 19.0, 18.0, 10.0, 10.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.765066146850586, -14.335415840148926, -13.905765533447266, -13.476116180419922, -13.046465873718262, -12.616815567016602, -12.187166213989258, -11.757515907287598, -11.327865600585938, -10.898215293884277, -10.468564987182617, -10.038915634155273, -9.609265327453613, -9.179615020751953, -8.74996566772461, -8.32031536102295, -7.890665054321289, -7.461014747619629, -7.031364917755127, -6.601715087890625, -6.172064781188965, -5.742414474487305, -5.312764644622803, -4.883114814758301, -4.453464508056641, -4.0238142013549805, -3.5941643714904785, -3.1645143032073975, -2.7348642349243164, -2.3052141666412354, -1.8755640983581543, -1.4459140300750732, -1.0162630081176758, -0.5866129398345947, -0.15696287155151367, 0.2726871967315674, 0.7023372650146484, 1.1319873332977295, 1.5616374015808105, 1.9912874698638916, 2.4209375381469727, 2.8505876064300537, 3.2802376747131348, 3.709887742996216, 4.139537811279297, 4.569188117980957, 4.998837947845459, 5.428487777709961, 5.858138084411621, 6.287788391113281, 6.717438220977783, 7.147088050842285, 7.576738357543945, 8.006388664245605, 8.436038970947266, 8.86568832397461, 9.29533863067627, 9.72498893737793, 10.154638290405273, 10.584288597106934, 11.013938903808594, 11.443589210510254, 11.873239517211914, 12.302888870239258, 12.732539176940918]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 16.0, 10.0, 23.0, 43.0, 56.0, 80.0, 107.0, 202.0, 307.0, 489.0, 860.0, 1445.0, 2606.0, 4678.0, 8738.0, 16421.0, 31892.0, 59183.0, 106245.0, 167913.0, 205160.0, 179278.0, 118160.0, 67541.0, 35649.0, 18966.0, 9910.0, 5389.0, 2977.0, 1691.0, 946.0, 580.0, 358.0, 201.0, 140.0, 94.0, 58.0, 42.0, 29.0, 20.0, 13.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.6875, -13.240234375, -12.79296875, -12.345703125, -11.8984375, -11.451171875, -11.00390625, -10.556640625, -10.109375, -9.662109375, -9.21484375, -8.767578125, -8.3203125, -7.873046875, -7.42578125, -6.978515625, -6.53125, -6.083984375, -5.63671875, -5.189453125, -4.7421875, -4.294921875, -3.84765625, -3.400390625, -2.953125, -2.505859375, -2.05859375, -1.611328125, -1.1640625, -0.716796875, -0.26953125, 0.177734375, 0.625, 1.072265625, 1.51953125, 1.966796875, 2.4140625, 2.861328125, 3.30859375, 3.755859375, 4.203125, 4.650390625, 5.09765625, 5.544921875, 5.9921875, 6.439453125, 6.88671875, 7.333984375, 7.78125, 8.228515625, 8.67578125, 9.123046875, 9.5703125, 10.017578125, 10.46484375, 10.912109375, 11.359375, 11.806640625, 12.25390625, 12.701171875, 13.1484375, 13.595703125, 14.04296875, 14.490234375, 14.9375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 9.0, 9.0, 9.0, 9.0, 10.0, 19.0, 19.0, 24.0, 29.0, 37.0, 26.0, 40.0, 41.0, 50.0, 36.0, 50.0, 61.0, 47.0, 56.0, 49.0, 51.0, 49.0, 43.0, 37.0, 43.0, 21.0, 32.0, 15.0, 20.0, 11.0, 11.0, 7.0, 6.0, 10.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.3125, -15.835205078125, -15.35791015625, -14.880615234375, -14.4033203125, -13.926025390625, -13.44873046875, -12.971435546875, -12.494140625, -12.016845703125, -11.53955078125, -11.062255859375, -10.5849609375, -10.107666015625, -9.63037109375, -9.153076171875, -8.67578125, -8.198486328125, -7.72119140625, -7.243896484375, -6.7666015625, -6.289306640625, -5.81201171875, -5.334716796875, -4.857421875, -4.380126953125, -3.90283203125, -3.425537109375, -2.9482421875, -2.470947265625, -1.99365234375, -1.516357421875, -1.0390625, -0.561767578125, -0.08447265625, 0.392822265625, 0.8701171875, 1.347412109375, 1.82470703125, 2.302001953125, 2.779296875, 3.256591796875, 3.73388671875, 4.211181640625, 4.6884765625, 5.165771484375, 5.64306640625, 6.120361328125, 6.59765625, 7.074951171875, 7.55224609375, 8.029541015625, 8.5068359375, 8.984130859375, 9.46142578125, 9.938720703125, 10.416015625, 10.893310546875, 11.37060546875, 11.847900390625, 12.3251953125, 12.802490234375, 13.27978515625, 13.757080078125, 14.234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 10.0, 17.0, 17.0, 20.0, 28.0, 49.0, 70.0, 111.0, 120.0, 200.0, 309.0, 519.0, 837.0, 1475.0, 2773.0, 5725.0, 12010.0, 27608.0, 64747.0, 148930.0, 282196.0, 265796.0, 132195.0, 56813.0, 24288.0, 10680.0, 4986.0, 2560.0, 1391.0, 753.0, 462.0, 280.0, 175.0, 116.0, 87.0, 63.0, 45.0, 23.0, 14.0, 21.0, 12.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.796875, -23.095458984375, -22.39404296875, -21.692626953125, -20.9912109375, -20.289794921875, -19.58837890625, -18.886962890625, -18.185546875, -17.484130859375, -16.78271484375, -16.081298828125, -15.3798828125, -14.678466796875, -13.97705078125, -13.275634765625, -12.57421875, -11.872802734375, -11.17138671875, -10.469970703125, -9.7685546875, -9.067138671875, -8.36572265625, -7.664306640625, -6.962890625, -6.261474609375, -5.56005859375, -4.858642578125, -4.1572265625, -3.455810546875, -2.75439453125, -2.052978515625, -1.3515625, -0.650146484375, 0.05126953125, 0.752685546875, 1.4541015625, 2.155517578125, 2.85693359375, 3.558349609375, 4.259765625, 4.961181640625, 5.66259765625, 6.364013671875, 7.0654296875, 7.766845703125, 8.46826171875, 9.169677734375, 9.87109375, 10.572509765625, 11.27392578125, 11.975341796875, 12.6767578125, 13.378173828125, 14.07958984375, 14.781005859375, 15.482421875, 16.183837890625, 16.88525390625, 17.586669921875, 18.2880859375, 18.989501953125, 19.69091796875, 20.392333984375, 21.09375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 7.0, 6.0, 9.0, 16.0, 11.0, 12.0, 22.0, 20.0, 32.0, 31.0, 33.0, 34.0, 32.0, 43.0, 39.0, 43.0, 54.0, 37.0, 40.0, 29.0, 46.0, 39.0, 34.0, 47.0, 33.0, 39.0, 32.0, 32.0, 19.0, 23.0, 15.0, 13.0, 15.0, 14.0, 12.0, 5.0, 8.0, 7.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.59375, -7.348388671875, -7.10302734375, -6.857666015625, -6.6123046875, -6.366943359375, -6.12158203125, -5.876220703125, -5.630859375, -5.385498046875, -5.14013671875, -4.894775390625, -4.6494140625, -4.404052734375, -4.15869140625, -3.913330078125, -3.66796875, -3.422607421875, -3.17724609375, -2.931884765625, -2.6865234375, -2.441162109375, -2.19580078125, -1.950439453125, -1.705078125, -1.459716796875, -1.21435546875, -0.968994140625, -0.7236328125, -0.478271484375, -0.23291015625, 0.012451171875, 0.2578125, 0.503173828125, 0.74853515625, 0.993896484375, 1.2392578125, 1.484619140625, 1.72998046875, 1.975341796875, 2.220703125, 2.466064453125, 2.71142578125, 2.956787109375, 3.2021484375, 3.447509765625, 3.69287109375, 3.938232421875, 4.18359375, 4.428955078125, 4.67431640625, 4.919677734375, 5.1650390625, 5.410400390625, 5.65576171875, 5.901123046875, 6.146484375, 6.391845703125, 6.63720703125, 6.882568359375, 7.1279296875, 7.373291015625, 7.61865234375, 7.864013671875, 8.109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 22.0, 25.0, 32.0, 63.0, 103.0, 143.0, 214.0, 279.0, 469.0, 742.0, 1140.0, 1861.0, 3040.0, 5050.0, 8580.0, 14966.0, 27423.0, 50385.0, 94088.0, 166886.0, 233633.0, 190601.0, 111753.0, 60696.0, 32906.0, 17959.0, 10080.0, 5884.0, 3526.0, 2117.0, 1414.0, 862.0, 534.0, 368.0, 234.0, 154.0, 114.0, 59.0, 44.0, 26.0, 27.0, 8.0, 20.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.34136962890625, -7.0850830078125, -6.82879638671875, -6.572509765625, -6.31622314453125, -6.0599365234375, -5.80364990234375, -5.54736328125, -5.29107666015625, -5.0347900390625, -4.77850341796875, -4.522216796875, -4.26593017578125, -4.0096435546875, -3.75335693359375, -3.4970703125, -3.24078369140625, -2.9844970703125, -2.72821044921875, -2.471923828125, -2.21563720703125, -1.9593505859375, -1.70306396484375, -1.44677734375, -1.19049072265625, -0.9342041015625, -0.67791748046875, -0.421630859375, -0.16534423828125, 0.0909423828125, 0.34722900390625, 0.603515625, 0.85980224609375, 1.1160888671875, 1.37237548828125, 1.628662109375, 1.88494873046875, 2.1412353515625, 2.39752197265625, 2.65380859375, 2.91009521484375, 3.1663818359375, 3.42266845703125, 3.678955078125, 3.93524169921875, 4.1915283203125, 4.44781494140625, 4.7041015625, 4.96038818359375, 5.2166748046875, 5.47296142578125, 5.729248046875, 5.98553466796875, 6.2418212890625, 6.49810791015625, 6.75439453125, 7.01068115234375, 7.2669677734375, 7.52325439453125, 7.779541015625, 8.03582763671875, 8.2921142578125, 8.54840087890625, 8.8046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 2.0, 9.0, 5.0, 8.0, 10.0, 12.0, 12.0, 23.0, 22.0, 31.0, 41.0, 49.0, 62.0, 80.0, 91.0, 85.0, 96.0, 74.0, 65.0, 48.0, 41.0, 34.0, 20.0, 24.0, 13.0, 10.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048279762268066406, -0.00046736374497413635, -0.00045192986726760864, -0.00043649598956108093, -0.0004210621118545532, -0.0004056282341480255, -0.0003901943564414978, -0.0003747604787349701, -0.0003593266010284424, -0.00034389272332191467, -0.00032845884561538696, -0.00031302496790885925, -0.00029759109020233154, -0.00028215721249580383, -0.0002667233347892761, -0.0002512894570827484, -0.0002358555793762207, -0.000220421701669693, -0.00020498782396316528, -0.00018955394625663757, -0.00017412006855010986, -0.00015868619084358215, -0.00014325231313705444, -0.00012781843543052673, -0.00011238455772399902, -9.695068001747131e-05, -8.15168023109436e-05, -6.60829246044159e-05, -5.0649046897888184e-05, -3.5215169191360474e-05, -1.9781291484832764e-05, -4.347413778305054e-06, 1.1086463928222656e-05, 2.6520341634750366e-05, 4.1954219341278076e-05, 5.7388097047805786e-05, 7.28219747543335e-05, 8.82558524608612e-05, 0.00010368973016738892, 0.00011912360787391663, 0.00013455748558044434, 0.00014999136328697205, 0.00016542524099349976, 0.00018085911870002747, 0.00019629299640655518, 0.00021172687411308289, 0.0002271607518196106, 0.0002425946295261383, 0.000258028507232666, 0.0002734623849391937, 0.00028889626264572144, 0.00030433014035224915, 0.00031976401805877686, 0.00033519789576530457, 0.0003506317734718323, 0.00036606565117836, 0.0003814995288848877, 0.0003969334065914154, 0.0004123672842979431, 0.0004278011620044708, 0.00044323503971099854, 0.00045866891741752625, 0.00047410279512405396, 0.0004895366728305817, 0.0005049705505371094]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 10.0, 17.0, 22.0, 26.0, 24.0, 52.0, 78.0, 101.0, 143.0, 212.0, 326.0, 494.0, 795.0, 1240.0, 1974.0, 3337.0, 5595.0, 8871.0, 15128.0, 25301.0, 42102.0, 68101.0, 104243.0, 144099.0, 165275.0, 152108.0, 113730.0, 76015.0, 47455.0, 28386.0, 17089.0, 10076.0, 6109.0, 3594.0, 2316.0, 1395.0, 898.0, 599.0, 391.0, 240.0, 189.0, 120.0, 87.0, 50.0, 37.0, 24.0, 24.0, 15.0, 16.0, 10.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.671875, -5.49249267578125, -5.3131103515625, -5.13372802734375, -4.954345703125, -4.77496337890625, -4.5955810546875, -4.41619873046875, -4.23681640625, -4.05743408203125, -3.8780517578125, -3.69866943359375, -3.519287109375, -3.33990478515625, -3.1605224609375, -2.98114013671875, -2.8017578125, -2.62237548828125, -2.4429931640625, -2.26361083984375, -2.084228515625, -1.90484619140625, -1.7254638671875, -1.54608154296875, -1.36669921875, -1.18731689453125, -1.0079345703125, -0.82855224609375, -0.649169921875, -0.46978759765625, -0.2904052734375, -0.11102294921875, 0.068359375, 0.24774169921875, 0.4271240234375, 0.60650634765625, 0.785888671875, 0.96527099609375, 1.1446533203125, 1.32403564453125, 1.50341796875, 1.68280029296875, 1.8621826171875, 2.04156494140625, 2.220947265625, 2.40032958984375, 2.5797119140625, 2.75909423828125, 2.9384765625, 3.11785888671875, 3.2972412109375, 3.47662353515625, 3.656005859375, 3.83538818359375, 4.0147705078125, 4.19415283203125, 4.37353515625, 4.55291748046875, 4.7322998046875, 4.91168212890625, 5.091064453125, 5.27044677734375, 5.4498291015625, 5.62921142578125, 5.80859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 1.0, 5.0, 8.0, 5.0, 6.0, 14.0, 6.0, 11.0, 25.0, 21.0, 19.0, 22.0, 35.0, 44.0, 30.0, 40.0, 45.0, 45.0, 41.0, 47.0, 51.0, 37.0, 54.0, 48.0, 45.0, 40.0, 39.0, 34.0, 30.0, 25.0, 21.0, 11.0, 23.0, 13.0, 8.0, 7.0, 7.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6396484375, -1.592010498046875, -1.54437255859375, -1.496734619140625, -1.4490966796875, -1.401458740234375, -1.35382080078125, -1.306182861328125, -1.258544921875, -1.210906982421875, -1.16326904296875, -1.115631103515625, -1.0679931640625, -1.020355224609375, -0.97271728515625, -0.925079345703125, -0.87744140625, -0.829803466796875, -0.78216552734375, -0.734527587890625, -0.6868896484375, -0.639251708984375, -0.59161376953125, -0.543975830078125, -0.496337890625, -0.448699951171875, -0.40106201171875, -0.353424072265625, -0.3057861328125, -0.258148193359375, -0.21051025390625, -0.162872314453125, -0.115234375, -0.067596435546875, -0.01995849609375, 0.027679443359375, 0.0753173828125, 0.122955322265625, 0.17059326171875, 0.218231201171875, 0.265869140625, 0.313507080078125, 0.36114501953125, 0.408782958984375, 0.4564208984375, 0.504058837890625, 0.55169677734375, 0.599334716796875, 0.64697265625, 0.694610595703125, 0.74224853515625, 0.789886474609375, 0.8375244140625, 0.885162353515625, 0.93280029296875, 0.980438232421875, 1.028076171875, 1.075714111328125, 1.12335205078125, 1.170989990234375, 1.2186279296875, 1.266265869140625, 1.31390380859375, 1.361541748046875, 1.4091796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 7.0, 3.0, 4.0, 7.0, 12.0, 9.0, 12.0, 19.0, 21.0, 32.0, 34.0, 35.0, 39.0, 44.0, 62.0, 54.0, 54.0, 58.0, 58.0, 59.0, 43.0, 38.0, 46.0, 48.0, 30.0, 39.0, 21.0, 24.0, 17.0, 11.0, 14.0, 9.0, 6.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.617773056030273, -18.964508056640625, -18.311241149902344, -17.657976150512695, -17.004711151123047, -16.351444244384766, -15.698179244995117, -15.044913291931152, -14.391647338867188, -13.738381385803223, -13.085115432739258, -12.43185043334961, -11.778584480285645, -11.12531852722168, -10.472053527832031, -9.818787574768066, -9.165521621704102, -8.512255668640137, -7.85899019241333, -7.205724716186523, -6.552458763122559, -5.899192810058594, -5.245927333831787, -4.5926618576049805, -3.9393959045410156, -3.28613018989563, -2.632864475250244, -1.9795987606048584, -1.3263330459594727, -0.6730673313140869, -0.019801616668701172, 0.6334638595581055, 1.2867317199707031, 1.9399974346160889, 2.5932631492614746, 3.2465288639068604, 3.899794578552246, 4.553060531616211, 5.206326007843018, 5.859591484069824, 6.512857437133789, 7.166123390197754, 7.8193888664245605, 8.472654342651367, 9.125920295715332, 9.779186248779297, 10.432451248168945, 11.08571720123291, 11.738983154296875, 12.39224910736084, 13.045515060424805, 13.698780059814453, 14.352046012878418, 15.005311965942383, 15.658576965332031, 16.311843872070312, 16.96510887145996, 17.61837387084961, 18.27164077758789, 18.92490577697754, 19.578170776367188, 20.23143768310547, 20.884702682495117, 21.537967681884766, 22.191234588623047]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 10.0, 6.0, 12.0, 10.0, 12.0, 19.0, 29.0, 24.0, 27.0, 37.0, 42.0, 34.0, 37.0, 39.0, 49.0, 49.0, 50.0, 54.0, 51.0, 46.0, 40.0, 43.0, 40.0, 45.0, 39.0, 31.0, 25.0, 18.0, 13.0, 22.0, 8.0, 5.0, 14.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.852544784545898, -14.425804138183594, -13.999063491821289, -13.572322845458984, -13.145581245422363, -12.718840599060059, -12.292099952697754, -11.86535930633545, -11.438618659973145, -11.01187801361084, -10.585137367248535, -10.158395767211914, -9.73165512084961, -9.304914474487305, -8.878173828125, -8.451433181762695, -8.02469253540039, -7.597951889038086, -7.171210765838623, -6.744470119476318, -6.317729473114014, -5.890988349914551, -5.464247703552246, -5.037507057189941, -4.61076545715332, -4.184024810791016, -3.757283926010132, -3.330543041229248, -2.9038023948669434, -2.4770615100860596, -2.050320625305176, -1.623579978942871, -1.1968393325805664, -0.7700985670089722, -0.34335774183273315, 0.08338308334350586, 0.5101238489151001, 0.9368646144866943, 1.3636054992675781, 1.7903461456298828, 2.2170870304107666, 2.6438279151916504, 3.070568561553955, 3.497309446334839, 3.9240503311157227, 4.350790977478027, 4.777531623840332, 5.204272270202637, 5.6310133934021, 6.057754039764404, 6.484495162963867, 6.911235809326172, 7.337976455688477, 7.764717102050781, 8.191457748413086, 8.61819839477539, 9.044939994812012, 9.471680641174316, 9.898421287536621, 10.325162887573242, 10.751903533935547, 11.178644180297852, 11.605384826660156, 12.032125473022461, 12.458866119384766]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 11.0, 6.0, 14.0, 21.0, 22.0, 42.0, 38.0, 61.0, 113.0, 123.0, 156.0, 248.0, 399.0, 626.0, 946.0, 1732.0, 2895.0, 5159.0, 9289.0, 17290.0, 31734.0, 56799.0, 96975.0, 147487.0, 182704.0, 175094.0, 131211.0, 82357.0, 46890.0, 25607.0, 14271.0, 7652.0, 4170.0, 2471.0, 1436.0, 862.0, 561.0, 352.0, 219.0, 146.0, 116.0, 73.0, 44.0, 33.0, 33.0, 17.0, 16.0, 11.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.703125, -16.178466796875, -15.65380859375, -15.129150390625, -14.6044921875, -14.079833984375, -13.55517578125, -13.030517578125, -12.505859375, -11.981201171875, -11.45654296875, -10.931884765625, -10.4072265625, -9.882568359375, -9.35791015625, -8.833251953125, -8.30859375, -7.783935546875, -7.25927734375, -6.734619140625, -6.2099609375, -5.685302734375, -5.16064453125, -4.635986328125, -4.111328125, -3.586669921875, -3.06201171875, -2.537353515625, -2.0126953125, -1.488037109375, -0.96337890625, -0.438720703125, 0.0859375, 0.610595703125, 1.13525390625, 1.659912109375, 2.1845703125, 2.709228515625, 3.23388671875, 3.758544921875, 4.283203125, 4.807861328125, 5.33251953125, 5.857177734375, 6.3818359375, 6.906494140625, 7.43115234375, 7.955810546875, 8.48046875, 9.005126953125, 9.52978515625, 10.054443359375, 10.5791015625, 11.103759765625, 11.62841796875, 12.153076171875, 12.677734375, 13.202392578125, 13.72705078125, 14.251708984375, 14.7763671875, 15.301025390625, 15.82568359375, 16.350341796875, 16.875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 9.0, 7.0, 13.0, 23.0, 23.0, 33.0, 35.0, 46.0, 64.0, 46.0, 40.0, 49.0, 49.0, 63.0, 48.0, 52.0, 60.0, 59.0, 37.0, 32.0, 36.0, 32.0, 28.0, 17.0, 12.0, 9.0, 13.0, 13.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.296875, -14.80712890625, -14.3173828125, -13.82763671875, -13.337890625, -12.84814453125, -12.3583984375, -11.86865234375, -11.37890625, -10.88916015625, -10.3994140625, -9.90966796875, -9.419921875, -8.93017578125, -8.4404296875, -7.95068359375, -7.4609375, -6.97119140625, -6.4814453125, -5.99169921875, -5.501953125, -5.01220703125, -4.5224609375, -4.03271484375, -3.54296875, -3.05322265625, -2.5634765625, -2.07373046875, -1.583984375, -1.09423828125, -0.6044921875, -0.11474609375, 0.375, 0.86474609375, 1.3544921875, 1.84423828125, 2.333984375, 2.82373046875, 3.3134765625, 3.80322265625, 4.29296875, 4.78271484375, 5.2724609375, 5.76220703125, 6.251953125, 6.74169921875, 7.2314453125, 7.72119140625, 8.2109375, 8.70068359375, 9.1904296875, 9.68017578125, 10.169921875, 10.65966796875, 11.1494140625, 11.63916015625, 12.12890625, 12.61865234375, 13.1083984375, 13.59814453125, 14.087890625, 14.57763671875, 15.0673828125, 15.55712890625, 16.046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 16.0, 19.0, 36.0, 44.0, 78.0, 108.0, 142.0, 250.0, 398.0, 697.0, 1073.0, 1875.0, 3167.0, 5568.0, 9994.0, 17554.0, 30909.0, 53229.0, 85670.0, 126711.0, 159577.0, 165628.0, 138669.0, 98334.0, 62301.0, 37481.0, 21139.0, 11958.0, 6654.0, 3865.0, 2167.0, 1278.0, 756.0, 475.0, 269.0, 148.0, 113.0, 72.0, 50.0, 33.0, 16.0, 10.0, 10.0, 6.0, 6.0, 2.0, 1.0, 0.0, 4.0], "bins": [-15.5859375, -15.1549072265625, -14.723876953125, -14.2928466796875, -13.86181640625, -13.4307861328125, -12.999755859375, -12.5687255859375, -12.1376953125, -11.7066650390625, -11.275634765625, -10.8446044921875, -10.41357421875, -9.9825439453125, -9.551513671875, -9.1204833984375, -8.689453125, -8.2584228515625, -7.827392578125, -7.3963623046875, -6.96533203125, -6.5343017578125, -6.103271484375, -5.6722412109375, -5.2412109375, -4.8101806640625, -4.379150390625, -3.9481201171875, -3.51708984375, -3.0860595703125, -2.655029296875, -2.2239990234375, -1.79296875, -1.3619384765625, -0.930908203125, -0.4998779296875, -0.06884765625, 0.3621826171875, 0.793212890625, 1.2242431640625, 1.6552734375, 2.0863037109375, 2.517333984375, 2.9483642578125, 3.37939453125, 3.8104248046875, 4.241455078125, 4.6724853515625, 5.103515625, 5.5345458984375, 5.965576171875, 6.3966064453125, 6.82763671875, 7.2586669921875, 7.689697265625, 8.1207275390625, 8.5517578125, 8.9827880859375, 9.413818359375, 9.8448486328125, 10.27587890625, 10.7069091796875, 11.137939453125, 11.5689697265625, 12.0]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 4.0, 6.0, 3.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 14.0, 25.0, 24.0, 21.0, 27.0, 27.0, 34.0, 30.0, 33.0, 48.0, 38.0, 43.0, 40.0, 32.0, 36.0, 41.0, 31.0, 33.0, 32.0, 34.0, 31.0, 25.0, 36.0, 26.0, 27.0, 27.0, 22.0, 18.0, 11.0, 11.0, 13.0, 7.0, 8.0, 4.0, 7.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.875, -6.6630859375, -6.451171875, -6.2392578125, -6.02734375, -5.8154296875, -5.603515625, -5.3916015625, -5.1796875, -4.9677734375, -4.755859375, -4.5439453125, -4.33203125, -4.1201171875, -3.908203125, -3.6962890625, -3.484375, -3.2724609375, -3.060546875, -2.8486328125, -2.63671875, -2.4248046875, -2.212890625, -2.0009765625, -1.7890625, -1.5771484375, -1.365234375, -1.1533203125, -0.94140625, -0.7294921875, -0.517578125, -0.3056640625, -0.09375, 0.1181640625, 0.330078125, 0.5419921875, 0.75390625, 0.9658203125, 1.177734375, 1.3896484375, 1.6015625, 1.8134765625, 2.025390625, 2.2373046875, 2.44921875, 2.6611328125, 2.873046875, 3.0849609375, 3.296875, 3.5087890625, 3.720703125, 3.9326171875, 4.14453125, 4.3564453125, 4.568359375, 4.7802734375, 4.9921875, 5.2041015625, 5.416015625, 5.6279296875, 5.83984375, 6.0517578125, 6.263671875, 6.4755859375, 6.6875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 6.0, 13.0, 13.0, 21.0, 37.0, 37.0, 72.0, 66.0, 98.0, 164.0, 223.0, 333.0, 512.0, 780.0, 1298.0, 2012.0, 3446.0, 6031.0, 10538.0, 19480.0, 35885.0, 65926.0, 113589.0, 171128.0, 199419.0, 167229.0, 109885.0, 62614.0, 34367.0, 18497.0, 10352.0, 5750.0, 3323.0, 1885.0, 1225.0, 738.0, 488.0, 319.0, 237.0, 159.0, 92.0, 84.0, 57.0, 29.0, 28.0, 16.0, 15.0, 14.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-9.046875, -8.7681884765625, -8.489501953125, -8.2108154296875, -7.93212890625, -7.6534423828125, -7.374755859375, -7.0960693359375, -6.8173828125, -6.5386962890625, -6.260009765625, -5.9813232421875, -5.70263671875, -5.4239501953125, -5.145263671875, -4.8665771484375, -4.587890625, -4.3092041015625, -4.030517578125, -3.7518310546875, -3.47314453125, -3.1944580078125, -2.915771484375, -2.6370849609375, -2.3583984375, -2.0797119140625, -1.801025390625, -1.5223388671875, -1.24365234375, -0.9649658203125, -0.686279296875, -0.4075927734375, -0.12890625, 0.1497802734375, 0.428466796875, 0.7071533203125, 0.98583984375, 1.2645263671875, 1.543212890625, 1.8218994140625, 2.1005859375, 2.3792724609375, 2.657958984375, 2.9366455078125, 3.21533203125, 3.4940185546875, 3.772705078125, 4.0513916015625, 4.330078125, 4.6087646484375, 4.887451171875, 5.1661376953125, 5.44482421875, 5.7235107421875, 6.002197265625, 6.2808837890625, 6.5595703125, 6.8382568359375, 7.116943359375, 7.3956298828125, 7.67431640625, 7.9530029296875, 8.231689453125, 8.5103759765625, 8.7890625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 9.0, 16.0, 8.0, 15.0, 18.0, 19.0, 25.0, 40.0, 32.0, 42.0, 63.0, 39.0, 48.0, 53.0, 60.0, 56.0, 67.0, 51.0, 46.0, 50.0, 36.0, 33.0, 26.0, 23.0, 27.0, 18.0, 20.0, 12.0, 9.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008192062377929688, -0.0007928088307380676, -0.0007664114236831665, -0.0007400140166282654, -0.0007136166095733643, -0.0006872192025184631, -0.000660821795463562, -0.0006344243884086609, -0.0006080269813537598, -0.0005816295742988586, -0.0005552321672439575, -0.0005288347601890564, -0.0005024373531341553, -0.00047603994607925415, -0.00044964253902435303, -0.0004232451319694519, -0.0003968477249145508, -0.00037045031785964966, -0.00034405291080474854, -0.0003176555037498474, -0.0002912580966949463, -0.00026486068964004517, -0.00023846328258514404, -0.00021206587553024292, -0.0001856684684753418, -0.00015927106142044067, -0.00013287365436553955, -0.00010647624731063843, -8.00788402557373e-05, -5.368143320083618e-05, -2.728402614593506e-05, -8.866190910339355e-07, 2.5510787963867188e-05, 5.190819501876831e-05, 7.830560207366943e-05, 0.00010470300912857056, 0.00013110041618347168, 0.0001574978232383728, 0.00018389523029327393, 0.00021029263734817505, 0.00023669004440307617, 0.0002630874514579773, 0.0002894848585128784, 0.00031588226556777954, 0.00034227967262268066, 0.0003686770796775818, 0.0003950744867324829, 0.00042147189378738403, 0.00044786930084228516, 0.0004742667078971863, 0.0005006641149520874, 0.0005270615220069885, 0.0005534589290618896, 0.0005798563361167908, 0.0006062537431716919, 0.000632651150226593, 0.0006590485572814941, 0.0006854459643363953, 0.0007118433713912964, 0.0007382407784461975, 0.0007646381855010986, 0.0007910355925559998, 0.0008174329996109009, 0.000843830406665802, 0.0008702278137207031]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 15.0, 24.0, 32.0, 34.0, 59.0, 95.0, 159.0, 231.0, 386.0, 602.0, 971.0, 1608.0, 2722.0, 4543.0, 7668.0, 13634.0, 23915.0, 41913.0, 72201.0, 117297.0, 164632.0, 182693.0, 154980.0, 106081.0, 64356.0, 37463.0, 21145.0, 12076.0, 6894.0, 3939.0, 2354.0, 1471.0, 842.0, 538.0, 342.0, 219.0, 143.0, 96.0, 62.0, 30.0, 26.0, 18.0, 8.0, 8.0, 6.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.03125, -7.775390625, -7.51953125, -7.263671875, -7.0078125, -6.751953125, -6.49609375, -6.240234375, -5.984375, -5.728515625, -5.47265625, -5.216796875, -4.9609375, -4.705078125, -4.44921875, -4.193359375, -3.9375, -3.681640625, -3.42578125, -3.169921875, -2.9140625, -2.658203125, -2.40234375, -2.146484375, -1.890625, -1.634765625, -1.37890625, -1.123046875, -0.8671875, -0.611328125, -0.35546875, -0.099609375, 0.15625, 0.412109375, 0.66796875, 0.923828125, 1.1796875, 1.435546875, 1.69140625, 1.947265625, 2.203125, 2.458984375, 2.71484375, 2.970703125, 3.2265625, 3.482421875, 3.73828125, 3.994140625, 4.25, 4.505859375, 4.76171875, 5.017578125, 5.2734375, 5.529296875, 5.78515625, 6.041015625, 6.296875, 6.552734375, 6.80859375, 7.064453125, 7.3203125, 7.576171875, 7.83203125, 8.087890625, 8.34375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 6.0, 15.0, 11.0, 14.0, 12.0, 17.0, 22.0, 27.0, 47.0, 35.0, 45.0, 53.0, 54.0, 55.0, 61.0, 75.0, 66.0, 49.0, 49.0, 40.0, 48.0, 29.0, 27.0, 25.0, 21.0, 13.0, 16.0, 12.0, 11.0, 3.0, 8.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.47100830078125, -2.3834228515625, -2.29583740234375, -2.208251953125, -2.12066650390625, -2.0330810546875, -1.94549560546875, -1.85791015625, -1.77032470703125, -1.6827392578125, -1.59515380859375, -1.507568359375, -1.41998291015625, -1.3323974609375, -1.24481201171875, -1.1572265625, -1.06964111328125, -0.9820556640625, -0.89447021484375, -0.806884765625, -0.71929931640625, -0.6317138671875, -0.54412841796875, -0.45654296875, -0.36895751953125, -0.2813720703125, -0.19378662109375, -0.106201171875, -0.01861572265625, 0.0689697265625, 0.15655517578125, 0.244140625, 0.33172607421875, 0.4193115234375, 0.50689697265625, 0.594482421875, 0.68206787109375, 0.7696533203125, 0.85723876953125, 0.94482421875, 1.03240966796875, 1.1199951171875, 1.20758056640625, 1.295166015625, 1.38275146484375, 1.4703369140625, 1.55792236328125, 1.6455078125, 1.73309326171875, 1.8206787109375, 1.90826416015625, 1.995849609375, 2.08343505859375, 2.1710205078125, 2.25860595703125, 2.34619140625, 2.43377685546875, 2.5213623046875, 2.60894775390625, 2.696533203125, 2.78411865234375, 2.8717041015625, 2.95928955078125, 3.046875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 9.0, 12.0, 18.0, 18.0, 22.0, 41.0, 37.0, 37.0, 54.0, 51.0, 82.0, 52.0, 77.0, 56.0, 68.0, 58.0, 50.0, 38.0, 37.0, 30.0, 27.0, 17.0, 19.0, 17.0, 11.0, 6.0, 8.0, 2.0, 12.0, 4.0, 0.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.460142135620117, -18.730737686157227, -18.001331329345703, -17.271926879882812, -16.542522430419922, -15.813116073608398, -15.083711624145508, -14.3543062210083, -13.624900817871094, -12.895495414733887, -12.16609001159668, -11.436685562133789, -10.707280158996582, -9.977874755859375, -9.248470306396484, -8.519064903259277, -7.78965950012207, -7.060254096984863, -6.3308491706848145, -5.601444244384766, -4.872038841247559, -4.142633438110352, -3.4132285118103027, -2.683823585510254, -1.9544181823730469, -1.225013017654419, -0.495607852935791, 0.23379731178283691, 0.9632024765014648, 1.6926076412200928, 2.4220128059387207, 3.1514177322387695, 3.8808231353759766, 4.610228538513184, 5.339633464813232, 6.069038391113281, 6.798443794250488, 7.527849197387695, 8.257253646850586, 8.986659049987793, 9.716064453125, 10.445469856262207, 11.174875259399414, 11.904279708862305, 12.633685111999512, 13.363090515136719, 14.09249496459961, 14.821900367736816, 15.551305770874023, 16.280710220336914, 17.010116577148438, 17.739521026611328, 18.46892547607422, 19.198331832885742, 19.927736282348633, 20.657142639160156, 21.386547088623047, 22.115951538085938, 22.84535789489746, 23.57476234436035, 24.304168701171875, 25.033573150634766, 25.762977600097656, 26.492382049560547, 27.22178840637207]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 4.0, 4.0, 8.0, 7.0, 13.0, 13.0, 11.0, 15.0, 8.0, 14.0, 26.0, 26.0, 24.0, 34.0, 44.0, 29.0, 25.0, 52.0, 43.0, 42.0, 51.0, 42.0, 49.0, 41.0, 39.0, 52.0, 37.0, 16.0, 30.0, 29.0, 27.0, 21.0, 24.0, 20.0, 13.0, 14.0, 14.0, 9.0, 7.0, 7.0, 12.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.368841171264648, -10.982305526733398, -10.595768928527832, -10.209233283996582, -9.822696685791016, -9.436161041259766, -9.049625396728516, -8.66308879852295, -8.2765531539917, -7.890017032623291, -7.503480911254883, -7.116945266723633, -6.730409145355225, -6.343873023986816, -5.957336902618408, -5.57080078125, -5.184264659881592, -4.797728538513184, -4.411192417144775, -4.024656295776367, -3.638120651245117, -3.251584529876709, -2.865048408508301, -2.4785125255584717, -2.0919764041900635, -1.7054404020309448, -1.3189043998718262, -0.932368278503418, -0.5458322763442993, -0.15929627418518066, 0.22723984718322754, 0.6137757301330566, 1.0003118515014648, 1.3868478536605835, 1.7733838558197021, 2.1599199771881104, 2.5464558601379395, 2.9329919815063477, 3.319528102874756, 3.706063985824585, 4.092599868774414, 4.479135990142822, 4.8656721115112305, 5.2522077560424805, 5.638743877410889, 6.025279998779297, 6.411816120147705, 6.798352241516113, 7.1848883628845215, 7.57142448425293, 7.957960605621338, 8.344496726989746, 8.731032371520996, 9.117568969726562, 9.504104614257812, 9.890640258789062, 10.277176856994629, 10.663712501525879, 11.050249099731445, 11.436784744262695, 11.823321342468262, 12.209856986999512, 12.596393585205078, 12.982929229736328, 13.369464874267578]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 13.0, 16.0, 26.0, 32.0, 51.0, 75.0, 89.0, 146.0, 202.0, 338.0, 479.0, 703.0, 1128.0, 1687.0, 2632.0, 4415.0, 7187.0, 12117.0, 21513.0, 37874.0, 69756.0, 133270.0, 262834.0, 522323.0, 881499.0, 946883.0, 620571.0, 317167.0, 159035.0, 83116.0, 44393.0, 24837.0, 14659.0, 8566.0, 5215.0, 3308.0, 1999.0, 1354.0, 933.0, 597.0, 387.0, 242.0, 192.0, 118.0, 100.0, 55.0, 39.0, 32.0, 17.0, 16.0, 9.0, 12.0, 7.0, 5.0, 3.0, 2.0], "bins": [-16.84375, -16.3355712890625, -15.827392578125, -15.3192138671875, -14.81103515625, -14.3028564453125, -13.794677734375, -13.2864990234375, -12.7783203125, -12.2701416015625, -11.761962890625, -11.2537841796875, -10.74560546875, -10.2374267578125, -9.729248046875, -9.2210693359375, -8.712890625, -8.2047119140625, -7.696533203125, -7.1883544921875, -6.68017578125, -6.1719970703125, -5.663818359375, -5.1556396484375, -4.6474609375, -4.1392822265625, -3.631103515625, -3.1229248046875, -2.61474609375, -2.1065673828125, -1.598388671875, -1.0902099609375, -0.58203125, -0.0738525390625, 0.434326171875, 0.9425048828125, 1.45068359375, 1.9588623046875, 2.467041015625, 2.9752197265625, 3.4833984375, 3.9915771484375, 4.499755859375, 5.0079345703125, 5.51611328125, 6.0242919921875, 6.532470703125, 7.0406494140625, 7.548828125, 8.0570068359375, 8.565185546875, 9.0733642578125, 9.58154296875, 10.0897216796875, 10.597900390625, 11.1060791015625, 11.6142578125, 12.1224365234375, 12.630615234375, 13.1387939453125, 13.64697265625, 14.1551513671875, 14.663330078125, 15.1715087890625, 15.6796875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 5.0, 2.0, 5.0, 11.0, 13.0, 13.0, 10.0, 10.0, 17.0, 15.0, 28.0, 25.0, 32.0, 33.0, 29.0, 32.0, 38.0, 39.0, 41.0, 42.0, 44.0, 35.0, 61.0, 50.0, 46.0, 42.0, 40.0, 38.0, 39.0, 27.0, 23.0, 21.0, 17.0, 17.0, 12.0, 6.0, 12.0, 11.0, 4.0, 3.0, 1.0, 5.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1640625, -8.87841796875, -8.5927734375, -8.30712890625, -8.021484375, -7.73583984375, -7.4501953125, -7.16455078125, -6.87890625, -6.59326171875, -6.3076171875, -6.02197265625, -5.736328125, -5.45068359375, -5.1650390625, -4.87939453125, -4.59375, -4.30810546875, -4.0224609375, -3.73681640625, -3.451171875, -3.16552734375, -2.8798828125, -2.59423828125, -2.30859375, -2.02294921875, -1.7373046875, -1.45166015625, -1.166015625, -0.88037109375, -0.5947265625, -0.30908203125, -0.0234375, 0.26220703125, 0.5478515625, 0.83349609375, 1.119140625, 1.40478515625, 1.6904296875, 1.97607421875, 2.26171875, 2.54736328125, 2.8330078125, 3.11865234375, 3.404296875, 3.68994140625, 3.9755859375, 4.26123046875, 4.546875, 4.83251953125, 5.1181640625, 5.40380859375, 5.689453125, 5.97509765625, 6.2607421875, 6.54638671875, 6.83203125, 7.11767578125, 7.4033203125, 7.68896484375, 7.974609375, 8.26025390625, 8.5458984375, 8.83154296875, 9.1171875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 15.0, 23.0, 45.0, 51.0, 77.0, 131.0, 160.0, 273.0, 401.0, 673.0, 1060.0, 1697.0, 2688.0, 4383.0, 7276.0, 12377.0, 21725.0, 38595.0, 69415.0, 128998.0, 237706.0, 434658.0, 720980.0, 896821.0, 696263.0, 413971.0, 226675.0, 121935.0, 66786.0, 37166.0, 20911.0, 12091.0, 6993.0, 4306.0, 2563.0, 1576.0, 1036.0, 623.0, 373.0, 269.0, 178.0, 112.0, 69.0, 45.0, 39.0, 22.0, 14.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0], "bins": [-17.78125, -17.2652587890625, -16.749267578125, -16.2332763671875, -15.71728515625, -15.2012939453125, -14.685302734375, -14.1693115234375, -13.6533203125, -13.1373291015625, -12.621337890625, -12.1053466796875, -11.58935546875, -11.0733642578125, -10.557373046875, -10.0413818359375, -9.525390625, -9.0093994140625, -8.493408203125, -7.9774169921875, -7.46142578125, -6.9454345703125, -6.429443359375, -5.9134521484375, -5.3974609375, -4.8814697265625, -4.365478515625, -3.8494873046875, -3.33349609375, -2.8175048828125, -2.301513671875, -1.7855224609375, -1.26953125, -0.7535400390625, -0.237548828125, 0.2784423828125, 0.79443359375, 1.3104248046875, 1.826416015625, 2.3424072265625, 2.8583984375, 3.3743896484375, 3.890380859375, 4.4063720703125, 4.92236328125, 5.4383544921875, 5.954345703125, 6.4703369140625, 6.986328125, 7.5023193359375, 8.018310546875, 8.5343017578125, 9.05029296875, 9.5662841796875, 10.082275390625, 10.5982666015625, 11.1142578125, 11.6302490234375, 12.146240234375, 12.6622314453125, 13.17822265625, 13.6942138671875, 14.210205078125, 14.7261962890625, 15.2421875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 16.0, 30.0, 26.0, 35.0, 43.0, 60.0, 88.0, 117.0, 147.0, 176.0, 215.0, 262.0, 278.0, 303.0, 321.0, 310.0, 280.0, 275.0, 222.0, 159.0, 165.0, 128.0, 109.0, 65.0, 61.0, 38.0, 33.0, 32.0, 20.0, 11.0, 5.0, 11.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -4.99627685546875, -4.8011474609375, -4.60601806640625, -4.410888671875, -4.21575927734375, -4.0206298828125, -3.82550048828125, -3.63037109375, -3.43524169921875, -3.2401123046875, -3.04498291015625, -2.849853515625, -2.65472412109375, -2.4595947265625, -2.26446533203125, -2.0693359375, -1.87420654296875, -1.6790771484375, -1.48394775390625, -1.288818359375, -1.09368896484375, -0.8985595703125, -0.70343017578125, -0.50830078125, -0.31317138671875, -0.1180419921875, 0.07708740234375, 0.272216796875, 0.46734619140625, 0.6624755859375, 0.85760498046875, 1.052734375, 1.24786376953125, 1.4429931640625, 1.63812255859375, 1.833251953125, 2.02838134765625, 2.2235107421875, 2.41864013671875, 2.61376953125, 2.80889892578125, 3.0040283203125, 3.19915771484375, 3.394287109375, 3.58941650390625, 3.7845458984375, 3.97967529296875, 4.1748046875, 4.36993408203125, 4.5650634765625, 4.76019287109375, 4.955322265625, 5.15045166015625, 5.3455810546875, 5.54071044921875, 5.73583984375, 5.93096923828125, 6.1260986328125, 6.32122802734375, 6.516357421875, 6.71148681640625, 6.9066162109375, 7.10174560546875, 7.296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 9.0, 9.0, 19.0, 15.0, 22.0, 23.0, 20.0, 45.0, 34.0, 48.0, 43.0, 66.0, 74.0, 67.0, 69.0, 62.0, 60.0, 46.0, 51.0, 34.0, 19.0, 18.0, 28.0, 16.0, 18.0, 12.0, 9.0, 7.0, 10.0, 6.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.273786544799805, -18.626934051513672, -17.98008155822754, -17.333229064941406, -16.686378479003906, -16.039525985717773, -15.39267349243164, -14.745820999145508, -14.098968505859375, -13.452116012573242, -12.80526351928711, -12.158411979675293, -11.51155948638916, -10.864706993103027, -10.217855453491211, -9.571002960205078, -8.924150466918945, -8.277297973632812, -7.630445957183838, -6.983593940734863, -6.3367414474487305, -5.689888954162598, -5.043036937713623, -4.396184921264648, -3.7493324279785156, -3.102480173110962, -2.455627918243408, -1.8087756633758545, -1.1619234085083008, -0.5150711536407471, 0.13178110122680664, 0.7786331176757812, 1.425485610961914, 2.0723378658294678, 2.7191901206970215, 3.366042375564575, 4.012894630432129, 4.659747123718262, 5.306599140167236, 5.953451156616211, 6.600303649902344, 7.247156143188477, 7.894008159637451, 8.540860176086426, 9.187712669372559, 9.834565162658691, 10.481416702270508, 11.12826919555664, 11.775121688842773, 12.421974182128906, 13.068826675415039, 13.715678215026855, 14.362530708312988, 15.009383201599121, 15.656234741210938, 16.30308723449707, 16.949939727783203, 17.596792221069336, 18.24364471435547, 18.8904972076416, 19.537349700927734, 20.184200286865234, 20.831052780151367, 21.4779052734375, 22.124757766723633]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 18.0, 12.0, 18.0, 12.0, 24.0, 24.0, 29.0, 25.0, 32.0, 33.0, 40.0, 43.0, 43.0, 49.0, 45.0, 41.0, 63.0, 44.0, 39.0, 37.0, 38.0, 42.0, 25.0, 25.0, 31.0, 30.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.629175186157227, -10.27098560333252, -9.912796020507812, -9.554606437683105, -9.196416854858398, -8.838227272033691, -8.480037689208984, -8.121848106384277, -7.76365852355957, -7.405468940734863, -7.047279357910156, -6.689089775085449, -6.330900192260742, -5.972710609436035, -5.614521026611328, -5.256331443786621, -4.898141860961914, -4.539952278137207, -4.1817626953125, -3.823573112487793, -3.465383529663086, -3.107193946838379, -2.749004364013672, -2.390814781188965, -2.032625198364258, -1.6744356155395508, -1.3162460327148438, -0.9580564498901367, -0.5998668670654297, -0.24167728424072266, 0.11651229858398438, 0.4747018814086914, 0.832890510559082, 1.191080093383789, 1.549269676208496, 1.9074592590332031, 2.26564884185791, 2.623838424682617, 2.982028007507324, 3.3402175903320312, 3.6984071731567383, 4.056596755981445, 4.414786338806152, 4.772975921630859, 5.131165504455566, 5.489355087280273, 5.8475446701049805, 6.2057342529296875, 6.5639238357543945, 6.922113418579102, 7.280303001403809, 7.638492584228516, 7.996682167053223, 8.35487174987793, 8.713061332702637, 9.071250915527344, 9.42944049835205, 9.787630081176758, 10.145819664001465, 10.504009246826172, 10.862198829650879, 11.220388412475586, 11.578577995300293, 11.936767578125, 12.294957160949707]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 12.0, 21.0, 34.0, 51.0, 65.0, 85.0, 112.0, 186.0, 279.0, 393.0, 526.0, 833.0, 1343.0, 2006.0, 3336.0, 5647.0, 9537.0, 16024.0, 28479.0, 49858.0, 87495.0, 140043.0, 185596.0, 183389.0, 135696.0, 83814.0, 48099.0, 27109.0, 15159.0, 9010.0, 5357.0, 3180.0, 1947.0, 1261.0, 834.0, 589.0, 333.0, 219.0, 172.0, 125.0, 67.0, 58.0, 46.0, 24.0, 34.0, 12.0, 5.0, 11.0, 8.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.9017333984375, -10.537841796875, -10.1739501953125, -9.81005859375, -9.4461669921875, -9.082275390625, -8.7183837890625, -8.3544921875, -7.9906005859375, -7.626708984375, -7.2628173828125, -6.89892578125, -6.5350341796875, -6.171142578125, -5.8072509765625, -5.443359375, -5.0794677734375, -4.715576171875, -4.3516845703125, -3.98779296875, -3.6239013671875, -3.260009765625, -2.8961181640625, -2.5322265625, -2.1683349609375, -1.804443359375, -1.4405517578125, -1.07666015625, -0.7127685546875, -0.348876953125, 0.0150146484375, 0.37890625, 0.7427978515625, 1.106689453125, 1.4705810546875, 1.83447265625, 2.1983642578125, 2.562255859375, 2.9261474609375, 3.2900390625, 3.6539306640625, 4.017822265625, 4.3817138671875, 4.74560546875, 5.1094970703125, 5.473388671875, 5.8372802734375, 6.201171875, 6.5650634765625, 6.928955078125, 7.2928466796875, 7.65673828125, 8.0206298828125, 8.384521484375, 8.7484130859375, 9.1123046875, 9.4761962890625, 9.840087890625, 10.2039794921875, 10.56787109375, 10.9317626953125, 11.295654296875, 11.6595458984375, 12.0234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 7.0, 17.0, 10.0, 17.0, 17.0, 25.0, 22.0, 34.0, 37.0, 32.0, 21.0, 41.0, 50.0, 58.0, 43.0, 43.0, 60.0, 45.0, 47.0, 49.0, 34.0, 30.0, 27.0, 26.0, 36.0, 30.0, 20.0, 20.0, 13.0, 15.0, 12.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1796875, -11.789306640625, -11.39892578125, -11.008544921875, -10.6181640625, -10.227783203125, -9.83740234375, -9.447021484375, -9.056640625, -8.666259765625, -8.27587890625, -7.885498046875, -7.4951171875, -7.104736328125, -6.71435546875, -6.323974609375, -5.93359375, -5.543212890625, -5.15283203125, -4.762451171875, -4.3720703125, -3.981689453125, -3.59130859375, -3.200927734375, -2.810546875, -2.420166015625, -2.02978515625, -1.639404296875, -1.2490234375, -0.858642578125, -0.46826171875, -0.077880859375, 0.3125, 0.702880859375, 1.09326171875, 1.483642578125, 1.8740234375, 2.264404296875, 2.65478515625, 3.045166015625, 3.435546875, 3.825927734375, 4.21630859375, 4.606689453125, 4.9970703125, 5.387451171875, 5.77783203125, 6.168212890625, 6.55859375, 6.948974609375, 7.33935546875, 7.729736328125, 8.1201171875, 8.510498046875, 8.90087890625, 9.291259765625, 9.681640625, 10.072021484375, 10.46240234375, 10.852783203125, 11.2431640625, 11.633544921875, 12.02392578125, 12.414306640625, 12.8046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 28.0, 35.0, 56.0, 80.0, 158.0, 203.0, 324.0, 658.0, 1134.0, 2046.0, 3939.0, 8433.0, 19049.0, 45334.0, 110973.0, 245685.0, 310000.0, 172985.0, 72177.0, 29856.0, 12864.0, 5904.0, 2912.0, 1556.0, 849.0, 499.0, 282.0, 159.0, 114.0, 83.0, 54.0, 23.0, 24.0, 20.0, 9.0, 3.0, 9.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.8115234375, -15.185546875, -14.5595703125, -13.93359375, -13.3076171875, -12.681640625, -12.0556640625, -11.4296875, -10.8037109375, -10.177734375, -9.5517578125, -8.92578125, -8.2998046875, -7.673828125, -7.0478515625, -6.421875, -5.7958984375, -5.169921875, -4.5439453125, -3.91796875, -3.2919921875, -2.666015625, -2.0400390625, -1.4140625, -0.7880859375, -0.162109375, 0.4638671875, 1.08984375, 1.7158203125, 2.341796875, 2.9677734375, 3.59375, 4.2197265625, 4.845703125, 5.4716796875, 6.09765625, 6.7236328125, 7.349609375, 7.9755859375, 8.6015625, 9.2275390625, 9.853515625, 10.4794921875, 11.10546875, 11.7314453125, 12.357421875, 12.9833984375, 13.609375, 14.2353515625, 14.861328125, 15.4873046875, 16.11328125, 16.7392578125, 17.365234375, 17.9912109375, 18.6171875, 19.2431640625, 19.869140625, 20.4951171875, 21.12109375, 21.7470703125, 22.373046875, 22.9990234375, 23.625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 18.0, 22.0, 20.0, 32.0, 29.0, 22.0, 39.0, 46.0, 41.0, 42.0, 47.0, 41.0, 44.0, 47.0, 46.0, 39.0, 41.0, 36.0, 40.0, 36.0, 41.0, 39.0, 27.0, 25.0, 28.0, 20.0, 17.0, 7.0, 9.0, 13.0, 11.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.7958984375, -6.560546875, -6.3251953125, -6.08984375, -5.8544921875, -5.619140625, -5.3837890625, -5.1484375, -4.9130859375, -4.677734375, -4.4423828125, -4.20703125, -3.9716796875, -3.736328125, -3.5009765625, -3.265625, -3.0302734375, -2.794921875, -2.5595703125, -2.32421875, -2.0888671875, -1.853515625, -1.6181640625, -1.3828125, -1.1474609375, -0.912109375, -0.6767578125, -0.44140625, -0.2060546875, 0.029296875, 0.2646484375, 0.5, 0.7353515625, 0.970703125, 1.2060546875, 1.44140625, 1.6767578125, 1.912109375, 2.1474609375, 2.3828125, 2.6181640625, 2.853515625, 3.0888671875, 3.32421875, 3.5595703125, 3.794921875, 4.0302734375, 4.265625, 4.5009765625, 4.736328125, 4.9716796875, 5.20703125, 5.4423828125, 5.677734375, 5.9130859375, 6.1484375, 6.3837890625, 6.619140625, 6.8544921875, 7.08984375, 7.3251953125, 7.560546875, 7.7958984375, 8.03125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 16.0, 13.0, 21.0, 44.0, 42.0, 60.0, 107.0, 180.0, 249.0, 393.0, 737.0, 1275.0, 2319.0, 4479.0, 9404.0, 20295.0, 45979.0, 109466.0, 240736.0, 309134.0, 171005.0, 73401.0, 31187.0, 13983.0, 6570.0, 3225.0, 1701.0, 964.0, 586.0, 319.0, 248.0, 119.0, 99.0, 55.0, 34.0, 29.0, 18.0, 17.0, 7.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.1015625, -8.8280029296875, -8.554443359375, -8.2808837890625, -8.00732421875, -7.7337646484375, -7.460205078125, -7.1866455078125, -6.9130859375, -6.6395263671875, -6.365966796875, -6.0924072265625, -5.81884765625, -5.5452880859375, -5.271728515625, -4.9981689453125, -4.724609375, -4.4510498046875, -4.177490234375, -3.9039306640625, -3.63037109375, -3.3568115234375, -3.083251953125, -2.8096923828125, -2.5361328125, -2.2625732421875, -1.989013671875, -1.7154541015625, -1.44189453125, -1.1683349609375, -0.894775390625, -0.6212158203125, -0.34765625, -0.0740966796875, 0.199462890625, 0.4730224609375, 0.74658203125, 1.0201416015625, 1.293701171875, 1.5672607421875, 1.8408203125, 2.1143798828125, 2.387939453125, 2.6614990234375, 2.93505859375, 3.2086181640625, 3.482177734375, 3.7557373046875, 4.029296875, 4.3028564453125, 4.576416015625, 4.8499755859375, 5.12353515625, 5.3970947265625, 5.670654296875, 5.9442138671875, 6.2177734375, 6.4913330078125, 6.764892578125, 7.0384521484375, 7.31201171875, 7.5855712890625, 7.859130859375, 8.1326904296875, 8.40625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 6.0, 17.0, 14.0, 17.0, 15.0, 20.0, 24.0, 38.0, 51.0, 54.0, 58.0, 79.0, 68.0, 64.0, 56.0, 79.0, 52.0, 62.0, 34.0, 40.0, 22.0, 20.0, 19.0, 12.0, 9.0, 17.0, 6.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002980232238769531, -0.0002882517874240875, -0.0002784803509712219, -0.0002687089145183563, -0.0002589374780654907, -0.0002491660416126251, -0.00023939460515975952, -0.00022962316870689392, -0.00021985173225402832, -0.00021008029580116272, -0.00020030885934829712, -0.00019053742289543152, -0.00018076598644256592, -0.00017099454998970032, -0.00016122311353683472, -0.00015145167708396912, -0.00014168024063110352, -0.00013190880417823792, -0.00012213736772537231, -0.00011236593127250671, -0.00010259449481964111, -9.282305836677551e-05, -8.305162191390991e-05, -7.328018546104431e-05, -6.350874900817871e-05, -5.373731255531311e-05, -4.396587610244751e-05, -3.419443964958191e-05, -2.442300319671631e-05, -1.4651566743850708e-05, -4.880130290985107e-06, 4.891306161880493e-06, 1.4662742614746094e-05, 2.4434179067611694e-05, 3.4205615520477295e-05, 4.3977051973342896e-05, 5.3748488426208496e-05, 6.35199248790741e-05, 7.32913613319397e-05, 8.30627977848053e-05, 9.28342342376709e-05, 0.0001026056706905365, 0.0001123771071434021, 0.0001221485435962677, 0.0001319199800491333, 0.0001416914165019989, 0.0001514628529548645, 0.0001612342894077301, 0.0001710057258605957, 0.0001807771623134613, 0.0001905485987663269, 0.0002003200352191925, 0.0002100914716720581, 0.0002198629081249237, 0.0002296343445777893, 0.0002394057810306549, 0.0002491772174835205, 0.0002589486539363861, 0.0002687200903892517, 0.0002784915268421173, 0.0002882629632949829, 0.0002980343997478485, 0.0003078058362007141, 0.0003175772726535797, 0.0003273487091064453]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 3.0, 11.0, 18.0, 13.0, 29.0, 34.0, 57.0, 91.0, 128.0, 191.0, 319.0, 387.0, 600.0, 947.0, 1563.0, 2632.0, 4654.0, 8422.0, 15615.0, 31224.0, 60140.0, 112702.0, 182010.0, 216921.0, 177022.0, 109268.0, 58458.0, 30101.0, 15393.0, 8206.0, 4475.0, 2617.0, 1478.0, 960.0, 634.0, 388.0, 273.0, 187.0, 121.0, 81.0, 60.0, 44.0, 20.0, 19.0, 16.0, 4.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.735107421875, -5.54052734375, -5.345947265625, -5.1513671875, -4.956787109375, -4.76220703125, -4.567626953125, -4.373046875, -4.178466796875, -3.98388671875, -3.789306640625, -3.5947265625, -3.400146484375, -3.20556640625, -3.010986328125, -2.81640625, -2.621826171875, -2.42724609375, -2.232666015625, -2.0380859375, -1.843505859375, -1.64892578125, -1.454345703125, -1.259765625, -1.065185546875, -0.87060546875, -0.676025390625, -0.4814453125, -0.286865234375, -0.09228515625, 0.102294921875, 0.296875, 0.491455078125, 0.68603515625, 0.880615234375, 1.0751953125, 1.269775390625, 1.46435546875, 1.658935546875, 1.853515625, 2.048095703125, 2.24267578125, 2.437255859375, 2.6318359375, 2.826416015625, 3.02099609375, 3.215576171875, 3.41015625, 3.604736328125, 3.79931640625, 3.993896484375, 4.1884765625, 4.383056640625, 4.57763671875, 4.772216796875, 4.966796875, 5.161376953125, 5.35595703125, 5.550537109375, 5.7451171875, 5.939697265625, 6.13427734375, 6.328857421875, 6.5234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 7.0, 2.0, 7.0, 3.0, 9.0, 15.0, 19.0, 16.0, 28.0, 32.0, 29.0, 32.0, 35.0, 45.0, 58.0, 53.0, 55.0, 54.0, 65.0, 57.0, 57.0, 59.0, 51.0, 51.0, 28.0, 30.0, 22.0, 19.0, 9.0, 7.0, 12.0, 9.0, 1.0, 9.0, 8.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.736328125, -1.67657470703125, -1.6168212890625, -1.55706787109375, -1.497314453125, -1.43756103515625, -1.3778076171875, -1.31805419921875, -1.25830078125, -1.19854736328125, -1.1387939453125, -1.07904052734375, -1.019287109375, -0.95953369140625, -0.8997802734375, -0.84002685546875, -0.7802734375, -0.72052001953125, -0.6607666015625, -0.60101318359375, -0.541259765625, -0.48150634765625, -0.4217529296875, -0.36199951171875, -0.30224609375, -0.24249267578125, -0.1827392578125, -0.12298583984375, -0.063232421875, -0.00347900390625, 0.0562744140625, 0.11602783203125, 0.17578125, 0.23553466796875, 0.2952880859375, 0.35504150390625, 0.414794921875, 0.47454833984375, 0.5343017578125, 0.59405517578125, 0.65380859375, 0.71356201171875, 0.7733154296875, 0.83306884765625, 0.892822265625, 0.95257568359375, 1.0123291015625, 1.07208251953125, 1.1318359375, 1.19158935546875, 1.2513427734375, 1.31109619140625, 1.370849609375, 1.43060302734375, 1.4903564453125, 1.55010986328125, 1.60986328125, 1.66961669921875, 1.7293701171875, 1.78912353515625, 1.848876953125, 1.90863037109375, 1.9683837890625, 2.02813720703125, 2.087890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 3.0, 4.0, 11.0, 15.0, 11.0, 17.0, 22.0, 19.0, 43.0, 32.0, 35.0, 52.0, 63.0, 63.0, 72.0, 69.0, 71.0, 61.0, 57.0, 46.0, 50.0, 22.0, 18.0, 27.0, 23.0, 17.0, 8.0, 10.0, 11.0, 9.0, 6.0, 0.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.129344940185547, -19.466495513916016, -18.803647994995117, -18.140798568725586, -17.477951049804688, -16.815101623535156, -16.152254104614258, -15.489404678344727, -14.826556205749512, -14.163707733154297, -13.500859260559082, -12.838010787963867, -12.175161361694336, -11.512313842773438, -10.849464416503906, -10.186615943908691, -9.523767471313477, -8.860918998718262, -8.198070526123047, -7.535221576690674, -6.872373104095459, -6.209524631500244, -5.546675682067871, -4.883827209472656, -4.220978736877441, -3.5581302642822266, -2.8952815532684326, -2.2324328422546387, -1.5695843696594238, -0.906735897064209, -0.24388718605041504, 0.4189615249633789, 1.081808090209961, 1.7446566820144653, 2.4075052738189697, 3.0703539848327637, 3.7332024574279785, 4.396050930023193, 5.058899879455566, 5.721748352050781, 6.384596824645996, 7.047445297241211, 7.710293769836426, 8.37314224243164, 9.035991668701172, 9.69883918762207, 10.361688613891602, 11.024537086486816, 11.687385559082031, 12.350234031677246, 13.013082504272461, 13.675930976867676, 14.33877944946289, 15.001628875732422, 15.664477348327637, 16.32732582092285, 16.99017333984375, 17.65302276611328, 18.31587028503418, 18.97871971130371, 19.64156723022461, 20.30441665649414, 20.96726417541504, 21.63011360168457, 22.2929630279541]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 13.0, 14.0, 10.0, 15.0, 18.0, 25.0, 23.0, 25.0, 25.0, 26.0, 34.0, 38.0, 38.0, 34.0, 48.0, 40.0, 48.0, 48.0, 41.0, 37.0, 44.0, 37.0, 32.0, 38.0, 29.0, 25.0, 19.0, 33.0, 20.0, 25.0, 14.0, 14.0, 17.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.874702453613281, -9.548356056213379, -9.22200870513916, -8.895662307739258, -8.569314956665039, -8.242968559265137, -7.916621208190918, -7.590274810791016, -7.263927459716797, -6.937580585479736, -6.611233711242676, -6.284886837005615, -5.958539962768555, -5.632193088531494, -5.305846214294434, -4.979499816894531, -4.653152942657471, -4.32680606842041, -4.00045919418335, -3.674112319946289, -3.3477654457092285, -3.021418571472168, -2.6950719356536865, -2.368725061416626, -2.0423781871795654, -1.7160313129425049, -1.3896844387054443, -1.0633376836776733, -0.7369908094406128, -0.41064393520355225, -0.08429718017578125, 0.2420496940612793, 0.5683965682983398, 0.8947434425354004, 1.221090316772461, 1.547437071800232, 1.8737839460372925, 2.2001309394836426, 2.526477575302124, 2.8528244495391846, 3.179171323776245, 3.5055181980133057, 3.831865072250366, 4.158211708068848, 4.484558582305908, 4.810905456542969, 5.137252330780029, 5.46359920501709, 5.78994607925415, 6.116292953491211, 6.4426398277282715, 6.768986701965332, 7.095333576202393, 7.421680450439453, 7.7480268478393555, 8.074374198913574, 8.400720596313477, 8.727066993713379, 9.053414344787598, 9.3797607421875, 9.706108093261719, 10.032454490661621, 10.35880184173584, 10.685148239135742, 11.011495590209961]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 16.0, 26.0, 30.0, 55.0, 87.0, 135.0, 208.0, 371.0, 628.0, 1163.0, 2228.0, 4489.0, 8944.0, 18498.0, 37723.0, 73628.0, 129921.0, 191645.0, 208267.0, 163324.0, 100287.0, 53934.0, 26745.0, 13099.0, 6321.0, 3101.0, 1570.0, 860.0, 517.0, 272.0, 150.0, 107.0, 63.0, 43.0, 27.0, 22.0, 13.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.40625, -15.88134765625, -15.3564453125, -14.83154296875, -14.306640625, -13.78173828125, -13.2568359375, -12.73193359375, -12.20703125, -11.68212890625, -11.1572265625, -10.63232421875, -10.107421875, -9.58251953125, -9.0576171875, -8.53271484375, -8.0078125, -7.48291015625, -6.9580078125, -6.43310546875, -5.908203125, -5.38330078125, -4.8583984375, -4.33349609375, -3.80859375, -3.28369140625, -2.7587890625, -2.23388671875, -1.708984375, -1.18408203125, -0.6591796875, -0.13427734375, 0.390625, 0.91552734375, 1.4404296875, 1.96533203125, 2.490234375, 3.01513671875, 3.5400390625, 4.06494140625, 4.58984375, 5.11474609375, 5.6396484375, 6.16455078125, 6.689453125, 7.21435546875, 7.7392578125, 8.26416015625, 8.7890625, 9.31396484375, 9.8388671875, 10.36376953125, 10.888671875, 11.41357421875, 11.9384765625, 12.46337890625, 12.98828125, 13.51318359375, 14.0380859375, 14.56298828125, 15.087890625, 15.61279296875, 16.1376953125, 16.66259765625, 17.1875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 7.0, 10.0, 12.0, 16.0, 21.0, 19.0, 27.0, 29.0, 22.0, 19.0, 27.0, 33.0, 28.0, 39.0, 43.0, 42.0, 45.0, 50.0, 33.0, 34.0, 36.0, 40.0, 39.0, 27.0, 31.0, 28.0, 26.0, 27.0, 25.0, 24.0, 25.0, 18.0, 8.0, 19.0, 12.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.953125, -9.6209716796875, -9.288818359375, -8.9566650390625, -8.62451171875, -8.2923583984375, -7.960205078125, -7.6280517578125, -7.2958984375, -6.9637451171875, -6.631591796875, -6.2994384765625, -5.96728515625, -5.6351318359375, -5.302978515625, -4.9708251953125, -4.638671875, -4.3065185546875, -3.974365234375, -3.6422119140625, -3.31005859375, -2.9779052734375, -2.645751953125, -2.3135986328125, -1.9814453125, -1.6492919921875, -1.317138671875, -0.9849853515625, -0.65283203125, -0.3206787109375, 0.011474609375, 0.3436279296875, 0.67578125, 1.0079345703125, 1.340087890625, 1.6722412109375, 2.00439453125, 2.3365478515625, 2.668701171875, 3.0008544921875, 3.3330078125, 3.6651611328125, 3.997314453125, 4.3294677734375, 4.66162109375, 4.9937744140625, 5.325927734375, 5.6580810546875, 5.990234375, 6.3223876953125, 6.654541015625, 6.9866943359375, 7.31884765625, 7.6510009765625, 7.983154296875, 8.3153076171875, 8.6474609375, 8.9796142578125, 9.311767578125, 9.6439208984375, 9.97607421875, 10.3082275390625, 10.640380859375, 10.9725341796875, 11.3046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 13.0, 26.0, 38.0, 48.0, 57.0, 69.0, 119.0, 165.0, 246.0, 446.0, 746.0, 1339.0, 2816.0, 6710.0, 17135.0, 44537.0, 109220.0, 216825.0, 278653.0, 203763.0, 98627.0, 39959.0, 15401.0, 5980.0, 2592.0, 1230.0, 678.0, 410.0, 239.0, 145.0, 105.0, 64.0, 41.0, 24.0, 17.0, 21.0, 14.0, 9.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.09375, -18.42236328125, -17.7509765625, -17.07958984375, -16.408203125, -15.73681640625, -15.0654296875, -14.39404296875, -13.72265625, -13.05126953125, -12.3798828125, -11.70849609375, -11.037109375, -10.36572265625, -9.6943359375, -9.02294921875, -8.3515625, -7.68017578125, -7.0087890625, -6.33740234375, -5.666015625, -4.99462890625, -4.3232421875, -3.65185546875, -2.98046875, -2.30908203125, -1.6376953125, -0.96630859375, -0.294921875, 0.37646484375, 1.0478515625, 1.71923828125, 2.390625, 3.06201171875, 3.7333984375, 4.40478515625, 5.076171875, 5.74755859375, 6.4189453125, 7.09033203125, 7.76171875, 8.43310546875, 9.1044921875, 9.77587890625, 10.447265625, 11.11865234375, 11.7900390625, 12.46142578125, 13.1328125, 13.80419921875, 14.4755859375, 15.14697265625, 15.818359375, 16.48974609375, 17.1611328125, 17.83251953125, 18.50390625, 19.17529296875, 19.8466796875, 20.51806640625, 21.189453125, 21.86083984375, 22.5322265625, 23.20361328125, 23.875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 11.0, 9.0, 10.0, 29.0, 7.0, 14.0, 17.0, 29.0, 18.0, 28.0, 28.0, 32.0, 31.0, 34.0, 38.0, 31.0, 35.0, 31.0, 38.0, 40.0, 31.0, 41.0, 20.0, 29.0, 37.0, 31.0, 29.0, 23.0, 18.0, 33.0, 24.0, 26.0, 13.0, 19.0, 18.0, 17.0, 12.0, 4.0, 17.0, 3.0, 2.0, 5.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.84765625, -5.6590576171875, -5.470458984375, -5.2818603515625, -5.09326171875, -4.9046630859375, -4.716064453125, -4.5274658203125, -4.3388671875, -4.1502685546875, -3.961669921875, -3.7730712890625, -3.58447265625, -3.3958740234375, -3.207275390625, -3.0186767578125, -2.830078125, -2.6414794921875, -2.452880859375, -2.2642822265625, -2.07568359375, -1.8870849609375, -1.698486328125, -1.5098876953125, -1.3212890625, -1.1326904296875, -0.944091796875, -0.7554931640625, -0.56689453125, -0.3782958984375, -0.189697265625, -0.0010986328125, 0.1875, 0.3760986328125, 0.564697265625, 0.7532958984375, 0.94189453125, 1.1304931640625, 1.319091796875, 1.5076904296875, 1.6962890625, 1.8848876953125, 2.073486328125, 2.2620849609375, 2.45068359375, 2.6392822265625, 2.827880859375, 3.0164794921875, 3.205078125, 3.3936767578125, 3.582275390625, 3.7708740234375, 3.95947265625, 4.1480712890625, 4.336669921875, 4.5252685546875, 4.7138671875, 4.9024658203125, 5.091064453125, 5.2796630859375, 5.46826171875, 5.6568603515625, 5.845458984375, 6.0340576171875, 6.22265625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 34.0, 34.0, 72.0, 105.0, 162.0, 234.0, 380.0, 559.0, 812.0, 1227.0, 1916.0, 3071.0, 4616.0, 7441.0, 11793.0, 19078.0, 30929.0, 50086.0, 78853.0, 117520.0, 151793.0, 161875.0, 137070.0, 98691.0, 63892.0, 39782.0, 24915.0, 15192.0, 9467.0, 5995.0, 3804.0, 2477.0, 1651.0, 1011.0, 647.0, 462.0, 297.0, 198.0, 129.0, 82.0, 45.0, 37.0, 31.0, 16.0, 6.0, 7.0, 10.0, 1.0, 4.0, 4.0], "bins": [-6.22265625, -6.04620361328125, -5.8697509765625, -5.69329833984375, -5.516845703125, -5.34039306640625, -5.1639404296875, -4.98748779296875, -4.81103515625, -4.63458251953125, -4.4581298828125, -4.28167724609375, -4.105224609375, -3.92877197265625, -3.7523193359375, -3.57586669921875, -3.3994140625, -3.22296142578125, -3.0465087890625, -2.87005615234375, -2.693603515625, -2.51715087890625, -2.3406982421875, -2.16424560546875, -1.98779296875, -1.81134033203125, -1.6348876953125, -1.45843505859375, -1.281982421875, -1.10552978515625, -0.9290771484375, -0.75262451171875, -0.576171875, -0.39971923828125, -0.2232666015625, -0.04681396484375, 0.129638671875, 0.30609130859375, 0.4825439453125, 0.65899658203125, 0.83544921875, 1.01190185546875, 1.1883544921875, 1.36480712890625, 1.541259765625, 1.71771240234375, 1.8941650390625, 2.07061767578125, 2.2470703125, 2.42352294921875, 2.5999755859375, 2.77642822265625, 2.952880859375, 3.12933349609375, 3.3057861328125, 3.48223876953125, 3.65869140625, 3.83514404296875, 4.0115966796875, 4.18804931640625, 4.364501953125, 4.54095458984375, 4.7174072265625, 4.89385986328125, 5.0703125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 15.0, 24.0, 21.0, 32.0, 53.0, 48.0, 62.0, 77.0, 78.0, 91.0, 81.0, 89.0, 65.0, 45.0, 41.0, 29.0, 30.0, 24.0, 11.0, 11.0, 11.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006399154663085938, -0.0006174445152282715, -0.0005949735641479492, -0.000572502613067627, -0.0005500316619873047, -0.0005275607109069824, -0.0005050897598266602, -0.0004826188087463379, -0.0004601478576660156, -0.00043767690658569336, -0.0004152059555053711, -0.00039273500442504883, -0.00037026405334472656, -0.0003477931022644043, -0.00032532215118408203, -0.00030285120010375977, -0.0002803802490234375, -0.00025790929794311523, -0.00023543834686279297, -0.0002129673957824707, -0.00019049644470214844, -0.00016802549362182617, -0.0001455545425415039, -0.00012308359146118164, -0.00010061264038085938, -7.814168930053711e-05, -5.5670738220214844e-05, -3.319978713989258e-05, -1.0728836059570312e-05, 1.1742115020751953e-05, 3.421306610107422e-05, 5.6684017181396484e-05, 7.915496826171875e-05, 0.00010162591934204102, 0.00012409687042236328, 0.00014656782150268555, 0.0001690387725830078, 0.00019150972366333008, 0.00021398067474365234, 0.0002364516258239746, 0.0002589225769042969, 0.00028139352798461914, 0.0003038644790649414, 0.00032633543014526367, 0.00034880638122558594, 0.0003712773323059082, 0.00039374828338623047, 0.00041621923446655273, 0.000438690185546875, 0.00046116113662719727, 0.00048363208770751953, 0.0005061030387878418, 0.0005285739898681641, 0.0005510449409484863, 0.0005735158920288086, 0.0005959868431091309, 0.0006184577941894531, 0.0006409287452697754, 0.0006633996963500977, 0.0006858706474304199, 0.0007083415985107422, 0.0007308125495910645, 0.0007532835006713867, 0.000775754451751709, 0.0007982254028320312]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 14.0, 23.0, 43.0, 40.0, 72.0, 103.0, 144.0, 214.0, 329.0, 519.0, 773.0, 1227.0, 1827.0, 2921.0, 4758.0, 7813.0, 12918.0, 21635.0, 36179.0, 59153.0, 92919.0, 134716.0, 163554.0, 159542.0, 125429.0, 85667.0, 53640.0, 32240.0, 19526.0, 11549.0, 7157.0, 4279.0, 2658.0, 1743.0, 1075.0, 728.0, 434.0, 325.0, 183.0, 144.0, 106.0, 57.0, 46.0, 40.0, 23.0, 11.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0], "bins": [-5.80859375, -5.63201904296875, -5.4554443359375, -5.27886962890625, -5.102294921875, -4.92572021484375, -4.7491455078125, -4.57257080078125, -4.39599609375, -4.21942138671875, -4.0428466796875, -3.86627197265625, -3.689697265625, -3.51312255859375, -3.3365478515625, -3.15997314453125, -2.9833984375, -2.80682373046875, -2.6302490234375, -2.45367431640625, -2.277099609375, -2.10052490234375, -1.9239501953125, -1.74737548828125, -1.57080078125, -1.39422607421875, -1.2176513671875, -1.04107666015625, -0.864501953125, -0.68792724609375, -0.5113525390625, -0.33477783203125, -0.158203125, 0.01837158203125, 0.1949462890625, 0.37152099609375, 0.548095703125, 0.72467041015625, 0.9012451171875, 1.07781982421875, 1.25439453125, 1.43096923828125, 1.6075439453125, 1.78411865234375, 1.960693359375, 2.13726806640625, 2.3138427734375, 2.49041748046875, 2.6669921875, 2.84356689453125, 3.0201416015625, 3.19671630859375, 3.373291015625, 3.54986572265625, 3.7264404296875, 3.90301513671875, 4.07958984375, 4.25616455078125, 4.4327392578125, 4.60931396484375, 4.785888671875, 4.96246337890625, 5.1390380859375, 5.31561279296875, 5.4921875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 18.0, 13.0, 11.0, 21.0, 23.0, 21.0, 23.0, 30.0, 49.0, 46.0, 46.0, 50.0, 69.0, 53.0, 56.0, 54.0, 35.0, 70.0, 45.0, 41.0, 29.0, 35.0, 14.0, 27.0, 21.0, 18.0, 21.0, 10.0, 10.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.81781005859375, -1.7586669921875, -1.69952392578125, -1.640380859375, -1.58123779296875, -1.5220947265625, -1.46295166015625, -1.40380859375, -1.34466552734375, -1.2855224609375, -1.22637939453125, -1.167236328125, -1.10809326171875, -1.0489501953125, -0.98980712890625, -0.9306640625, -0.87152099609375, -0.8123779296875, -0.75323486328125, -0.694091796875, -0.63494873046875, -0.5758056640625, -0.51666259765625, -0.45751953125, -0.39837646484375, -0.3392333984375, -0.28009033203125, -0.220947265625, -0.16180419921875, -0.1026611328125, -0.04351806640625, 0.015625, 0.07476806640625, 0.1339111328125, 0.19305419921875, 0.252197265625, 0.31134033203125, 0.3704833984375, 0.42962646484375, 0.48876953125, 0.54791259765625, 0.6070556640625, 0.66619873046875, 0.725341796875, 0.78448486328125, 0.8436279296875, 0.90277099609375, 0.9619140625, 1.02105712890625, 1.0802001953125, 1.13934326171875, 1.198486328125, 1.25762939453125, 1.3167724609375, 1.37591552734375, 1.43505859375, 1.49420166015625, 1.5533447265625, 1.61248779296875, 1.671630859375, 1.73077392578125, 1.7899169921875, 1.84906005859375, 1.908203125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 7.0, 9.0, 10.0, 19.0, 18.0, 26.0, 30.0, 41.0, 50.0, 50.0, 61.0, 75.0, 57.0, 72.0, 81.0, 71.0, 59.0, 55.0, 46.0, 25.0, 18.0, 21.0, 15.0, 17.0, 12.0, 10.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.58266830444336, -21.86414337158203, -21.145618438720703, -20.427093505859375, -19.708568572998047, -18.99004364013672, -18.27151870727539, -17.552993774414062, -16.834468841552734, -16.115943908691406, -15.397418975830078, -14.67889404296875, -13.960369110107422, -13.241844177246094, -12.523320198059082, -11.804795265197754, -11.086271286010742, -10.367746353149414, -9.649221420288086, -8.930696487426758, -8.21217155456543, -7.49364709854126, -6.77512264251709, -6.056597709655762, -5.338072776794434, -4.6195478439331055, -3.9010231494903564, -3.1824984550476074, -2.4639735221862793, -1.7454485893249512, -1.0269241333007812, -0.3083992004394531, 0.410125732421875, 1.1286505460739136, 1.8471753597259521, 2.565700054168701, 3.2842249870300293, 4.002749919891357, 4.721274375915527, 5.4397993087768555, 6.158324241638184, 6.876849174499512, 7.59537410736084, 8.313898086547852, 9.03242301940918, 9.750947952270508, 10.469472885131836, 11.187997817993164, 11.906522750854492, 12.62504768371582, 13.343572616577148, 14.062097549438477, 14.780622482299805, 15.499147415161133, 16.217670440673828, 16.936195373535156, 17.654720306396484, 18.373245239257812, 19.09177017211914, 19.81029510498047, 20.528820037841797, 21.247344970703125, 21.965869903564453, 22.68439483642578, 23.40291976928711]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 11.0, 7.0, 7.0, 4.0, 9.0, 11.0, 15.0, 18.0, 24.0, 23.0, 18.0, 26.0, 32.0, 29.0, 44.0, 46.0, 47.0, 37.0, 27.0, 45.0, 37.0, 38.0, 45.0, 45.0, 39.0, 28.0, 44.0, 27.0, 25.0, 23.0, 20.0, 18.0, 21.0, 21.0, 19.0, 13.0, 9.0, 11.0, 12.0, 4.0, 2.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.802571296691895, -8.481050491333008, -8.159530639648438, -7.838009834289551, -7.516489505767822, -7.194969177246094, -6.873448371887207, -6.5519280433654785, -6.23040771484375, -5.9088873863220215, -5.587367057800293, -5.265846252441406, -4.944325923919678, -4.622805595397949, -4.3012847900390625, -3.979764461517334, -3.6582441329956055, -3.336723804473877, -3.0152032375335693, -2.6936826705932617, -2.372162342071533, -2.0506420135498047, -1.729121446609497, -1.4076008796691895, -1.086080551147461, -0.7645601034164429, -0.4430396556854248, -0.12151920795440674, 0.20000123977661133, 0.5215216875076294, 0.8430421352386475, 1.164562702178955, 1.4860830307006836, 1.8076034784317017, 2.1291239261627197, 2.4506444931030273, 2.772164821624756, 3.0936851501464844, 3.415205717086792, 3.7367262840270996, 4.058246612548828, 4.379766941070557, 4.701287269592285, 5.022808074951172, 5.3443284034729, 5.665848731994629, 5.987369537353516, 6.308889865875244, 6.630410194396973, 6.951930522918701, 7.27345085144043, 7.594971656799316, 7.916491985321045, 8.238012313842773, 8.55953311920166, 8.881053924560547, 9.202573776245117, 9.524094581604004, 9.845614433288574, 10.167135238647461, 10.488655090332031, 10.810175895690918, 11.131696701049805, 11.453216552734375, 11.774737358093262]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 11.0, 12.0, 16.0, 25.0, 23.0, 50.0, 72.0, 113.0, 171.0, 284.0, 417.0, 785.0, 1408.0, 2520.0, 5214.0, 10711.0, 22889.0, 51782.0, 124898.0, 331470.0, 902695.0, 1436223.0, 808525.0, 293911.0, 111810.0, 46490.0, 20726.0, 9949.0, 5024.0, 2524.0, 1424.0, 796.0, 474.0, 299.0, 169.0, 126.0, 78.0, 44.0, 37.0, 27.0, 14.0, 20.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-23.953125, -23.23681640625, -22.5205078125, -21.80419921875, -21.087890625, -20.37158203125, -19.6552734375, -18.93896484375, -18.22265625, -17.50634765625, -16.7900390625, -16.07373046875, -15.357421875, -14.64111328125, -13.9248046875, -13.20849609375, -12.4921875, -11.77587890625, -11.0595703125, -10.34326171875, -9.626953125, -8.91064453125, -8.1943359375, -7.47802734375, -6.76171875, -6.04541015625, -5.3291015625, -4.61279296875, -3.896484375, -3.18017578125, -2.4638671875, -1.74755859375, -1.03125, -0.31494140625, 0.4013671875, 1.11767578125, 1.833984375, 2.55029296875, 3.2666015625, 3.98291015625, 4.69921875, 5.41552734375, 6.1318359375, 6.84814453125, 7.564453125, 8.28076171875, 8.9970703125, 9.71337890625, 10.4296875, 11.14599609375, 11.8623046875, 12.57861328125, 13.294921875, 14.01123046875, 14.7275390625, 15.44384765625, 16.16015625, 16.87646484375, 17.5927734375, 18.30908203125, 19.025390625, 19.74169921875, 20.4580078125, 21.17431640625, 21.890625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 12.0, 18.0, 13.0, 23.0, 10.0, 27.0, 19.0, 33.0, 37.0, 39.0, 45.0, 37.0, 48.0, 55.0, 51.0, 59.0, 43.0, 47.0, 40.0, 46.0, 38.0, 39.0, 33.0, 30.0, 26.0, 22.0, 23.0, 15.0, 14.0, 8.0, 11.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.4146728515625, -7.134033203125, -6.8533935546875, -6.57275390625, -6.2921142578125, -6.011474609375, -5.7308349609375, -5.4501953125, -5.1695556640625, -4.888916015625, -4.6082763671875, -4.32763671875, -4.0469970703125, -3.766357421875, -3.4857177734375, -3.205078125, -2.9244384765625, -2.643798828125, -2.3631591796875, -2.08251953125, -1.8018798828125, -1.521240234375, -1.2406005859375, -0.9599609375, -0.6793212890625, -0.398681640625, -0.1180419921875, 0.16259765625, 0.4432373046875, 0.723876953125, 1.0045166015625, 1.28515625, 1.5657958984375, 1.846435546875, 2.1270751953125, 2.40771484375, 2.6883544921875, 2.968994140625, 3.2496337890625, 3.5302734375, 3.8109130859375, 4.091552734375, 4.3721923828125, 4.65283203125, 4.9334716796875, 5.214111328125, 5.4947509765625, 5.775390625, 6.0560302734375, 6.336669921875, 6.6173095703125, 6.89794921875, 7.1785888671875, 7.459228515625, 7.7398681640625, 8.0205078125, 8.3011474609375, 8.581787109375, 8.8624267578125, 9.14306640625, 9.4237060546875, 9.704345703125, 9.9849853515625, 10.265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 8.0, 15.0, 9.0, 11.0, 28.0, 37.0, 57.0, 84.0, 129.0, 183.0, 321.0, 526.0, 856.0, 1400.0, 2266.0, 4026.0, 6829.0, 12496.0, 22174.0, 41410.0, 78777.0, 152526.0, 294826.0, 557030.0, 893641.0, 906856.0, 575189.0, 306470.0, 156697.0, 82111.0, 43095.0, 23434.0, 12884.0, 7114.0, 4230.0, 2509.0, 1529.0, 923.0, 601.0, 339.0, 211.0, 120.0, 98.0, 63.0, 56.0, 30.0, 22.0, 14.0, 10.0, 2.0, 6.0, 2.0, 4.0, 4.0], "bins": [-18.609375, -18.078125, -17.546875, -17.015625, -16.484375, -15.953125, -15.421875, -14.890625, -14.359375, -13.828125, -13.296875, -12.765625, -12.234375, -11.703125, -11.171875, -10.640625, -10.109375, -9.578125, -9.046875, -8.515625, -7.984375, -7.453125, -6.921875, -6.390625, -5.859375, -5.328125, -4.796875, -4.265625, -3.734375, -3.203125, -2.671875, -2.140625, -1.609375, -1.078125, -0.546875, -0.015625, 0.515625, 1.046875, 1.578125, 2.109375, 2.640625, 3.171875, 3.703125, 4.234375, 4.765625, 5.296875, 5.828125, 6.359375, 6.890625, 7.421875, 7.953125, 8.484375, 9.015625, 9.546875, 10.078125, 10.609375, 11.140625, 11.671875, 12.203125, 12.734375, 13.265625, 13.796875, 14.328125, 14.859375, 15.390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 18.0, 14.0, 16.0, 34.0, 35.0, 71.0, 64.0, 104.0, 150.0, 164.0, 195.0, 274.0, 272.0, 351.0, 322.0, 342.0, 308.0, 259.0, 253.0, 203.0, 177.0, 123.0, 91.0, 67.0, 51.0, 34.0, 20.0, 18.0, 13.0, 5.0, 4.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7525634765625, -5.552001953125, -5.3514404296875, -5.15087890625, -4.9503173828125, -4.749755859375, -4.5491943359375, -4.3486328125, -4.1480712890625, -3.947509765625, -3.7469482421875, -3.54638671875, -3.3458251953125, -3.145263671875, -2.9447021484375, -2.744140625, -2.5435791015625, -2.343017578125, -2.1424560546875, -1.94189453125, -1.7413330078125, -1.540771484375, -1.3402099609375, -1.1396484375, -0.9390869140625, -0.738525390625, -0.5379638671875, -0.33740234375, -0.1368408203125, 0.063720703125, 0.2642822265625, 0.46484375, 0.6654052734375, 0.865966796875, 1.0665283203125, 1.26708984375, 1.4676513671875, 1.668212890625, 1.8687744140625, 2.0693359375, 2.2698974609375, 2.470458984375, 2.6710205078125, 2.87158203125, 3.0721435546875, 3.272705078125, 3.4732666015625, 3.673828125, 3.8743896484375, 4.074951171875, 4.2755126953125, 4.47607421875, 4.6766357421875, 4.877197265625, 5.0777587890625, 5.2783203125, 5.4788818359375, 5.679443359375, 5.8800048828125, 6.08056640625, 6.2811279296875, 6.481689453125, 6.6822509765625, 6.8828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 16.0, 15.0, 14.0, 26.0, 34.0, 43.0, 52.0, 71.0, 57.0, 71.0, 90.0, 86.0, 78.0, 67.0, 59.0, 45.0, 35.0, 30.0, 26.0, 17.0, 15.0, 9.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.007352828979492, -24.204038619995117, -23.400724411010742, -22.597408294677734, -21.79409408569336, -20.990779876708984, -20.18746566772461, -19.384151458740234, -18.58083724975586, -17.777523040771484, -16.97420883178711, -16.170894622802734, -15.367578506469727, -14.564264297485352, -13.760950088500977, -12.957635879516602, -12.154319763183594, -11.351005554199219, -10.547690391540527, -9.744376182556152, -8.941061019897461, -8.137746810913086, -7.334432601928711, -6.531117916107178, -5.7278032302856445, -4.924488544464111, -4.121173858642578, -3.317859649658203, -2.51454496383667, -1.7112302780151367, -0.9079160690307617, -0.10460138320922852, 0.6987133026123047, 1.5020278692245483, 2.305342435836792, 3.108656883239746, 3.9119715690612793, 4.7152862548828125, 5.5186004638671875, 6.321915149688721, 7.125229835510254, 7.928544521331787, 8.73185920715332, 9.535173416137695, 10.33848762512207, 11.141802787780762, 11.945116996765137, 12.748432159423828, 13.551746368408203, 14.355060577392578, 15.15837574005127, 15.961689949035645, 16.765005111694336, 17.56831932067871, 18.371633529663086, 19.17494773864746, 19.97826385498047, 20.781578063964844, 21.58489227294922, 22.388206481933594, 23.1915225982666, 23.994836807250977, 24.79815101623535, 25.601465225219727, 26.4047794342041]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 5.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 12.0, 18.0, 11.0, 18.0, 21.0, 23.0, 17.0, 23.0, 27.0, 33.0, 29.0, 41.0, 36.0, 37.0, 38.0, 36.0, 47.0, 46.0, 40.0, 29.0, 34.0, 39.0, 34.0, 34.0, 33.0, 26.0, 28.0, 22.0, 24.0, 14.0, 21.0, 16.0, 13.0, 8.0, 6.0, 7.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.131150245666504, -7.8515729904174805, -7.571995258331299, -7.292417526245117, -7.012840270996094, -6.73326301574707, -6.453685283660889, -6.174107551574707, -5.894530296325684, -5.61495304107666, -5.3353753089904785, -5.055797576904297, -4.776220321655273, -4.49664306640625, -4.217065334320068, -3.937487840652466, -3.6579103469848633, -3.3783328533172607, -3.098755359649658, -2.8191778659820557, -2.539600372314453, -2.2600228786468506, -1.980445384979248, -1.7008678913116455, -1.421290397644043, -1.1417129039764404, -0.8621354103088379, -0.5825579166412354, -0.3029804229736328, -0.023402929306030273, 0.25617456436157227, 0.5357520580291748, 0.8153285980224609, 1.0949060916900635, 1.374483585357666, 1.6540610790252686, 1.933638572692871, 2.2132160663604736, 2.492793560028076, 2.7723710536956787, 3.0519485473632812, 3.331526041030884, 3.6111035346984863, 3.890681028366089, 4.170258522033691, 4.449835777282715, 4.7294135093688965, 5.008991241455078, 5.288568496704102, 5.568145751953125, 5.847723484039307, 6.127301216125488, 6.406878471374512, 6.686455726623535, 6.966033458709717, 7.245611190795898, 7.525188446044922, 7.804765701293945, 8.084342956542969, 8.363921165466309, 8.643498420715332, 8.923075675964355, 9.202653884887695, 9.482231140136719, 9.761808395385742]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 16.0, 15.0, 25.0, 37.0, 66.0, 85.0, 136.0, 185.0, 298.0, 443.0, 734.0, 1094.0, 1830.0, 2947.0, 5176.0, 8993.0, 16064.0, 28659.0, 51849.0, 91063.0, 146598.0, 193830.0, 183685.0, 132459.0, 79369.0, 44749.0, 24849.0, 13913.0, 7709.0, 4474.0, 2701.0, 1610.0, 1045.0, 631.0, 410.0, 273.0, 166.0, 129.0, 83.0, 50.0, 36.0, 20.0, 17.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-11.4453125, -11.09716796875, -10.7490234375, -10.40087890625, -10.052734375, -9.70458984375, -9.3564453125, -9.00830078125, -8.66015625, -8.31201171875, -7.9638671875, -7.61572265625, -7.267578125, -6.91943359375, -6.5712890625, -6.22314453125, -5.875, -5.52685546875, -5.1787109375, -4.83056640625, -4.482421875, -4.13427734375, -3.7861328125, -3.43798828125, -3.08984375, -2.74169921875, -2.3935546875, -2.04541015625, -1.697265625, -1.34912109375, -1.0009765625, -0.65283203125, -0.3046875, 0.04345703125, 0.3916015625, 0.73974609375, 1.087890625, 1.43603515625, 1.7841796875, 2.13232421875, 2.48046875, 2.82861328125, 3.1767578125, 3.52490234375, 3.873046875, 4.22119140625, 4.5693359375, 4.91748046875, 5.265625, 5.61376953125, 5.9619140625, 6.31005859375, 6.658203125, 7.00634765625, 7.3544921875, 7.70263671875, 8.05078125, 8.39892578125, 8.7470703125, 9.09521484375, 9.443359375, 9.79150390625, 10.1396484375, 10.48779296875, 10.8359375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 7.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 15.0, 17.0, 18.0, 20.0, 30.0, 28.0, 45.0, 36.0, 39.0, 52.0, 38.0, 48.0, 46.0, 53.0, 45.0, 33.0, 42.0, 51.0, 42.0, 34.0, 33.0, 29.0, 24.0, 27.0, 25.0, 16.0, 20.0, 15.0, 5.0, 4.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.74853515625, -10.3876953125, -10.02685546875, -9.666015625, -9.30517578125, -8.9443359375, -8.58349609375, -8.22265625, -7.86181640625, -7.5009765625, -7.14013671875, -6.779296875, -6.41845703125, -6.0576171875, -5.69677734375, -5.3359375, -4.97509765625, -4.6142578125, -4.25341796875, -3.892578125, -3.53173828125, -3.1708984375, -2.81005859375, -2.44921875, -2.08837890625, -1.7275390625, -1.36669921875, -1.005859375, -0.64501953125, -0.2841796875, 0.07666015625, 0.4375, 0.79833984375, 1.1591796875, 1.52001953125, 1.880859375, 2.24169921875, 2.6025390625, 2.96337890625, 3.32421875, 3.68505859375, 4.0458984375, 4.40673828125, 4.767578125, 5.12841796875, 5.4892578125, 5.85009765625, 6.2109375, 6.57177734375, 6.9326171875, 7.29345703125, 7.654296875, 8.01513671875, 8.3759765625, 8.73681640625, 9.09765625, 9.45849609375, 9.8193359375, 10.18017578125, 10.541015625, 10.90185546875, 11.2626953125, 11.62353515625, 11.984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 5.0, 13.0, 17.0, 22.0, 34.0, 40.0, 71.0, 98.0, 150.0, 233.0, 329.0, 523.0, 770.0, 1208.0, 2249.0, 3675.0, 6694.0, 12547.0, 24503.0, 49178.0, 99288.0, 189977.0, 259609.0, 192228.0, 101399.0, 49804.0, 24625.0, 12881.0, 6754.0, 3843.0, 2170.0, 1291.0, 820.0, 492.0, 330.0, 224.0, 147.0, 92.0, 67.0, 41.0, 35.0, 19.0, 19.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.4375, -14.976806640625, -14.51611328125, -14.055419921875, -13.5947265625, -13.134033203125, -12.67333984375, -12.212646484375, -11.751953125, -11.291259765625, -10.83056640625, -10.369873046875, -9.9091796875, -9.448486328125, -8.98779296875, -8.527099609375, -8.06640625, -7.605712890625, -7.14501953125, -6.684326171875, -6.2236328125, -5.762939453125, -5.30224609375, -4.841552734375, -4.380859375, -3.920166015625, -3.45947265625, -2.998779296875, -2.5380859375, -2.077392578125, -1.61669921875, -1.156005859375, -0.6953125, -0.234619140625, 0.22607421875, 0.686767578125, 1.1474609375, 1.608154296875, 2.06884765625, 2.529541015625, 2.990234375, 3.450927734375, 3.91162109375, 4.372314453125, 4.8330078125, 5.293701171875, 5.75439453125, 6.215087890625, 6.67578125, 7.136474609375, 7.59716796875, 8.057861328125, 8.5185546875, 8.979248046875, 9.43994140625, 9.900634765625, 10.361328125, 10.822021484375, 11.28271484375, 11.743408203125, 12.2041015625, 12.664794921875, 13.12548828125, 13.586181640625, 14.046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 3.0, 8.0, 11.0, 8.0, 14.0, 8.0, 15.0, 20.0, 28.0, 35.0, 22.0, 28.0, 29.0, 31.0, 37.0, 43.0, 47.0, 43.0, 52.0, 48.0, 53.0, 44.0, 33.0, 40.0, 43.0, 38.0, 32.0, 28.0, 29.0, 28.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 10.0, 4.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-8.046875, -7.83538818359375, -7.6239013671875, -7.41241455078125, -7.200927734375, -6.98944091796875, -6.7779541015625, -6.56646728515625, -6.35498046875, -6.14349365234375, -5.9320068359375, -5.72052001953125, -5.509033203125, -5.29754638671875, -5.0860595703125, -4.87457275390625, -4.6630859375, -4.45159912109375, -4.2401123046875, -4.02862548828125, -3.817138671875, -3.60565185546875, -3.3941650390625, -3.18267822265625, -2.97119140625, -2.75970458984375, -2.5482177734375, -2.33673095703125, -2.125244140625, -1.91375732421875, -1.7022705078125, -1.49078369140625, -1.279296875, -1.06781005859375, -0.8563232421875, -0.64483642578125, -0.433349609375, -0.22186279296875, -0.0103759765625, 0.20111083984375, 0.41259765625, 0.62408447265625, 0.8355712890625, 1.04705810546875, 1.258544921875, 1.47003173828125, 1.6815185546875, 1.89300537109375, 2.1044921875, 2.31597900390625, 2.5274658203125, 2.73895263671875, 2.950439453125, 3.16192626953125, 3.3734130859375, 3.58489990234375, 3.79638671875, 4.00787353515625, 4.2193603515625, 4.43084716796875, 4.642333984375, 4.85382080078125, 5.0653076171875, 5.27679443359375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 9.0, 16.0, 14.0, 19.0, 31.0, 39.0, 64.0, 72.0, 129.0, 167.0, 235.0, 389.0, 581.0, 937.0, 1626.0, 3160.0, 7230.0, 20510.0, 70277.0, 269987.0, 451755.0, 156382.0, 40970.0, 13134.0, 4986.0, 2328.0, 1243.0, 739.0, 457.0, 347.0, 223.0, 135.0, 105.0, 67.0, 59.0, 32.0, 26.0, 18.0, 13.0, 12.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.4375, -13.0213623046875, -12.605224609375, -12.1890869140625, -11.77294921875, -11.3568115234375, -10.940673828125, -10.5245361328125, -10.1083984375, -9.6922607421875, -9.276123046875, -8.8599853515625, -8.44384765625, -8.0277099609375, -7.611572265625, -7.1954345703125, -6.779296875, -6.3631591796875, -5.947021484375, -5.5308837890625, -5.11474609375, -4.6986083984375, -4.282470703125, -3.8663330078125, -3.4501953125, -3.0340576171875, -2.617919921875, -2.2017822265625, -1.78564453125, -1.3695068359375, -0.953369140625, -0.5372314453125, -0.12109375, 0.2950439453125, 0.711181640625, 1.1273193359375, 1.54345703125, 1.9595947265625, 2.375732421875, 2.7918701171875, 3.2080078125, 3.6241455078125, 4.040283203125, 4.4564208984375, 4.87255859375, 5.2886962890625, 5.704833984375, 6.1209716796875, 6.537109375, 6.9532470703125, 7.369384765625, 7.7855224609375, 8.20166015625, 8.6177978515625, 9.033935546875, 9.4500732421875, 9.8662109375, 10.2823486328125, 10.698486328125, 11.1146240234375, 11.53076171875, 11.9468994140625, 12.363037109375, 12.7791748046875, 13.1953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 16.0, 12.0, 16.0, 20.0, 27.0, 37.0, 54.0, 70.0, 75.0, 84.0, 74.0, 77.0, 77.0, 65.0, 69.0, 57.0, 39.0, 36.0, 22.0, 20.0, 5.0, 12.0, 8.0, 9.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003781318664550781, -0.00036704540252685547, -0.0003559589385986328, -0.00034487247467041016, -0.0003337860107421875, -0.00032269954681396484, -0.0003116130828857422, -0.00030052661895751953, -0.0002894401550292969, -0.0002783536911010742, -0.00026726722717285156, -0.0002561807632446289, -0.00024509429931640625, -0.0002340078353881836, -0.00022292137145996094, -0.00021183490753173828, -0.00020074844360351562, -0.00018966197967529297, -0.0001785755157470703, -0.00016748905181884766, -0.000156402587890625, -0.00014531612396240234, -0.0001342296600341797, -0.00012314319610595703, -0.00011205673217773438, -0.00010097026824951172, -8.988380432128906e-05, -7.87973403930664e-05, -6.771087646484375e-05, -5.6624412536621094e-05, -4.553794860839844e-05, -3.445148468017578e-05, -2.3365020751953125e-05, -1.2278556823730469e-05, -1.1920928955078125e-06, 9.894371032714844e-06, 2.09808349609375e-05, 3.2067298889160156e-05, 4.315376281738281e-05, 5.424022674560547e-05, 6.532669067382812e-05, 7.641315460205078e-05, 8.749961853027344e-05, 9.85860824584961e-05, 0.00010967254638671875, 0.0001207590103149414, 0.00013184547424316406, 0.00014293193817138672, 0.00015401840209960938, 0.00016510486602783203, 0.0001761913299560547, 0.00018727779388427734, 0.0001983642578125, 0.00020945072174072266, 0.0002205371856689453, 0.00023162364959716797, 0.00024271011352539062, 0.0002537965774536133, 0.00026488304138183594, 0.0002759695053100586, 0.00028705596923828125, 0.0002981424331665039, 0.00030922889709472656, 0.0003203153610229492, 0.0003314018249511719]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 17.0, 14.0, 18.0, 24.0, 41.0, 46.0, 74.0, 96.0, 142.0, 191.0, 241.0, 385.0, 494.0, 774.0, 1179.0, 1901.0, 3252.0, 6626.0, 16370.0, 50743.0, 168097.0, 367367.0, 281941.0, 96675.0, 29704.0, 10269.0, 4659.0, 2524.0, 1528.0, 987.0, 640.0, 452.0, 315.0, 217.0, 151.0, 98.0, 87.0, 53.0, 46.0, 39.0, 20.0, 13.0, 15.0, 8.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.125, -10.7955322265625, -10.466064453125, -10.1365966796875, -9.80712890625, -9.4776611328125, -9.148193359375, -8.8187255859375, -8.4892578125, -8.1597900390625, -7.830322265625, -7.5008544921875, -7.17138671875, -6.8419189453125, -6.512451171875, -6.1829833984375, -5.853515625, -5.5240478515625, -5.194580078125, -4.8651123046875, -4.53564453125, -4.2061767578125, -3.876708984375, -3.5472412109375, -3.2177734375, -2.8883056640625, -2.558837890625, -2.2293701171875, -1.89990234375, -1.5704345703125, -1.240966796875, -0.9114990234375, -0.58203125, -0.2525634765625, 0.076904296875, 0.4063720703125, 0.73583984375, 1.0653076171875, 1.394775390625, 1.7242431640625, 2.0537109375, 2.3831787109375, 2.712646484375, 3.0421142578125, 3.37158203125, 3.7010498046875, 4.030517578125, 4.3599853515625, 4.689453125, 5.0189208984375, 5.348388671875, 5.6778564453125, 6.00732421875, 6.3367919921875, 6.666259765625, 6.9957275390625, 7.3251953125, 7.6546630859375, 7.984130859375, 8.3135986328125, 8.64306640625, 8.9725341796875, 9.302001953125, 9.6314697265625, 9.9609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 19.0, 32.0, 31.0, 37.0, 52.0, 62.0, 62.0, 74.0, 85.0, 83.0, 83.0, 79.0, 59.0, 63.0, 69.0, 24.0, 21.0, 20.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.171875, -2.101959228515625, -2.03204345703125, -1.962127685546875, -1.8922119140625, -1.822296142578125, -1.75238037109375, -1.682464599609375, -1.612548828125, -1.542633056640625, -1.47271728515625, -1.402801513671875, -1.3328857421875, -1.262969970703125, -1.19305419921875, -1.123138427734375, -1.05322265625, -0.983306884765625, -0.91339111328125, -0.843475341796875, -0.7735595703125, -0.703643798828125, -0.63372802734375, -0.563812255859375, -0.493896484375, -0.423980712890625, -0.35406494140625, -0.284149169921875, -0.2142333984375, -0.144317626953125, -0.07440185546875, -0.004486083984375, 0.0654296875, 0.135345458984375, 0.20526123046875, 0.275177001953125, 0.3450927734375, 0.415008544921875, 0.48492431640625, 0.554840087890625, 0.624755859375, 0.694671630859375, 0.76458740234375, 0.834503173828125, 0.9044189453125, 0.974334716796875, 1.04425048828125, 1.114166259765625, 1.18408203125, 1.253997802734375, 1.32391357421875, 1.393829345703125, 1.4637451171875, 1.533660888671875, 1.60357666015625, 1.673492431640625, 1.743408203125, 1.813323974609375, 1.88323974609375, 1.953155517578125, 2.0230712890625, 2.092987060546875, 2.16290283203125, 2.232818603515625, 2.302734375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 8.0, 7.0, 11.0, 18.0, 13.0, 24.0, 38.0, 52.0, 45.0, 65.0, 73.0, 74.0, 67.0, 95.0, 81.0, 66.0, 51.0, 50.0, 37.0, 29.0, 17.0, 20.0, 11.0, 10.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.588699340820312, -22.803377151489258, -22.018054962158203, -21.23273468017578, -20.447412490844727, -19.662090301513672, -18.87677001953125, -18.091447830200195, -17.30612564086914, -16.520803451538086, -15.735482215881348, -14.95016098022461, -14.164838790893555, -13.3795166015625, -12.594195365905762, -11.808874130249023, -11.023551940917969, -10.238229751586914, -9.452908515930176, -8.667587280273438, -7.882265090942383, -7.096943378448486, -6.31162166595459, -5.526299953460693, -4.740978240966797, -3.9556565284729004, -3.170334815979004, -2.3850131034851074, -1.599691390991211, -0.8143696784973145, -0.02904796600341797, 0.7562737464904785, 1.5415935516357422, 2.3269152641296387, 3.112236976623535, 3.8975586891174316, 4.682880401611328, 5.468202114105225, 6.253523826599121, 7.038845539093018, 7.824167251586914, 8.609489440917969, 9.394810676574707, 10.180131912231445, 10.9654541015625, 11.750776290893555, 12.536097526550293, 13.321418762207031, 14.106740951538086, 14.89206314086914, 15.677384376525879, 16.462705612182617, 17.248027801513672, 18.033349990844727, 18.81867218017578, 19.603992462158203, 20.389314651489258, 21.174636840820312, 21.959957122802734, 22.74527931213379, 23.530601501464844, 24.3159236907959, 25.101245880126953, 25.886566162109375, 26.67188835144043]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 11.0, 11.0, 10.0, 15.0, 21.0, 16.0, 26.0, 22.0, 16.0, 21.0, 31.0, 39.0, 28.0, 32.0, 36.0, 42.0, 48.0, 44.0, 43.0, 35.0, 28.0, 35.0, 33.0, 45.0, 38.0, 28.0, 27.0, 26.0, 23.0, 28.0, 13.0, 25.0, 14.0, 10.0, 16.0, 7.0, 3.0, 7.0, 12.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.110013008117676, -7.8352484703063965, -7.560483932495117, -7.285719394683838, -7.010954856872559, -6.736190319061279, -6.46142578125, -6.186661243438721, -5.911896705627441, -5.637132167816162, -5.362367630004883, -5.0876030921936035, -4.812838554382324, -4.538074016571045, -4.263309478759766, -3.9885449409484863, -3.713780403137207, -3.4390158653259277, -3.1642513275146484, -2.889486789703369, -2.61472225189209, -2.3399577140808105, -2.0651931762695312, -1.790428638458252, -1.5156641006469727, -1.2408995628356934, -0.9661350250244141, -0.6913704872131348, -0.41660594940185547, -0.14184141159057617, 0.13292312622070312, 0.4076876640319824, 0.6824531555175781, 0.9572176933288574, 1.2319822311401367, 1.506746768951416, 1.7815113067626953, 2.0562758445739746, 2.331040382385254, 2.605804920196533, 2.8805694580078125, 3.155333995819092, 3.430098533630371, 3.7048630714416504, 3.9796276092529297, 4.254392147064209, 4.529156684875488, 4.803921222686768, 5.078685760498047, 5.353450298309326, 5.6282148361206055, 5.902979373931885, 6.177743911743164, 6.452508449554443, 6.727272987365723, 7.002037525177002, 7.276802062988281, 7.5515666007995605, 7.82633113861084, 8.101095199584961, 8.375860214233398, 8.650625228881836, 8.925389289855957, 9.200153350830078, 9.474918365478516]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 15.0, 19.0, 33.0, 37.0, 73.0, 111.0, 131.0, 224.0, 384.0, 580.0, 983.0, 1653.0, 2765.0, 4598.0, 7844.0, 13847.0, 23744.0, 39975.0, 66761.0, 101297.0, 137819.0, 160017.0, 152763.0, 121325.0, 83439.0, 52792.0, 31319.0, 18258.0, 10496.0, 6038.0, 3546.0, 2153.0, 1324.0, 822.0, 523.0, 311.0, 179.0, 110.0, 85.0, 57.0, 26.0, 21.0, 20.0, 14.0, 4.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.1221923828125, -11.752197265625, -11.3822021484375, -11.01220703125, -10.6422119140625, -10.272216796875, -9.9022216796875, -9.5322265625, -9.1622314453125, -8.792236328125, -8.4222412109375, -8.05224609375, -7.6822509765625, -7.312255859375, -6.9422607421875, -6.572265625, -6.2022705078125, -5.832275390625, -5.4622802734375, -5.09228515625, -4.7222900390625, -4.352294921875, -3.9822998046875, -3.6123046875, -3.2423095703125, -2.872314453125, -2.5023193359375, -2.13232421875, -1.7623291015625, -1.392333984375, -1.0223388671875, -0.65234375, -0.2823486328125, 0.087646484375, 0.4576416015625, 0.82763671875, 1.1976318359375, 1.567626953125, 1.9376220703125, 2.3076171875, 2.6776123046875, 3.047607421875, 3.4176025390625, 3.78759765625, 4.1575927734375, 4.527587890625, 4.8975830078125, 5.267578125, 5.6375732421875, 6.007568359375, 6.3775634765625, 6.74755859375, 7.1175537109375, 7.487548828125, 7.8575439453125, 8.2275390625, 8.5975341796875, 8.967529296875, 9.3375244140625, 9.70751953125, 10.0775146484375, 10.447509765625, 10.8175048828125, 11.1875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 2.0, 10.0, 10.0, 15.0, 28.0, 23.0, 25.0, 27.0, 40.0, 44.0, 48.0, 49.0, 57.0, 42.0, 58.0, 54.0, 49.0, 56.0, 37.0, 40.0, 32.0, 44.0, 36.0, 37.0, 29.0, 19.0, 21.0, 11.0, 13.0, 2.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.0234375, -12.6182861328125, -12.213134765625, -11.8079833984375, -11.40283203125, -10.9976806640625, -10.592529296875, -10.1873779296875, -9.7822265625, -9.3770751953125, -8.971923828125, -8.5667724609375, -8.16162109375, -7.7564697265625, -7.351318359375, -6.9461669921875, -6.541015625, -6.1358642578125, -5.730712890625, -5.3255615234375, -4.92041015625, -4.5152587890625, -4.110107421875, -3.7049560546875, -3.2998046875, -2.8946533203125, -2.489501953125, -2.0843505859375, -1.67919921875, -1.2740478515625, -0.868896484375, -0.4637451171875, -0.05859375, 0.3465576171875, 0.751708984375, 1.1568603515625, 1.56201171875, 1.9671630859375, 2.372314453125, 2.7774658203125, 3.1826171875, 3.5877685546875, 3.992919921875, 4.3980712890625, 4.80322265625, 5.2083740234375, 5.613525390625, 6.0186767578125, 6.423828125, 6.8289794921875, 7.234130859375, 7.6392822265625, 8.04443359375, 8.4495849609375, 8.854736328125, 9.2598876953125, 9.6650390625, 10.0701904296875, 10.475341796875, 10.8804931640625, 11.28564453125, 11.6907958984375, 12.095947265625, 12.5010986328125, 12.90625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 12.0, 24.0, 25.0, 38.0, 52.0, 77.0, 128.0, 181.0, 233.0, 386.0, 568.0, 888.0, 1432.0, 2244.0, 3577.0, 5687.0, 9287.0, 14842.0, 23793.0, 37284.0, 57228.0, 83603.0, 113339.0, 135869.0, 140900.0, 125851.0, 97651.0, 68953.0, 45581.0, 29354.0, 18476.0, 11506.0, 7128.0, 4450.0, 2873.0, 1736.0, 1082.0, 804.0, 473.0, 313.0, 203.0, 135.0, 93.0, 61.0, 48.0, 35.0, 15.0, 18.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1953125, -9.868896484375, -9.54248046875, -9.216064453125, -8.8896484375, -8.563232421875, -8.23681640625, -7.910400390625, -7.583984375, -7.257568359375, -6.93115234375, -6.604736328125, -6.2783203125, -5.951904296875, -5.62548828125, -5.299072265625, -4.97265625, -4.646240234375, -4.31982421875, -3.993408203125, -3.6669921875, -3.340576171875, -3.01416015625, -2.687744140625, -2.361328125, -2.034912109375, -1.70849609375, -1.382080078125, -1.0556640625, -0.729248046875, -0.40283203125, -0.076416015625, 0.25, 0.576416015625, 0.90283203125, 1.229248046875, 1.5556640625, 1.882080078125, 2.20849609375, 2.534912109375, 2.861328125, 3.187744140625, 3.51416015625, 3.840576171875, 4.1669921875, 4.493408203125, 4.81982421875, 5.146240234375, 5.47265625, 5.799072265625, 6.12548828125, 6.451904296875, 6.7783203125, 7.104736328125, 7.43115234375, 7.757568359375, 8.083984375, 8.410400390625, 8.73681640625, 9.063232421875, 9.3896484375, 9.716064453125, 10.04248046875, 10.368896484375, 10.6953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 11.0, 17.0, 15.0, 15.0, 12.0, 25.0, 30.0, 25.0, 17.0, 41.0, 34.0, 34.0, 31.0, 44.0, 36.0, 37.0, 50.0, 52.0, 45.0, 35.0, 38.0, 35.0, 32.0, 32.0, 30.0, 23.0, 34.0, 27.0, 30.0, 19.0, 8.0, 7.0, 12.0, 9.0, 12.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9434814453125, -5.746337890625, -5.5491943359375, -5.35205078125, -5.1549072265625, -4.957763671875, -4.7606201171875, -4.5634765625, -4.3663330078125, -4.169189453125, -3.9720458984375, -3.77490234375, -3.5777587890625, -3.380615234375, -3.1834716796875, -2.986328125, -2.7891845703125, -2.592041015625, -2.3948974609375, -2.19775390625, -2.0006103515625, -1.803466796875, -1.6063232421875, -1.4091796875, -1.2120361328125, -1.014892578125, -0.8177490234375, -0.62060546875, -0.4234619140625, -0.226318359375, -0.0291748046875, 0.16796875, 0.3651123046875, 0.562255859375, 0.7593994140625, 0.95654296875, 1.1536865234375, 1.350830078125, 1.5479736328125, 1.7451171875, 1.9422607421875, 2.139404296875, 2.3365478515625, 2.53369140625, 2.7308349609375, 2.927978515625, 3.1251220703125, 3.322265625, 3.5194091796875, 3.716552734375, 3.9136962890625, 4.11083984375, 4.3079833984375, 4.505126953125, 4.7022705078125, 4.8994140625, 5.0965576171875, 5.293701171875, 5.4908447265625, 5.68798828125, 5.8851318359375, 6.082275390625, 6.2794189453125, 6.4765625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 22.0, 38.0, 67.0, 99.0, 114.0, 194.0, 298.0, 434.0, 687.0, 1191.0, 1947.0, 3256.0, 5255.0, 9074.0, 15267.0, 25542.0, 43012.0, 70742.0, 107777.0, 148180.0, 168641.0, 151307.0, 111548.0, 72578.0, 45162.0, 26746.0, 16000.0, 9287.0, 5417.0, 3335.0, 2074.0, 1172.0, 777.0, 470.0, 258.0, 177.0, 145.0, 69.0, 46.0, 32.0, 22.0, 25.0, 15.0, 12.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.3125, -5.14923095703125, -4.9859619140625, -4.82269287109375, -4.659423828125, -4.49615478515625, -4.3328857421875, -4.16961669921875, -4.00634765625, -3.84307861328125, -3.6798095703125, -3.51654052734375, -3.353271484375, -3.19000244140625, -3.0267333984375, -2.86346435546875, -2.7001953125, -2.53692626953125, -2.3736572265625, -2.21038818359375, -2.047119140625, -1.88385009765625, -1.7205810546875, -1.55731201171875, -1.39404296875, -1.23077392578125, -1.0675048828125, -0.90423583984375, -0.740966796875, -0.57769775390625, -0.4144287109375, -0.25115966796875, -0.087890625, 0.07537841796875, 0.2386474609375, 0.40191650390625, 0.565185546875, 0.72845458984375, 0.8917236328125, 1.05499267578125, 1.21826171875, 1.38153076171875, 1.5447998046875, 1.70806884765625, 1.871337890625, 2.03460693359375, 2.1978759765625, 2.36114501953125, 2.5244140625, 2.68768310546875, 2.8509521484375, 3.01422119140625, 3.177490234375, 3.34075927734375, 3.5040283203125, 3.66729736328125, 3.83056640625, 3.99383544921875, 4.1571044921875, 4.32037353515625, 4.483642578125, 4.64691162109375, 4.8101806640625, 4.97344970703125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 9.0, 7.0, 4.0, 23.0, 21.0, 19.0, 30.0, 36.0, 44.0, 53.0, 56.0, 76.0, 57.0, 71.0, 97.0, 62.0, 60.0, 57.0, 43.0, 37.0, 34.0, 25.0, 14.0, 20.0, 9.0, 10.0, 7.0, 8.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006604194641113281, -0.0006402879953384399, -0.0006201565265655518, -0.0006000250577926636, -0.0005798935890197754, -0.0005597621202468872, -0.000539630651473999, -0.0005194991827011108, -0.0004993677139282227, -0.00047923624515533447, -0.0004591047763824463, -0.0004389733076095581, -0.0004188418388366699, -0.00039871037006378174, -0.00037857890129089355, -0.00035844743251800537, -0.0003383159637451172, -0.000318184494972229, -0.0002980530261993408, -0.00027792155742645264, -0.00025779008865356445, -0.00023765861988067627, -0.00021752715110778809, -0.0001973956823348999, -0.00017726421356201172, -0.00015713274478912354, -0.00013700127601623535, -0.00011686980724334717, -9.673833847045898e-05, -7.66068696975708e-05, -5.647540092468262e-05, -3.6343932151794434e-05, -1.621246337890625e-05, 3.919005393981934e-06, 2.4050474166870117e-05, 4.41819429397583e-05, 6.431341171264648e-05, 8.444488048553467e-05, 0.00010457634925842285, 0.00012470781803131104, 0.00014483928680419922, 0.0001649707555770874, 0.00018510222434997559, 0.00020523369312286377, 0.00022536516189575195, 0.00024549663066864014, 0.0002656280994415283, 0.0002857595682144165, 0.0003058910369873047, 0.00032602250576019287, 0.00034615397453308105, 0.00036628544330596924, 0.0003864169120788574, 0.0004065483808517456, 0.0004266798496246338, 0.00044681131839752197, 0.00046694278717041016, 0.00048707425594329834, 0.0005072057247161865, 0.0005273371934890747, 0.0005474686622619629, 0.0005676001310348511, 0.0005877315998077393, 0.0006078630685806274, 0.0006279945373535156]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 5.0, 12.0, 17.0, 23.0, 39.0, 65.0, 103.0, 146.0, 220.0, 291.0, 505.0, 752.0, 1237.0, 1900.0, 2871.0, 4689.0, 7381.0, 11864.0, 19064.0, 30574.0, 48749.0, 74657.0, 108463.0, 140144.0, 154320.0, 137424.0, 105297.0, 72148.0, 47053.0, 29239.0, 18348.0, 11282.0, 7231.0, 4439.0, 2866.0, 1821.0, 1135.0, 725.0, 505.0, 341.0, 211.0, 147.0, 77.0, 63.0, 36.0, 23.0, 17.0, 11.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-4.84375, -4.69451904296875, -4.5452880859375, -4.39605712890625, -4.246826171875, -4.09759521484375, -3.9483642578125, -3.79913330078125, -3.64990234375, -3.50067138671875, -3.3514404296875, -3.20220947265625, -3.052978515625, -2.90374755859375, -2.7545166015625, -2.60528564453125, -2.4560546875, -2.30682373046875, -2.1575927734375, -2.00836181640625, -1.859130859375, -1.70989990234375, -1.5606689453125, -1.41143798828125, -1.26220703125, -1.11297607421875, -0.9637451171875, -0.81451416015625, -0.665283203125, -0.51605224609375, -0.3668212890625, -0.21759033203125, -0.068359375, 0.08087158203125, 0.2301025390625, 0.37933349609375, 0.528564453125, 0.67779541015625, 0.8270263671875, 0.97625732421875, 1.12548828125, 1.27471923828125, 1.4239501953125, 1.57318115234375, 1.722412109375, 1.87164306640625, 2.0208740234375, 2.17010498046875, 2.3193359375, 2.46856689453125, 2.6177978515625, 2.76702880859375, 2.916259765625, 3.06549072265625, 3.2147216796875, 3.36395263671875, 3.51318359375, 3.66241455078125, 3.8116455078125, 3.96087646484375, 4.110107421875, 4.25933837890625, 4.4085693359375, 4.55780029296875, 4.70703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 7.0, 12.0, 19.0, 24.0, 28.0, 34.0, 46.0, 64.0, 52.0, 62.0, 66.0, 75.0, 67.0, 56.0, 62.0, 48.0, 54.0, 55.0, 32.0, 20.0, 17.0, 19.0, 10.0, 10.0, 12.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7018890380859375, -1.639129638671875, -1.5763702392578125, -1.51361083984375, -1.4508514404296875, -1.388092041015625, -1.3253326416015625, -1.2625732421875, -1.1998138427734375, -1.137054443359375, -1.0742950439453125, -1.01153564453125, -0.9487762451171875, -0.886016845703125, -0.8232574462890625, -0.760498046875, -0.6977386474609375, -0.634979248046875, -0.5722198486328125, -0.50946044921875, -0.4467010498046875, -0.383941650390625, -0.3211822509765625, -0.2584228515625, -0.1956634521484375, -0.132904052734375, -0.0701446533203125, -0.00738525390625, 0.0553741455078125, 0.118133544921875, 0.1808929443359375, 0.24365234375, 0.3064117431640625, 0.369171142578125, 0.4319305419921875, 0.49468994140625, 0.5574493408203125, 0.620208740234375, 0.6829681396484375, 0.7457275390625, 0.8084869384765625, 0.871246337890625, 0.9340057373046875, 0.99676513671875, 1.0595245361328125, 1.122283935546875, 1.1850433349609375, 1.247802734375, 1.3105621337890625, 1.373321533203125, 1.4360809326171875, 1.49884033203125, 1.5615997314453125, 1.624359130859375, 1.6871185302734375, 1.7498779296875, 1.8126373291015625, 1.875396728515625, 1.9381561279296875, 2.00091552734375, 2.0636749267578125, 2.126434326171875, 2.1891937255859375, 2.251953125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 11.0, 11.0, 9.0, 27.0, 23.0, 41.0, 51.0, 62.0, 48.0, 68.0, 84.0, 70.0, 75.0, 73.0, 70.0, 57.0, 40.0, 35.0, 19.0, 28.0, 13.0, 18.0, 10.0, 6.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.393449783325195, -21.668926239013672, -20.94440269470215, -20.219879150390625, -19.49535369873047, -18.770830154418945, -18.046306610107422, -17.3217830657959, -16.597259521484375, -15.872735977172852, -15.148212432861328, -14.423687934875488, -13.699164390563965, -12.974640846252441, -12.250116348266602, -11.525592803955078, -10.801069259643555, -10.076545715332031, -9.352022171020508, -8.627497673034668, -7.9029741287231445, -7.178450584411621, -6.4539265632629395, -5.729402542114258, -5.004878997802734, -4.280355453491211, -3.5558314323425293, -2.8313076496124268, -2.106783866882324, -1.3822600841522217, -0.6577363014221191, 0.0667877197265625, 0.7913093566894531, 1.5158331394195557, 2.240356922149658, 2.9648807048797607, 3.6894044876098633, 4.413928031921387, 5.138452053070068, 5.86297607421875, 6.587499618530273, 7.312023162841797, 8.03654670715332, 8.76107120513916, 9.485594749450684, 10.210118293762207, 10.934642791748047, 11.65916633605957, 12.383689880371094, 13.108213424682617, 13.83273696899414, 14.55726146697998, 15.281785011291504, 16.006309509277344, 16.730833053588867, 17.45535659790039, 18.179880142211914, 18.904403686523438, 19.62892723083496, 20.353450775146484, 21.07797622680664, 21.802499771118164, 22.527023315429688, 23.25154685974121, 23.976070404052734]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 5.0, 5.0, 14.0, 17.0, 13.0, 14.0, 16.0, 20.0, 30.0, 24.0, 33.0, 31.0, 26.0, 43.0, 38.0, 38.0, 42.0, 52.0, 50.0, 44.0, 43.0, 54.0, 32.0, 40.0, 38.0, 34.0, 30.0, 20.0, 25.0, 24.0, 15.0, 23.0, 15.0, 9.0, 5.0, 13.0, 3.0, 8.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620841979980469, -9.307011604309082, -8.993182182312012, -8.679351806640625, -8.365522384643555, -8.051692008972168, -7.7378621101379395, -7.424032211303711, -7.110201835632324, -6.796371936798096, -6.482542037963867, -6.1687116622924805, -5.854881763458252, -5.541051864624023, -5.227221965789795, -4.913392066955566, -4.599562168121338, -4.285732269287109, -3.9719021320343018, -3.6580722332000732, -3.3442420959472656, -3.030412197113037, -2.7165822982788086, -2.402752161026001, -2.0889222621917725, -1.7750922441482544, -1.4612622261047363, -1.1474323272705078, -0.8336023092269897, -0.5197722911834717, -0.20594239234924316, 0.10788774490356445, 0.42171764373779297, 0.735547661781311, 1.049377679824829, 1.3632075786590576, 1.6770375967025757, 1.9908676147460938, 2.3046975135803223, 2.61852765083313, 2.9323575496673584, 3.246187448501587, 3.5600175857543945, 3.873847484588623, 4.187677383422852, 4.501507759094238, 4.815337181091309, 5.129167556762695, 5.442997455596924, 5.756827354431152, 6.070657253265381, 6.384487152099609, 6.698317527770996, 7.012147426605225, 7.325977325439453, 7.63980770111084, 7.95363712310791, 8.267467498779297, 8.581296920776367, 8.895127296447754, 9.208956718444824, 9.522787094116211, 9.836616516113281, 10.150446891784668, 10.464277267456055]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 12.0, 16.0, 36.0, 41.0, 41.0, 82.0, 119.0, 181.0, 329.0, 454.0, 760.0, 1269.0, 2154.0, 3628.0, 6808.0, 12233.0, 23108.0, 44323.0, 89697.0, 193065.0, 433588.0, 920256.0, 1160130.0, 707608.0, 313208.0, 140803.0, 67147.0, 33407.0, 17384.0, 9324.0, 5243.0, 2997.0, 1785.0, 1110.0, 671.0, 403.0, 288.0, 180.0, 119.0, 89.0, 51.0, 38.0, 30.0, 22.0, 9.0, 8.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-17.5, -16.958251953125, -16.41650390625, -15.874755859375, -15.3330078125, -14.791259765625, -14.24951171875, -13.707763671875, -13.166015625, -12.624267578125, -12.08251953125, -11.540771484375, -10.9990234375, -10.457275390625, -9.91552734375, -9.373779296875, -8.83203125, -8.290283203125, -7.74853515625, -7.206787109375, -6.6650390625, -6.123291015625, -5.58154296875, -5.039794921875, -4.498046875, -3.956298828125, -3.41455078125, -2.872802734375, -2.3310546875, -1.789306640625, -1.24755859375, -0.705810546875, -0.1640625, 0.377685546875, 0.91943359375, 1.461181640625, 2.0029296875, 2.544677734375, 3.08642578125, 3.628173828125, 4.169921875, 4.711669921875, 5.25341796875, 5.795166015625, 6.3369140625, 6.878662109375, 7.42041015625, 7.962158203125, 8.50390625, 9.045654296875, 9.58740234375, 10.129150390625, 10.6708984375, 11.212646484375, 11.75439453125, 12.296142578125, 12.837890625, 13.379638671875, 13.92138671875, 14.463134765625, 15.0048828125, 15.546630859375, 16.08837890625, 16.630126953125, 17.171875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 15.0, 11.0, 20.0, 21.0, 16.0, 26.0, 37.0, 28.0, 34.0, 38.0, 45.0, 51.0, 39.0, 54.0, 41.0, 50.0, 49.0, 52.0, 50.0, 47.0, 28.0, 33.0, 26.0, 31.0, 17.0, 24.0, 18.0, 15.0, 23.0, 6.0, 9.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.31622314453125, -8.0621337890625, -7.80804443359375, -7.553955078125, -7.29986572265625, -7.0457763671875, -6.79168701171875, -6.53759765625, -6.28350830078125, -6.0294189453125, -5.77532958984375, -5.521240234375, -5.26715087890625, -5.0130615234375, -4.75897216796875, -4.5048828125, -4.25079345703125, -3.9967041015625, -3.74261474609375, -3.488525390625, -3.23443603515625, -2.9803466796875, -2.72625732421875, -2.47216796875, -2.21807861328125, -1.9639892578125, -1.70989990234375, -1.455810546875, -1.20172119140625, -0.9476318359375, -0.69354248046875, -0.439453125, -0.18536376953125, 0.0687255859375, 0.32281494140625, 0.576904296875, 0.83099365234375, 1.0850830078125, 1.33917236328125, 1.59326171875, 1.84735107421875, 2.1014404296875, 2.35552978515625, 2.609619140625, 2.86370849609375, 3.1177978515625, 3.37188720703125, 3.6259765625, 3.88006591796875, 4.1341552734375, 4.38824462890625, 4.642333984375, 4.89642333984375, 5.1505126953125, 5.40460205078125, 5.65869140625, 5.91278076171875, 6.1668701171875, 6.42095947265625, 6.675048828125, 6.92913818359375, 7.1832275390625, 7.43731689453125, 7.69140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 15.0, 10.0, 18.0, 30.0, 38.0, 59.0, 101.0, 151.0, 191.0, 324.0, 529.0, 782.0, 1214.0, 1908.0, 3068.0, 5120.0, 8803.0, 15161.0, 26720.0, 48072.0, 88251.0, 163854.0, 303449.0, 546089.0, 846154.0, 864364.0, 569016.0, 318537.0, 171116.0, 92318.0, 50896.0, 28279.0, 15863.0, 9467.0, 5469.0, 3299.0, 1935.0, 1324.0, 792.0, 520.0, 343.0, 216.0, 119.0, 107.0, 81.0, 32.0, 29.0, 14.0, 14.0, 8.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.453125, -14.9708251953125, -14.488525390625, -14.0062255859375, -13.52392578125, -13.0416259765625, -12.559326171875, -12.0770263671875, -11.5947265625, -11.1124267578125, -10.630126953125, -10.1478271484375, -9.66552734375, -9.1832275390625, -8.700927734375, -8.2186279296875, -7.736328125, -7.2540283203125, -6.771728515625, -6.2894287109375, -5.80712890625, -5.3248291015625, -4.842529296875, -4.3602294921875, -3.8779296875, -3.3956298828125, -2.913330078125, -2.4310302734375, -1.94873046875, -1.4664306640625, -0.984130859375, -0.5018310546875, -0.01953125, 0.4627685546875, 0.945068359375, 1.4273681640625, 1.90966796875, 2.3919677734375, 2.874267578125, 3.3565673828125, 3.8388671875, 4.3211669921875, 4.803466796875, 5.2857666015625, 5.76806640625, 6.2503662109375, 6.732666015625, 7.2149658203125, 7.697265625, 8.1795654296875, 8.661865234375, 9.1441650390625, 9.62646484375, 10.1087646484375, 10.591064453125, 11.0733642578125, 11.5556640625, 12.0379638671875, 12.520263671875, 13.0025634765625, 13.48486328125, 13.9671630859375, 14.449462890625, 14.9317626953125, 15.4140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 10.0, 11.0, 23.0, 22.0, 23.0, 26.0, 31.0, 40.0, 60.0, 101.0, 105.0, 125.0, 150.0, 203.0, 244.0, 260.0, 281.0, 287.0, 295.0, 267.0, 289.0, 233.0, 195.0, 156.0, 145.0, 112.0, 70.0, 75.0, 54.0, 53.0, 34.0, 23.0, 14.0, 13.0, 13.0, 8.0, 3.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.875, -4.7135009765625, -4.552001953125, -4.3905029296875, -4.22900390625, -4.0675048828125, -3.906005859375, -3.7445068359375, -3.5830078125, -3.4215087890625, -3.260009765625, -3.0985107421875, -2.93701171875, -2.7755126953125, -2.614013671875, -2.4525146484375, -2.291015625, -2.1295166015625, -1.968017578125, -1.8065185546875, -1.64501953125, -1.4835205078125, -1.322021484375, -1.1605224609375, -0.9990234375, -0.8375244140625, -0.676025390625, -0.5145263671875, -0.35302734375, -0.1915283203125, -0.030029296875, 0.1314697265625, 0.29296875, 0.4544677734375, 0.615966796875, 0.7774658203125, 0.93896484375, 1.1004638671875, 1.261962890625, 1.4234619140625, 1.5849609375, 1.7464599609375, 1.907958984375, 2.0694580078125, 2.23095703125, 2.3924560546875, 2.553955078125, 2.7154541015625, 2.876953125, 3.0384521484375, 3.199951171875, 3.3614501953125, 3.52294921875, 3.6844482421875, 3.845947265625, 4.0074462890625, 4.1689453125, 4.3304443359375, 4.491943359375, 4.6534423828125, 4.81494140625, 4.9764404296875, 5.137939453125, 5.2994384765625, 5.4609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 11.0, 5.0, 11.0, 15.0, 23.0, 22.0, 29.0, 39.0, 45.0, 60.0, 71.0, 75.0, 82.0, 71.0, 70.0, 70.0, 57.0, 53.0, 30.0, 26.0, 33.0, 21.0, 16.0, 12.0, 10.0, 8.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.947229385375977, -22.237016677856445, -21.526803970336914, -20.816591262817383, -20.10637855529785, -19.39616584777832, -18.685951232910156, -17.975738525390625, -17.265525817871094, -16.555313110351562, -15.845100402832031, -15.1348876953125, -14.424674987792969, -13.714462280273438, -13.00424861907959, -12.294035911560059, -11.583824157714844, -10.873611450195312, -10.163398742675781, -9.45318603515625, -8.742973327636719, -8.032760620117188, -7.32254695892334, -6.612334251403809, -5.902121543884277, -5.191908836364746, -4.481696128845215, -3.7714829444885254, -3.061270236968994, -2.351057529449463, -1.6408443450927734, -0.9306316375732422, -0.22041893005371094, 0.48979389667510986, 1.2000067234039307, 1.910219669342041, 2.6204323768615723, 3.3306450843811035, 4.040858268737793, 4.751070976257324, 5.4612836837768555, 6.171496391296387, 6.881709098815918, 7.591922283172607, 8.302135467529297, 9.012348175048828, 9.72256088256836, 10.43277359008789, 11.142986297607422, 11.853199005126953, 12.563411712646484, 13.273624420166016, 13.983837127685547, 14.694049835205078, 15.404263496398926, 16.11447525024414, 16.824687957763672, 17.534900665283203, 18.245113372802734, 18.955326080322266, 19.665538787841797, 20.375751495361328, 21.08596420288086, 21.79617691040039, 22.506391525268555]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 16.0, 8.0, 14.0, 15.0, 17.0, 16.0, 28.0, 34.0, 37.0, 31.0, 47.0, 38.0, 35.0, 49.0, 43.0, 38.0, 50.0, 48.0, 56.0, 43.0, 36.0, 41.0, 30.0, 31.0, 27.0, 21.0, 21.0, 13.0, 17.0, 18.0, 16.0, 12.0, 7.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6331353187561035, -7.344013214111328, -7.054891109466553, -6.765769004821777, -6.476646900177002, -6.187524795532227, -5.898402214050293, -5.609280586242676, -5.320158004760742, -5.031035900115967, -4.741913795471191, -4.452791690826416, -4.163669586181641, -3.8745474815368652, -3.5854251384735107, -3.2963030338287354, -3.007181167602539, -2.7180590629577637, -2.4289369583129883, -2.139814853668213, -1.850692629814148, -1.5615705251693726, -1.2724483013153076, -0.9833261966705322, -0.6942040920257568, -0.40508195757865906, -0.11595982313156128, 0.1731623411178589, 0.4622844457626343, 0.7514065504074097, 1.0405287742614746, 1.32965087890625, 1.6187725067138672, 1.9078946113586426, 2.197016716003418, 2.4861388206481934, 2.7752609252929688, 3.064383029937744, 3.3535053730010986, 3.642627477645874, 3.9317495822906494, 4.220871925354004, 4.509994029998779, 4.799116134643555, 5.08823823928833, 5.3773603439331055, 5.666482448577881, 5.955604553222656, 6.244726657867432, 6.533848762512207, 6.822970867156982, 7.112092971801758, 7.401215076446533, 7.690337181091309, 7.979459762573242, 8.26858139038086, 8.557703971862793, 8.846826553344727, 9.135948181152344, 9.425070762634277, 9.714192390441895, 10.003314971923828, 10.292436599731445, 10.581559181213379, 10.870680809020996]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 11.0, 7.0, 17.0, 28.0, 53.0, 84.0, 121.0, 193.0, 248.0, 485.0, 780.0, 1408.0, 2515.0, 4650.0, 8796.0, 18493.0, 40494.0, 90993.0, 192971.0, 280828.0, 211845.0, 104424.0, 46298.0, 21047.0, 10101.0, 5193.0, 2635.0, 1558.0, 855.0, 527.0, 328.0, 181.0, 127.0, 99.0, 41.0, 29.0, 29.0, 18.0, 12.0, 10.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.6751708984375, -15.194091796875, -14.7130126953125, -14.23193359375, -13.7508544921875, -13.269775390625, -12.7886962890625, -12.3076171875, -11.8265380859375, -11.345458984375, -10.8643798828125, -10.38330078125, -9.9022216796875, -9.421142578125, -8.9400634765625, -8.458984375, -7.9779052734375, -7.496826171875, -7.0157470703125, -6.53466796875, -6.0535888671875, -5.572509765625, -5.0914306640625, -4.6103515625, -4.1292724609375, -3.648193359375, -3.1671142578125, -2.68603515625, -2.2049560546875, -1.723876953125, -1.2427978515625, -0.76171875, -0.2806396484375, 0.200439453125, 0.6815185546875, 1.16259765625, 1.6436767578125, 2.124755859375, 2.6058349609375, 3.0869140625, 3.5679931640625, 4.049072265625, 4.5301513671875, 5.01123046875, 5.4923095703125, 5.973388671875, 6.4544677734375, 6.935546875, 7.4166259765625, 7.897705078125, 8.3787841796875, 8.85986328125, 9.3409423828125, 9.822021484375, 10.3031005859375, 10.7841796875, 11.2652587890625, 11.746337890625, 12.2274169921875, 12.70849609375, 13.1895751953125, 13.670654296875, 14.1517333984375, 14.6328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 3.0, 10.0, 13.0, 12.0, 27.0, 19.0, 30.0, 28.0, 27.0, 38.0, 48.0, 49.0, 56.0, 50.0, 57.0, 44.0, 52.0, 47.0, 48.0, 42.0, 39.0, 40.0, 34.0, 28.0, 22.0, 28.0, 16.0, 22.0, 14.0, 14.0, 3.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.4588623046875, -10.097412109375, -9.7359619140625, -9.37451171875, -9.0130615234375, -8.651611328125, -8.2901611328125, -7.9287109375, -7.5672607421875, -7.205810546875, -6.8443603515625, -6.48291015625, -6.1214599609375, -5.760009765625, -5.3985595703125, -5.037109375, -4.6756591796875, -4.314208984375, -3.9527587890625, -3.59130859375, -3.2298583984375, -2.868408203125, -2.5069580078125, -2.1455078125, -1.7840576171875, -1.422607421875, -1.0611572265625, -0.69970703125, -0.3382568359375, 0.023193359375, 0.3846435546875, 0.74609375, 1.1075439453125, 1.468994140625, 1.8304443359375, 2.19189453125, 2.5533447265625, 2.914794921875, 3.2762451171875, 3.6376953125, 3.9991455078125, 4.360595703125, 4.7220458984375, 5.08349609375, 5.4449462890625, 5.806396484375, 6.1678466796875, 6.529296875, 6.8907470703125, 7.252197265625, 7.6136474609375, 7.97509765625, 8.3365478515625, 8.697998046875, 9.0594482421875, 9.4208984375, 9.7823486328125, 10.143798828125, 10.5052490234375, 10.86669921875, 11.2281494140625, 11.589599609375, 11.9510498046875, 12.3125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 11.0, 9.0, 17.0, 31.0, 31.0, 45.0, 71.0, 105.0, 174.0, 265.0, 446.0, 769.0, 1541.0, 3168.0, 7548.0, 19885.0, 61183.0, 204820.0, 430399.0, 217958.0, 64272.0, 21012.0, 7792.0, 3391.0, 1564.0, 811.0, 466.0, 269.0, 174.0, 100.0, 67.0, 37.0, 41.0, 25.0, 16.0, 6.0, 9.0, 10.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.703125, -26.92333984375, -26.1435546875, -25.36376953125, -24.583984375, -23.80419921875, -23.0244140625, -22.24462890625, -21.46484375, -20.68505859375, -19.9052734375, -19.12548828125, -18.345703125, -17.56591796875, -16.7861328125, -16.00634765625, -15.2265625, -14.44677734375, -13.6669921875, -12.88720703125, -12.107421875, -11.32763671875, -10.5478515625, -9.76806640625, -8.98828125, -8.20849609375, -7.4287109375, -6.64892578125, -5.869140625, -5.08935546875, -4.3095703125, -3.52978515625, -2.75, -1.97021484375, -1.1904296875, -0.41064453125, 0.369140625, 1.14892578125, 1.9287109375, 2.70849609375, 3.48828125, 4.26806640625, 5.0478515625, 5.82763671875, 6.607421875, 7.38720703125, 8.1669921875, 8.94677734375, 9.7265625, 10.50634765625, 11.2861328125, 12.06591796875, 12.845703125, 13.62548828125, 14.4052734375, 15.18505859375, 15.96484375, 16.74462890625, 17.5244140625, 18.30419921875, 19.083984375, 19.86376953125, 20.6435546875, 21.42333984375, 22.203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 10.0, 13.0, 12.0, 21.0, 22.0, 16.0, 15.0, 28.0, 24.0, 35.0, 29.0, 35.0, 43.0, 34.0, 52.0, 38.0, 45.0, 37.0, 44.0, 41.0, 45.0, 49.0, 45.0, 28.0, 27.0, 29.0, 22.0, 14.0, 19.0, 18.0, 19.0, 11.0, 12.0, 11.0, 8.0, 9.0, 6.0, 7.0, 4.0, 0.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.79559326171875, -5.6107177734375, -5.42584228515625, -5.240966796875, -5.05609130859375, -4.8712158203125, -4.68634033203125, -4.50146484375, -4.31658935546875, -4.1317138671875, -3.94683837890625, -3.761962890625, -3.57708740234375, -3.3922119140625, -3.20733642578125, -3.0224609375, -2.83758544921875, -2.6527099609375, -2.46783447265625, -2.282958984375, -2.09808349609375, -1.9132080078125, -1.72833251953125, -1.54345703125, -1.35858154296875, -1.1737060546875, -0.98883056640625, -0.803955078125, -0.61907958984375, -0.4342041015625, -0.24932861328125, -0.064453125, 0.12042236328125, 0.3052978515625, 0.49017333984375, 0.675048828125, 0.85992431640625, 1.0447998046875, 1.22967529296875, 1.41455078125, 1.59942626953125, 1.7843017578125, 1.96917724609375, 2.154052734375, 2.33892822265625, 2.5238037109375, 2.70867919921875, 2.8935546875, 3.07843017578125, 3.2633056640625, 3.44818115234375, 3.633056640625, 3.81793212890625, 4.0028076171875, 4.18768310546875, 4.37255859375, 4.55743408203125, 4.7423095703125, 4.92718505859375, 5.112060546875, 5.29693603515625, 5.4818115234375, 5.66668701171875, 5.8515625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 8.0, 3.0, 2.0, 4.0, 3.0, 12.0, 11.0, 13.0, 24.0, 21.0, 44.0, 57.0, 76.0, 111.0, 129.0, 212.0, 254.0, 399.0, 614.0, 900.0, 1261.0, 1837.0, 2755.0, 4360.0, 6861.0, 11031.0, 19325.0, 35062.0, 67905.0, 134879.0, 240356.0, 237161.0, 132465.0, 66318.0, 34541.0, 19108.0, 10954.0, 6591.0, 4291.0, 2729.0, 1797.0, 1224.0, 841.0, 583.0, 387.0, 277.0, 218.0, 165.0, 121.0, 66.0, 60.0, 39.0, 32.0, 18.0, 17.0, 14.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.671875, -6.4632568359375, -6.254638671875, -6.0460205078125, -5.83740234375, -5.6287841796875, -5.420166015625, -5.2115478515625, -5.0029296875, -4.7943115234375, -4.585693359375, -4.3770751953125, -4.16845703125, -3.9598388671875, -3.751220703125, -3.5426025390625, -3.333984375, -3.1253662109375, -2.916748046875, -2.7081298828125, -2.49951171875, -2.2908935546875, -2.082275390625, -1.8736572265625, -1.6650390625, -1.4564208984375, -1.247802734375, -1.0391845703125, -0.83056640625, -0.6219482421875, -0.413330078125, -0.2047119140625, 0.00390625, 0.2125244140625, 0.421142578125, 0.6297607421875, 0.83837890625, 1.0469970703125, 1.255615234375, 1.4642333984375, 1.6728515625, 1.8814697265625, 2.090087890625, 2.2987060546875, 2.50732421875, 2.7159423828125, 2.924560546875, 3.1331787109375, 3.341796875, 3.5504150390625, 3.759033203125, 3.9676513671875, 4.17626953125, 4.3848876953125, 4.593505859375, 4.8021240234375, 5.0107421875, 5.2193603515625, 5.427978515625, 5.6365966796875, 5.84521484375, 6.0538330078125, 6.262451171875, 6.4710693359375, 6.6796875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 6.0, 8.0, 11.0, 14.0, 20.0, 22.0, 30.0, 43.0, 75.0, 92.0, 93.0, 98.0, 115.0, 71.0, 69.0, 55.0, 47.0, 33.0, 19.0, 13.0, 13.0, 9.0, 6.0, 10.0, 4.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044727325439453125, -0.00043395906686782837, -0.0004206448793411255, -0.0004073306918144226, -0.0003940165042877197, -0.00038070231676101685, -0.00036738812923431396, -0.0003540739417076111, -0.0003407597541809082, -0.0003274455666542053, -0.00031413137912750244, -0.00030081719160079956, -0.0002875030040740967, -0.0002741888165473938, -0.0002608746290206909, -0.00024756044149398804, -0.00023424625396728516, -0.00022093206644058228, -0.0002076178789138794, -0.00019430369138717651, -0.00018098950386047363, -0.00016767531633377075, -0.00015436112880706787, -0.000141046941280365, -0.0001277327537536621, -0.00011441856622695923, -0.00010110437870025635, -8.779019117355347e-05, -7.447600364685059e-05, -6.11618161201477e-05, -4.7847628593444824e-05, -3.453344106674194e-05, -2.1219253540039062e-05, -7.905066013336182e-06, 5.409121513366699e-06, 1.872330904006958e-05, 3.203749656677246e-05, 4.535168409347534e-05, 5.866587162017822e-05, 7.19800591468811e-05, 8.529424667358398e-05, 9.860843420028687e-05, 0.00011192262172698975, 0.00012523680925369263, 0.0001385509967803955, 0.0001518651843070984, 0.00016517937183380127, 0.00017849355936050415, 0.00019180774688720703, 0.0002051219344139099, 0.0002184361219406128, 0.00023175030946731567, 0.00024506449699401855, 0.00025837868452072144, 0.0002716928720474243, 0.0002850070595741272, 0.0002983212471008301, 0.00031163543462753296, 0.00032494962215423584, 0.0003382638096809387, 0.0003515779972076416, 0.0003648921847343445, 0.00037820637226104736, 0.00039152055978775024, 0.0004048347473144531]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 19.0, 10.0, 21.0, 37.0, 48.0, 68.0, 98.0, 138.0, 249.0, 422.0, 649.0, 1106.0, 1869.0, 3178.0, 5576.0, 10281.0, 19984.0, 40492.0, 85818.0, 173048.0, 260451.0, 217306.0, 116015.0, 54510.0, 26711.0, 13590.0, 7106.0, 3923.0, 2201.0, 1383.0, 847.0, 505.0, 340.0, 194.0, 123.0, 80.0, 49.0, 38.0, 22.0, 16.0, 6.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.71112060546875, -6.4925537109375, -6.27398681640625, -6.055419921875, -5.83685302734375, -5.6182861328125, -5.39971923828125, -5.18115234375, -4.96258544921875, -4.7440185546875, -4.52545166015625, -4.306884765625, -4.08831787109375, -3.8697509765625, -3.65118408203125, -3.4326171875, -3.21405029296875, -2.9954833984375, -2.77691650390625, -2.558349609375, -2.33978271484375, -2.1212158203125, -1.90264892578125, -1.68408203125, -1.46551513671875, -1.2469482421875, -1.02838134765625, -0.809814453125, -0.59124755859375, -0.3726806640625, -0.15411376953125, 0.064453125, 0.28302001953125, 0.5015869140625, 0.72015380859375, 0.938720703125, 1.15728759765625, 1.3758544921875, 1.59442138671875, 1.81298828125, 2.03155517578125, 2.2501220703125, 2.46868896484375, 2.687255859375, 2.90582275390625, 3.1243896484375, 3.34295654296875, 3.5615234375, 3.78009033203125, 3.9986572265625, 4.21722412109375, 4.435791015625, 4.65435791015625, 4.8729248046875, 5.09149169921875, 5.31005859375, 5.52862548828125, 5.7471923828125, 5.96575927734375, 6.184326171875, 6.40289306640625, 6.6214599609375, 6.84002685546875, 7.05859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 6.0, 13.0, 4.0, 8.0, 5.0, 18.0, 19.0, 22.0, 21.0, 31.0, 38.0, 34.0, 67.0, 66.0, 62.0, 46.0, 64.0, 52.0, 47.0, 56.0, 42.0, 48.0, 32.0, 45.0, 27.0, 20.0, 10.0, 17.0, 16.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.384765625, -1.3418731689453125, -1.298980712890625, -1.2560882568359375, -1.21319580078125, -1.1703033447265625, -1.127410888671875, -1.0845184326171875, -1.0416259765625, -0.9987335205078125, -0.955841064453125, -0.9129486083984375, -0.87005615234375, -0.8271636962890625, -0.784271240234375, -0.7413787841796875, -0.698486328125, -0.6555938720703125, -0.612701416015625, -0.5698089599609375, -0.52691650390625, -0.4840240478515625, -0.441131591796875, -0.3982391357421875, -0.3553466796875, -0.3124542236328125, -0.269561767578125, -0.2266693115234375, -0.18377685546875, -0.1408843994140625, -0.097991943359375, -0.0550994873046875, -0.01220703125, 0.0306854248046875, 0.073577880859375, 0.1164703369140625, 0.15936279296875, 0.2022552490234375, 0.245147705078125, 0.2880401611328125, 0.3309326171875, 0.3738250732421875, 0.416717529296875, 0.4596099853515625, 0.50250244140625, 0.5453948974609375, 0.588287353515625, 0.6311798095703125, 0.674072265625, 0.7169647216796875, 0.759857177734375, 0.8027496337890625, 0.84564208984375, 0.8885345458984375, 0.931427001953125, 0.9743194580078125, 1.0172119140625, 1.0601043701171875, 1.102996826171875, 1.1458892822265625, 1.18878173828125, 1.2316741943359375, 1.274566650390625, 1.3174591064453125, 1.3603515625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 3.0, 13.0, 8.0, 10.0, 14.0, 21.0, 29.0, 37.0, 45.0, 51.0, 58.0, 81.0, 83.0, 77.0, 62.0, 71.0, 69.0, 53.0, 49.0, 36.0, 22.0, 23.0, 14.0, 11.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-25.621694564819336, -24.904603958129883, -24.18751335144043, -23.470422744750977, -22.753334045410156, -22.036243438720703, -21.31915283203125, -20.602062225341797, -19.884971618652344, -19.16788101196289, -18.450790405273438, -17.733699798583984, -17.01660919189453, -16.29952049255371, -15.582429885864258, -14.865339279174805, -14.148248672485352, -13.431158065795898, -12.714067459106445, -11.996977806091309, -11.279887199401855, -10.562796592712402, -9.845706939697266, -9.128616333007812, -8.41152572631836, -7.694435119628906, -6.977344989776611, -6.260254859924316, -5.543164253234863, -4.82607364654541, -4.108983516693115, -3.3918933868408203, -2.6748046875, -1.957714319229126, -1.240623950958252, -0.5235335826873779, 0.1935567855834961, 0.9106471538543701, 1.6277375221252441, 2.344827651977539, 3.061918258666992, 3.779008626937866, 4.49609899520874, 5.213189125061035, 5.930279731750488, 6.647370338439941, 7.364460468292236, 8.081550598144531, 8.798641204833984, 9.515731811523438, 10.23282241821289, 10.949912071228027, 11.66700267791748, 12.384093284606934, 13.10118293762207, 13.818273544311523, 14.535364151000977, 15.25245475769043, 15.969545364379883, 16.686635971069336, 17.403724670410156, 18.12081527709961, 18.837905883789062, 19.554996490478516, 20.27208709716797]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 6.0, 10.0, 8.0, 7.0, 12.0, 7.0, 24.0, 13.0, 13.0, 27.0, 31.0, 37.0, 38.0, 33.0, 36.0, 48.0, 36.0, 32.0, 40.0, 53.0, 46.0, 46.0, 46.0, 47.0, 36.0, 36.0, 31.0, 28.0, 25.0, 16.0, 22.0, 9.0, 20.0, 16.0, 18.0, 10.0, 9.0, 10.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.047958850860596, -6.774683952331543, -6.501409530639648, -6.228134632110596, -5.954859733581543, -5.68158483505249, -5.4083099365234375, -5.135035514831543, -4.86176061630249, -4.5884857177734375, -4.315211296081543, -4.04193639755249, -3.7686614990234375, -3.4953866004943848, -3.222111940383911, -2.9488372802734375, -2.6755623817443848, -2.402287483215332, -2.1290128231048584, -1.8557380437850952, -1.582463264465332, -1.3091884851455688, -1.0359137058258057, -0.7626389265060425, -0.4893641471862793, -0.2160893678665161, 0.05718541145324707, 0.33046019077301025, 0.6037349700927734, 0.8770097494125366, 1.1502845287322998, 1.423559308052063, 1.6968345642089844, 1.9701093435287476, 2.2433841228485107, 2.5166587829589844, 2.789933681488037, 3.06320858001709, 3.3364832401275635, 3.609757900238037, 3.88303279876709, 4.156307697296143, 4.429582595825195, 4.70285701751709, 4.976131916046143, 5.249406814575195, 5.52268123626709, 5.795956134796143, 6.069231033325195, 6.342505931854248, 6.615780830383301, 6.889055252075195, 7.162330150604248, 7.435605049133301, 7.708879470825195, 7.982154369354248, 8.2554292678833, 8.528703689575195, 8.801979064941406, 9.0752534866333, 9.348527908325195, 9.621803283691406, 9.8950777053833, 10.168353080749512, 10.441627502441406]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 12.0, 18.0, 22.0, 23.0, 42.0, 61.0, 94.0, 154.0, 230.0, 380.0, 624.0, 896.0, 1578.0, 2601.0, 4664.0, 7887.0, 14002.0, 24700.0, 43223.0, 72982.0, 115304.0, 158621.0, 175972.0, 153260.0, 109188.0, 68729.0, 39911.0, 22630.0, 12879.0, 7380.0, 4261.0, 2460.0, 1419.0, 868.0, 546.0, 321.0, 186.0, 123.0, 113.0, 54.0, 34.0, 27.0, 25.0, 12.0, 10.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.890625, -12.48046875, -12.0703125, -11.66015625, -11.25, -10.83984375, -10.4296875, -10.01953125, -9.609375, -9.19921875, -8.7890625, -8.37890625, -7.96875, -7.55859375, -7.1484375, -6.73828125, -6.328125, -5.91796875, -5.5078125, -5.09765625, -4.6875, -4.27734375, -3.8671875, -3.45703125, -3.046875, -2.63671875, -2.2265625, -1.81640625, -1.40625, -0.99609375, -0.5859375, -0.17578125, 0.234375, 0.64453125, 1.0546875, 1.46484375, 1.875, 2.28515625, 2.6953125, 3.10546875, 3.515625, 3.92578125, 4.3359375, 4.74609375, 5.15625, 5.56640625, 5.9765625, 6.38671875, 6.796875, 7.20703125, 7.6171875, 8.02734375, 8.4375, 8.84765625, 9.2578125, 9.66796875, 10.078125, 10.48828125, 10.8984375, 11.30859375, 11.71875, 12.12890625, 12.5390625, 12.94921875, 13.359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 1.0, 9.0, 10.0, 9.0, 7.0, 14.0, 16.0, 23.0, 25.0, 17.0, 36.0, 44.0, 40.0, 35.0, 36.0, 52.0, 39.0, 47.0, 49.0, 39.0, 39.0, 45.0, 47.0, 34.0, 43.0, 27.0, 34.0, 20.0, 25.0, 18.0, 16.0, 19.0, 13.0, 11.0, 13.0, 6.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0859375, -9.7691650390625, -9.452392578125, -9.1356201171875, -8.81884765625, -8.5020751953125, -8.185302734375, -7.8685302734375, -7.5517578125, -7.2349853515625, -6.918212890625, -6.6014404296875, -6.28466796875, -5.9678955078125, -5.651123046875, -5.3343505859375, -5.017578125, -4.7008056640625, -4.384033203125, -4.0672607421875, -3.75048828125, -3.4337158203125, -3.116943359375, -2.8001708984375, -2.4833984375, -2.1666259765625, -1.849853515625, -1.5330810546875, -1.21630859375, -0.8995361328125, -0.582763671875, -0.2659912109375, 0.05078125, 0.3675537109375, 0.684326171875, 1.0010986328125, 1.31787109375, 1.6346435546875, 1.951416015625, 2.2681884765625, 2.5849609375, 2.9017333984375, 3.218505859375, 3.5352783203125, 3.85205078125, 4.1688232421875, 4.485595703125, 4.8023681640625, 5.119140625, 5.4359130859375, 5.752685546875, 6.0694580078125, 6.38623046875, 6.7030029296875, 7.019775390625, 7.3365478515625, 7.6533203125, 7.9700927734375, 8.286865234375, 8.6036376953125, 8.92041015625, 9.2371826171875, 9.553955078125, 9.8707275390625, 10.1875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 12.0, 13.0, 36.0, 36.0, 62.0, 89.0, 152.0, 237.0, 419.0, 803.0, 1493.0, 2840.0, 5695.0, 11663.0, 24566.0, 49306.0, 95149.0, 159970.0, 210294.0, 197395.0, 135392.0, 76441.0, 39094.0, 18982.0, 8997.0, 4539.0, 2218.0, 1095.0, 614.0, 350.0, 199.0, 123.0, 99.0, 46.0, 36.0, 22.0, 25.0, 9.0, 14.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6640625, -15.1558837890625, -14.647705078125, -14.1395263671875, -13.63134765625, -13.1231689453125, -12.614990234375, -12.1068115234375, -11.5986328125, -11.0904541015625, -10.582275390625, -10.0740966796875, -9.56591796875, -9.0577392578125, -8.549560546875, -8.0413818359375, -7.533203125, -7.0250244140625, -6.516845703125, -6.0086669921875, -5.50048828125, -4.9923095703125, -4.484130859375, -3.9759521484375, -3.4677734375, -2.9595947265625, -2.451416015625, -1.9432373046875, -1.43505859375, -0.9268798828125, -0.418701171875, 0.0894775390625, 0.59765625, 1.1058349609375, 1.614013671875, 2.1221923828125, 2.63037109375, 3.1385498046875, 3.646728515625, 4.1549072265625, 4.6630859375, 5.1712646484375, 5.679443359375, 6.1876220703125, 6.69580078125, 7.2039794921875, 7.712158203125, 8.2203369140625, 8.728515625, 9.2366943359375, 9.744873046875, 10.2530517578125, 10.76123046875, 11.2694091796875, 11.777587890625, 12.2857666015625, 12.7939453125, 13.3021240234375, 13.810302734375, 14.3184814453125, 14.82666015625, 15.3348388671875, 15.843017578125, 16.3511962890625, 16.859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 12.0, 6.0, 23.0, 17.0, 24.0, 13.0, 20.0, 31.0, 35.0, 31.0, 33.0, 25.0, 38.0, 28.0, 39.0, 40.0, 38.0, 36.0, 41.0, 38.0, 40.0, 45.0, 44.0, 37.0, 28.0, 35.0, 31.0, 19.0, 21.0, 12.0, 14.0, 13.0, 9.0, 6.0, 15.0, 7.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.4765625, -4.296875, -4.1171875, -3.9375, -3.7578125, -3.578125, -3.3984375, -3.21875, -3.0390625, -2.859375, -2.6796875, -2.5, -2.3203125, -2.140625, -1.9609375, -1.78125, -1.6015625, -1.421875, -1.2421875, -1.0625, -0.8828125, -0.703125, -0.5234375, -0.34375, -0.1640625, 0.015625, 0.1953125, 0.375, 0.5546875, 0.734375, 0.9140625, 1.09375, 1.2734375, 1.453125, 1.6328125, 1.8125, 1.9921875, 2.171875, 2.3515625, 2.53125, 2.7109375, 2.890625, 3.0703125, 3.25, 3.4296875, 3.609375, 3.7890625, 3.96875, 4.1484375, 4.328125, 4.5078125, 4.6875, 4.8671875, 5.046875, 5.2265625, 5.40625, 5.5859375, 5.765625, 5.9453125, 6.125, 6.3046875, 6.484375, 6.6640625, 6.84375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 9.0, 23.0, 16.0, 26.0, 53.0, 58.0, 81.0, 95.0, 165.0, 220.0, 318.0, 510.0, 890.0, 1581.0, 2897.0, 5876.0, 13263.0, 31685.0, 80812.0, 186615.0, 295145.0, 236329.0, 112411.0, 44919.0, 18025.0, 7713.0, 3820.0, 2031.0, 1094.0, 626.0, 373.0, 273.0, 151.0, 129.0, 88.0, 61.0, 39.0, 27.0, 21.0, 14.0, 13.0, 14.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.15625, -9.854736328125, -9.55322265625, -9.251708984375, -8.9501953125, -8.648681640625, -8.34716796875, -8.045654296875, -7.744140625, -7.442626953125, -7.14111328125, -6.839599609375, -6.5380859375, -6.236572265625, -5.93505859375, -5.633544921875, -5.33203125, -5.030517578125, -4.72900390625, -4.427490234375, -4.1259765625, -3.824462890625, -3.52294921875, -3.221435546875, -2.919921875, -2.618408203125, -2.31689453125, -2.015380859375, -1.7138671875, -1.412353515625, -1.11083984375, -0.809326171875, -0.5078125, -0.206298828125, 0.09521484375, 0.396728515625, 0.6982421875, 0.999755859375, 1.30126953125, 1.602783203125, 1.904296875, 2.205810546875, 2.50732421875, 2.808837890625, 3.1103515625, 3.411865234375, 3.71337890625, 4.014892578125, 4.31640625, 4.617919921875, 4.91943359375, 5.220947265625, 5.5224609375, 5.823974609375, 6.12548828125, 6.427001953125, 6.728515625, 7.030029296875, 7.33154296875, 7.633056640625, 7.9345703125, 8.236083984375, 8.53759765625, 8.839111328125, 9.140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 7.0, 7.0, 12.0, 12.0, 29.0, 23.0, 29.0, 29.0, 36.0, 37.0, 45.0, 54.0, 60.0, 57.0, 62.0, 49.0, 55.0, 52.0, 56.0, 44.0, 43.0, 31.0, 33.0, 22.0, 20.0, 16.0, 10.0, 15.0, 14.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004963874816894531, -0.00047941505908966064, -0.00046244263648986816, -0.0004454702138900757, -0.0004284977912902832, -0.0004115253686904907, -0.00039455294609069824, -0.00037758052349090576, -0.0003606081008911133, -0.0003436356782913208, -0.0003266632556915283, -0.00030969083309173584, -0.00029271841049194336, -0.0002757459878921509, -0.0002587735652923584, -0.00024180114269256592, -0.00022482872009277344, -0.00020785629749298096, -0.00019088387489318848, -0.000173911452293396, -0.00015693902969360352, -0.00013996660709381104, -0.00012299418449401855, -0.00010602176189422607, -8.90493392944336e-05, -7.207691669464111e-05, -5.510449409484863e-05, -3.813207149505615e-05, -2.1159648895263672e-05, -4.187226295471191e-06, 1.2785196304321289e-05, 2.975761890411377e-05, 4.673004150390625e-05, 6.370246410369873e-05, 8.067488670349121e-05, 9.764730930328369e-05, 0.00011461973190307617, 0.00013159215450286865, 0.00014856457710266113, 0.0001655369997024536, 0.0001825094223022461, 0.00019948184490203857, 0.00021645426750183105, 0.00023342669010162354, 0.000250399112701416, 0.0002673715353012085, 0.000284343957901001, 0.00030131638050079346, 0.00031828880310058594, 0.0003352612257003784, 0.0003522336483001709, 0.0003692060708999634, 0.00038617849349975586, 0.00040315091609954834, 0.0004201233386993408, 0.0004370957612991333, 0.0004540681838989258, 0.00047104060649871826, 0.00048801302909851074, 0.0005049854516983032, 0.0005219578742980957, 0.0005389302968978882, 0.0005559027194976807, 0.0005728751420974731, 0.0005898475646972656]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 9.0, 2.0, 7.0, 8.0, 9.0, 16.0, 13.0, 18.0, 38.0, 49.0, 75.0, 107.0, 140.0, 211.0, 309.0, 510.0, 748.0, 1178.0, 1964.0, 3369.0, 6126.0, 10828.0, 20216.0, 37614.0, 67563.0, 114816.0, 168142.0, 193541.0, 165033.0, 110730.0, 65062.0, 35953.0, 19425.0, 10432.0, 5773.0, 3281.0, 1995.0, 1130.0, 725.0, 448.0, 294.0, 199.0, 139.0, 92.0, 66.0, 40.0, 29.0, 31.0, 18.0, 11.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.734375, -5.5521240234375, -5.369873046875, -5.1876220703125, -5.00537109375, -4.8231201171875, -4.640869140625, -4.4586181640625, -4.2763671875, -4.0941162109375, -3.911865234375, -3.7296142578125, -3.54736328125, -3.3651123046875, -3.182861328125, -3.0006103515625, -2.818359375, -2.6361083984375, -2.453857421875, -2.2716064453125, -2.08935546875, -1.9071044921875, -1.724853515625, -1.5426025390625, -1.3603515625, -1.1781005859375, -0.995849609375, -0.8135986328125, -0.63134765625, -0.4490966796875, -0.266845703125, -0.0845947265625, 0.09765625, 0.2799072265625, 0.462158203125, 0.6444091796875, 0.82666015625, 1.0089111328125, 1.191162109375, 1.3734130859375, 1.5556640625, 1.7379150390625, 1.920166015625, 2.1024169921875, 2.28466796875, 2.4669189453125, 2.649169921875, 2.8314208984375, 3.013671875, 3.1959228515625, 3.378173828125, 3.5604248046875, 3.74267578125, 3.9249267578125, 4.107177734375, 4.2894287109375, 4.4716796875, 4.6539306640625, 4.836181640625, 5.0184326171875, 5.20068359375, 5.3829345703125, 5.565185546875, 5.7474365234375, 5.9296875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 14.0, 9.0, 19.0, 20.0, 23.0, 33.0, 42.0, 40.0, 56.0, 69.0, 60.0, 79.0, 70.0, 76.0, 55.0, 46.0, 57.0, 43.0, 43.0, 37.0, 21.0, 18.0, 5.0, 15.0, 10.0, 3.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8626861572265625, -1.800567626953125, -1.7384490966796875, -1.67633056640625, -1.6142120361328125, -1.552093505859375, -1.4899749755859375, -1.4278564453125, -1.3657379150390625, -1.303619384765625, -1.2415008544921875, -1.17938232421875, -1.1172637939453125, -1.055145263671875, -0.9930267333984375, -0.930908203125, -0.8687896728515625, -0.806671142578125, -0.7445526123046875, -0.68243408203125, -0.6203155517578125, -0.558197021484375, -0.4960784912109375, -0.4339599609375, -0.3718414306640625, -0.309722900390625, -0.2476043701171875, -0.18548583984375, -0.1233673095703125, -0.061248779296875, 0.0008697509765625, 0.06298828125, 0.1251068115234375, 0.187225341796875, 0.2493438720703125, 0.31146240234375, 0.3735809326171875, 0.435699462890625, 0.4978179931640625, 0.5599365234375, 0.6220550537109375, 0.684173583984375, 0.7462921142578125, 0.80841064453125, 0.8705291748046875, 0.932647705078125, 0.9947662353515625, 1.056884765625, 1.1190032958984375, 1.181121826171875, 1.2432403564453125, 1.30535888671875, 1.3674774169921875, 1.429595947265625, 1.4917144775390625, 1.5538330078125, 1.6159515380859375, 1.678070068359375, 1.7401885986328125, 1.80230712890625, 1.8644256591796875, 1.926544189453125, 1.9886627197265625, 2.05078125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 3.0, 10.0, 10.0, 16.0, 16.0, 21.0, 28.0, 46.0, 50.0, 63.0, 74.0, 93.0, 79.0, 96.0, 64.0, 71.0, 66.0, 31.0, 36.0, 31.0, 27.0, 9.0, 12.0, 13.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.34234046936035, -26.557292938232422, -25.772245407104492, -24.987197875976562, -24.202150344848633, -23.417102813720703, -22.63205337524414, -21.847007751464844, -21.06195831298828, -20.27691078186035, -19.491863250732422, -18.706815719604492, -17.921768188476562, -17.136720657348633, -16.351673126220703, -15.566624641418457, -14.781578063964844, -13.996530532836914, -13.211483001708984, -12.426435470581055, -11.641387939453125, -10.856340408325195, -10.07129192352295, -9.28624439239502, -8.50119686126709, -7.71614933013916, -6.9311017990112305, -6.146053791046143, -5.361006259918213, -4.575958728790283, -3.7909107208251953, -3.0058631896972656, -2.220815658569336, -1.4357680082321167, -0.6507203578948975, 0.13432741165161133, 0.919374942779541, 1.7044224739074707, 2.4894704818725586, 3.2745180130004883, 4.059565544128418, 4.844613075256348, 5.629660606384277, 6.414708614349365, 7.199756145477295, 7.984803676605225, 8.769851684570312, 9.554899215698242, 10.339946746826172, 11.124994277954102, 11.910041809082031, 12.695089340209961, 13.48013687133789, 14.26518440246582, 15.050232887268066, 15.835280418395996, 16.62032699584961, 17.40537452697754, 18.19042205810547, 18.9754695892334, 19.760517120361328, 20.545564651489258, 21.330612182617188, 22.11566162109375, 22.90070915222168]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 12.0, 13.0, 13.0, 8.0, 23.0, 20.0, 20.0, 25.0, 23.0, 29.0, 40.0, 32.0, 52.0, 43.0, 38.0, 32.0, 46.0, 63.0, 42.0, 36.0, 40.0, 41.0, 46.0, 32.0, 34.0, 26.0, 28.0, 18.0, 22.0, 10.0, 6.0, 14.0, 15.0, 14.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.717850208282471, -7.419209957122803, -7.120569705963135, -6.821929454803467, -6.523289203643799, -6.224648952484131, -5.926008701324463, -5.627368450164795, -5.328728199005127, -5.030087947845459, -4.731447696685791, -4.432807445526123, -4.134167194366455, -3.835526943206787, -3.536886692047119, -3.238246440887451, -2.939606189727783, -2.6409659385681152, -2.3423256874084473, -2.0436854362487793, -1.7450451850891113, -1.4464049339294434, -1.1477646827697754, -0.8491244316101074, -0.5504841804504395, -0.2518439292907715, 0.046796321868896484, 0.34543657302856445, 0.6440768241882324, 0.9427170753479004, 1.2413573265075684, 1.5399975776672363, 1.838637351989746, 2.137277603149414, 2.435917854309082, 2.73455810546875, 3.033198356628418, 3.331838607788086, 3.630478858947754, 3.929119110107422, 4.22775936126709, 4.526399612426758, 4.825039863586426, 5.123680114746094, 5.422320365905762, 5.72096061706543, 6.019600868225098, 6.318241119384766, 6.616881370544434, 6.915521621704102, 7.2141618728637695, 7.5128021240234375, 7.8114423751831055, 8.110082626342773, 8.408722877502441, 8.70736312866211, 9.006003379821777, 9.304643630981445, 9.603283882141113, 9.901924133300781, 10.20056438446045, 10.499204635620117, 10.797844886779785, 11.096485137939453, 11.395125389099121]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 10.0, 19.0, 26.0, 40.0, 60.0, 95.0, 155.0, 223.0, 413.0, 637.0, 1182.0, 1927.0, 3337.0, 6259.0, 12609.0, 25167.0, 52574.0, 117310.0, 278734.0, 690717.0, 1276717.0, 981621.0, 420102.0, 173308.0, 77183.0, 35898.0, 17722.0, 9130.0, 4725.0, 2657.0, 1511.0, 859.0, 499.0, 319.0, 184.0, 131.0, 69.0, 50.0, 30.0, 19.0, 13.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.671875, -18.064208984375, -17.45654296875, -16.848876953125, -16.2412109375, -15.633544921875, -15.02587890625, -14.418212890625, -13.810546875, -13.202880859375, -12.59521484375, -11.987548828125, -11.3798828125, -10.772216796875, -10.16455078125, -9.556884765625, -8.94921875, -8.341552734375, -7.73388671875, -7.126220703125, -6.5185546875, -5.910888671875, -5.30322265625, -4.695556640625, -4.087890625, -3.480224609375, -2.87255859375, -2.264892578125, -1.6572265625, -1.049560546875, -0.44189453125, 0.165771484375, 0.7734375, 1.381103515625, 1.98876953125, 2.596435546875, 3.2041015625, 3.811767578125, 4.41943359375, 5.027099609375, 5.634765625, 6.242431640625, 6.85009765625, 7.457763671875, 8.0654296875, 8.673095703125, 9.28076171875, 9.888427734375, 10.49609375, 11.103759765625, 11.71142578125, 12.319091796875, 12.9267578125, 13.534423828125, 14.14208984375, 14.749755859375, 15.357421875, 15.965087890625, 16.57275390625, 17.180419921875, 17.7880859375, 18.395751953125, 19.00341796875, 19.611083984375, 20.21875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 12.0, 7.0, 13.0, 7.0, 13.0, 20.0, 17.0, 21.0, 27.0, 30.0, 24.0, 27.0, 37.0, 29.0, 41.0, 44.0, 48.0, 50.0, 41.0, 35.0, 52.0, 46.0, 33.0, 43.0, 48.0, 32.0, 33.0, 25.0, 20.0, 21.0, 21.0, 12.0, 13.0, 16.0, 11.0, 9.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.9002685546875, -5.675537109375, -5.4508056640625, -5.22607421875, -5.0013427734375, -4.776611328125, -4.5518798828125, -4.3271484375, -4.1024169921875, -3.877685546875, -3.6529541015625, -3.42822265625, -3.2034912109375, -2.978759765625, -2.7540283203125, -2.529296875, -2.3045654296875, -2.079833984375, -1.8551025390625, -1.63037109375, -1.4056396484375, -1.180908203125, -0.9561767578125, -0.7314453125, -0.5067138671875, -0.281982421875, -0.0572509765625, 0.16748046875, 0.3922119140625, 0.616943359375, 0.8416748046875, 1.06640625, 1.2911376953125, 1.515869140625, 1.7406005859375, 1.96533203125, 2.1900634765625, 2.414794921875, 2.6395263671875, 2.8642578125, 3.0889892578125, 3.313720703125, 3.5384521484375, 3.76318359375, 3.9879150390625, 4.212646484375, 4.4373779296875, 4.662109375, 4.8868408203125, 5.111572265625, 5.3363037109375, 5.56103515625, 5.7857666015625, 6.010498046875, 6.2352294921875, 6.4599609375, 6.6846923828125, 6.909423828125, 7.1341552734375, 7.35888671875, 7.5836181640625, 7.808349609375, 8.0330810546875, 8.2578125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 16.0, 19.0, 50.0, 73.0, 98.0, 178.0, 226.0, 390.0, 611.0, 1036.0, 1723.0, 2951.0, 5233.0, 9068.0, 15928.0, 28858.0, 53743.0, 102391.0, 197687.0, 382617.0, 694030.0, 959245.0, 785904.0, 453863.0, 235495.0, 121026.0, 63869.0, 33960.0, 18675.0, 10674.0, 6126.0, 3440.0, 1995.0, 1168.0, 722.0, 428.0, 270.0, 188.0, 100.0, 66.0, 43.0, 29.0, 13.0, 14.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.024658203125, -15.51806640625, -15.011474609375, -14.5048828125, -13.998291015625, -13.49169921875, -12.985107421875, -12.478515625, -11.971923828125, -11.46533203125, -10.958740234375, -10.4521484375, -9.945556640625, -9.43896484375, -8.932373046875, -8.42578125, -7.919189453125, -7.41259765625, -6.906005859375, -6.3994140625, -5.892822265625, -5.38623046875, -4.879638671875, -4.373046875, -3.866455078125, -3.35986328125, -2.853271484375, -2.3466796875, -1.840087890625, -1.33349609375, -0.826904296875, -0.3203125, 0.186279296875, 0.69287109375, 1.199462890625, 1.7060546875, 2.212646484375, 2.71923828125, 3.225830078125, 3.732421875, 4.239013671875, 4.74560546875, 5.252197265625, 5.7587890625, 6.265380859375, 6.77197265625, 7.278564453125, 7.78515625, 8.291748046875, 8.79833984375, 9.304931640625, 9.8115234375, 10.318115234375, 10.82470703125, 11.331298828125, 11.837890625, 12.344482421875, 12.85107421875, 13.357666015625, 13.8642578125, 14.370849609375, 14.87744140625, 15.384033203125, 15.890625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 23.0, 25.0, 33.0, 52.0, 62.0, 62.0, 87.0, 112.0, 127.0, 186.0, 206.0, 241.0, 265.0, 297.0, 274.0, 304.0, 276.0, 242.0, 215.0, 196.0, 161.0, 137.0, 127.0, 75.0, 69.0, 55.0, 31.0, 25.0, 21.0, 21.0, 10.0, 13.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.82391357421875, -4.6673583984375, -4.51080322265625, -4.354248046875, -4.19769287109375, -4.0411376953125, -3.88458251953125, -3.72802734375, -3.57147216796875, -3.4149169921875, -3.25836181640625, -3.101806640625, -2.94525146484375, -2.7886962890625, -2.63214111328125, -2.4755859375, -2.31903076171875, -2.1624755859375, -2.00592041015625, -1.849365234375, -1.69281005859375, -1.5362548828125, -1.37969970703125, -1.22314453125, -1.06658935546875, -0.9100341796875, -0.75347900390625, -0.596923828125, -0.44036865234375, -0.2838134765625, -0.12725830078125, 0.029296875, 0.18585205078125, 0.3424072265625, 0.49896240234375, 0.655517578125, 0.81207275390625, 0.9686279296875, 1.12518310546875, 1.28173828125, 1.43829345703125, 1.5948486328125, 1.75140380859375, 1.907958984375, 2.06451416015625, 2.2210693359375, 2.37762451171875, 2.5341796875, 2.69073486328125, 2.8472900390625, 3.00384521484375, 3.160400390625, 3.31695556640625, 3.4735107421875, 3.63006591796875, 3.78662109375, 3.94317626953125, 4.0997314453125, 4.25628662109375, 4.412841796875, 4.56939697265625, 4.7259521484375, 4.88250732421875, 5.0390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 13.0, 12.0, 23.0, 42.0, 46.0, 49.0, 63.0, 70.0, 68.0, 75.0, 87.0, 92.0, 64.0, 46.0, 46.0, 46.0, 34.0, 18.0, 20.0, 12.0, 15.0, 10.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.599149703979492, -23.857467651367188, -23.11578369140625, -22.374101638793945, -21.63241958618164, -20.890735626220703, -20.1490535736084, -19.407371520996094, -18.665687561035156, -17.92400550842285, -17.182321548461914, -16.44063949584961, -15.698956489562988, -14.957273483276367, -14.215591430664062, -13.473908424377441, -12.73222541809082, -11.9905424118042, -11.248859405517578, -10.507177352905273, -9.765494346618652, -9.023811340332031, -8.282129287719727, -7.5404462814331055, -6.798763275146484, -6.057080268859863, -5.3153977394104, -4.5737152099609375, -3.8320322036743164, -3.0903494358062744, -2.3486666679382324, -1.6069841384887695, -0.8652992248535156, -0.12361645698547363, 0.6180663108825684, 1.3597490787506104, 2.1014318466186523, 2.8431146144866943, 3.5847973823547363, 4.326479911804199, 5.06816291809082, 5.809845924377441, 6.551528453826904, 7.293210983276367, 8.034893989562988, 8.77657699584961, 9.518259048461914, 10.259942054748535, 11.001625061035156, 11.743308067321777, 12.484991073608398, 13.226673126220703, 13.968356132507324, 14.710039138793945, 15.45172119140625, 16.193405151367188, 16.935087203979492, 17.676769256591797, 18.418453216552734, 19.16013526916504, 19.901817321777344, 20.64350128173828, 21.385183334350586, 22.12686538696289, 22.868549346923828]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 12.0, 14.0, 11.0, 23.0, 19.0, 24.0, 31.0, 33.0, 30.0, 36.0, 32.0, 36.0, 45.0, 43.0, 49.0, 41.0, 38.0, 43.0, 38.0, 35.0, 46.0, 35.0, 25.0, 39.0, 28.0, 29.0, 28.0, 13.0, 14.0, 12.0, 15.0, 14.0, 10.0, 7.0, 6.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.250918388366699, -6.986877918243408, -6.722837924957275, -6.458797454833984, -6.194757461547852, -5.9307169914245605, -5.6666765213012695, -5.402636528015137, -5.138596057891846, -4.874555587768555, -4.610515594482422, -4.346475124359131, -4.08243465423584, -3.818394660949707, -3.554354190826416, -3.290313959121704, -3.026273727416992, -2.7622334957122803, -2.4981932640075684, -2.2341527938842773, -1.9701125621795654, -1.7060723304748535, -1.442031979560852, -1.1779916286468506, -0.9139513969421387, -0.649911105632782, -0.3858708143234253, -0.1218305230140686, 0.14220976829528809, 0.40625, 0.6702903509140015, 0.9343307018280029, 1.1983709335327148, 1.4624111652374268, 1.7264515161514282, 1.9904918670654297, 2.2545320987701416, 2.5185723304748535, 2.7826128005981445, 3.0466530323028564, 3.3106932640075684, 3.5747334957122803, 3.838773727416992, 4.102814197540283, 4.366854667663574, 4.630894660949707, 4.894935131072998, 5.158975601196289, 5.423015594482422, 5.687056064605713, 5.951096057891846, 6.215136528015137, 6.4791765213012695, 6.7432169914245605, 7.007257461547852, 7.271297454833984, 7.535337924957275, 7.799378395080566, 8.0634183883667, 8.327458381652832, 8.591499328613281, 8.855539321899414, 9.119579315185547, 9.383620262145996, 9.647660255432129]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 12.0, 23.0, 35.0, 33.0, 71.0, 100.0, 156.0, 265.0, 398.0, 658.0, 1006.0, 1662.0, 2859.0, 4652.0, 7814.0, 13232.0, 22623.0, 38257.0, 63084.0, 99364.0, 138930.0, 164313.0, 156854.0, 122564.0, 82549.0, 51940.0, 30649.0, 18110.0, 10438.0, 6334.0, 3639.0, 2228.0, 1350.0, 845.0, 539.0, 308.0, 216.0, 159.0, 85.0, 69.0, 46.0, 26.0, 32.0, 5.0, 9.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.560791015625, -6.32470703125, -6.088623046875, -5.8525390625, -5.616455078125, -5.38037109375, -5.144287109375, -4.908203125, -4.672119140625, -4.43603515625, -4.199951171875, -3.9638671875, -3.727783203125, -3.49169921875, -3.255615234375, -3.01953125, -2.783447265625, -2.54736328125, -2.311279296875, -2.0751953125, -1.839111328125, -1.60302734375, -1.366943359375, -1.130859375, -0.894775390625, -0.65869140625, -0.422607421875, -0.1865234375, 0.049560546875, 0.28564453125, 0.521728515625, 0.7578125, 0.993896484375, 1.22998046875, 1.466064453125, 1.7021484375, 1.938232421875, 2.17431640625, 2.410400390625, 2.646484375, 2.882568359375, 3.11865234375, 3.354736328125, 3.5908203125, 3.826904296875, 4.06298828125, 4.299072265625, 4.53515625, 4.771240234375, 5.00732421875, 5.243408203125, 5.4794921875, 5.715576171875, 5.95166015625, 6.187744140625, 6.423828125, 6.659912109375, 6.89599609375, 7.132080078125, 7.3681640625, 7.604248046875, 7.84033203125, 8.076416015625, 8.3125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 11.0, 14.0, 21.0, 26.0, 22.0, 26.0, 28.0, 32.0, 49.0, 34.0, 44.0, 48.0, 48.0, 47.0, 34.0, 58.0, 57.0, 46.0, 46.0, 39.0, 34.0, 34.0, 22.0, 28.0, 21.0, 17.0, 17.0, 20.0, 11.0, 5.0, 6.0, 11.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.9765625, -8.6484375, -8.3203125, -7.9921875, -7.6640625, -7.3359375, -7.0078125, -6.6796875, -6.3515625, -6.0234375, -5.6953125, -5.3671875, -5.0390625, -4.7109375, -4.3828125, -4.0546875, -3.7265625, -3.3984375, -3.0703125, -2.7421875, -2.4140625, -2.0859375, -1.7578125, -1.4296875, -1.1015625, -0.7734375, -0.4453125, -0.1171875, 0.2109375, 0.5390625, 0.8671875, 1.1953125, 1.5234375, 1.8515625, 2.1796875, 2.5078125, 2.8359375, 3.1640625, 3.4921875, 3.8203125, 4.1484375, 4.4765625, 4.8046875, 5.1328125, 5.4609375, 5.7890625, 6.1171875, 6.4453125, 6.7734375, 7.1015625, 7.4296875, 7.7578125, 8.0859375, 8.4140625, 8.7421875, 9.0703125, 9.3984375, 9.7265625, 10.0546875, 10.3828125, 10.7109375, 11.0390625, 11.3671875, 11.6953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 9.0, 22.0, 18.0, 30.0, 58.0, 79.0, 116.0, 172.0, 261.0, 363.0, 522.0, 853.0, 1271.0, 2013.0, 3348.0, 5513.0, 9028.0, 15156.0, 25262.0, 43311.0, 72413.0, 116794.0, 168501.0, 187242.0, 149228.0, 98188.0, 60020.0, 35883.0, 20650.0, 12379.0, 7545.0, 4644.0, 2745.0, 1803.0, 1110.0, 663.0, 412.0, 285.0, 215.0, 120.0, 92.0, 69.0, 41.0, 32.0, 22.0, 13.0, 15.0, 6.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-8.9140625, -8.63818359375, -8.3623046875, -8.08642578125, -7.810546875, -7.53466796875, -7.2587890625, -6.98291015625, -6.70703125, -6.43115234375, -6.1552734375, -5.87939453125, -5.603515625, -5.32763671875, -5.0517578125, -4.77587890625, -4.5, -4.22412109375, -3.9482421875, -3.67236328125, -3.396484375, -3.12060546875, -2.8447265625, -2.56884765625, -2.29296875, -2.01708984375, -1.7412109375, -1.46533203125, -1.189453125, -0.91357421875, -0.6376953125, -0.36181640625, -0.0859375, 0.18994140625, 0.4658203125, 0.74169921875, 1.017578125, 1.29345703125, 1.5693359375, 1.84521484375, 2.12109375, 2.39697265625, 2.6728515625, 2.94873046875, 3.224609375, 3.50048828125, 3.7763671875, 4.05224609375, 4.328125, 4.60400390625, 4.8798828125, 5.15576171875, 5.431640625, 5.70751953125, 5.9833984375, 6.25927734375, 6.53515625, 6.81103515625, 7.0869140625, 7.36279296875, 7.638671875, 7.91455078125, 8.1904296875, 8.46630859375, 8.7421875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 4.0, 11.0, 14.0, 14.0, 15.0, 18.0, 20.0, 21.0, 27.0, 29.0, 28.0, 41.0, 26.0, 38.0, 45.0, 45.0, 38.0, 38.0, 49.0, 44.0, 41.0, 39.0, 46.0, 42.0, 32.0, 35.0, 24.0, 25.0, 21.0, 25.0, 17.0, 12.0, 12.0, 13.0, 9.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.74652099609375, -4.5711669921875, -4.39581298828125, -4.220458984375, -4.04510498046875, -3.8697509765625, -3.69439697265625, -3.51904296875, -3.34368896484375, -3.1683349609375, -2.99298095703125, -2.817626953125, -2.64227294921875, -2.4669189453125, -2.29156494140625, -2.1162109375, -1.94085693359375, -1.7655029296875, -1.59014892578125, -1.414794921875, -1.23944091796875, -1.0640869140625, -0.88873291015625, -0.71337890625, -0.53802490234375, -0.3626708984375, -0.18731689453125, -0.011962890625, 0.16339111328125, 0.3387451171875, 0.51409912109375, 0.689453125, 0.86480712890625, 1.0401611328125, 1.21551513671875, 1.390869140625, 1.56622314453125, 1.7415771484375, 1.91693115234375, 2.09228515625, 2.26763916015625, 2.4429931640625, 2.61834716796875, 2.793701171875, 2.96905517578125, 3.1444091796875, 3.31976318359375, 3.4951171875, 3.67047119140625, 3.8458251953125, 4.02117919921875, 4.196533203125, 4.37188720703125, 4.5472412109375, 4.72259521484375, 4.89794921875, 5.07330322265625, 5.2486572265625, 5.42401123046875, 5.599365234375, 5.77471923828125, 5.9500732421875, 6.12542724609375, 6.30078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 16.0, 15.0, 22.0, 39.0, 77.0, 113.0, 161.0, 275.0, 406.0, 678.0, 1121.0, 1847.0, 2928.0, 4989.0, 8315.0, 14539.0, 25520.0, 45036.0, 79193.0, 137057.0, 202794.0, 202844.0, 136084.0, 79425.0, 44611.0, 25176.0, 14539.0, 8236.0, 4978.0, 2923.0, 1711.0, 1126.0, 629.0, 408.0, 253.0, 153.0, 100.0, 82.0, 46.0, 29.0, 25.0, 18.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9140625, -4.76513671875, -4.6162109375, -4.46728515625, -4.318359375, -4.16943359375, -4.0205078125, -3.87158203125, -3.72265625, -3.57373046875, -3.4248046875, -3.27587890625, -3.126953125, -2.97802734375, -2.8291015625, -2.68017578125, -2.53125, -2.38232421875, -2.2333984375, -2.08447265625, -1.935546875, -1.78662109375, -1.6376953125, -1.48876953125, -1.33984375, -1.19091796875, -1.0419921875, -0.89306640625, -0.744140625, -0.59521484375, -0.4462890625, -0.29736328125, -0.1484375, 0.00048828125, 0.1494140625, 0.29833984375, 0.447265625, 0.59619140625, 0.7451171875, 0.89404296875, 1.04296875, 1.19189453125, 1.3408203125, 1.48974609375, 1.638671875, 1.78759765625, 1.9365234375, 2.08544921875, 2.234375, 2.38330078125, 2.5322265625, 2.68115234375, 2.830078125, 2.97900390625, 3.1279296875, 3.27685546875, 3.42578125, 3.57470703125, 3.7236328125, 3.87255859375, 4.021484375, 4.17041015625, 4.3193359375, 4.46826171875, 4.6171875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 11.0, 5.0, 16.0, 11.0, 25.0, 25.0, 31.0, 41.0, 42.0, 53.0, 58.0, 64.0, 54.0, 65.0, 70.0, 50.0, 68.0, 54.0, 36.0, 37.0, 45.0, 21.0, 22.0, 15.0, 23.0, 14.0, 7.0, 10.0, 5.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002429485321044922, -0.00023453310132026672, -0.00022611767053604126, -0.0002177022397518158, -0.00020928680896759033, -0.00020087137818336487, -0.0001924559473991394, -0.00018404051661491394, -0.00017562508583068848, -0.000167209655046463, -0.00015879422426223755, -0.00015037879347801208, -0.00014196336269378662, -0.00013354793190956116, -0.0001251325011253357, -0.00011671707034111023, -0.00010830163955688477, -9.98862087726593e-05, -9.147077798843384e-05, -8.305534720420837e-05, -7.463991641998291e-05, -6.622448563575745e-05, -5.780905485153198e-05, -4.939362406730652e-05, -4.0978193283081055e-05, -3.256276249885559e-05, -2.4147331714630127e-05, -1.5731900930404663e-05, -7.316470146179199e-06, 1.0989606380462646e-06, 9.514391422271729e-06, 1.7929822206497192e-05, 2.6345252990722656e-05, 3.476068377494812e-05, 4.3176114559173584e-05, 5.159154534339905e-05, 6.000697612762451e-05, 6.842240691184998e-05, 7.683783769607544e-05, 8.52532684803009e-05, 9.366869926452637e-05, 0.00010208413004875183, 0.0001104995608329773, 0.00011891499161720276, 0.00012733042240142822, 0.0001357458531856537, 0.00014416128396987915, 0.00015257671475410461, 0.00016099214553833008, 0.00016940757632255554, 0.000177823007106781, 0.00018623843789100647, 0.00019465386867523193, 0.0002030692994594574, 0.00021148473024368286, 0.00021990016102790833, 0.0002283155918121338, 0.00023673102259635925, 0.0002451464533805847, 0.0002535618841648102, 0.00026197731494903564, 0.0002703927457332611, 0.00027880817651748657, 0.00028722360730171204, 0.0002956390380859375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 16.0, 24.0, 40.0, 53.0, 75.0, 110.0, 159.0, 231.0, 354.0, 624.0, 865.0, 1396.0, 2068.0, 3336.0, 5329.0, 8479.0, 13566.0, 20736.0, 32973.0, 51534.0, 77120.0, 107484.0, 136071.0, 146233.0, 131985.0, 102713.0, 72381.0, 48189.0, 30708.0, 19558.0, 12439.0, 7856.0, 4987.0, 3111.0, 2002.0, 1314.0, 851.0, 510.0, 361.0, 265.0, 135.0, 98.0, 65.0, 41.0, 20.0, 23.0, 16.0, 16.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-3.458984375, -3.352294921875, -3.24560546875, -3.138916015625, -3.0322265625, -2.925537109375, -2.81884765625, -2.712158203125, -2.60546875, -2.498779296875, -2.39208984375, -2.285400390625, -2.1787109375, -2.072021484375, -1.96533203125, -1.858642578125, -1.751953125, -1.645263671875, -1.53857421875, -1.431884765625, -1.3251953125, -1.218505859375, -1.11181640625, -1.005126953125, -0.8984375, -0.791748046875, -0.68505859375, -0.578369140625, -0.4716796875, -0.364990234375, -0.25830078125, -0.151611328125, -0.044921875, 0.061767578125, 0.16845703125, 0.275146484375, 0.3818359375, 0.488525390625, 0.59521484375, 0.701904296875, 0.80859375, 0.915283203125, 1.02197265625, 1.128662109375, 1.2353515625, 1.342041015625, 1.44873046875, 1.555419921875, 1.662109375, 1.768798828125, 1.87548828125, 1.982177734375, 2.0888671875, 2.195556640625, 2.30224609375, 2.408935546875, 2.515625, 2.622314453125, 2.72900390625, 2.835693359375, 2.9423828125, 3.049072265625, 3.15576171875, 3.262451171875, 3.369140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 10.0, 5.0, 12.0, 19.0, 10.0, 16.0, 26.0, 20.0, 27.0, 27.0, 34.0, 29.0, 55.0, 37.0, 34.0, 46.0, 48.0, 49.0, 46.0, 42.0, 37.0, 41.0, 46.0, 32.0, 33.0, 29.0, 34.0, 22.0, 20.0, 13.0, 12.0, 11.0, 16.0, 13.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.96728515625, -0.93695068359375, -0.9066162109375, -0.87628173828125, -0.845947265625, -0.81561279296875, -0.7852783203125, -0.75494384765625, -0.724609375, -0.69427490234375, -0.6639404296875, -0.63360595703125, -0.603271484375, -0.57293701171875, -0.5426025390625, -0.51226806640625, -0.48193359375, -0.45159912109375, -0.4212646484375, -0.39093017578125, -0.360595703125, -0.33026123046875, -0.2999267578125, -0.26959228515625, -0.2392578125, -0.20892333984375, -0.1785888671875, -0.14825439453125, -0.117919921875, -0.08758544921875, -0.0572509765625, -0.02691650390625, 0.00341796875, 0.03375244140625, 0.0640869140625, 0.09442138671875, 0.124755859375, 0.15509033203125, 0.1854248046875, 0.21575927734375, 0.24609375, 0.27642822265625, 0.3067626953125, 0.33709716796875, 0.367431640625, 0.39776611328125, 0.4281005859375, 0.45843505859375, 0.48876953125, 0.51910400390625, 0.5494384765625, 0.57977294921875, 0.610107421875, 0.64044189453125, 0.6707763671875, 0.70111083984375, 0.7314453125, 0.76177978515625, 0.7921142578125, 0.82244873046875, 0.852783203125, 0.88311767578125, 0.9134521484375, 0.94378662109375, 0.97412109375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 23.0, 16.0, 39.0, 46.0, 48.0, 59.0, 80.0, 50.0, 85.0, 87.0, 92.0, 64.0, 48.0, 43.0, 43.0, 30.0, 25.0, 19.0, 14.0, 12.0, 15.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.877593994140625, -23.158777236938477, -22.439960479736328, -21.721141815185547, -21.0023250579834, -20.28350830078125, -19.5646915435791, -18.845874786376953, -18.127058029174805, -17.408241271972656, -16.689424514770508, -15.970606803894043, -15.251790046691895, -14.53297233581543, -13.814155578613281, -13.095338821411133, -12.376521110534668, -11.65770435333252, -10.938886642456055, -10.220069885253906, -9.501253128051758, -8.78243637084961, -8.063618659973145, -7.344801902770996, -6.6259846687316895, -5.907167434692383, -5.188350677490234, -4.469533443450928, -3.7507164478302, -3.0318994522094727, -2.313082218170166, -1.5942654609680176, -0.8754482269287109, -0.15663117170333862, 0.5621858835220337, 1.2810029983520508, 1.9998199939727783, 2.718636989593506, 3.4374542236328125, 4.156270980834961, 4.875088214874268, 5.593905448913574, 6.312722206115723, 7.031539440155029, 7.750356674194336, 8.469173431396484, 9.187990188598633, 9.906806945800781, 10.625624656677246, 11.344441413879395, 12.06325912475586, 12.782075881958008, 13.500892639160156, 14.219709396362305, 14.93852710723877, 15.657343864440918, 16.376161575317383, 17.09497833251953, 17.81379508972168, 18.532611846923828, 19.25143051147461, 19.970247268676758, 20.689064025878906, 21.407880783081055, 22.126697540283203]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 14.0, 13.0, 12.0, 14.0, 20.0, 25.0, 24.0, 23.0, 41.0, 26.0, 40.0, 30.0, 39.0, 43.0, 54.0, 48.0, 45.0, 37.0, 34.0, 55.0, 29.0, 38.0, 31.0, 33.0, 23.0, 42.0, 26.0, 19.0, 17.0, 16.0, 11.0, 17.0, 12.0, 10.0, 9.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34538459777832, -7.082252025604248, -6.819119453430176, -6.555986404418945, -6.292853832244873, -6.029721260070801, -5.76658821105957, -5.503455638885498, -5.240323066711426, -4.9771904945373535, -4.714057922363281, -4.450924873352051, -4.1877923011779785, -3.9246597290039062, -3.661526918411255, -3.3983941078186035, -3.1352615356445312, -2.872128963470459, -2.6089961528778076, -2.3458633422851562, -2.082730770111084, -1.8195980787277222, -1.5564653873443604, -1.2933326959609985, -1.0302000045776367, -0.7670673131942749, -0.5039346218109131, -0.24080193042755127, 0.022330760955810547, 0.28546345233917236, 0.5485961437225342, 0.811728835105896, 1.0748615264892578, 1.3379942178726196, 1.6011269092559814, 1.8642596006393433, 2.127392292022705, 2.3905248641967773, 2.6536576747894287, 2.91679048538208, 3.1799230575561523, 3.4430556297302246, 3.706188440322876, 3.9693212509155273, 4.2324538230896, 4.495586395263672, 4.758719444274902, 5.021852016448975, 5.284984588623047, 5.548117160797119, 5.811249732971191, 6.074382781982422, 6.337515354156494, 6.600647926330566, 6.863780975341797, 7.126913547515869, 7.390046119689941, 7.653178691864014, 7.916311264038086, 8.179444313049316, 8.442577362060547, 8.705709457397461, 8.968842506408691, 9.231974601745605, 9.495107650756836]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 5.0, 10.0, 22.0, 30.0, 54.0, 74.0, 112.0, 199.0, 247.0, 409.0, 625.0, 994.0, 1522.0, 2279.0, 3680.0, 5735.0, 9338.0, 14549.0, 22630.0, 34685.0, 51624.0, 73368.0, 98198.0, 119614.0, 129898.0, 123666.0, 105216.0, 80975.0, 57704.0, 39409.0, 25789.0, 16776.0, 10669.0, 6813.0, 4224.0, 2660.0, 1695.0, 1038.0, 703.0, 438.0, 289.0, 198.0, 123.0, 82.0, 61.0, 38.0, 18.0, 21.0, 16.0, 7.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.4921875, -8.223876953125, -7.95556640625, -7.687255859375, -7.4189453125, -7.150634765625, -6.88232421875, -6.614013671875, -6.345703125, -6.077392578125, -5.80908203125, -5.540771484375, -5.2724609375, -5.004150390625, -4.73583984375, -4.467529296875, -4.19921875, -3.930908203125, -3.66259765625, -3.394287109375, -3.1259765625, -2.857666015625, -2.58935546875, -2.321044921875, -2.052734375, -1.784423828125, -1.51611328125, -1.247802734375, -0.9794921875, -0.711181640625, -0.44287109375, -0.174560546875, 0.09375, 0.362060546875, 0.63037109375, 0.898681640625, 1.1669921875, 1.435302734375, 1.70361328125, 1.971923828125, 2.240234375, 2.508544921875, 2.77685546875, 3.045166015625, 3.3134765625, 3.581787109375, 3.85009765625, 4.118408203125, 4.38671875, 4.655029296875, 4.92333984375, 5.191650390625, 5.4599609375, 5.728271484375, 5.99658203125, 6.264892578125, 6.533203125, 6.801513671875, 7.06982421875, 7.338134765625, 7.6064453125, 7.874755859375, 8.14306640625, 8.411376953125, 8.6796875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 3.0, 6.0, 6.0, 6.0, 13.0, 17.0, 18.0, 19.0, 26.0, 25.0, 19.0, 30.0, 29.0, 37.0, 34.0, 42.0, 45.0, 38.0, 51.0, 48.0, 42.0, 37.0, 41.0, 40.0, 38.0, 32.0, 32.0, 26.0, 30.0, 26.0, 19.0, 20.0, 18.0, 22.0, 9.0, 17.0, 8.0, 8.0, 4.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.98095703125, -8.6884765625, -8.39599609375, -8.103515625, -7.81103515625, -7.5185546875, -7.22607421875, -6.93359375, -6.64111328125, -6.3486328125, -6.05615234375, -5.763671875, -5.47119140625, -5.1787109375, -4.88623046875, -4.59375, -4.30126953125, -4.0087890625, -3.71630859375, -3.423828125, -3.13134765625, -2.8388671875, -2.54638671875, -2.25390625, -1.96142578125, -1.6689453125, -1.37646484375, -1.083984375, -0.79150390625, -0.4990234375, -0.20654296875, 0.0859375, 0.37841796875, 0.6708984375, 0.96337890625, 1.255859375, 1.54833984375, 1.8408203125, 2.13330078125, 2.42578125, 2.71826171875, 3.0107421875, 3.30322265625, 3.595703125, 3.88818359375, 4.1806640625, 4.47314453125, 4.765625, 5.05810546875, 5.3505859375, 5.64306640625, 5.935546875, 6.22802734375, 6.5205078125, 6.81298828125, 7.10546875, 7.39794921875, 7.6904296875, 7.98291015625, 8.275390625, 8.56787109375, 8.8603515625, 9.15283203125, 9.4453125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 20.0, 28.0, 40.0, 42.0, 77.0, 152.0, 240.0, 330.0, 626.0, 1063.0, 1812.0, 3182.0, 5370.0, 9127.0, 15484.0, 25758.0, 41363.0, 64579.0, 94519.0, 125005.0, 146018.0, 142799.0, 121592.0, 90267.0, 60896.0, 39372.0, 23786.0, 14295.0, 8634.0, 4927.0, 2900.0, 1739.0, 977.0, 571.0, 347.0, 201.0, 142.0, 98.0, 54.0, 32.0, 19.0, 17.0, 5.0, 16.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-10.703125, -10.3876953125, -10.072265625, -9.7568359375, -9.44140625, -9.1259765625, -8.810546875, -8.4951171875, -8.1796875, -7.8642578125, -7.548828125, -7.2333984375, -6.91796875, -6.6025390625, -6.287109375, -5.9716796875, -5.65625, -5.3408203125, -5.025390625, -4.7099609375, -4.39453125, -4.0791015625, -3.763671875, -3.4482421875, -3.1328125, -2.8173828125, -2.501953125, -2.1865234375, -1.87109375, -1.5556640625, -1.240234375, -0.9248046875, -0.609375, -0.2939453125, 0.021484375, 0.3369140625, 0.65234375, 0.9677734375, 1.283203125, 1.5986328125, 1.9140625, 2.2294921875, 2.544921875, 2.8603515625, 3.17578125, 3.4912109375, 3.806640625, 4.1220703125, 4.4375, 4.7529296875, 5.068359375, 5.3837890625, 5.69921875, 6.0146484375, 6.330078125, 6.6455078125, 6.9609375, 7.2763671875, 7.591796875, 7.9072265625, 8.22265625, 8.5380859375, 8.853515625, 9.1689453125, 9.484375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 6.0, 5.0, 0.0, 8.0, 9.0, 7.0, 12.0, 12.0, 21.0, 21.0, 18.0, 25.0, 29.0, 31.0, 25.0, 36.0, 37.0, 38.0, 37.0, 44.0, 47.0, 42.0, 47.0, 45.0, 60.0, 37.0, 29.0, 41.0, 33.0, 35.0, 27.0, 25.0, 15.0, 19.0, 19.0, 11.0, 8.0, 13.0, 11.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.15234375, -5.9656982421875, -5.779052734375, -5.5924072265625, -5.40576171875, -5.2191162109375, -5.032470703125, -4.8458251953125, -4.6591796875, -4.4725341796875, -4.285888671875, -4.0992431640625, -3.91259765625, -3.7259521484375, -3.539306640625, -3.3526611328125, -3.166015625, -2.9793701171875, -2.792724609375, -2.6060791015625, -2.41943359375, -2.2327880859375, -2.046142578125, -1.8594970703125, -1.6728515625, -1.4862060546875, -1.299560546875, -1.1129150390625, -0.92626953125, -0.7396240234375, -0.552978515625, -0.3663330078125, -0.1796875, 0.0069580078125, 0.193603515625, 0.3802490234375, 0.56689453125, 0.7535400390625, 0.940185546875, 1.1268310546875, 1.3134765625, 1.5001220703125, 1.686767578125, 1.8734130859375, 2.06005859375, 2.2467041015625, 2.433349609375, 2.6199951171875, 2.806640625, 2.9932861328125, 3.179931640625, 3.3665771484375, 3.55322265625, 3.7398681640625, 3.926513671875, 4.1131591796875, 4.2998046875, 4.4864501953125, 4.673095703125, 4.8597412109375, 5.04638671875, 5.2330322265625, 5.419677734375, 5.6063232421875, 5.79296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 11.0, 16.0, 26.0, 36.0, 85.0, 101.0, 176.0, 256.0, 407.0, 671.0, 1035.0, 1745.0, 2885.0, 4683.0, 7473.0, 12163.0, 19602.0, 31126.0, 48066.0, 71451.0, 99613.0, 127535.0, 141185.0, 134357.0, 110737.0, 80653.0, 55881.0, 36157.0, 22990.0, 14427.0, 8830.0, 5346.0, 3220.0, 2142.0, 1302.0, 844.0, 493.0, 303.0, 184.0, 128.0, 83.0, 40.0, 31.0, 12.0, 15.0, 11.0, 9.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.02734375, -3.904083251953125, -3.78082275390625, -3.657562255859375, -3.5343017578125, -3.411041259765625, -3.28778076171875, -3.164520263671875, -3.041259765625, -2.917999267578125, -2.79473876953125, -2.671478271484375, -2.5482177734375, -2.424957275390625, -2.30169677734375, -2.178436279296875, -2.05517578125, -1.931915283203125, -1.80865478515625, -1.685394287109375, -1.5621337890625, -1.438873291015625, -1.31561279296875, -1.192352294921875, -1.069091796875, -0.945831298828125, -0.82257080078125, -0.699310302734375, -0.5760498046875, -0.452789306640625, -0.32952880859375, -0.206268310546875, -0.0830078125, 0.040252685546875, 0.16351318359375, 0.286773681640625, 0.4100341796875, 0.533294677734375, 0.65655517578125, 0.779815673828125, 0.903076171875, 1.026336669921875, 1.14959716796875, 1.272857666015625, 1.3961181640625, 1.519378662109375, 1.64263916015625, 1.765899658203125, 1.88916015625, 2.012420654296875, 2.13568115234375, 2.258941650390625, 2.3822021484375, 2.505462646484375, 2.62872314453125, 2.751983642578125, 2.875244140625, 2.998504638671875, 3.12176513671875, 3.245025634765625, 3.3682861328125, 3.491546630859375, 3.61480712890625, 3.738067626953125, 3.861328125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 9.0, 10.0, 6.0, 11.0, 18.0, 32.0, 36.0, 37.0, 53.0, 60.0, 59.0, 81.0, 87.0, 69.0, 66.0, 70.0, 51.0, 47.0, 36.0, 36.0, 33.0, 27.0, 19.0, 11.0, 11.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005793571472167969, -0.0005607008934020996, -0.0005420446395874023, -0.0005233883857727051, -0.0005047321319580078, -0.00048607587814331055, -0.0004674196243286133, -0.000448763370513916, -0.00043010711669921875, -0.0004114508628845215, -0.0003927946090698242, -0.00037413835525512695, -0.0003554821014404297, -0.0003368258476257324, -0.00031816959381103516, -0.0002995133399963379, -0.0002808570861816406, -0.00026220083236694336, -0.0002435445785522461, -0.00022488832473754883, -0.00020623207092285156, -0.0001875758171081543, -0.00016891956329345703, -0.00015026330947875977, -0.0001316070556640625, -0.00011295080184936523, -9.429454803466797e-05, -7.56382942199707e-05, -5.698204040527344e-05, -3.832578659057617e-05, -1.9669532775878906e-05, -1.0132789611816406e-06, 1.7642974853515625e-05, 3.629922866821289e-05, 5.4955482482910156e-05, 7.361173629760742e-05, 9.226799011230469e-05, 0.00011092424392700195, 0.00012958049774169922, 0.00014823675155639648, 0.00016689300537109375, 0.00018554925918579102, 0.00020420551300048828, 0.00022286176681518555, 0.0002415180206298828, 0.0002601742744445801, 0.00027883052825927734, 0.0002974867820739746, 0.0003161430358886719, 0.00033479928970336914, 0.0003534555435180664, 0.00037211179733276367, 0.00039076805114746094, 0.0004094243049621582, 0.00042808055877685547, 0.00044673681259155273, 0.00046539306640625, 0.00048404932022094727, 0.0005027055740356445, 0.0005213618278503418, 0.0005400180816650391, 0.0005586743354797363, 0.0005773305892944336, 0.0005959868431091309, 0.0006146430969238281]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 13.0, 21.0, 33.0, 49.0, 69.0, 119.0, 161.0, 248.0, 386.0, 572.0, 892.0, 1328.0, 2153.0, 3243.0, 5030.0, 7392.0, 11436.0, 17523.0, 25975.0, 38533.0, 55562.0, 74980.0, 97310.0, 115445.0, 124092.0, 116973.0, 98997.0, 76793.0, 55767.0, 39222.0, 26252.0, 17850.0, 11809.0, 7772.0, 4915.0, 3418.0, 2237.0, 1398.0, 916.0, 547.0, 338.0, 274.0, 169.0, 112.0, 76.0, 57.0, 25.0, 17.0, 21.0, 13.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.5390625, -3.433502197265625, -3.32794189453125, -3.222381591796875, -3.1168212890625, -3.011260986328125, -2.90570068359375, -2.800140380859375, -2.694580078125, -2.589019775390625, -2.48345947265625, -2.377899169921875, -2.2723388671875, -2.166778564453125, -2.06121826171875, -1.955657958984375, -1.85009765625, -1.744537353515625, -1.63897705078125, -1.533416748046875, -1.4278564453125, -1.322296142578125, -1.21673583984375, -1.111175537109375, -1.005615234375, -0.900054931640625, -0.79449462890625, -0.688934326171875, -0.5833740234375, -0.477813720703125, -0.37225341796875, -0.266693115234375, -0.1611328125, -0.055572509765625, 0.04998779296875, 0.155548095703125, 0.2611083984375, 0.366668701171875, 0.47222900390625, 0.577789306640625, 0.683349609375, 0.788909912109375, 0.89447021484375, 1.000030517578125, 1.1055908203125, 1.211151123046875, 1.31671142578125, 1.422271728515625, 1.52783203125, 1.633392333984375, 1.73895263671875, 1.844512939453125, 1.9500732421875, 2.055633544921875, 2.16119384765625, 2.266754150390625, 2.372314453125, 2.477874755859375, 2.58343505859375, 2.688995361328125, 2.7945556640625, 2.900115966796875, 3.00567626953125, 3.111236572265625, 3.216796875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 5.0, 6.0, 8.0, 11.0, 13.0, 11.0, 15.0, 13.0, 32.0, 24.0, 20.0, 27.0, 26.0, 34.0, 45.0, 38.0, 39.0, 35.0, 47.0, 44.0, 50.0, 40.0, 47.0, 36.0, 34.0, 33.0, 27.0, 38.0, 27.0, 24.0, 21.0, 18.0, 13.0, 12.0, 13.0, 12.0, 10.0, 13.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1240234375, -1.089202880859375, -1.05438232421875, -1.019561767578125, -0.9847412109375, -0.949920654296875, -0.91510009765625, -0.880279541015625, -0.845458984375, -0.810638427734375, -0.77581787109375, -0.740997314453125, -0.7061767578125, -0.671356201171875, -0.63653564453125, -0.601715087890625, -0.56689453125, -0.532073974609375, -0.49725341796875, -0.462432861328125, -0.4276123046875, -0.392791748046875, -0.35797119140625, -0.323150634765625, -0.288330078125, -0.253509521484375, -0.21868896484375, -0.183868408203125, -0.1490478515625, -0.114227294921875, -0.07940673828125, -0.044586181640625, -0.009765625, 0.025054931640625, 0.05987548828125, 0.094696044921875, 0.1295166015625, 0.164337158203125, 0.19915771484375, 0.233978271484375, 0.268798828125, 0.303619384765625, 0.33843994140625, 0.373260498046875, 0.4080810546875, 0.442901611328125, 0.47772216796875, 0.512542724609375, 0.54736328125, 0.582183837890625, 0.61700439453125, 0.651824951171875, 0.6866455078125, 0.721466064453125, 0.75628662109375, 0.791107177734375, 0.825927734375, 0.860748291015625, 0.89556884765625, 0.930389404296875, 0.9652099609375, 1.000030517578125, 1.03485107421875, 1.069671630859375, 1.1044921875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 3.0, 5.0, 10.0, 15.0, 21.0, 27.0, 31.0, 43.0, 41.0, 66.0, 74.0, 83.0, 78.0, 77.0, 81.0, 65.0, 52.0, 51.0, 40.0, 32.0, 22.0, 12.0, 16.0, 15.0, 10.0, 7.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.025188446044922, -24.291629791259766, -23.558069229125977, -22.82451057434082, -22.09095001220703, -21.357391357421875, -20.62383270263672, -19.89027214050293, -19.15671157836914, -18.423152923583984, -17.689592361450195, -16.95603370666504, -16.22247314453125, -15.488914489746094, -14.755354881286621, -14.021795272827148, -13.288236618041992, -12.55467700958252, -11.821117401123047, -11.08755874633789, -10.353998184204102, -9.620439529418945, -8.886879920959473, -8.1533203125, -7.419760704040527, -6.686201095581055, -5.952641487121582, -5.219082355499268, -4.485522747039795, -3.7519631385803223, -3.018404006958008, -2.284844398498535, -1.5512828826904297, -0.8177233934402466, -0.08416390419006348, 0.6493954658508301, 1.3829550743103027, 2.1165146827697754, 2.85007381439209, 3.5836334228515625, 4.317193031311035, 5.050752639770508, 5.7843122482299805, 6.517871379852295, 7.251430988311768, 7.98499059677124, 8.718549728393555, 9.452109336853027, 10.1856689453125, 10.919228553771973, 11.652788162231445, 12.386346817016602, 13.11990737915039, 13.853466033935547, 14.58702564239502, 15.320585250854492, 16.05414581298828, 16.787704467773438, 17.521265029907227, 18.254823684692383, 18.988384246826172, 19.721942901611328, 20.455501556396484, 21.189062118530273, 21.92262077331543]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 14.0, 19.0, 19.0, 14.0, 28.0, 17.0, 27.0, 29.0, 51.0, 36.0, 36.0, 40.0, 49.0, 51.0, 50.0, 41.0, 50.0, 33.0, 36.0, 36.0, 40.0, 24.0, 36.0, 32.0, 18.0, 17.0, 23.0, 16.0, 18.0, 5.0, 13.0, 15.0, 7.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.810589790344238, -8.527017593383789, -8.243444442749023, -7.959872245788574, -7.676299571990967, -7.392726898193359, -7.10915470123291, -6.825582027435303, -6.542009353637695, -6.258436679840088, -5.9748640060424805, -5.691291809082031, -5.407719135284424, -5.124146461486816, -4.840574264526367, -4.55700159072876, -4.273428916931152, -3.989856243133545, -3.7062838077545166, -3.4227113723754883, -3.139138698577881, -2.8555660247802734, -2.571993589401245, -2.288421154022217, -2.0048484802246094, -1.7212759256362915, -1.4377033710479736, -1.1541308164596558, -0.8705582618713379, -0.58698570728302, -0.30341315269470215, -0.019840598106384277, 0.2637319564819336, 0.5473045110702515, 0.8308770656585693, 1.1144496202468872, 1.398022174835205, 1.681594729423523, 1.9651672840118408, 2.248739719390869, 2.5323123931884766, 2.815885066986084, 3.0994575023651123, 3.3830299377441406, 3.666602611541748, 3.9501752853393555, 4.233747482299805, 4.517320156097412, 4.8008928298950195, 5.084465503692627, 5.368038177490234, 5.651610374450684, 5.935183048248291, 6.218755722045898, 6.502327919006348, 6.785900592803955, 7.0694732666015625, 7.35304594039917, 7.636618614196777, 7.920190811157227, 8.203763961791992, 8.487336158752441, 8.77090835571289, 9.054481506347656, 9.338053703308105]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 15.0, 18.0, 26.0, 37.0, 56.0, 76.0, 95.0, 140.0, 246.0, 385.0, 582.0, 976.0, 1832.0, 3084.0, 5583.0, 10401.0, 20757.0, 42792.0, 93038.0, 215440.0, 529385.0, 1138360.0, 1166090.0, 551700.0, 224289.0, 95870.0, 44702.0, 22163.0, 11593.0, 6191.0, 3370.0, 1922.0, 1154.0, 723.0, 433.0, 243.0, 178.0, 99.0, 75.0, 45.0, 32.0, 29.0, 18.0, 15.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.578125, -17.998046875, -17.41796875, -16.837890625, -16.2578125, -15.677734375, -15.09765625, -14.517578125, -13.9375, -13.357421875, -12.77734375, -12.197265625, -11.6171875, -11.037109375, -10.45703125, -9.876953125, -9.296875, -8.716796875, -8.13671875, -7.556640625, -6.9765625, -6.396484375, -5.81640625, -5.236328125, -4.65625, -4.076171875, -3.49609375, -2.916015625, -2.3359375, -1.755859375, -1.17578125, -0.595703125, -0.015625, 0.564453125, 1.14453125, 1.724609375, 2.3046875, 2.884765625, 3.46484375, 4.044921875, 4.625, 5.205078125, 5.78515625, 6.365234375, 6.9453125, 7.525390625, 8.10546875, 8.685546875, 9.265625, 9.845703125, 10.42578125, 11.005859375, 11.5859375, 12.166015625, 12.74609375, 13.326171875, 13.90625, 14.486328125, 15.06640625, 15.646484375, 16.2265625, 16.806640625, 17.38671875, 17.966796875, 18.546875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 14.0, 16.0, 19.0, 18.0, 12.0, 26.0, 39.0, 28.0, 23.0, 37.0, 37.0, 32.0, 38.0, 34.0, 42.0, 41.0, 57.0, 43.0, 51.0, 48.0, 35.0, 33.0, 27.0, 35.0, 35.0, 31.0, 18.0, 16.0, 17.0, 10.0, 10.0, 12.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1015625, -6.87933349609375, -6.6571044921875, -6.43487548828125, -6.212646484375, -5.99041748046875, -5.7681884765625, -5.54595947265625, -5.32373046875, -5.10150146484375, -4.8792724609375, -4.65704345703125, -4.434814453125, -4.21258544921875, -3.9903564453125, -3.76812744140625, -3.5458984375, -3.32366943359375, -3.1014404296875, -2.87921142578125, -2.656982421875, -2.43475341796875, -2.2125244140625, -1.99029541015625, -1.76806640625, -1.54583740234375, -1.3236083984375, -1.10137939453125, -0.879150390625, -0.65692138671875, -0.4346923828125, -0.21246337890625, 0.009765625, 0.23199462890625, 0.4542236328125, 0.67645263671875, 0.898681640625, 1.12091064453125, 1.3431396484375, 1.56536865234375, 1.78759765625, 2.00982666015625, 2.2320556640625, 2.45428466796875, 2.676513671875, 2.89874267578125, 3.1209716796875, 3.34320068359375, 3.5654296875, 3.78765869140625, 4.0098876953125, 4.23211669921875, 4.454345703125, 4.67657470703125, 4.8988037109375, 5.12103271484375, 5.34326171875, 5.56549072265625, 5.7877197265625, 6.00994873046875, 6.232177734375, 6.45440673828125, 6.6766357421875, 6.89886474609375, 7.12109375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 13.0, 21.0, 42.0, 65.0, 91.0, 146.0, 236.0, 333.0, 566.0, 902.0, 1471.0, 2358.0, 3987.0, 6940.0, 11424.0, 20366.0, 36080.0, 65018.0, 120805.0, 226193.0, 421760.0, 721622.0, 920162.0, 718435.0, 420285.0, 224840.0, 119826.0, 64875.0, 36088.0, 20102.0, 11835.0, 6865.0, 4089.0, 2491.0, 1479.0, 880.0, 606.0, 368.0, 222.0, 132.0, 88.0, 57.0, 41.0, 26.0, 12.0, 14.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-16.40625, -15.9306640625, -15.455078125, -14.9794921875, -14.50390625, -14.0283203125, -13.552734375, -13.0771484375, -12.6015625, -12.1259765625, -11.650390625, -11.1748046875, -10.69921875, -10.2236328125, -9.748046875, -9.2724609375, -8.796875, -8.3212890625, -7.845703125, -7.3701171875, -6.89453125, -6.4189453125, -5.943359375, -5.4677734375, -4.9921875, -4.5166015625, -4.041015625, -3.5654296875, -3.08984375, -2.6142578125, -2.138671875, -1.6630859375, -1.1875, -0.7119140625, -0.236328125, 0.2392578125, 0.71484375, 1.1904296875, 1.666015625, 2.1416015625, 2.6171875, 3.0927734375, 3.568359375, 4.0439453125, 4.51953125, 4.9951171875, 5.470703125, 5.9462890625, 6.421875, 6.8974609375, 7.373046875, 7.8486328125, 8.32421875, 8.7998046875, 9.275390625, 9.7509765625, 10.2265625, 10.7021484375, 11.177734375, 11.6533203125, 12.12890625, 12.6044921875, 13.080078125, 13.5556640625, 14.03125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 6.0, 10.0, 7.0, 10.0, 15.0, 25.0, 18.0, 38.0, 45.0, 65.0, 92.0, 119.0, 166.0, 174.0, 234.0, 269.0, 287.0, 311.0, 293.0, 301.0, 281.0, 259.0, 232.0, 178.0, 133.0, 111.0, 74.0, 86.0, 66.0, 36.0, 32.0, 30.0, 15.0, 13.0, 13.0, 8.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.74609375, -5.5792236328125, -5.412353515625, -5.2454833984375, -5.07861328125, -4.9117431640625, -4.744873046875, -4.5780029296875, -4.4111328125, -4.2442626953125, -4.077392578125, -3.9105224609375, -3.74365234375, -3.5767822265625, -3.409912109375, -3.2430419921875, -3.076171875, -2.9093017578125, -2.742431640625, -2.5755615234375, -2.40869140625, -2.2418212890625, -2.074951171875, -1.9080810546875, -1.7412109375, -1.5743408203125, -1.407470703125, -1.2406005859375, -1.07373046875, -0.9068603515625, -0.739990234375, -0.5731201171875, -0.40625, -0.2393798828125, -0.072509765625, 0.0943603515625, 0.26123046875, 0.4281005859375, 0.594970703125, 0.7618408203125, 0.9287109375, 1.0955810546875, 1.262451171875, 1.4293212890625, 1.59619140625, 1.7630615234375, 1.929931640625, 2.0968017578125, 2.263671875, 2.4305419921875, 2.597412109375, 2.7642822265625, 2.93115234375, 3.0980224609375, 3.264892578125, 3.4317626953125, 3.5986328125, 3.7655029296875, 3.932373046875, 4.0992431640625, 4.26611328125, 4.4329833984375, 4.599853515625, 4.7667236328125, 4.93359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 8.0, 6.0, 12.0, 14.0, 33.0, 33.0, 22.0, 41.0, 54.0, 54.0, 68.0, 71.0, 61.0, 77.0, 73.0, 56.0, 53.0, 42.0, 35.0, 32.0, 32.0, 15.0, 20.0, 10.0, 4.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.09366798400879, -18.480443954467773, -17.867218017578125, -17.25399398803711, -16.64076805114746, -16.027544021606445, -15.414319038391113, -14.801094055175781, -14.18786907196045, -13.574644088745117, -12.961419105529785, -12.348194122314453, -11.734970092773438, -11.121744155883789, -10.508520126342773, -9.895295143127441, -9.28207015991211, -8.668845176696777, -8.055620193481445, -7.4423956871032715, -6.8291707038879395, -6.215945720672607, -5.602721214294434, -4.989496231079102, -4.3762712478637695, -3.7630462646484375, -3.1498215198516846, -2.5365967750549316, -1.9233717918395996, -1.3101468086242676, -0.6969220638275146, -0.08369731903076172, 0.5295276641845703, 1.1427525281906128, 1.7559773921966553, 2.369202136993408, 2.9824271202087402, 3.5956521034240723, 4.208876609802246, 4.822101593017578, 5.43532657623291, 6.048551559448242, 6.661776542663574, 7.275001049041748, 7.88822603225708, 8.50145149230957, 9.114675521850586, 9.727900505065918, 10.34112548828125, 10.954350471496582, 11.567575454711914, 12.180800437927246, 12.794025421142578, 13.407249450683594, 14.020474433898926, 14.633699417114258, 15.24692440032959, 15.860149383544922, 16.473373413085938, 17.086599349975586, 17.6998233795166, 18.31304931640625, 18.926273345947266, 19.53949737548828, 20.15272331237793]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 7.0, 3.0, 5.0, 9.0, 13.0, 13.0, 14.0, 11.0, 22.0, 30.0, 32.0, 19.0, 33.0, 37.0, 35.0, 44.0, 45.0, 39.0, 45.0, 45.0, 59.0, 56.0, 41.0, 36.0, 37.0, 42.0, 24.0, 24.0, 24.0, 17.0, 19.0, 28.0, 18.0, 10.0, 14.0, 5.0, 11.0, 9.0, 5.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.348005294799805, -8.07004165649414, -7.792078018188477, -7.5141143798828125, -7.236151218414307, -6.958187580108643, -6.6802239418029785, -6.4022603034973145, -6.124297142028809, -5.8463335037231445, -5.5683698654174805, -5.290406227111816, -5.0124430656433105, -4.7344794273376465, -4.456515789031982, -4.178552150726318, -3.9005885124206543, -3.6226248741149902, -3.3446614742279053, -3.066697835922241, -2.7887344360351562, -2.510770797729492, -2.232807159423828, -1.9548436403274536, -1.676880121231079, -1.3989166021347046, -1.12095308303833, -0.842989444732666, -0.5650259256362915, -0.287062406539917, -0.00909876823425293, 0.2688647508621216, 0.5468282699584961, 0.8247917890548706, 1.1027553081512451, 1.3807189464569092, 1.6586824655532837, 1.9366459846496582, 2.2146096229553223, 2.4925732612609863, 2.7705366611480713, 3.0485002994537354, 3.3264636993408203, 3.6044273376464844, 3.8823909759521484, 4.1603546142578125, 4.438318252563477, 4.716281414031982, 4.9942450523376465, 5.2722086906433105, 5.550172328948975, 5.8281354904174805, 6.1060991287231445, 6.384062767028809, 6.662026405334473, 6.939990043640137, 7.217953681945801, 7.495917320251465, 7.773880958557129, 8.051844596862793, 8.329808235168457, 8.607770919799805, 8.885734558105469, 9.163698196411133, 9.441661834716797]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 9.0, 11.0, 22.0, 28.0, 54.0, 79.0, 132.0, 206.0, 329.0, 567.0, 920.0, 1618.0, 3055.0, 5831.0, 11472.0, 22080.0, 42717.0, 80288.0, 136228.0, 192485.0, 199576.0, 152880.0, 93059.0, 50670.0, 25750.0, 13353.0, 6939.0, 3566.0, 1928.0, 1112.0, 625.0, 332.0, 210.0, 137.0, 92.0, 53.0, 35.0, 25.0, 16.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0], "bins": [-9.296875, -9.0162353515625, -8.735595703125, -8.4549560546875, -8.17431640625, -7.8936767578125, -7.613037109375, -7.3323974609375, -7.0517578125, -6.7711181640625, -6.490478515625, -6.2098388671875, -5.92919921875, -5.6485595703125, -5.367919921875, -5.0872802734375, -4.806640625, -4.5260009765625, -4.245361328125, -3.9647216796875, -3.68408203125, -3.4034423828125, -3.122802734375, -2.8421630859375, -2.5615234375, -2.2808837890625, -2.000244140625, -1.7196044921875, -1.43896484375, -1.1583251953125, -0.877685546875, -0.5970458984375, -0.31640625, -0.0357666015625, 0.244873046875, 0.5255126953125, 0.80615234375, 1.0867919921875, 1.367431640625, 1.6480712890625, 1.9287109375, 2.2093505859375, 2.489990234375, 2.7706298828125, 3.05126953125, 3.3319091796875, 3.612548828125, 3.8931884765625, 4.173828125, 4.4544677734375, 4.735107421875, 5.0157470703125, 5.29638671875, 5.5770263671875, 5.857666015625, 6.1383056640625, 6.4189453125, 6.6995849609375, 6.980224609375, 7.2608642578125, 7.54150390625, 7.8221435546875, 8.102783203125, 8.3834228515625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 13.0, 15.0, 11.0, 24.0, 19.0, 27.0, 25.0, 33.0, 27.0, 33.0, 32.0, 48.0, 34.0, 37.0, 54.0, 36.0, 50.0, 49.0, 40.0, 34.0, 36.0, 40.0, 32.0, 29.0, 27.0, 26.0, 20.0, 14.0, 17.0, 24.0, 5.0, 14.0, 18.0, 6.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1484375, -7.850830078125, -7.55322265625, -7.255615234375, -6.9580078125, -6.660400390625, -6.36279296875, -6.065185546875, -5.767578125, -5.469970703125, -5.17236328125, -4.874755859375, -4.5771484375, -4.279541015625, -3.98193359375, -3.684326171875, -3.38671875, -3.089111328125, -2.79150390625, -2.493896484375, -2.1962890625, -1.898681640625, -1.60107421875, -1.303466796875, -1.005859375, -0.708251953125, -0.41064453125, -0.113037109375, 0.1845703125, 0.482177734375, 0.77978515625, 1.077392578125, 1.375, 1.672607421875, 1.97021484375, 2.267822265625, 2.5654296875, 2.863037109375, 3.16064453125, 3.458251953125, 3.755859375, 4.053466796875, 4.35107421875, 4.648681640625, 4.9462890625, 5.243896484375, 5.54150390625, 5.839111328125, 6.13671875, 6.434326171875, 6.73193359375, 7.029541015625, 7.3271484375, 7.624755859375, 7.92236328125, 8.219970703125, 8.517578125, 8.815185546875, 9.11279296875, 9.410400390625, 9.7080078125, 10.005615234375, 10.30322265625, 10.600830078125, 10.8984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 14.0, 23.0, 32.0, 47.0, 100.0, 118.0, 187.0, 311.0, 587.0, 953.0, 1695.0, 3265.0, 6600.0, 13247.0, 28096.0, 60577.0, 127494.0, 228609.0, 258409.0, 164087.0, 80825.0, 38001.0, 17462.0, 8398.0, 4197.0, 2226.0, 1193.0, 718.0, 413.0, 259.0, 140.0, 90.0, 56.0, 43.0, 19.0, 18.0, 9.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.88720703125, -10.5009765625, -10.11474609375, -9.728515625, -9.34228515625, -8.9560546875, -8.56982421875, -8.18359375, -7.79736328125, -7.4111328125, -7.02490234375, -6.638671875, -6.25244140625, -5.8662109375, -5.47998046875, -5.09375, -4.70751953125, -4.3212890625, -3.93505859375, -3.548828125, -3.16259765625, -2.7763671875, -2.39013671875, -2.00390625, -1.61767578125, -1.2314453125, -0.84521484375, -0.458984375, -0.07275390625, 0.3134765625, 0.69970703125, 1.0859375, 1.47216796875, 1.8583984375, 2.24462890625, 2.630859375, 3.01708984375, 3.4033203125, 3.78955078125, 4.17578125, 4.56201171875, 4.9482421875, 5.33447265625, 5.720703125, 6.10693359375, 6.4931640625, 6.87939453125, 7.265625, 7.65185546875, 8.0380859375, 8.42431640625, 8.810546875, 9.19677734375, 9.5830078125, 9.96923828125, 10.35546875, 10.74169921875, 11.1279296875, 11.51416015625, 11.900390625, 12.28662109375, 12.6728515625, 13.05908203125, 13.4453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 4.0, 8.0, 17.0, 12.0, 7.0, 14.0, 22.0, 13.0, 21.0, 18.0, 17.0, 33.0, 33.0, 30.0, 28.0, 40.0, 35.0, 32.0, 32.0, 31.0, 38.0, 45.0, 42.0, 39.0, 40.0, 44.0, 39.0, 27.0, 32.0, 30.0, 23.0, 26.0, 16.0, 21.0, 16.0, 16.0, 15.0, 13.0, 4.0, 5.0, 4.0, 0.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-5.390625, -5.22869873046875, -5.0667724609375, -4.90484619140625, -4.742919921875, -4.58099365234375, -4.4190673828125, -4.25714111328125, -4.09521484375, -3.93328857421875, -3.7713623046875, -3.60943603515625, -3.447509765625, -3.28558349609375, -3.1236572265625, -2.96173095703125, -2.7998046875, -2.63787841796875, -2.4759521484375, -2.31402587890625, -2.152099609375, -1.99017333984375, -1.8282470703125, -1.66632080078125, -1.50439453125, -1.34246826171875, -1.1805419921875, -1.01861572265625, -0.856689453125, -0.69476318359375, -0.5328369140625, -0.37091064453125, -0.208984375, -0.04705810546875, 0.1148681640625, 0.27679443359375, 0.438720703125, 0.60064697265625, 0.7625732421875, 0.92449951171875, 1.08642578125, 1.24835205078125, 1.4102783203125, 1.57220458984375, 1.734130859375, 1.89605712890625, 2.0579833984375, 2.21990966796875, 2.3818359375, 2.54376220703125, 2.7056884765625, 2.86761474609375, 3.029541015625, 3.19146728515625, 3.3533935546875, 3.51531982421875, 3.67724609375, 3.83917236328125, 4.0010986328125, 4.16302490234375, 4.324951171875, 4.48687744140625, 4.6488037109375, 4.81072998046875, 4.97265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 9.0, 15.0, 10.0, 21.0, 28.0, 41.0, 58.0, 72.0, 104.0, 178.0, 251.0, 452.0, 666.0, 1256.0, 2184.0, 4515.0, 9895.0, 23368.0, 60254.0, 159746.0, 335123.0, 267527.0, 109246.0, 41607.0, 16828.0, 7162.0, 3492.0, 1843.0, 991.0, 556.0, 320.0, 231.0, 154.0, 103.0, 59.0, 44.0, 47.0, 26.0, 18.0, 8.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.6328125, -8.36962890625, -8.1064453125, -7.84326171875, -7.580078125, -7.31689453125, -7.0537109375, -6.79052734375, -6.52734375, -6.26416015625, -6.0009765625, -5.73779296875, -5.474609375, -5.21142578125, -4.9482421875, -4.68505859375, -4.421875, -4.15869140625, -3.8955078125, -3.63232421875, -3.369140625, -3.10595703125, -2.8427734375, -2.57958984375, -2.31640625, -2.05322265625, -1.7900390625, -1.52685546875, -1.263671875, -1.00048828125, -0.7373046875, -0.47412109375, -0.2109375, 0.05224609375, 0.3154296875, 0.57861328125, 0.841796875, 1.10498046875, 1.3681640625, 1.63134765625, 1.89453125, 2.15771484375, 2.4208984375, 2.68408203125, 2.947265625, 3.21044921875, 3.4736328125, 3.73681640625, 4.0, 4.26318359375, 4.5263671875, 4.78955078125, 5.052734375, 5.31591796875, 5.5791015625, 5.84228515625, 6.10546875, 6.36865234375, 6.6318359375, 6.89501953125, 7.158203125, 7.42138671875, 7.6845703125, 7.94775390625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 7.0, 4.0, 7.0, 14.0, 25.0, 29.0, 25.0, 39.0, 50.0, 47.0, 72.0, 91.0, 79.0, 90.0, 83.0, 56.0, 53.0, 48.0, 42.0, 38.0, 24.0, 25.0, 13.0, 6.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331878662109375, -0.000321120023727417, -0.000310361385345459, -0.000299602746963501, -0.00028884410858154297, -0.00027808547019958496, -0.00026732683181762695, -0.00025656819343566895, -0.00024580955505371094, -0.00023505091667175293, -0.00022429227828979492, -0.00021353363990783691, -0.0002027750015258789, -0.0001920163631439209, -0.0001812577247619629, -0.00017049908638000488, -0.00015974044799804688, -0.00014898180961608887, -0.00013822317123413086, -0.00012746453285217285, -0.00011670589447021484, -0.00010594725608825684, -9.518861770629883e-05, -8.442997932434082e-05, -7.367134094238281e-05, -6.29127025604248e-05, -5.21540641784668e-05, -4.139542579650879e-05, -3.063678741455078e-05, -1.9878149032592773e-05, -9.119510650634766e-06, 1.6391277313232422e-06, 1.239776611328125e-05, 2.3156404495239258e-05, 3.3915042877197266e-05, 4.4673681259155273e-05, 5.543231964111328e-05, 6.619095802307129e-05, 7.69495964050293e-05, 8.77082347869873e-05, 9.846687316894531e-05, 0.00010922551155090332, 0.00011998414993286133, 0.00013074278831481934, 0.00014150142669677734, 0.00015226006507873535, 0.00016301870346069336, 0.00017377734184265137, 0.00018453598022460938, 0.00019529461860656738, 0.0002060532569885254, 0.0002168118953704834, 0.0002275705337524414, 0.00023832917213439941, 0.0002490878105163574, 0.00025984644889831543, 0.00027060508728027344, 0.00028136372566223145, 0.00029212236404418945, 0.00030288100242614746, 0.00031363964080810547, 0.0003243982791900635, 0.0003351569175720215, 0.0003459155559539795, 0.0003566741943359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 9.0, 12.0, 16.0, 25.0, 32.0, 54.0, 88.0, 130.0, 192.0, 279.0, 508.0, 790.0, 1422.0, 2519.0, 4805.0, 9615.0, 20909.0, 47211.0, 104500.0, 202442.0, 264023.0, 199587.0, 102411.0, 46173.0, 20671.0, 9493.0, 4655.0, 2431.0, 1387.0, 798.0, 509.0, 313.0, 177.0, 122.0, 72.0, 58.0, 51.0, 21.0, 12.0, 14.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.43243408203125, -6.2281494140625, -6.02386474609375, -5.819580078125, -5.61529541015625, -5.4110107421875, -5.20672607421875, -5.00244140625, -4.79815673828125, -4.5938720703125, -4.38958740234375, -4.185302734375, -3.98101806640625, -3.7767333984375, -3.57244873046875, -3.3681640625, -3.16387939453125, -2.9595947265625, -2.75531005859375, -2.551025390625, -2.34674072265625, -2.1424560546875, -1.93817138671875, -1.73388671875, -1.52960205078125, -1.3253173828125, -1.12103271484375, -0.916748046875, -0.71246337890625, -0.5081787109375, -0.30389404296875, -0.099609375, 0.10467529296875, 0.3089599609375, 0.51324462890625, 0.717529296875, 0.92181396484375, 1.1260986328125, 1.33038330078125, 1.53466796875, 1.73895263671875, 1.9432373046875, 2.14752197265625, 2.351806640625, 2.55609130859375, 2.7603759765625, 2.96466064453125, 3.1689453125, 3.37322998046875, 3.5775146484375, 3.78179931640625, 3.986083984375, 4.19036865234375, 4.3946533203125, 4.59893798828125, 4.80322265625, 5.00750732421875, 5.2117919921875, 5.41607666015625, 5.620361328125, 5.82464599609375, 6.0289306640625, 6.23321533203125, 6.4375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 8.0, 6.0, 9.0, 8.0, 26.0, 31.0, 40.0, 37.0, 46.0, 53.0, 51.0, 53.0, 62.0, 64.0, 83.0, 57.0, 71.0, 49.0, 49.0, 32.0, 35.0, 33.0, 18.0, 23.0, 8.0, 12.0, 11.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.339019775390625, -1.29034423828125, -1.241668701171875, -1.1929931640625, -1.144317626953125, -1.09564208984375, -1.046966552734375, -0.998291015625, -0.949615478515625, -0.90093994140625, -0.852264404296875, -0.8035888671875, -0.754913330078125, -0.70623779296875, -0.657562255859375, -0.60888671875, -0.560211181640625, -0.51153564453125, -0.462860107421875, -0.4141845703125, -0.365509033203125, -0.31683349609375, -0.268157958984375, -0.219482421875, -0.170806884765625, -0.12213134765625, -0.073455810546875, -0.0247802734375, 0.023895263671875, 0.07257080078125, 0.121246337890625, 0.169921875, 0.218597412109375, 0.26727294921875, 0.315948486328125, 0.3646240234375, 0.413299560546875, 0.46197509765625, 0.510650634765625, 0.559326171875, 0.608001708984375, 0.65667724609375, 0.705352783203125, 0.7540283203125, 0.802703857421875, 0.85137939453125, 0.900054931640625, 0.94873046875, 0.997406005859375, 1.04608154296875, 1.094757080078125, 1.1434326171875, 1.192108154296875, 1.24078369140625, 1.289459228515625, 1.338134765625, 1.386810302734375, 1.43548583984375, 1.484161376953125, 1.5328369140625, 1.581512451171875, 1.63018798828125, 1.678863525390625, 1.7275390625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 5.0, 8.0, 9.0, 20.0, 24.0, 30.0, 32.0, 27.0, 43.0, 55.0, 54.0, 54.0, 64.0, 71.0, 65.0, 72.0, 54.0, 49.0, 37.0, 35.0, 25.0, 32.0, 20.0, 18.0, 15.0, 9.0, 11.0, 9.0, 3.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.752038955688477, -17.176942825317383, -16.601844787597656, -16.026748657226562, -15.451651573181152, -14.876554489135742, -14.301458358764648, -13.726361274719238, -13.151264190673828, -12.576167106628418, -12.001070022583008, -11.425973892211914, -10.850876808166504, -10.275779724121094, -9.70068359375, -9.12558650970459, -8.55048942565918, -7.9753923416137695, -7.400295734405518, -6.825199127197266, -6.2501020431518555, -5.675004959106445, -5.099908351898193, -4.524811744689941, -3.9497146606445312, -3.3746178150177, -2.799520969390869, -2.224424123764038, -1.649327278137207, -1.074230432510376, -0.4991335868835449, 0.07596302032470703, 0.6510601043701172, 1.2261569499969482, 1.8012537956237793, 2.3763506412506104, 2.9514474868774414, 3.5265443325042725, 4.1016411781311035, 4.6767377853393555, 5.251834869384766, 5.826931953430176, 6.402028560638428, 6.97712516784668, 7.55222225189209, 8.1273193359375, 8.702415466308594, 9.277512550354004, 9.852609634399414, 10.427706718444824, 11.002803802490234, 11.577899932861328, 12.152997016906738, 12.728094100952148, 13.303190231323242, 13.878287315368652, 14.453384399414062, 15.028481483459473, 15.603578567504883, 16.178674697875977, 16.753772735595703, 17.328868865966797, 17.90396499633789, 18.479061126708984, 19.05415916442871]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 4.0, 11.0, 13.0, 15.0, 14.0, 16.0, 24.0, 31.0, 31.0, 25.0, 33.0, 43.0, 40.0, 48.0, 30.0, 63.0, 52.0, 48.0, 50.0, 50.0, 34.0, 40.0, 46.0, 28.0, 18.0, 23.0, 25.0, 25.0, 20.0, 15.0, 14.0, 9.0, 12.0, 9.0, 8.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.358636856079102, -8.073909759521484, -7.789182186126709, -7.504454612731934, -7.219727516174316, -6.934999942779541, -6.650272369384766, -6.365545272827148, -6.080817699432373, -5.796090126037598, -5.5113630294799805, -5.226635456085205, -4.94190788269043, -4.6571807861328125, -4.372453212738037, -4.087725639343262, -3.8029985427856445, -3.5182712078094482, -3.233543872833252, -2.9488162994384766, -2.6640889644622803, -2.379361629486084, -2.0946340560913086, -1.8099067211151123, -1.525179386138916, -1.2404520511627197, -0.9557245969772339, -0.6709972023963928, -0.38626980781555176, -0.10154247283935547, 0.18318498134613037, 0.4679124355316162, 0.7526388168334961, 1.0373661518096924, 1.3220936059951782, 1.606821060180664, 1.8915483951568604, 2.1762757301330566, 2.461003303527832, 2.7457306385040283, 3.0304579734802246, 3.315185308456421, 3.599912643432617, 3.8846402168273926, 4.169367790222168, 4.454094886779785, 4.7388224601745605, 5.023550033569336, 5.308277130126953, 5.5930047035217285, 5.877731800079346, 6.162459373474121, 6.447186470031738, 6.731914043426514, 7.016641616821289, 7.301368713378906, 7.586096286773682, 7.870823860168457, 8.155550956726074, 8.440278053283691, 8.725006103515625, 9.009733200073242, 9.29446029663086, 9.579188346862793, 9.86391544342041]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 9.0, 10.0, 18.0, 46.0, 72.0, 104.0, 147.0, 250.0, 407.0, 675.0, 1110.0, 1880.0, 2968.0, 5178.0, 8590.0, 14277.0, 24333.0, 39856.0, 63910.0, 97137.0, 133156.0, 157221.0, 151091.0, 121782.0, 85174.0, 54654.0, 33784.0, 20256.0, 12248.0, 7147.0, 4426.0, 2543.0, 1499.0, 979.0, 597.0, 375.0, 246.0, 134.0, 110.0, 54.0, 35.0, 31.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.5880126953125, -9.230712890625, -8.8734130859375, -8.51611328125, -8.1588134765625, -7.801513671875, -7.4442138671875, -7.0869140625, -6.7296142578125, -6.372314453125, -6.0150146484375, -5.65771484375, -5.3004150390625, -4.943115234375, -4.5858154296875, -4.228515625, -3.8712158203125, -3.513916015625, -3.1566162109375, -2.79931640625, -2.4420166015625, -2.084716796875, -1.7274169921875, -1.3701171875, -1.0128173828125, -0.655517578125, -0.2982177734375, 0.05908203125, 0.4163818359375, 0.773681640625, 1.1309814453125, 1.48828125, 1.8455810546875, 2.202880859375, 2.5601806640625, 2.91748046875, 3.2747802734375, 3.632080078125, 3.9893798828125, 4.3466796875, 4.7039794921875, 5.061279296875, 5.4185791015625, 5.77587890625, 6.1331787109375, 6.490478515625, 6.8477783203125, 7.205078125, 7.5623779296875, 7.919677734375, 8.2769775390625, 8.63427734375, 8.9915771484375, 9.348876953125, 9.7061767578125, 10.0634765625, 10.4207763671875, 10.778076171875, 11.1353759765625, 11.49267578125, 11.8499755859375, 12.207275390625, 12.5645751953125, 12.921875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 5.0, 7.0, 9.0, 10.0, 20.0, 8.0, 13.0, 11.0, 16.0, 23.0, 29.0, 33.0, 24.0, 29.0, 44.0, 42.0, 25.0, 50.0, 46.0, 38.0, 50.0, 51.0, 50.0, 41.0, 36.0, 29.0, 28.0, 32.0, 38.0, 24.0, 26.0, 18.0, 16.0, 13.0, 10.0, 12.0, 7.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.7265625, -9.42431640625, -9.1220703125, -8.81982421875, -8.517578125, -8.21533203125, -7.9130859375, -7.61083984375, -7.30859375, -7.00634765625, -6.7041015625, -6.40185546875, -6.099609375, -5.79736328125, -5.4951171875, -5.19287109375, -4.890625, -4.58837890625, -4.2861328125, -3.98388671875, -3.681640625, -3.37939453125, -3.0771484375, -2.77490234375, -2.47265625, -2.17041015625, -1.8681640625, -1.56591796875, -1.263671875, -0.96142578125, -0.6591796875, -0.35693359375, -0.0546875, 0.24755859375, 0.5498046875, 0.85205078125, 1.154296875, 1.45654296875, 1.7587890625, 2.06103515625, 2.36328125, 2.66552734375, 2.9677734375, 3.27001953125, 3.572265625, 3.87451171875, 4.1767578125, 4.47900390625, 4.78125, 5.08349609375, 5.3857421875, 5.68798828125, 5.990234375, 6.29248046875, 6.5947265625, 6.89697265625, 7.19921875, 7.50146484375, 7.8037109375, 8.10595703125, 8.408203125, 8.71044921875, 9.0126953125, 9.31494140625, 9.6171875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 15.0, 15.0, 24.0, 45.0, 80.0, 104.0, 160.0, 265.0, 366.0, 588.0, 911.0, 1521.0, 2493.0, 3915.0, 6168.0, 10112.0, 16608.0, 26311.0, 40850.0, 62254.0, 89542.0, 117350.0, 136074.0, 137422.0, 119894.0, 93086.0, 65860.0, 43190.0, 27601.0, 17217.0, 10762.0, 6602.0, 4207.0, 2543.0, 1591.0, 1021.0, 626.0, 400.0, 258.0, 187.0, 105.0, 70.0, 43.0, 36.0, 20.0, 11.0, 10.0, 11.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1422119140625, -9.815673828125, -9.4891357421875, -9.16259765625, -8.8360595703125, -8.509521484375, -8.1829833984375, -7.8564453125, -7.5299072265625, -7.203369140625, -6.8768310546875, -6.55029296875, -6.2237548828125, -5.897216796875, -5.5706787109375, -5.244140625, -4.9176025390625, -4.591064453125, -4.2645263671875, -3.93798828125, -3.6114501953125, -3.284912109375, -2.9583740234375, -2.6318359375, -2.3052978515625, -1.978759765625, -1.6522216796875, -1.32568359375, -0.9991455078125, -0.672607421875, -0.3460693359375, -0.01953125, 0.3070068359375, 0.633544921875, 0.9600830078125, 1.28662109375, 1.6131591796875, 1.939697265625, 2.2662353515625, 2.5927734375, 2.9193115234375, 3.245849609375, 3.5723876953125, 3.89892578125, 4.2254638671875, 4.552001953125, 4.8785400390625, 5.205078125, 5.5316162109375, 5.858154296875, 6.1846923828125, 6.51123046875, 6.8377685546875, 7.164306640625, 7.4908447265625, 7.8173828125, 8.1439208984375, 8.470458984375, 8.7969970703125, 9.12353515625, 9.4500732421875, 9.776611328125, 10.1031494140625, 10.4296875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 7.0, 10.0, 14.0, 10.0, 8.0, 17.0, 28.0, 24.0, 37.0, 40.0, 36.0, 39.0, 36.0, 35.0, 43.0, 44.0, 36.0, 49.0, 50.0, 50.0, 38.0, 43.0, 28.0, 30.0, 30.0, 32.0, 25.0, 14.0, 22.0, 20.0, 14.0, 13.0, 9.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.35546875, -5.1781005859375, -5.000732421875, -4.8233642578125, -4.64599609375, -4.4686279296875, -4.291259765625, -4.1138916015625, -3.9365234375, -3.7591552734375, -3.581787109375, -3.4044189453125, -3.22705078125, -3.0496826171875, -2.872314453125, -2.6949462890625, -2.517578125, -2.3402099609375, -2.162841796875, -1.9854736328125, -1.80810546875, -1.6307373046875, -1.453369140625, -1.2760009765625, -1.0986328125, -0.9212646484375, -0.743896484375, -0.5665283203125, -0.38916015625, -0.2117919921875, -0.034423828125, 0.1429443359375, 0.3203125, 0.4976806640625, 0.675048828125, 0.8524169921875, 1.02978515625, 1.2071533203125, 1.384521484375, 1.5618896484375, 1.7392578125, 1.9166259765625, 2.093994140625, 2.2713623046875, 2.44873046875, 2.6260986328125, 2.803466796875, 2.9808349609375, 3.158203125, 3.3355712890625, 3.512939453125, 3.6903076171875, 3.86767578125, 4.0450439453125, 4.222412109375, 4.3997802734375, 4.5771484375, 4.7545166015625, 4.931884765625, 5.1092529296875, 5.28662109375, 5.4639892578125, 5.641357421875, 5.8187255859375, 5.99609375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 14.0, 10.0, 16.0, 21.0, 26.0, 48.0, 80.0, 103.0, 150.0, 225.0, 360.0, 504.0, 778.0, 1300.0, 2085.0, 3508.0, 6243.0, 10815.0, 20394.0, 37239.0, 66385.0, 112221.0, 165778.0, 192223.0, 165537.0, 112497.0, 66268.0, 37090.0, 20220.0, 11113.0, 6165.0, 3539.0, 2070.0, 1246.0, 775.0, 512.0, 315.0, 208.0, 147.0, 94.0, 63.0, 47.0, 27.0, 22.0, 23.0, 15.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-6.23046875, -6.04986572265625, -5.8692626953125, -5.68865966796875, -5.508056640625, -5.32745361328125, -5.1468505859375, -4.96624755859375, -4.78564453125, -4.60504150390625, -4.4244384765625, -4.24383544921875, -4.063232421875, -3.88262939453125, -3.7020263671875, -3.52142333984375, -3.3408203125, -3.16021728515625, -2.9796142578125, -2.79901123046875, -2.618408203125, -2.43780517578125, -2.2572021484375, -2.07659912109375, -1.89599609375, -1.71539306640625, -1.5347900390625, -1.35418701171875, -1.173583984375, -0.99298095703125, -0.8123779296875, -0.63177490234375, -0.451171875, -0.27056884765625, -0.0899658203125, 0.09063720703125, 0.271240234375, 0.45184326171875, 0.6324462890625, 0.81304931640625, 0.99365234375, 1.17425537109375, 1.3548583984375, 1.53546142578125, 1.716064453125, 1.89666748046875, 2.0772705078125, 2.25787353515625, 2.4384765625, 2.61907958984375, 2.7996826171875, 2.98028564453125, 3.160888671875, 3.34149169921875, 3.5220947265625, 3.70269775390625, 3.88330078125, 4.06390380859375, 4.2445068359375, 4.42510986328125, 4.605712890625, 4.78631591796875, 4.9669189453125, 5.14752197265625, 5.328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 9.0, 8.0, 4.0, 8.0, 10.0, 19.0, 14.0, 25.0, 44.0, 42.0, 49.0, 56.0, 67.0, 65.0, 88.0, 70.0, 62.0, 59.0, 57.0, 48.0, 43.0, 42.0, 20.0, 24.0, 18.0, 18.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006918907165527344, -0.0006720125675201416, -0.0006521344184875488, -0.0006322562694549561, -0.0006123781204223633, -0.0005924999713897705, -0.0005726218223571777, -0.000552743673324585, -0.0005328655242919922, -0.0005129873752593994, -0.0004931092262268066, -0.00047323107719421387, -0.0004533529281616211, -0.0004334747791290283, -0.00041359663009643555, -0.0003937184810638428, -0.00037384033203125, -0.0003539621829986572, -0.00033408403396606445, -0.0003142058849334717, -0.0002943277359008789, -0.00027444958686828613, -0.00025457143783569336, -0.00023469328880310059, -0.0002148151397705078, -0.00019493699073791504, -0.00017505884170532227, -0.0001551806926727295, -0.00013530254364013672, -0.00011542439460754395, -9.554624557495117e-05, -7.56680965423584e-05, -5.5789947509765625e-05, -3.591179847717285e-05, -1.6033649444580078e-05, 3.844499588012695e-06, 2.372264862060547e-05, 4.360079765319824e-05, 6.347894668579102e-05, 8.335709571838379e-05, 0.00010323524475097656, 0.00012311339378356934, 0.0001429915428161621, 0.00016286969184875488, 0.00018274784088134766, 0.00020262598991394043, 0.0002225041389465332, 0.00024238228797912598, 0.00026226043701171875, 0.0002821385860443115, 0.0003020167350769043, 0.00032189488410949707, 0.00034177303314208984, 0.0003616511821746826, 0.0003815293312072754, 0.00040140748023986816, 0.00042128562927246094, 0.0004411637783050537, 0.0004610419273376465, 0.00048092007637023926, 0.000500798225402832, 0.0005206763744354248, 0.0005405545234680176, 0.0005604326725006104, 0.0005803108215332031]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 8.0, 18.0, 20.0, 29.0, 41.0, 83.0, 130.0, 142.0, 245.0, 341.0, 620.0, 939.0, 1552.0, 2508.0, 4238.0, 7322.0, 12581.0, 22236.0, 39696.0, 69184.0, 113847.0, 164196.0, 186134.0, 159360.0, 108949.0, 66204.0, 37799.0, 21000.0, 11887.0, 6825.0, 4002.0, 2391.0, 1454.0, 918.0, 565.0, 374.0, 230.0, 155.0, 106.0, 79.0, 39.0, 24.0, 23.0, 14.0, 15.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.625, -5.45684814453125, -5.2886962890625, -5.12054443359375, -4.952392578125, -4.78424072265625, -4.6160888671875, -4.44793701171875, -4.27978515625, -4.11163330078125, -3.9434814453125, -3.77532958984375, -3.607177734375, -3.43902587890625, -3.2708740234375, -3.10272216796875, -2.9345703125, -2.76641845703125, -2.5982666015625, -2.43011474609375, -2.261962890625, -2.09381103515625, -1.9256591796875, -1.75750732421875, -1.58935546875, -1.42120361328125, -1.2530517578125, -1.08489990234375, -0.916748046875, -0.74859619140625, -0.5804443359375, -0.41229248046875, -0.244140625, -0.07598876953125, 0.0921630859375, 0.26031494140625, 0.428466796875, 0.59661865234375, 0.7647705078125, 0.93292236328125, 1.10107421875, 1.26922607421875, 1.4373779296875, 1.60552978515625, 1.773681640625, 1.94183349609375, 2.1099853515625, 2.27813720703125, 2.4462890625, 2.61444091796875, 2.7825927734375, 2.95074462890625, 3.118896484375, 3.28704833984375, 3.4552001953125, 3.62335205078125, 3.79150390625, 3.95965576171875, 4.1278076171875, 4.29595947265625, 4.464111328125, 4.63226318359375, 4.8004150390625, 4.96856689453125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 13.0, 7.0, 13.0, 13.0, 17.0, 22.0, 27.0, 25.0, 31.0, 37.0, 42.0, 55.0, 64.0, 45.0, 73.0, 64.0, 64.0, 48.0, 55.0, 41.0, 40.0, 30.0, 48.0, 26.0, 15.0, 17.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.374725341796875, -1.32659912109375, -1.278472900390625, -1.2303466796875, -1.182220458984375, -1.13409423828125, -1.085968017578125, -1.037841796875, -0.989715576171875, -0.94158935546875, -0.893463134765625, -0.8453369140625, -0.797210693359375, -0.74908447265625, -0.700958251953125, -0.65283203125, -0.604705810546875, -0.55657958984375, -0.508453369140625, -0.4603271484375, -0.412200927734375, -0.36407470703125, -0.315948486328125, -0.267822265625, -0.219696044921875, -0.17156982421875, -0.123443603515625, -0.0753173828125, -0.027191162109375, 0.02093505859375, 0.069061279296875, 0.1171875, 0.165313720703125, 0.21343994140625, 0.261566162109375, 0.3096923828125, 0.357818603515625, 0.40594482421875, 0.454071044921875, 0.502197265625, 0.550323486328125, 0.59844970703125, 0.646575927734375, 0.6947021484375, 0.742828369140625, 0.79095458984375, 0.839080810546875, 0.88720703125, 0.935333251953125, 0.98345947265625, 1.031585693359375, 1.0797119140625, 1.127838134765625, 1.17596435546875, 1.224090576171875, 1.272216796875, 1.320343017578125, 1.36846923828125, 1.416595458984375, 1.4647216796875, 1.512847900390625, 1.56097412109375, 1.609100341796875, 1.6572265625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 12.0, 12.0, 23.0, 25.0, 28.0, 26.0, 48.0, 44.0, 53.0, 57.0, 75.0, 63.0, 72.0, 77.0, 64.0, 60.0, 40.0, 32.0, 26.0, 27.0, 26.0, 14.0, 12.0, 11.0, 8.0, 14.0, 1.0, 3.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.33849334716797, -17.729873657226562, -17.121252059936523, -16.512632369995117, -15.904010772705078, -15.295391082763672, -14.68677043914795, -14.078149795532227, -13.469529151916504, -12.860908508300781, -12.252287864685059, -11.643667221069336, -11.03504753112793, -10.42642593383789, -9.817806243896484, -9.209185600280762, -8.600564956665039, -7.991944313049316, -7.383323669433594, -6.774703502655029, -6.166082859039307, -5.557462215423584, -4.9488420486450195, -4.340221405029297, -3.731600761413574, -3.1229801177978516, -2.514359712600708, -1.905739188194275, -1.2971186637878418, -0.6884980201721191, -0.07987761497497559, 0.528742790222168, 1.1373653411865234, 1.7459858655929565, 2.3546063899993896, 2.963226795196533, 3.571847438812256, 4.1804680824279785, 4.789088249206543, 5.397708892822266, 6.006329536437988, 6.614950180053711, 7.223570823669434, 7.832190990447998, 8.440811157226562, 9.049432754516602, 9.658052444458008, 10.26667308807373, 10.875293731689453, 11.483914375305176, 12.092535018920898, 12.701155662536621, 13.309776306152344, 13.91839599609375, 14.527016639709473, 15.135637283325195, 15.744257926940918, 16.35287857055664, 16.961498260498047, 17.570119857788086, 18.178739547729492, 18.78736114501953, 19.395980834960938, 20.004600524902344, 20.613222122192383]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 13.0, 12.0, 16.0, 13.0, 18.0, 28.0, 29.0, 23.0, 36.0, 31.0, 41.0, 51.0, 40.0, 52.0, 43.0, 54.0, 36.0, 45.0, 43.0, 50.0, 41.0, 36.0, 23.0, 22.0, 22.0, 20.0, 25.0, 18.0, 21.0, 11.0, 14.0, 7.0, 13.0, 10.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.433783531188965, -8.144537925720215, -7.855292797088623, -7.566047668457031, -7.276802062988281, -6.987556457519531, -6.6983113288879395, -6.409066200256348, -6.119820594787598, -5.830574989318848, -5.541329860687256, -5.252084732055664, -4.962839126586914, -4.673593521118164, -4.384348392486572, -4.0951032638549805, -3.8058576583862305, -3.5166122913360596, -3.2273669242858887, -2.9381215572357178, -2.648876190185547, -2.359630823135376, -2.070385456085205, -1.7811400890350342, -1.4918947219848633, -1.2026493549346924, -0.9134039878845215, -0.6241586208343506, -0.3349132537841797, -0.04566788673400879, 0.2435774803161621, 0.532822847366333, 0.8220691680908203, 1.1113145351409912, 1.400559902191162, 1.689805269241333, 1.979050636291504, 2.268296003341675, 2.5575413703918457, 2.8467867374420166, 3.1360321044921875, 3.4252774715423584, 3.7145228385925293, 4.003767967224121, 4.293013572692871, 4.582259178161621, 4.871504306793213, 5.160749435424805, 5.449995040893555, 5.739240646362305, 6.0284857749938965, 6.317730903625488, 6.606976509094238, 6.896222114562988, 7.18546724319458, 7.474712371826172, 7.763957977294922, 8.053203582763672, 8.342449188232422, 8.631693840026855, 8.920939445495605, 9.210185050964355, 9.499429702758789, 9.788675308227539, 10.077920913696289]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 18.0, 19.0, 27.0, 49.0, 96.0, 138.0, 215.0, 333.0, 599.0, 1103.0, 2050.0, 4011.0, 8126.0, 17486.0, 39255.0, 95415.0, 249939.0, 696532.0, 1447838.0, 1024094.0, 368907.0, 135293.0, 54827.0, 24062.0, 11402.0, 5603.0, 2924.0, 1630.0, 882.0, 535.0, 291.0, 188.0, 117.0, 84.0, 58.0, 43.0, 29.0, 19.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.536376953125, -16.85400390625, -16.171630859375, -15.4892578125, -14.806884765625, -14.12451171875, -13.442138671875, -12.759765625, -12.077392578125, -11.39501953125, -10.712646484375, -10.0302734375, -9.347900390625, -8.66552734375, -7.983154296875, -7.30078125, -6.618408203125, -5.93603515625, -5.253662109375, -4.5712890625, -3.888916015625, -3.20654296875, -2.524169921875, -1.841796875, -1.159423828125, -0.47705078125, 0.205322265625, 0.8876953125, 1.570068359375, 2.25244140625, 2.934814453125, 3.6171875, 4.299560546875, 4.98193359375, 5.664306640625, 6.3466796875, 7.029052734375, 7.71142578125, 8.393798828125, 9.076171875, 9.758544921875, 10.44091796875, 11.123291015625, 11.8056640625, 12.488037109375, 13.17041015625, 13.852783203125, 14.53515625, 15.217529296875, 15.89990234375, 16.582275390625, 17.2646484375, 17.947021484375, 18.62939453125, 19.311767578125, 19.994140625, 20.676513671875, 21.35888671875, 22.041259765625, 22.7236328125, 23.406005859375, 24.08837890625, 24.770751953125, 25.453125]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 12.0, 12.0, 5.0, 10.0, 15.0, 21.0, 23.0, 30.0, 37.0, 36.0, 41.0, 46.0, 54.0, 43.0, 52.0, 37.0, 38.0, 53.0, 45.0, 56.0, 39.0, 38.0, 35.0, 29.0, 29.0, 26.0, 27.0, 18.0, 11.0, 20.0, 9.0, 6.0, 15.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.52386474609375, -6.2781982421875, -6.03253173828125, -5.786865234375, -5.54119873046875, -5.2955322265625, -5.04986572265625, -4.80419921875, -4.55853271484375, -4.3128662109375, -4.06719970703125, -3.821533203125, -3.57586669921875, -3.3302001953125, -3.08453369140625, -2.8388671875, -2.59320068359375, -2.3475341796875, -2.10186767578125, -1.856201171875, -1.61053466796875, -1.3648681640625, -1.11920166015625, -0.87353515625, -0.62786865234375, -0.3822021484375, -0.13653564453125, 0.109130859375, 0.35479736328125, 0.6004638671875, 0.84613037109375, 1.091796875, 1.33746337890625, 1.5831298828125, 1.82879638671875, 2.074462890625, 2.32012939453125, 2.5657958984375, 2.81146240234375, 3.05712890625, 3.30279541015625, 3.5484619140625, 3.79412841796875, 4.039794921875, 4.28546142578125, 4.5311279296875, 4.77679443359375, 5.0224609375, 5.26812744140625, 5.5137939453125, 5.75946044921875, 6.005126953125, 6.25079345703125, 6.4964599609375, 6.74212646484375, 6.98779296875, 7.23345947265625, 7.4791259765625, 7.72479248046875, 7.970458984375, 8.21612548828125, 8.4617919921875, 8.70745849609375, 8.953125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 7.0, 14.0, 24.0, 32.0, 46.0, 56.0, 93.0, 161.0, 252.0, 447.0, 723.0, 1250.0, 2294.0, 4227.0, 8081.0, 15567.0, 32151.0, 66691.0, 144174.0, 317426.0, 678610.0, 1111245.0, 928393.0, 473193.0, 216063.0, 98877.0, 46489.0, 22643.0, 11554.0, 6057.0, 3197.0, 1752.0, 998.0, 576.0, 338.0, 221.0, 132.0, 72.0, 53.0, 35.0, 16.0, 17.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.859375, -20.241455078125, -19.62353515625, -19.005615234375, -18.3876953125, -17.769775390625, -17.15185546875, -16.533935546875, -15.916015625, -15.298095703125, -14.68017578125, -14.062255859375, -13.4443359375, -12.826416015625, -12.20849609375, -11.590576171875, -10.97265625, -10.354736328125, -9.73681640625, -9.118896484375, -8.5009765625, -7.883056640625, -7.26513671875, -6.647216796875, -6.029296875, -5.411376953125, -4.79345703125, -4.175537109375, -3.5576171875, -2.939697265625, -2.32177734375, -1.703857421875, -1.0859375, -0.468017578125, 0.14990234375, 0.767822265625, 1.3857421875, 2.003662109375, 2.62158203125, 3.239501953125, 3.857421875, 4.475341796875, 5.09326171875, 5.711181640625, 6.3291015625, 6.947021484375, 7.56494140625, 8.182861328125, 8.80078125, 9.418701171875, 10.03662109375, 10.654541015625, 11.2724609375, 11.890380859375, 12.50830078125, 13.126220703125, 13.744140625, 14.362060546875, 14.97998046875, 15.597900390625, 16.2158203125, 16.833740234375, 17.45166015625, 18.069580078125, 18.6875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 7.0, 12.0, 15.0, 28.0, 36.0, 60.0, 64.0, 94.0, 132.0, 179.0, 239.0, 300.0, 323.0, 384.0, 397.0, 315.0, 327.0, 276.0, 215.0, 174.0, 144.0, 97.0, 78.0, 48.0, 33.0, 34.0, 20.0, 10.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1171875, -7.91162109375, -7.7060546875, -7.50048828125, -7.294921875, -7.08935546875, -6.8837890625, -6.67822265625, -6.47265625, -6.26708984375, -6.0615234375, -5.85595703125, -5.650390625, -5.44482421875, -5.2392578125, -5.03369140625, -4.828125, -4.62255859375, -4.4169921875, -4.21142578125, -4.005859375, -3.80029296875, -3.5947265625, -3.38916015625, -3.18359375, -2.97802734375, -2.7724609375, -2.56689453125, -2.361328125, -2.15576171875, -1.9501953125, -1.74462890625, -1.5390625, -1.33349609375, -1.1279296875, -0.92236328125, -0.716796875, -0.51123046875, -0.3056640625, -0.10009765625, 0.10546875, 0.31103515625, 0.5166015625, 0.72216796875, 0.927734375, 1.13330078125, 1.3388671875, 1.54443359375, 1.75, 1.95556640625, 2.1611328125, 2.36669921875, 2.572265625, 2.77783203125, 2.9833984375, 3.18896484375, 3.39453125, 3.60009765625, 3.8056640625, 4.01123046875, 4.216796875, 4.42236328125, 4.6279296875, 4.83349609375, 5.0390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 10.0, 14.0, 18.0, 21.0, 26.0, 28.0, 48.0, 52.0, 48.0, 75.0, 81.0, 68.0, 88.0, 65.0, 61.0, 58.0, 49.0, 33.0, 40.0, 20.0, 15.0, 17.0, 7.0, 12.0, 8.0, 7.0, 4.0, 0.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.16599464416504, -20.458349227905273, -19.750701904296875, -19.04305648803711, -18.335411071777344, -17.627765655517578, -16.92011833190918, -16.212472915649414, -15.504826545715332, -14.79718017578125, -14.089534759521484, -13.381888389587402, -12.67424201965332, -11.966596603393555, -11.258950233459473, -10.55130386352539, -9.843658447265625, -9.136012077331543, -8.428366661071777, -7.720720291137695, -7.0130743980407715, -6.305428504943848, -5.597782135009766, -4.890136241912842, -4.182490348815918, -3.474844455718994, -2.767198324203491, -2.0595521926879883, -1.3519062995910645, -0.6442604064941406, 0.0633859634399414, 0.7710318565368652, 1.4786758422851562, 2.18632173538208, 2.893967866897583, 3.601613998413086, 4.30925989151001, 5.016905784606934, 5.724552154541016, 6.4321980476379395, 7.139843940734863, 7.847489833831787, 8.555135726928711, 9.262782096862793, 9.970428466796875, 10.67807388305664, 11.385720252990723, 12.093366622924805, 12.80101203918457, 13.508658409118652, 14.216303825378418, 14.9239501953125, 15.631595611572266, 16.33924102783203, 17.04688835144043, 17.754533767700195, 18.462181091308594, 19.16982650756836, 19.877473831176758, 20.585119247436523, 21.29276466369629, 22.000411987304688, 22.708057403564453, 23.41570281982422, 24.123348236083984]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 7.0, 9.0, 14.0, 22.0, 23.0, 17.0, 28.0, 32.0, 31.0, 37.0, 26.0, 48.0, 37.0, 35.0, 46.0, 32.0, 46.0, 44.0, 46.0, 45.0, 49.0, 35.0, 35.0, 31.0, 35.0, 24.0, 22.0, 28.0, 18.0, 16.0, 9.0, 15.0, 3.0, 9.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.962663173675537, -7.675048351287842, -7.387433052062988, -7.099818229675293, -6.812203407287598, -6.524588584899902, -6.236973285675049, -5.9493584632873535, -5.6617431640625, -5.374128341674805, -5.086513042449951, -4.798898220062256, -4.5112833976745605, -4.223668098449707, -3.9360532760620117, -3.6484384536743164, -3.360823631286621, -3.0732085704803467, -2.7855937480926514, -2.497978687286377, -2.2103638648986816, -1.9227488040924072, -1.6351337432861328, -1.3475189208984375, -1.059903860092163, -0.7722889184951782, -0.4846739172935486, -0.19705891609191895, 0.09055602550506592, 0.3781709671020508, 0.6657860279083252, 0.9534008502960205, 1.2410163879394531, 1.528631329536438, 1.8162462711334229, 2.1038613319396973, 2.3914761543273926, 2.679091215133667, 2.9667062759399414, 3.2543210983276367, 3.541936159133911, 3.8295512199401855, 4.117166042327881, 4.404781341552734, 4.69239616394043, 4.980010986328125, 5.26762580871582, 5.555240631103516, 5.842855930328369, 6.1304707527160645, 6.418086051940918, 6.705700874328613, 6.993315696716309, 7.280930519104004, 7.568545818328857, 7.856160640716553, 8.143775939941406, 8.431390762329102, 8.719005584716797, 9.006620407104492, 9.294236183166504, 9.5818510055542, 9.869465827941895, 10.15708065032959, 10.444695472717285]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 6.0, 10.0, 18.0, 24.0, 38.0, 35.0, 51.0, 76.0, 101.0, 145.0, 205.0, 267.0, 391.0, 601.0, 868.0, 1552.0, 2615.0, 4570.0, 8702.0, 17252.0, 37218.0, 81199.0, 164321.0, 251651.0, 227007.0, 130291.0, 61070.0, 28257.0, 13407.0, 6895.0, 3723.0, 2100.0, 1288.0, 840.0, 546.0, 380.0, 225.0, 181.0, 121.0, 78.0, 66.0, 44.0, 39.0, 18.0, 13.0, 14.0, 7.0, 4.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0], "bins": [-14.578125, -14.1470947265625, -13.716064453125, -13.2850341796875, -12.85400390625, -12.4229736328125, -11.991943359375, -11.5609130859375, -11.1298828125, -10.6988525390625, -10.267822265625, -9.8367919921875, -9.40576171875, -8.9747314453125, -8.543701171875, -8.1126708984375, -7.681640625, -7.2506103515625, -6.819580078125, -6.3885498046875, -5.95751953125, -5.5264892578125, -5.095458984375, -4.6644287109375, -4.2333984375, -3.8023681640625, -3.371337890625, -2.9403076171875, -2.50927734375, -2.0782470703125, -1.647216796875, -1.2161865234375, -0.78515625, -0.3541259765625, 0.076904296875, 0.5079345703125, 0.93896484375, 1.3699951171875, 1.801025390625, 2.2320556640625, 2.6630859375, 3.0941162109375, 3.525146484375, 3.9561767578125, 4.38720703125, 4.8182373046875, 5.249267578125, 5.6802978515625, 6.111328125, 6.5423583984375, 6.973388671875, 7.4044189453125, 7.83544921875, 8.2664794921875, 8.697509765625, 9.1285400390625, 9.5595703125, 9.9906005859375, 10.421630859375, 10.8526611328125, 11.28369140625, 11.7147216796875, 12.145751953125, 12.5767822265625, 13.0078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 7.0, 3.0, 5.0, 8.0, 10.0, 11.0, 20.0, 19.0, 17.0, 16.0, 25.0, 25.0, 24.0, 33.0, 26.0, 35.0, 34.0, 37.0, 36.0, 37.0, 35.0, 37.0, 42.0, 40.0, 47.0, 44.0, 30.0, 34.0, 32.0, 29.0, 24.0, 27.0, 20.0, 12.0, 19.0, 15.0, 11.0, 11.0, 8.0, 7.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.2655029296875, -7.991943359375, -7.7183837890625, -7.44482421875, -7.1712646484375, -6.897705078125, -6.6241455078125, -6.3505859375, -6.0770263671875, -5.803466796875, -5.5299072265625, -5.25634765625, -4.9827880859375, -4.709228515625, -4.4356689453125, -4.162109375, -3.8885498046875, -3.614990234375, -3.3414306640625, -3.06787109375, -2.7943115234375, -2.520751953125, -2.2471923828125, -1.9736328125, -1.7000732421875, -1.426513671875, -1.1529541015625, -0.87939453125, -0.6058349609375, -0.332275390625, -0.0587158203125, 0.21484375, 0.4884033203125, 0.761962890625, 1.0355224609375, 1.30908203125, 1.5826416015625, 1.856201171875, 2.1297607421875, 2.4033203125, 2.6768798828125, 2.950439453125, 3.2239990234375, 3.49755859375, 3.7711181640625, 4.044677734375, 4.3182373046875, 4.591796875, 4.8653564453125, 5.138916015625, 5.4124755859375, 5.68603515625, 5.9595947265625, 6.233154296875, 6.5067138671875, 6.7802734375, 7.0538330078125, 7.327392578125, 7.6009521484375, 7.87451171875, 8.1480712890625, 8.421630859375, 8.6951904296875, 8.96875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 9.0, 18.0, 17.0, 23.0, 39.0, 31.0, 56.0, 79.0, 106.0, 172.0, 209.0, 298.0, 419.0, 690.0, 1065.0, 1839.0, 3412.0, 7570.0, 19542.0, 59221.0, 191086.0, 404617.0, 238431.0, 76038.0, 24595.0, 9176.0, 4168.0, 2101.0, 1271.0, 717.0, 472.0, 312.0, 215.0, 139.0, 110.0, 67.0, 55.0, 48.0, 35.0, 27.0, 12.0, 7.0, 9.0, 9.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.84375, -20.1396484375, -19.435546875, -18.7314453125, -18.02734375, -17.3232421875, -16.619140625, -15.9150390625, -15.2109375, -14.5068359375, -13.802734375, -13.0986328125, -12.39453125, -11.6904296875, -10.986328125, -10.2822265625, -9.578125, -8.8740234375, -8.169921875, -7.4658203125, -6.76171875, -6.0576171875, -5.353515625, -4.6494140625, -3.9453125, -3.2412109375, -2.537109375, -1.8330078125, -1.12890625, -0.4248046875, 0.279296875, 0.9833984375, 1.6875, 2.3916015625, 3.095703125, 3.7998046875, 4.50390625, 5.2080078125, 5.912109375, 6.6162109375, 7.3203125, 8.0244140625, 8.728515625, 9.4326171875, 10.13671875, 10.8408203125, 11.544921875, 12.2490234375, 12.953125, 13.6572265625, 14.361328125, 15.0654296875, 15.76953125, 16.4736328125, 17.177734375, 17.8818359375, 18.5859375, 19.2900390625, 19.994140625, 20.6982421875, 21.40234375, 22.1064453125, 22.810546875, 23.5146484375, 24.21875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 11.0, 15.0, 13.0, 12.0, 25.0, 24.0, 29.0, 37.0, 37.0, 41.0, 42.0, 43.0, 38.0, 36.0, 47.0, 47.0, 39.0, 42.0, 40.0, 49.0, 48.0, 25.0, 31.0, 25.0, 28.0, 23.0, 16.0, 16.0, 16.0, 16.0, 15.0, 12.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5859375, -5.40032958984375, -5.2147216796875, -5.02911376953125, -4.843505859375, -4.65789794921875, -4.4722900390625, -4.28668212890625, -4.10107421875, -3.91546630859375, -3.7298583984375, -3.54425048828125, -3.358642578125, -3.17303466796875, -2.9874267578125, -2.80181884765625, -2.6162109375, -2.43060302734375, -2.2449951171875, -2.05938720703125, -1.873779296875, -1.68817138671875, -1.5025634765625, -1.31695556640625, -1.13134765625, -0.94573974609375, -0.7601318359375, -0.57452392578125, -0.388916015625, -0.20330810546875, -0.0177001953125, 0.16790771484375, 0.353515625, 0.53912353515625, 0.7247314453125, 0.91033935546875, 1.095947265625, 1.28155517578125, 1.4671630859375, 1.65277099609375, 1.83837890625, 2.02398681640625, 2.2095947265625, 2.39520263671875, 2.580810546875, 2.76641845703125, 2.9520263671875, 3.13763427734375, 3.3232421875, 3.50885009765625, 3.6944580078125, 3.88006591796875, 4.065673828125, 4.25128173828125, 4.4368896484375, 4.62249755859375, 4.80810546875, 4.99371337890625, 5.1793212890625, 5.36492919921875, 5.550537109375, 5.73614501953125, 5.9217529296875, 6.10736083984375, 6.29296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 2.0, 7.0, 7.0, 22.0, 18.0, 20.0, 38.0, 45.0, 70.0, 83.0, 120.0, 166.0, 227.0, 266.0, 397.0, 549.0, 797.0, 1115.0, 1570.0, 2308.0, 3639.0, 6298.0, 13909.0, 48610.0, 243899.0, 528143.0, 139653.0, 30719.0, 10421.0, 5185.0, 3069.0, 2059.0, 1429.0, 1043.0, 730.0, 536.0, 362.0, 301.0, 189.0, 140.0, 111.0, 81.0, 68.0, 38.0, 29.0, 23.0, 13.0, 11.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0], "bins": [-17.140625, -16.655517578125, -16.17041015625, -15.685302734375, -15.2001953125, -14.715087890625, -14.22998046875, -13.744873046875, -13.259765625, -12.774658203125, -12.28955078125, -11.804443359375, -11.3193359375, -10.834228515625, -10.34912109375, -9.864013671875, -9.37890625, -8.893798828125, -8.40869140625, -7.923583984375, -7.4384765625, -6.953369140625, -6.46826171875, -5.983154296875, -5.498046875, -5.012939453125, -4.52783203125, -4.042724609375, -3.5576171875, -3.072509765625, -2.58740234375, -2.102294921875, -1.6171875, -1.132080078125, -0.64697265625, -0.161865234375, 0.3232421875, 0.808349609375, 1.29345703125, 1.778564453125, 2.263671875, 2.748779296875, 3.23388671875, 3.718994140625, 4.2041015625, 4.689208984375, 5.17431640625, 5.659423828125, 6.14453125, 6.629638671875, 7.11474609375, 7.599853515625, 8.0849609375, 8.570068359375, 9.05517578125, 9.540283203125, 10.025390625, 10.510498046875, 10.99560546875, 11.480712890625, 11.9658203125, 12.450927734375, 12.93603515625, 13.421142578125, 13.90625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 15.0, 33.0, 49.0, 119.0, 195.0, 243.0, 162.0, 78.0, 41.0, 18.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00164794921875, -0.0016115084290504456, -0.0015750676393508911, -0.0015386268496513367, -0.0015021860599517822, -0.0014657452702522278, -0.0014293044805526733, -0.001392863690853119, -0.0013564229011535645, -0.00131998211145401, -0.0012835413217544556, -0.0012471005320549011, -0.0012106597423553467, -0.0011742189526557922, -0.0011377781629562378, -0.0011013373732566833, -0.001064896583557129, -0.0010284557938575745, -0.00099201500415802, -0.0009555742144584656, -0.0009191334247589111, -0.0008826926350593567, -0.0008462518453598022, -0.0008098110556602478, -0.0007733702659606934, -0.0007369294762611389, -0.0007004886865615845, -0.00066404789686203, -0.0006276071071624756, -0.0005911663174629211, -0.0005547255277633667, -0.0005182847380638123, -0.0004818439483642578, -0.00044540315866470337, -0.0004089623689651489, -0.0003725215792655945, -0.00033608078956604004, -0.0002996399998664856, -0.00026319921016693115, -0.0002267584204673767, -0.00019031763076782227, -0.00015387684106826782, -0.00011743605136871338, -8.099526166915894e-05, -4.455447196960449e-05, -8.113682270050049e-06, 2.8327107429504395e-05, 6.476789712905884e-05, 0.00010120868682861328, 0.00013764947652816772, 0.00017409026622772217, 0.0002105310559272766, 0.00024697184562683105, 0.0002834126353263855, 0.00031985342502593994, 0.0003562942147254944, 0.00039273500442504883, 0.00042917579412460327, 0.0004656165838241577, 0.0005020573735237122, 0.0005384981632232666, 0.000574938952922821, 0.0006113797426223755, 0.0006478205323219299, 0.0006842613220214844]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 11.0, 9.0, 22.0, 19.0, 41.0, 46.0, 66.0, 96.0, 126.0, 164.0, 177.0, 284.0, 353.0, 448.0, 617.0, 867.0, 1123.0, 1411.0, 1849.0, 2648.0, 3688.0, 6422.0, 19218.0, 112551.0, 505271.0, 313304.0, 49546.0, 11120.0, 4871.0, 3067.0, 2219.0, 1654.0, 1254.0, 974.0, 734.0, 550.0, 427.0, 344.0, 272.0, 174.0, 143.0, 81.0, 79.0, 58.0, 34.0, 30.0, 24.0, 16.0, 14.0, 10.0, 6.0, 10.0, 3.0, 2.0, 0.0, 1.0, 5.0], "bins": [-16.171875, -15.6630859375, -15.154296875, -14.6455078125, -14.13671875, -13.6279296875, -13.119140625, -12.6103515625, -12.1015625, -11.5927734375, -11.083984375, -10.5751953125, -10.06640625, -9.5576171875, -9.048828125, -8.5400390625, -8.03125, -7.5224609375, -7.013671875, -6.5048828125, -5.99609375, -5.4873046875, -4.978515625, -4.4697265625, -3.9609375, -3.4521484375, -2.943359375, -2.4345703125, -1.92578125, -1.4169921875, -0.908203125, -0.3994140625, 0.109375, 0.6181640625, 1.126953125, 1.6357421875, 2.14453125, 2.6533203125, 3.162109375, 3.6708984375, 4.1796875, 4.6884765625, 5.197265625, 5.7060546875, 6.21484375, 6.7236328125, 7.232421875, 7.7412109375, 8.25, 8.7587890625, 9.267578125, 9.7763671875, 10.28515625, 10.7939453125, 11.302734375, 11.8115234375, 12.3203125, 12.8291015625, 13.337890625, 13.8466796875, 14.35546875, 14.8642578125, 15.373046875, 15.8818359375, 16.390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 10.0, 23.0, 55.0, 97.0, 144.0, 189.0, 195.0, 120.0, 71.0, 31.0, 19.0, 9.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.57171630859375, -3.4324951171875, -3.29327392578125, -3.154052734375, -3.01483154296875, -2.8756103515625, -2.73638916015625, -2.59716796875, -2.45794677734375, -2.3187255859375, -2.17950439453125, -2.040283203125, -1.90106201171875, -1.7618408203125, -1.62261962890625, -1.4833984375, -1.34417724609375, -1.2049560546875, -1.06573486328125, -0.926513671875, -0.78729248046875, -0.6480712890625, -0.50885009765625, -0.36962890625, -0.23040771484375, -0.0911865234375, 0.04803466796875, 0.187255859375, 0.32647705078125, 0.4656982421875, 0.60491943359375, 0.744140625, 0.88336181640625, 1.0225830078125, 1.16180419921875, 1.301025390625, 1.44024658203125, 1.5794677734375, 1.71868896484375, 1.85791015625, 1.99713134765625, 2.1363525390625, 2.27557373046875, 2.414794921875, 2.55401611328125, 2.6932373046875, 2.83245849609375, 2.9716796875, 3.11090087890625, 3.2501220703125, 3.38934326171875, 3.528564453125, 3.66778564453125, 3.8070068359375, 3.94622802734375, 4.08544921875, 4.22467041015625, 4.3638916015625, 4.50311279296875, 4.642333984375, 4.78155517578125, 4.9207763671875, 5.05999755859375, 5.19921875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 3.0, 15.0, 19.0, 18.0, 23.0, 22.0, 38.0, 30.0, 47.0, 70.0, 69.0, 72.0, 73.0, 86.0, 66.0, 59.0, 63.0, 52.0, 32.0, 26.0, 21.0, 18.0, 15.0, 14.0, 4.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.578258514404297, -19.88836097717285, -19.198463439941406, -18.50856590270996, -17.818668365478516, -17.12877082824707, -16.438873291015625, -15.74897575378418, -15.059078216552734, -14.369180679321289, -13.679283142089844, -12.989385604858398, -12.299488067626953, -11.609590530395508, -10.919692993164062, -10.229795455932617, -9.539897918701172, -8.850000381469727, -8.160102844238281, -7.470205307006836, -6.780307769775391, -6.090410232543945, -5.4005126953125, -4.710615158081055, -4.020717620849609, -3.330820083618164, -2.6409225463867188, -1.9510250091552734, -1.2611274719238281, -0.5712299346923828, 0.1186676025390625, 0.8085651397705078, 1.4984607696533203, 2.1883583068847656, 2.878255844116211, 3.5681533813476562, 4.258050918579102, 4.947948455810547, 5.637845993041992, 6.3277435302734375, 7.017641067504883, 7.707538604736328, 8.397436141967773, 9.087333679199219, 9.777231216430664, 10.46712875366211, 11.157026290893555, 11.846923828125, 12.536821365356445, 13.22671890258789, 13.916616439819336, 14.606513977050781, 15.296411514282227, 15.986309051513672, 16.676206588745117, 17.366104125976562, 18.056001663208008, 18.745899200439453, 19.4357967376709, 20.125694274902344, 20.81559181213379, 21.505489349365234, 22.19538688659668, 22.885284423828125, 23.57518196105957]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 5.0, 10.0, 17.0, 11.0, 22.0, 31.0, 19.0, 37.0, 31.0, 33.0, 26.0, 43.0, 43.0, 41.0, 47.0, 41.0, 40.0, 52.0, 44.0, 35.0, 52.0, 40.0, 33.0, 31.0, 31.0, 28.0, 25.0, 21.0, 15.0, 18.0, 12.0, 5.0, 12.0, 8.0, 5.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.086185455322266, -7.793124675750732, -7.500064373016357, -7.207003593444824, -6.913943290710449, -6.620882511138916, -6.327821731567383, -6.034761428833008, -5.741701126098633, -5.4486403465271, -5.155580043792725, -4.862519264221191, -4.569458961486816, -4.276398181915283, -3.983337640762329, -3.690277099609375, -3.397216320037842, -3.1041557788848877, -2.8110952377319336, -2.5180344581604004, -2.2249741554260254, -1.9319134950637817, -1.638852834701538, -1.345792293548584, -1.0527317523956299, -0.7596712112426758, -0.4666106104850769, -0.17355000972747803, 0.11951053142547607, 0.4125710725784302, 0.7056317329406738, 0.9986922740936279, 1.291752815246582, 1.5848133563995361, 1.8778738975524902, 2.1709346771240234, 2.4639949798583984, 2.7570557594299316, 3.0501163005828857, 3.34317684173584, 3.636237382888794, 3.929297924041748, 4.222358703613281, 4.515419006347656, 4.8084797859191895, 5.1015400886535645, 5.394600868225098, 5.687661170959473, 5.980721950531006, 6.273782730102539, 6.566843032836914, 6.859903812408447, 7.152964115142822, 7.4460248947143555, 7.7390851974487305, 8.032146453857422, 8.325206756591797, 8.618267059326172, 8.911328315734863, 9.204388618469238, 9.497448921203613, 9.790509223937988, 10.08357048034668, 10.376630783081055, 10.66969108581543]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 18.0, 8.0, 28.0, 34.0, 58.0, 79.0, 133.0, 186.0, 339.0, 510.0, 825.0, 1373.0, 2397.0, 4175.0, 7255.0, 13002.0, 23031.0, 40163.0, 68985.0, 108627.0, 149823.0, 172127.0, 157698.0, 117596.0, 75396.0, 44996.0, 25755.0, 14300.0, 8271.0, 4616.0, 2678.0, 1574.0, 942.0, 565.0, 328.0, 245.0, 142.0, 106.0, 62.0, 28.0, 24.0, 12.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6171875, -13.199462890625, -12.78173828125, -12.364013671875, -11.9462890625, -11.528564453125, -11.11083984375, -10.693115234375, -10.275390625, -9.857666015625, -9.43994140625, -9.022216796875, -8.6044921875, -8.186767578125, -7.76904296875, -7.351318359375, -6.93359375, -6.515869140625, -6.09814453125, -5.680419921875, -5.2626953125, -4.844970703125, -4.42724609375, -4.009521484375, -3.591796875, -3.174072265625, -2.75634765625, -2.338623046875, -1.9208984375, -1.503173828125, -1.08544921875, -0.667724609375, -0.25, 0.167724609375, 0.58544921875, 1.003173828125, 1.4208984375, 1.838623046875, 2.25634765625, 2.674072265625, 3.091796875, 3.509521484375, 3.92724609375, 4.344970703125, 4.7626953125, 5.180419921875, 5.59814453125, 6.015869140625, 6.43359375, 6.851318359375, 7.26904296875, 7.686767578125, 8.1044921875, 8.522216796875, 8.93994140625, 9.357666015625, 9.775390625, 10.193115234375, 10.61083984375, 11.028564453125, 11.4462890625, 11.864013671875, 12.28173828125, 12.699462890625, 13.1171875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 17.0, 11.0, 19.0, 15.0, 19.0, 20.0, 35.0, 25.0, 27.0, 38.0, 37.0, 43.0, 52.0, 52.0, 55.0, 45.0, 46.0, 43.0, 50.0, 50.0, 37.0, 34.0, 36.0, 28.0, 17.0, 27.0, 9.0, 23.0, 12.0, 24.0, 11.0, 6.0, 8.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.5906982421875, -9.243896484375, -8.8970947265625, -8.55029296875, -8.2034912109375, -7.856689453125, -7.5098876953125, -7.1630859375, -6.8162841796875, -6.469482421875, -6.1226806640625, -5.77587890625, -5.4290771484375, -5.082275390625, -4.7354736328125, -4.388671875, -4.0418701171875, -3.695068359375, -3.3482666015625, -3.00146484375, -2.6546630859375, -2.307861328125, -1.9610595703125, -1.6142578125, -1.2674560546875, -0.920654296875, -0.5738525390625, -0.22705078125, 0.1197509765625, 0.466552734375, 0.8133544921875, 1.16015625, 1.5069580078125, 1.853759765625, 2.2005615234375, 2.54736328125, 2.8941650390625, 3.240966796875, 3.5877685546875, 3.9345703125, 4.2813720703125, 4.628173828125, 4.9749755859375, 5.32177734375, 5.6685791015625, 6.015380859375, 6.3621826171875, 6.708984375, 7.0557861328125, 7.402587890625, 7.7493896484375, 8.09619140625, 8.4429931640625, 8.789794921875, 9.1365966796875, 9.4833984375, 9.8302001953125, 10.177001953125, 10.5238037109375, 10.87060546875, 11.2174072265625, 11.564208984375, 11.9110107421875, 12.2578125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 10.0, 7.0, 23.0, 28.0, 38.0, 53.0, 97.0, 121.0, 192.0, 340.0, 584.0, 956.0, 1619.0, 2750.0, 4834.0, 8322.0, 14699.0, 25574.0, 43380.0, 71347.0, 108012.0, 144377.0, 162831.0, 150217.0, 115359.0, 77824.0, 48045.0, 28700.0, 16232.0, 9292.0, 5325.0, 3064.0, 1690.0, 1004.0, 605.0, 380.0, 221.0, 129.0, 98.0, 56.0, 33.0, 28.0, 19.0, 13.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-14.53125, -14.1112060546875, -13.691162109375, -13.2711181640625, -12.85107421875, -12.4310302734375, -12.010986328125, -11.5909423828125, -11.1708984375, -10.7508544921875, -10.330810546875, -9.9107666015625, -9.49072265625, -9.0706787109375, -8.650634765625, -8.2305908203125, -7.810546875, -7.3905029296875, -6.970458984375, -6.5504150390625, -6.13037109375, -5.7103271484375, -5.290283203125, -4.8702392578125, -4.4501953125, -4.0301513671875, -3.610107421875, -3.1900634765625, -2.77001953125, -2.3499755859375, -1.929931640625, -1.5098876953125, -1.08984375, -0.6697998046875, -0.249755859375, 0.1702880859375, 0.59033203125, 1.0103759765625, 1.430419921875, 1.8504638671875, 2.2705078125, 2.6905517578125, 3.110595703125, 3.5306396484375, 3.95068359375, 4.3707275390625, 4.790771484375, 5.2108154296875, 5.630859375, 6.0509033203125, 6.470947265625, 6.8909912109375, 7.31103515625, 7.7310791015625, 8.151123046875, 8.5711669921875, 8.9912109375, 9.4112548828125, 9.831298828125, 10.2513427734375, 10.67138671875, 11.0914306640625, 11.511474609375, 11.9315185546875, 12.3515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 15.0, 9.0, 9.0, 11.0, 14.0, 12.0, 15.0, 24.0, 25.0, 36.0, 20.0, 19.0, 32.0, 29.0, 29.0, 39.0, 37.0, 39.0, 35.0, 35.0, 46.0, 37.0, 50.0, 40.0, 27.0, 35.0, 34.0, 29.0, 33.0, 25.0, 20.0, 14.0, 16.0, 22.0, 16.0, 11.0, 11.0, 11.0, 4.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2890625, -5.10894775390625, -4.9288330078125, -4.74871826171875, -4.568603515625, -4.38848876953125, -4.2083740234375, -4.02825927734375, -3.84814453125, -3.66802978515625, -3.4879150390625, -3.30780029296875, -3.127685546875, -2.94757080078125, -2.7674560546875, -2.58734130859375, -2.4072265625, -2.22711181640625, -2.0469970703125, -1.86688232421875, -1.686767578125, -1.50665283203125, -1.3265380859375, -1.14642333984375, -0.96630859375, -0.78619384765625, -0.6060791015625, -0.42596435546875, -0.245849609375, -0.06573486328125, 0.1143798828125, 0.29449462890625, 0.474609375, 0.65472412109375, 0.8348388671875, 1.01495361328125, 1.195068359375, 1.37518310546875, 1.5552978515625, 1.73541259765625, 1.91552734375, 2.09564208984375, 2.2757568359375, 2.45587158203125, 2.635986328125, 2.81610107421875, 2.9962158203125, 3.17633056640625, 3.3564453125, 3.53656005859375, 3.7166748046875, 3.89678955078125, 4.076904296875, 4.25701904296875, 4.4371337890625, 4.61724853515625, 4.79736328125, 4.97747802734375, 5.1575927734375, 5.33770751953125, 5.517822265625, 5.69793701171875, 5.8780517578125, 6.05816650390625, 6.23828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 8.0, 8.0, 14.0, 19.0, 17.0, 48.0, 48.0, 72.0, 146.0, 194.0, 276.0, 416.0, 607.0, 1026.0, 1534.0, 2422.0, 4004.0, 6872.0, 12709.0, 23837.0, 49500.0, 101850.0, 188921.0, 245067.0, 194109.0, 106702.0, 51856.0, 25261.0, 12975.0, 7019.0, 4059.0, 2438.0, 1545.0, 935.0, 680.0, 455.0, 269.0, 195.0, 148.0, 87.0, 65.0, 54.0, 28.0, 24.0, 10.0, 13.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.3741455078125, -8.099853515625, -7.8255615234375, -7.55126953125, -7.2769775390625, -7.002685546875, -6.7283935546875, -6.4541015625, -6.1798095703125, -5.905517578125, -5.6312255859375, -5.35693359375, -5.0826416015625, -4.808349609375, -4.5340576171875, -4.259765625, -3.9854736328125, -3.711181640625, -3.4368896484375, -3.16259765625, -2.8883056640625, -2.614013671875, -2.3397216796875, -2.0654296875, -1.7911376953125, -1.516845703125, -1.2425537109375, -0.96826171875, -0.6939697265625, -0.419677734375, -0.1453857421875, 0.12890625, 0.4031982421875, 0.677490234375, 0.9517822265625, 1.22607421875, 1.5003662109375, 1.774658203125, 2.0489501953125, 2.3232421875, 2.5975341796875, 2.871826171875, 3.1461181640625, 3.42041015625, 3.6947021484375, 3.968994140625, 4.2432861328125, 4.517578125, 4.7918701171875, 5.066162109375, 5.3404541015625, 5.61474609375, 5.8890380859375, 6.163330078125, 6.4376220703125, 6.7119140625, 6.9862060546875, 7.260498046875, 7.5347900390625, 7.80908203125, 8.0833740234375, 8.357666015625, 8.6319580078125, 8.90625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 9.0, 6.0, 12.0, 16.0, 12.0, 34.0, 31.0, 38.0, 64.0, 77.0, 80.0, 73.0, 84.0, 99.0, 77.0, 65.0, 52.0, 47.0, 35.0, 19.0, 17.0, 16.0, 5.0, 5.0, 10.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008287429809570312, -0.0007984191179275513, -0.0007680952548980713, -0.0007377713918685913, -0.0007074475288391113, -0.0006771236658096313, -0.0006467998027801514, -0.0006164759397506714, -0.0005861520767211914, -0.0005558282136917114, -0.0005255043506622314, -0.0004951804876327515, -0.0004648566246032715, -0.0004345327615737915, -0.0004042088985443115, -0.00037388503551483154, -0.00034356117248535156, -0.0003132373094558716, -0.0002829134464263916, -0.0002525895833969116, -0.00022226572036743164, -0.00019194185733795166, -0.00016161799430847168, -0.0001312941312789917, -0.00010097026824951172, -7.064640522003174e-05, -4.032254219055176e-05, -9.998679161071777e-06, 2.0325183868408203e-05, 5.0649046897888184e-05, 8.097290992736816e-05, 0.00011129677295684814, 0.00014162063598632812, 0.0001719444990158081, 0.00020226836204528809, 0.00023259222507476807, 0.00026291608810424805, 0.00029323995113372803, 0.000323563814163208, 0.000353887677192688, 0.00038421154022216797, 0.00041453540325164795, 0.00044485926628112793, 0.0004751831293106079, 0.0005055069923400879, 0.0005358308553695679, 0.0005661547183990479, 0.0005964785814285278, 0.0006268024444580078, 0.0006571263074874878, 0.0006874501705169678, 0.0007177740335464478, 0.0007480978965759277, 0.0007784217596054077, 0.0008087456226348877, 0.0008390694856643677, 0.0008693933486938477, 0.0008997172117233276, 0.0009300410747528076, 0.0009603649377822876, 0.0009906888008117676, 0.0010210126638412476, 0.0010513365268707275, 0.0010816603899002075, 0.0011119842529296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 13.0, 10.0, 22.0, 34.0, 43.0, 64.0, 98.0, 144.0, 217.0, 327.0, 496.0, 691.0, 1053.0, 1561.0, 2398.0, 3625.0, 5863.0, 9362.0, 15890.0, 26395.0, 45224.0, 76144.0, 120523.0, 164908.0, 178663.0, 146301.0, 98728.0, 59872.0, 35353.0, 20957.0, 12422.0, 7598.0, 4688.0, 3029.0, 1918.0, 1243.0, 866.0, 582.0, 403.0, 270.0, 182.0, 92.0, 98.0, 51.0, 48.0, 27.0, 16.0, 22.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.9049072265625, -5.716064453125, -5.5272216796875, -5.33837890625, -5.1495361328125, -4.960693359375, -4.7718505859375, -4.5830078125, -4.3941650390625, -4.205322265625, -4.0164794921875, -3.82763671875, -3.6387939453125, -3.449951171875, -3.2611083984375, -3.072265625, -2.8834228515625, -2.694580078125, -2.5057373046875, -2.31689453125, -2.1280517578125, -1.939208984375, -1.7503662109375, -1.5615234375, -1.3726806640625, -1.183837890625, -0.9949951171875, -0.80615234375, -0.6173095703125, -0.428466796875, -0.2396240234375, -0.05078125, 0.1380615234375, 0.326904296875, 0.5157470703125, 0.70458984375, 0.8934326171875, 1.082275390625, 1.2711181640625, 1.4599609375, 1.6488037109375, 1.837646484375, 2.0264892578125, 2.21533203125, 2.4041748046875, 2.593017578125, 2.7818603515625, 2.970703125, 3.1595458984375, 3.348388671875, 3.5372314453125, 3.72607421875, 3.9149169921875, 4.103759765625, 4.2926025390625, 4.4814453125, 4.6702880859375, 4.859130859375, 5.0479736328125, 5.23681640625, 5.4256591796875, 5.614501953125, 5.8033447265625, 5.9921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 6.0, 6.0, 4.0, 11.0, 9.0, 15.0, 17.0, 22.0, 19.0, 23.0, 30.0, 42.0, 49.0, 44.0, 43.0, 69.0, 65.0, 67.0, 70.0, 54.0, 48.0, 57.0, 30.0, 22.0, 33.0, 31.0, 31.0, 19.0, 14.0, 13.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.103515625, -2.042724609375, -1.98193359375, -1.921142578125, -1.8603515625, -1.799560546875, -1.73876953125, -1.677978515625, -1.6171875, -1.556396484375, -1.49560546875, -1.434814453125, -1.3740234375, -1.313232421875, -1.25244140625, -1.191650390625, -1.130859375, -1.070068359375, -1.00927734375, -0.948486328125, -0.8876953125, -0.826904296875, -0.76611328125, -0.705322265625, -0.64453125, -0.583740234375, -0.52294921875, -0.462158203125, -0.4013671875, -0.340576171875, -0.27978515625, -0.218994140625, -0.158203125, -0.097412109375, -0.03662109375, 0.024169921875, 0.0849609375, 0.145751953125, 0.20654296875, 0.267333984375, 0.328125, 0.388916015625, 0.44970703125, 0.510498046875, 0.5712890625, 0.632080078125, 0.69287109375, 0.753662109375, 0.814453125, 0.875244140625, 0.93603515625, 0.996826171875, 1.0576171875, 1.118408203125, 1.17919921875, 1.239990234375, 1.30078125, 1.361572265625, 1.42236328125, 1.483154296875, 1.5439453125, 1.604736328125, 1.66552734375, 1.726318359375, 1.787109375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 12.0, 10.0, 14.0, 18.0, 17.0, 20.0, 23.0, 30.0, 42.0, 48.0, 65.0, 65.0, 73.0, 62.0, 80.0, 78.0, 65.0, 54.0, 39.0, 38.0, 22.0, 25.0, 21.0, 14.0, 13.0, 14.0, 6.0, 11.0, 1.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.22071647644043, -18.55204963684082, -17.883380889892578, -17.21471405029297, -16.54604721069336, -15.877379417419434, -15.208711624145508, -14.540044784545898, -13.871376991271973, -13.202709197998047, -12.534042358398438, -11.865374565124512, -11.196706771850586, -10.528039932250977, -9.85937213897705, -9.190704345703125, -8.522037506103516, -7.853370189666748, -7.1847028732299805, -6.516035079956055, -5.847367763519287, -5.1787004470825195, -4.510032653808594, -3.841365337371826, -3.1726980209350586, -2.504030704498291, -1.8353631496429443, -1.1666955947875977, -0.4980282783508301, 0.1706390380859375, 0.8393068313598633, 1.5079741477966309, 2.1766414642333984, 2.845308780670166, 3.5139763355255127, 4.182643890380859, 4.851311206817627, 5.5199785232543945, 6.18864631652832, 6.857313632965088, 7.5259809494018555, 8.194648742675781, 8.86331558227539, 9.531983375549316, 10.200651168823242, 10.869318008422852, 11.537985801696777, 12.206653594970703, 12.875320434570312, 13.543988227844238, 14.212655067443848, 14.881322860717773, 15.549989700317383, 16.218658447265625, 16.887325286865234, 17.555992126464844, 18.224658966064453, 18.893325805664062, 19.561994552612305, 20.230661392211914, 20.899328231811523, 21.567996978759766, 22.236663818359375, 22.905330657958984, 23.573999404907227]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 11.0, 10.0, 10.0, 11.0, 5.0, 22.0, 15.0, 14.0, 20.0, 15.0, 28.0, 28.0, 31.0, 23.0, 43.0, 36.0, 20.0, 40.0, 38.0, 32.0, 37.0, 51.0, 37.0, 36.0, 27.0, 31.0, 36.0, 38.0, 31.0, 34.0, 20.0, 19.0, 23.0, 24.0, 9.0, 18.0, 17.0, 2.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.744450569152832, -7.483931541442871, -7.22341251373291, -6.962893962860107, -6.7023749351501465, -6.4418559074401855, -6.181337356567383, -5.920818328857422, -5.660299301147461, -5.3997802734375, -5.139261245727539, -4.878742694854736, -4.618223667144775, -4.3577046394348145, -4.097186088562012, -3.836667060852051, -3.57614803314209, -3.315629005432129, -3.055110216140747, -2.7945914268493652, -2.5340723991394043, -2.2735533714294434, -2.0130345821380615, -1.7525156736373901, -1.4919967651367188, -1.2314778566360474, -0.970958948135376, -0.7104400396347046, -0.4499211311340332, -0.18940222263336182, 0.07111668586730957, 0.33163559436798096, 0.5921535491943359, 0.8526724576950073, 1.1131913661956787, 1.37371027469635, 1.6342291831970215, 1.8947480916976929, 2.1552670001983643, 2.415785789489746, 2.676304817199707, 2.936823844909668, 3.19734263420105, 3.4578614234924316, 3.7183804512023926, 3.9788994789123535, 4.239418029785156, 4.499937057495117, 4.760456085205078, 5.020975112915039, 5.281494140625, 5.542012691497803, 5.802531719207764, 6.063050746917725, 6.323569297790527, 6.584088325500488, 6.844607353210449, 7.10512638092041, 7.365645408630371, 7.626163959503174, 7.886682987213135, 8.147201538085938, 8.407720565795898, 8.66823959350586, 8.92875862121582]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 8.0, 27.0, 34.0, 60.0, 96.0, 154.0, 237.0, 307.0, 541.0, 903.0, 1395.0, 2593.0, 4367.0, 7605.0, 14153.0, 27345.0, 54478.0, 114518.0, 254984.0, 585474.0, 1133987.0, 1063404.0, 510661.0, 217767.0, 97877.0, 47018.0, 23839.0, 12736.0, 7205.0, 4109.0, 2406.0, 1399.0, 887.0, 548.0, 373.0, 245.0, 171.0, 97.0, 85.0, 42.0, 40.0, 20.0, 21.0, 15.0, 13.0, 6.0, 13.0, 8.0, 3.0, 4.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.7421875, -13.1676025390625, -12.593017578125, -12.0184326171875, -11.44384765625, -10.8692626953125, -10.294677734375, -9.7200927734375, -9.1455078125, -8.5709228515625, -7.996337890625, -7.4217529296875, -6.84716796875, -6.2725830078125, -5.697998046875, -5.1234130859375, -4.548828125, -3.9742431640625, -3.399658203125, -2.8250732421875, -2.25048828125, -1.6759033203125, -1.101318359375, -0.5267333984375, 0.0478515625, 0.6224365234375, 1.197021484375, 1.7716064453125, 2.34619140625, 2.9207763671875, 3.495361328125, 4.0699462890625, 4.64453125, 5.2191162109375, 5.793701171875, 6.3682861328125, 6.94287109375, 7.5174560546875, 8.092041015625, 8.6666259765625, 9.2412109375, 9.8157958984375, 10.390380859375, 10.9649658203125, 11.53955078125, 12.1141357421875, 12.688720703125, 13.2633056640625, 13.837890625, 14.4124755859375, 14.987060546875, 15.5616455078125, 16.13623046875, 16.7108154296875, 17.285400390625, 17.8599853515625, 18.4345703125, 19.0091552734375, 19.583740234375, 20.1583251953125, 20.73291015625, 21.3074951171875, 21.882080078125, 22.4566650390625, 23.03125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 10.0, 12.0, 16.0, 14.0, 15.0, 24.0, 21.0, 18.0, 18.0, 37.0, 42.0, 33.0, 38.0, 50.0, 49.0, 39.0, 47.0, 48.0, 43.0, 45.0, 56.0, 47.0, 37.0, 36.0, 34.0, 19.0, 23.0, 17.0, 22.0, 20.0, 8.0, 14.0, 9.0, 9.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.2803955078125, -7.021728515625, -6.7630615234375, -6.50439453125, -6.2457275390625, -5.987060546875, -5.7283935546875, -5.4697265625, -5.2110595703125, -4.952392578125, -4.6937255859375, -4.43505859375, -4.1763916015625, -3.917724609375, -3.6590576171875, -3.400390625, -3.1417236328125, -2.883056640625, -2.6243896484375, -2.36572265625, -2.1070556640625, -1.848388671875, -1.5897216796875, -1.3310546875, -1.0723876953125, -0.813720703125, -0.5550537109375, -0.29638671875, -0.0377197265625, 0.220947265625, 0.4796142578125, 0.73828125, 0.9969482421875, 1.255615234375, 1.5142822265625, 1.77294921875, 2.0316162109375, 2.290283203125, 2.5489501953125, 2.8076171875, 3.0662841796875, 3.324951171875, 3.5836181640625, 3.84228515625, 4.1009521484375, 4.359619140625, 4.6182861328125, 4.876953125, 5.1356201171875, 5.394287109375, 5.6529541015625, 5.91162109375, 6.1702880859375, 6.428955078125, 6.6876220703125, 6.9462890625, 7.2049560546875, 7.463623046875, 7.7222900390625, 7.98095703125, 8.2396240234375, 8.498291015625, 8.7569580078125, 9.015625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 1.0, 9.0, 21.0, 27.0, 32.0, 46.0, 65.0, 103.0, 171.0, 225.0, 370.0, 614.0, 973.0, 1569.0, 2681.0, 4457.0, 7570.0, 13582.0, 24706.0, 46361.0, 88545.0, 173028.0, 334746.0, 623080.0, 942603.0, 856483.0, 510840.0, 267856.0, 137360.0, 70748.0, 37817.0, 20372.0, 11242.0, 6387.0, 3732.0, 2171.0, 1378.0, 837.0, 530.0, 334.0, 213.0, 134.0, 74.0, 58.0, 46.0, 23.0, 17.0, 15.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0], "bins": [-18.328125, -17.786376953125, -17.24462890625, -16.702880859375, -16.1611328125, -15.619384765625, -15.07763671875, -14.535888671875, -13.994140625, -13.452392578125, -12.91064453125, -12.368896484375, -11.8271484375, -11.285400390625, -10.74365234375, -10.201904296875, -9.66015625, -9.118408203125, -8.57666015625, -8.034912109375, -7.4931640625, -6.951416015625, -6.40966796875, -5.867919921875, -5.326171875, -4.784423828125, -4.24267578125, -3.700927734375, -3.1591796875, -2.617431640625, -2.07568359375, -1.533935546875, -0.9921875, -0.450439453125, 0.09130859375, 0.633056640625, 1.1748046875, 1.716552734375, 2.25830078125, 2.800048828125, 3.341796875, 3.883544921875, 4.42529296875, 4.967041015625, 5.5087890625, 6.050537109375, 6.59228515625, 7.134033203125, 7.67578125, 8.217529296875, 8.75927734375, 9.301025390625, 9.8427734375, 10.384521484375, 10.92626953125, 11.468017578125, 12.009765625, 12.551513671875, 13.09326171875, 13.635009765625, 14.1767578125, 14.718505859375, 15.26025390625, 15.802001953125, 16.34375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 15.0, 20.0, 18.0, 24.0, 37.0, 39.0, 39.0, 73.0, 78.0, 106.0, 97.0, 111.0, 152.0, 201.0, 188.0, 234.0, 253.0, 268.0, 247.0, 258.0, 220.0, 240.0, 205.0, 183.0, 144.0, 115.0, 108.0, 84.0, 73.0, 48.0, 42.0, 18.0, 26.0, 26.0, 14.0, 12.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.49609375, -4.3480224609375, -4.199951171875, -4.0518798828125, -3.90380859375, -3.7557373046875, -3.607666015625, -3.4595947265625, -3.3115234375, -3.1634521484375, -3.015380859375, -2.8673095703125, -2.71923828125, -2.5711669921875, -2.423095703125, -2.2750244140625, -2.126953125, -1.9788818359375, -1.830810546875, -1.6827392578125, -1.53466796875, -1.3865966796875, -1.238525390625, -1.0904541015625, -0.9423828125, -0.7943115234375, -0.646240234375, -0.4981689453125, -0.35009765625, -0.2020263671875, -0.053955078125, 0.0941162109375, 0.2421875, 0.3902587890625, 0.538330078125, 0.6864013671875, 0.83447265625, 0.9825439453125, 1.130615234375, 1.2786865234375, 1.4267578125, 1.5748291015625, 1.722900390625, 1.8709716796875, 2.01904296875, 2.1671142578125, 2.315185546875, 2.4632568359375, 2.611328125, 2.7593994140625, 2.907470703125, 3.0555419921875, 3.20361328125, 3.3516845703125, 3.499755859375, 3.6478271484375, 3.7958984375, 3.9439697265625, 4.092041015625, 4.2401123046875, 4.38818359375, 4.5362548828125, 4.684326171875, 4.8323974609375, 4.98046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 8.0, 4.0, 13.0, 11.0, 12.0, 15.0, 16.0, 27.0, 32.0, 37.0, 39.0, 51.0, 72.0, 71.0, 61.0, 86.0, 68.0, 62.0, 58.0, 49.0, 37.0, 28.0, 26.0, 23.0, 20.0, 12.0, 9.0, 12.0, 8.0, 6.0, 3.0, 1.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71157455444336, -19.039499282836914, -18.36742401123047, -17.695348739624023, -17.023273468017578, -16.351198196411133, -15.679121971130371, -15.007046699523926, -14.33497142791748, -13.662896156311035, -12.99082088470459, -12.318744659423828, -11.646669387817383, -10.974594116210938, -10.302518844604492, -9.630443572998047, -8.958368301391602, -8.286293029785156, -7.614217758178711, -6.942142009735107, -6.270066738128662, -5.597991466522217, -4.925915718078613, -4.253840446472168, -3.5817651748657227, -2.9096899032592773, -2.237614393234253, -1.5655388832092285, -0.8934636116027832, -0.2213883399963379, 0.4506874084472656, 1.122762680053711, 1.794839859008789, 2.4669151306152344, 3.138990640640259, 3.811066150665283, 4.4831414222717285, 5.155216693878174, 5.827292442321777, 6.499367713928223, 7.171442985534668, 7.843518257141113, 8.515593528747559, 9.18766975402832, 9.859745025634766, 10.531820297241211, 11.203895568847656, 11.875970840454102, 12.548046112060547, 13.220121383666992, 13.892196655273438, 14.564271926879883, 15.236347198486328, 15.908422470092773, 16.58049774169922, 17.252574920654297, 17.92464828491211, 18.596723556518555, 19.268798828125, 19.940874099731445, 20.61294937133789, 21.285024642944336, 21.95709991455078, 22.62917709350586, 23.301252365112305]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 14.0, 19.0, 18.0, 16.0, 19.0, 28.0, 29.0, 21.0, 40.0, 41.0, 31.0, 43.0, 42.0, 44.0, 41.0, 58.0, 54.0, 42.0, 35.0, 33.0, 37.0, 39.0, 27.0, 29.0, 30.0, 24.0, 19.0, 22.0, 16.0, 13.0, 9.0, 11.0, 5.0, 6.0, 7.0, 0.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.642413139343262, -9.33700942993164, -9.03160572052002, -8.726202011108398, -8.420797348022461, -8.11539363861084, -7.809989929199219, -7.504586219787598, -7.199182510375977, -6.8937788009643555, -6.588375091552734, -6.282970905303955, -5.977567195892334, -5.672163486480713, -5.366759300231934, -5.0613555908203125, -4.755951881408691, -4.45054817199707, -4.145144462585449, -3.83974027633667, -3.534336566925049, -3.2289328575134277, -2.9235289096832275, -2.6181249618530273, -2.3127212524414062, -2.007317543029785, -1.701913595199585, -1.3965097665786743, -1.0911059379577637, -0.785702109336853, -0.4802982807159424, -0.1748943328857422, 0.1305093765258789, 0.43591320514678955, 0.7413170337677002, 1.0467208623886108, 1.3521246910095215, 1.6575285196304321, 1.9629323482513428, 2.268336296081543, 2.573740005493164, 2.879143714904785, 3.1845476627349854, 3.4899516105651855, 3.7953553199768066, 4.100759029388428, 4.406163215637207, 4.711566925048828, 5.016970634460449, 5.32237434387207, 5.627778053283691, 5.933182239532471, 6.238585948944092, 6.543989658355713, 6.849393844604492, 7.154797554016113, 7.460201263427734, 7.7656049728393555, 8.071008682250977, 8.376412391662598, 8.681816101074219, 8.987220764160156, 9.292624473571777, 9.598028182983398, 9.90343189239502]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 9.0, 11.0, 7.0, 9.0, 23.0, 37.0, 42.0, 60.0, 81.0, 144.0, 210.0, 299.0, 461.0, 822.0, 1302.0, 2210.0, 4300.0, 8350.0, 17642.0, 38591.0, 84483.0, 168683.0, 250725.0, 224094.0, 129689.0, 61331.0, 27650.0, 12988.0, 6362.0, 3262.0, 1849.0, 1035.0, 590.0, 389.0, 265.0, 170.0, 127.0, 85.0, 44.0, 41.0, 25.0, 22.0, 10.0, 11.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.546875, -12.139404296875, -11.73193359375, -11.324462890625, -10.9169921875, -10.509521484375, -10.10205078125, -9.694580078125, -9.287109375, -8.879638671875, -8.47216796875, -8.064697265625, -7.6572265625, -7.249755859375, -6.84228515625, -6.434814453125, -6.02734375, -5.619873046875, -5.21240234375, -4.804931640625, -4.3974609375, -3.989990234375, -3.58251953125, -3.175048828125, -2.767578125, -2.360107421875, -1.95263671875, -1.545166015625, -1.1376953125, -0.730224609375, -0.32275390625, 0.084716796875, 0.4921875, 0.899658203125, 1.30712890625, 1.714599609375, 2.1220703125, 2.529541015625, 2.93701171875, 3.344482421875, 3.751953125, 4.159423828125, 4.56689453125, 4.974365234375, 5.3818359375, 5.789306640625, 6.19677734375, 6.604248046875, 7.01171875, 7.419189453125, 7.82666015625, 8.234130859375, 8.6416015625, 9.049072265625, 9.45654296875, 9.864013671875, 10.271484375, 10.678955078125, 11.08642578125, 11.493896484375, 11.9013671875, 12.308837890625, 12.71630859375, 13.123779296875, 13.53125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 9.0, 5.0, 4.0, 12.0, 10.0, 15.0, 17.0, 16.0, 18.0, 27.0, 30.0, 23.0, 32.0, 37.0, 47.0, 49.0, 40.0, 40.0, 52.0, 49.0, 46.0, 51.0, 43.0, 41.0, 46.0, 31.0, 21.0, 26.0, 26.0, 25.0, 18.0, 14.0, 18.0, 19.0, 12.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.94677734375, -9.5966796875, -9.24658203125, -8.896484375, -8.54638671875, -8.1962890625, -7.84619140625, -7.49609375, -7.14599609375, -6.7958984375, -6.44580078125, -6.095703125, -5.74560546875, -5.3955078125, -5.04541015625, -4.6953125, -4.34521484375, -3.9951171875, -3.64501953125, -3.294921875, -2.94482421875, -2.5947265625, -2.24462890625, -1.89453125, -1.54443359375, -1.1943359375, -0.84423828125, -0.494140625, -0.14404296875, 0.2060546875, 0.55615234375, 0.90625, 1.25634765625, 1.6064453125, 1.95654296875, 2.306640625, 2.65673828125, 3.0068359375, 3.35693359375, 3.70703125, 4.05712890625, 4.4072265625, 4.75732421875, 5.107421875, 5.45751953125, 5.8076171875, 6.15771484375, 6.5078125, 6.85791015625, 7.2080078125, 7.55810546875, 7.908203125, 8.25830078125, 8.6083984375, 8.95849609375, 9.30859375, 9.65869140625, 10.0087890625, 10.35888671875, 10.708984375, 11.05908203125, 11.4091796875, 11.75927734375, 12.109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 11.0, 12.0, 23.0, 33.0, 41.0, 49.0, 100.0, 150.0, 231.0, 334.0, 468.0, 781.0, 1279.0, 2125.0, 3800.0, 6989.0, 13311.0, 26638.0, 55028.0, 113970.0, 213836.0, 262710.0, 173486.0, 87292.0, 41804.0, 20388.0, 10171.0, 5562.0, 3166.0, 1749.0, 1071.0, 661.0, 420.0, 263.0, 194.0, 122.0, 85.0, 60.0, 37.0, 34.0, 20.0, 11.0, 15.0, 9.0, 4.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1015625, -13.67822265625, -13.2548828125, -12.83154296875, -12.408203125, -11.98486328125, -11.5615234375, -11.13818359375, -10.71484375, -10.29150390625, -9.8681640625, -9.44482421875, -9.021484375, -8.59814453125, -8.1748046875, -7.75146484375, -7.328125, -6.90478515625, -6.4814453125, -6.05810546875, -5.634765625, -5.21142578125, -4.7880859375, -4.36474609375, -3.94140625, -3.51806640625, -3.0947265625, -2.67138671875, -2.248046875, -1.82470703125, -1.4013671875, -0.97802734375, -0.5546875, -0.13134765625, 0.2919921875, 0.71533203125, 1.138671875, 1.56201171875, 1.9853515625, 2.40869140625, 2.83203125, 3.25537109375, 3.6787109375, 4.10205078125, 4.525390625, 4.94873046875, 5.3720703125, 5.79541015625, 6.21875, 6.64208984375, 7.0654296875, 7.48876953125, 7.912109375, 8.33544921875, 8.7587890625, 9.18212890625, 9.60546875, 10.02880859375, 10.4521484375, 10.87548828125, 11.298828125, 11.72216796875, 12.1455078125, 12.56884765625, 12.9921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 9.0, 14.0, 15.0, 10.0, 27.0, 24.0, 19.0, 28.0, 47.0, 50.0, 50.0, 40.0, 51.0, 53.0, 55.0, 54.0, 47.0, 39.0, 53.0, 38.0, 40.0, 47.0, 25.0, 28.0, 33.0, 19.0, 13.0, 7.0, 7.0, 12.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01171875, -5.78448486328125, -5.5572509765625, -5.33001708984375, -5.102783203125, -4.87554931640625, -4.6483154296875, -4.42108154296875, -4.19384765625, -3.96661376953125, -3.7393798828125, -3.51214599609375, -3.284912109375, -3.05767822265625, -2.8304443359375, -2.60321044921875, -2.3759765625, -2.14874267578125, -1.9215087890625, -1.69427490234375, -1.467041015625, -1.23980712890625, -1.0125732421875, -0.78533935546875, -0.55810546875, -0.33087158203125, -0.1036376953125, 0.12359619140625, 0.350830078125, 0.57806396484375, 0.8052978515625, 1.03253173828125, 1.259765625, 1.48699951171875, 1.7142333984375, 1.94146728515625, 2.168701171875, 2.39593505859375, 2.6231689453125, 2.85040283203125, 3.07763671875, 3.30487060546875, 3.5321044921875, 3.75933837890625, 3.986572265625, 4.21380615234375, 4.4410400390625, 4.66827392578125, 4.8955078125, 5.12274169921875, 5.3499755859375, 5.57720947265625, 5.804443359375, 6.03167724609375, 6.2589111328125, 6.48614501953125, 6.71337890625, 6.94061279296875, 7.1678466796875, 7.39508056640625, 7.622314453125, 7.84954833984375, 8.0767822265625, 8.30401611328125, 8.53125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 13.0, 26.0, 14.0, 26.0, 32.0, 51.0, 71.0, 99.0, 145.0, 245.0, 352.0, 564.0, 920.0, 1430.0, 2515.0, 4468.0, 8459.0, 17344.0, 37362.0, 85058.0, 189990.0, 305712.0, 212550.0, 97515.0, 42626.0, 19561.0, 9549.0, 4982.0, 2627.0, 1593.0, 917.0, 591.0, 359.0, 269.0, 167.0, 88.0, 71.0, 58.0, 31.0, 27.0, 16.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.68359375, -7.44775390625, -7.2119140625, -6.97607421875, -6.740234375, -6.50439453125, -6.2685546875, -6.03271484375, -5.796875, -5.56103515625, -5.3251953125, -5.08935546875, -4.853515625, -4.61767578125, -4.3818359375, -4.14599609375, -3.91015625, -3.67431640625, -3.4384765625, -3.20263671875, -2.966796875, -2.73095703125, -2.4951171875, -2.25927734375, -2.0234375, -1.78759765625, -1.5517578125, -1.31591796875, -1.080078125, -0.84423828125, -0.6083984375, -0.37255859375, -0.13671875, 0.09912109375, 0.3349609375, 0.57080078125, 0.806640625, 1.04248046875, 1.2783203125, 1.51416015625, 1.75, 1.98583984375, 2.2216796875, 2.45751953125, 2.693359375, 2.92919921875, 3.1650390625, 3.40087890625, 3.63671875, 3.87255859375, 4.1083984375, 4.34423828125, 4.580078125, 4.81591796875, 5.0517578125, 5.28759765625, 5.5234375, 5.75927734375, 5.9951171875, 6.23095703125, 6.466796875, 6.70263671875, 6.9384765625, 7.17431640625, 7.41015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 9.0, 9.0, 11.0, 11.0, 17.0, 18.0, 26.0, 35.0, 55.0, 51.0, 67.0, 80.0, 60.0, 73.0, 84.0, 72.0, 67.0, 48.0, 54.0, 40.0, 23.0, 18.0, 15.0, 11.0, 7.0, 4.0, 5.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000423431396484375, -0.0004111379384994507, -0.00039884448051452637, -0.00038655102252960205, -0.00037425756454467773, -0.0003619641065597534, -0.0003496706485748291, -0.0003373771905899048, -0.00032508373260498047, -0.00031279027462005615, -0.00030049681663513184, -0.0002882033586502075, -0.0002759099006652832, -0.0002636164426803589, -0.00025132298469543457, -0.00023902952671051025, -0.00022673606872558594, -0.00021444261074066162, -0.0002021491527557373, -0.000189855694770813, -0.00017756223678588867, -0.00016526877880096436, -0.00015297532081604004, -0.00014068186283111572, -0.0001283884048461914, -0.00011609494686126709, -0.00010380148887634277, -9.150803089141846e-05, -7.921457290649414e-05, -6.692111492156982e-05, -5.462765693664551e-05, -4.233419895172119e-05, -3.0040740966796875e-05, -1.774728298187256e-05, -5.453824996948242e-06, 6.839632987976074e-06, 1.913309097290039e-05, 3.142654895782471e-05, 4.3720006942749023e-05, 5.601346492767334e-05, 6.830692291259766e-05, 8.060038089752197e-05, 9.289383888244629e-05, 0.0001051872968673706, 0.00011748075485229492, 0.00012977421283721924, 0.00014206767082214355, 0.00015436112880706787, 0.0001666545867919922, 0.0001789480447769165, 0.00019124150276184082, 0.00020353496074676514, 0.00021582841873168945, 0.00022812187671661377, 0.00024041533470153809, 0.0002527087926864624, 0.0002650022506713867, 0.00027729570865631104, 0.00028958916664123535, 0.00030188262462615967, 0.000314176082611084, 0.0003264695405960083, 0.0003387629985809326, 0.00035105645656585693, 0.00036334991455078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 8.0, 5.0, 9.0, 16.0, 22.0, 31.0, 39.0, 67.0, 62.0, 128.0, 189.0, 277.0, 483.0, 730.0, 1246.0, 2268.0, 4791.0, 10893.0, 29134.0, 83362.0, 212005.0, 327488.0, 227316.0, 92763.0, 32154.0, 11986.0, 5106.0, 2472.0, 1313.0, 780.0, 496.0, 339.0, 164.0, 130.0, 88.0, 63.0, 26.0, 24.0, 23.0, 14.0, 19.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.47265625, -8.1953125, -7.91796875, -7.640625, -7.36328125, -7.0859375, -6.80859375, -6.53125, -6.25390625, -5.9765625, -5.69921875, -5.421875, -5.14453125, -4.8671875, -4.58984375, -4.3125, -4.03515625, -3.7578125, -3.48046875, -3.203125, -2.92578125, -2.6484375, -2.37109375, -2.09375, -1.81640625, -1.5390625, -1.26171875, -0.984375, -0.70703125, -0.4296875, -0.15234375, 0.125, 0.40234375, 0.6796875, 0.95703125, 1.234375, 1.51171875, 1.7890625, 2.06640625, 2.34375, 2.62109375, 2.8984375, 3.17578125, 3.453125, 3.73046875, 4.0078125, 4.28515625, 4.5625, 4.83984375, 5.1171875, 5.39453125, 5.671875, 5.94921875, 6.2265625, 6.50390625, 6.78125, 7.05859375, 7.3359375, 7.61328125, 7.890625, 8.16796875, 8.4453125, 8.72265625, 9.0]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 4.0, 4.0, 9.0, 17.0, 15.0, 45.0, 35.0, 26.0, 54.0, 63.0, 70.0, 79.0, 92.0, 90.0, 67.0, 70.0, 58.0, 46.0, 31.0, 21.0, 31.0, 14.0, 11.0, 6.0, 6.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6171875, -1.56268310546875, -1.5081787109375, -1.45367431640625, -1.399169921875, -1.34466552734375, -1.2901611328125, -1.23565673828125, -1.18115234375, -1.12664794921875, -1.0721435546875, -1.01763916015625, -0.963134765625, -0.90863037109375, -0.8541259765625, -0.79962158203125, -0.7451171875, -0.69061279296875, -0.6361083984375, -0.58160400390625, -0.527099609375, -0.47259521484375, -0.4180908203125, -0.36358642578125, -0.30908203125, -0.25457763671875, -0.2000732421875, -0.14556884765625, -0.091064453125, -0.03656005859375, 0.0179443359375, 0.07244873046875, 0.126953125, 0.18145751953125, 0.2359619140625, 0.29046630859375, 0.344970703125, 0.39947509765625, 0.4539794921875, 0.50848388671875, 0.56298828125, 0.61749267578125, 0.6719970703125, 0.72650146484375, 0.781005859375, 0.83551025390625, 0.8900146484375, 0.94451904296875, 0.9990234375, 1.05352783203125, 1.1080322265625, 1.16253662109375, 1.217041015625, 1.27154541015625, 1.3260498046875, 1.38055419921875, 1.43505859375, 1.48956298828125, 1.5440673828125, 1.59857177734375, 1.653076171875, 1.70758056640625, 1.7620849609375, 1.81658935546875, 1.87109375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 9.0, 5.0, 11.0, 19.0, 16.0, 31.0, 23.0, 25.0, 43.0, 51.0, 54.0, 74.0, 73.0, 89.0, 65.0, 69.0, 52.0, 58.0, 47.0, 25.0, 32.0, 20.0, 29.0, 7.0, 15.0, 14.0, 5.0, 3.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.77476692199707, -19.087709426879883, -18.400651931762695, -17.71359634399414, -17.026538848876953, -16.339481353759766, -15.652423858642578, -14.96536636352539, -14.27830982208252, -13.591252326965332, -12.904195785522461, -12.217138290405273, -11.530080795288086, -10.843024253845215, -10.155966758728027, -9.468910217285156, -8.781852722167969, -8.094795227050781, -7.40773868560791, -6.720681190490723, -6.033624172210693, -5.346567153930664, -4.659509658813477, -3.9724526405334473, -3.285395622253418, -2.5983386039733887, -1.9112813472747803, -1.2242240905761719, -0.5371670722961426, 0.14988994598388672, 0.8369474411010742, 1.5240044593811035, 2.2110595703125, 2.8981165885925293, 3.5851738452911377, 4.272231101989746, 4.959288120269775, 5.646345138549805, 6.333402633666992, 7.0204596519470215, 7.707516670227051, 8.394574165344238, 9.08163070678711, 9.768688201904297, 10.455745697021484, 11.142802238464355, 11.829859733581543, 12.516916275024414, 13.203973770141602, 13.891031265258789, 14.57808780670166, 15.265145301818848, 15.952201843261719, 16.639259338378906, 17.326316833496094, 18.01337432861328, 18.70043182373047, 19.387489318847656, 20.074546813964844, 20.76160430908203, 21.448659896850586, 22.135717391967773, 22.82277488708496, 23.50983238220215, 24.196887969970703]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 2.0, 6.0, 3.0, 12.0, 12.0, 19.0, 15.0, 18.0, 17.0, 22.0, 27.0, 30.0, 35.0, 38.0, 37.0, 34.0, 45.0, 44.0, 47.0, 54.0, 53.0, 47.0, 41.0, 28.0, 34.0, 33.0, 35.0, 29.0, 30.0, 30.0, 15.0, 25.0, 13.0, 17.0, 11.0, 6.0, 11.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.260191917419434, -8.958500862121582, -8.65680980682373, -8.355118751525879, -8.053426742553711, -7.751736164093018, -7.450044631958008, -7.148353576660156, -6.846662521362305, -6.544971466064453, -6.243280410766602, -5.941588878631592, -5.63989782333374, -5.338206768035889, -5.036515235900879, -4.734824180603027, -4.433133125305176, -4.131442070007324, -3.8297507762908936, -3.528059482574463, -3.2263684272766113, -2.9246773719787598, -2.622986078262329, -2.3212947845458984, -2.019603729248047, -1.7179125547409058, -1.4162213802337646, -1.1145302057266235, -0.8128390312194824, -0.5111478567123413, -0.2094566822052002, 0.09223461151123047, 0.39392662048339844, 0.6956177949905396, 0.9973089694976807, 1.2990001440048218, 1.600691318511963, 1.902382493019104, 2.204073667526245, 2.505764961242676, 2.8074560165405273, 3.109147071838379, 3.4108383655548096, 3.7125296592712402, 4.014220714569092, 4.315911769866943, 4.617603302001953, 4.919294357299805, 5.220985412597656, 5.522676467895508, 5.824367523193359, 6.126059055328369, 6.427750110626221, 6.729441165924072, 7.031132698059082, 7.332823753356934, 7.634514808654785, 7.936205863952637, 8.237896919250488, 8.53958797454834, 8.841279983520508, 9.14297103881836, 9.444662094116211, 9.746353149414062, 10.048044204711914]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 12.0, 29.0, 37.0, 66.0, 124.0, 198.0, 328.0, 601.0, 1189.0, 2226.0, 4381.0, 8619.0, 17752.0, 35645.0, 71264.0, 129424.0, 195040.0, 213724.0, 165721.0, 99137.0, 51979.0, 25428.0, 12583.0, 6075.0, 3207.0, 1677.0, 880.0, 487.0, 274.0, 173.0, 98.0, 48.0, 35.0, 23.0, 14.0, 8.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.765625, -16.150634765625, -15.53564453125, -14.920654296875, -14.3056640625, -13.690673828125, -13.07568359375, -12.460693359375, -11.845703125, -11.230712890625, -10.61572265625, -10.000732421875, -9.3857421875, -8.770751953125, -8.15576171875, -7.540771484375, -6.92578125, -6.310791015625, -5.69580078125, -5.080810546875, -4.4658203125, -3.850830078125, -3.23583984375, -2.620849609375, -2.005859375, -1.390869140625, -0.77587890625, -0.160888671875, 0.4541015625, 1.069091796875, 1.68408203125, 2.299072265625, 2.9140625, 3.529052734375, 4.14404296875, 4.759033203125, 5.3740234375, 5.989013671875, 6.60400390625, 7.218994140625, 7.833984375, 8.448974609375, 9.06396484375, 9.678955078125, 10.2939453125, 10.908935546875, 11.52392578125, 12.138916015625, 12.75390625, 13.368896484375, 13.98388671875, 14.598876953125, 15.2138671875, 15.828857421875, 16.44384765625, 17.058837890625, 17.673828125, 18.288818359375, 18.90380859375, 19.518798828125, 20.1337890625, 20.748779296875, 21.36376953125, 21.978759765625, 22.59375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 3.0, 9.0, 9.0, 13.0, 14.0, 15.0, 18.0, 22.0, 22.0, 21.0, 25.0, 32.0, 33.0, 35.0, 37.0, 41.0, 38.0, 34.0, 41.0, 44.0, 39.0, 48.0, 38.0, 41.0, 21.0, 38.0, 40.0, 26.0, 26.0, 25.0, 22.0, 22.0, 12.0, 9.0, 18.0, 10.0, 10.0, 7.0, 9.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-10.34375, -10.0341796875, -9.724609375, -9.4150390625, -9.10546875, -8.7958984375, -8.486328125, -8.1767578125, -7.8671875, -7.5576171875, -7.248046875, -6.9384765625, -6.62890625, -6.3193359375, -6.009765625, -5.7001953125, -5.390625, -5.0810546875, -4.771484375, -4.4619140625, -4.15234375, -3.8427734375, -3.533203125, -3.2236328125, -2.9140625, -2.6044921875, -2.294921875, -1.9853515625, -1.67578125, -1.3662109375, -1.056640625, -0.7470703125, -0.4375, -0.1279296875, 0.181640625, 0.4912109375, 0.80078125, 1.1103515625, 1.419921875, 1.7294921875, 2.0390625, 2.3486328125, 2.658203125, 2.9677734375, 3.27734375, 3.5869140625, 3.896484375, 4.2060546875, 4.515625, 4.8251953125, 5.134765625, 5.4443359375, 5.75390625, 6.0634765625, 6.373046875, 6.6826171875, 6.9921875, 7.3017578125, 7.611328125, 7.9208984375, 8.23046875, 8.5400390625, 8.849609375, 9.1591796875, 9.46875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 14.0, 18.0, 36.0, 44.0, 70.0, 125.0, 169.0, 247.0, 361.0, 601.0, 889.0, 1309.0, 2035.0, 3097.0, 4656.0, 7360.0, 11432.0, 17372.0, 26151.0, 38887.0, 56408.0, 77272.0, 99693.0, 118358.0, 125136.0, 117054.0, 98301.0, 75418.0, 54502.0, 37540.0, 25676.0, 16774.0, 11025.0, 7130.0, 4587.0, 3062.0, 1974.0, 1294.0, 833.0, 567.0, 361.0, 248.0, 163.0, 95.0, 68.0, 50.0, 27.0, 24.0, 15.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.359375, -11.9786376953125, -11.597900390625, -11.2171630859375, -10.83642578125, -10.4556884765625, -10.074951171875, -9.6942138671875, -9.3134765625, -8.9327392578125, -8.552001953125, -8.1712646484375, -7.79052734375, -7.4097900390625, -7.029052734375, -6.6483154296875, -6.267578125, -5.8868408203125, -5.506103515625, -5.1253662109375, -4.74462890625, -4.3638916015625, -3.983154296875, -3.6024169921875, -3.2216796875, -2.8409423828125, -2.460205078125, -2.0794677734375, -1.69873046875, -1.3179931640625, -0.937255859375, -0.5565185546875, -0.17578125, 0.2049560546875, 0.585693359375, 0.9664306640625, 1.34716796875, 1.7279052734375, 2.108642578125, 2.4893798828125, 2.8701171875, 3.2508544921875, 3.631591796875, 4.0123291015625, 4.39306640625, 4.7738037109375, 5.154541015625, 5.5352783203125, 5.916015625, 6.2967529296875, 6.677490234375, 7.0582275390625, 7.43896484375, 7.8197021484375, 8.200439453125, 8.5811767578125, 8.9619140625, 9.3426513671875, 9.723388671875, 10.1041259765625, 10.48486328125, 10.8656005859375, 11.246337890625, 11.6270751953125, 12.0078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 11.0, 10.0, 11.0, 12.0, 19.0, 13.0, 11.0, 13.0, 25.0, 23.0, 28.0, 25.0, 37.0, 27.0, 41.0, 45.0, 43.0, 43.0, 43.0, 43.0, 31.0, 45.0, 51.0, 31.0, 42.0, 30.0, 32.0, 37.0, 34.0, 17.0, 20.0, 18.0, 16.0, 12.0, 14.0, 10.0, 9.0, 2.0, 7.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4453125, -6.244140625, -6.04296875, -5.841796875, -5.640625, -5.439453125, -5.23828125, -5.037109375, -4.8359375, -4.634765625, -4.43359375, -4.232421875, -4.03125, -3.830078125, -3.62890625, -3.427734375, -3.2265625, -3.025390625, -2.82421875, -2.623046875, -2.421875, -2.220703125, -2.01953125, -1.818359375, -1.6171875, -1.416015625, -1.21484375, -1.013671875, -0.8125, -0.611328125, -0.41015625, -0.208984375, -0.0078125, 0.193359375, 0.39453125, 0.595703125, 0.796875, 0.998046875, 1.19921875, 1.400390625, 1.6015625, 1.802734375, 2.00390625, 2.205078125, 2.40625, 2.607421875, 2.80859375, 3.009765625, 3.2109375, 3.412109375, 3.61328125, 3.814453125, 4.015625, 4.216796875, 4.41796875, 4.619140625, 4.8203125, 5.021484375, 5.22265625, 5.423828125, 5.625, 5.826171875, 6.02734375, 6.228515625, 6.4296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 18.0, 22.0, 31.0, 30.0, 49.0, 65.0, 87.0, 147.0, 222.0, 366.0, 548.0, 885.0, 1530.0, 2667.0, 4613.0, 8132.0, 15203.0, 29253.0, 57656.0, 110582.0, 186015.0, 227365.0, 180950.0, 106214.0, 54970.0, 27779.0, 14420.0, 7801.0, 4525.0, 2487.0, 1518.0, 871.0, 536.0, 335.0, 206.0, 157.0, 101.0, 56.0, 47.0, 36.0, 30.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3729248046875, -11.011474609375, -10.6500244140625, -10.28857421875, -9.9271240234375, -9.565673828125, -9.2042236328125, -8.8427734375, -8.4813232421875, -8.119873046875, -7.7584228515625, -7.39697265625, -7.0355224609375, -6.674072265625, -6.3126220703125, -5.951171875, -5.5897216796875, -5.228271484375, -4.8668212890625, -4.50537109375, -4.1439208984375, -3.782470703125, -3.4210205078125, -3.0595703125, -2.6981201171875, -2.336669921875, -1.9752197265625, -1.61376953125, -1.2523193359375, -0.890869140625, -0.5294189453125, -0.16796875, 0.1934814453125, 0.554931640625, 0.9163818359375, 1.27783203125, 1.6392822265625, 2.000732421875, 2.3621826171875, 2.7236328125, 3.0850830078125, 3.446533203125, 3.8079833984375, 4.16943359375, 4.5308837890625, 4.892333984375, 5.2537841796875, 5.615234375, 5.9766845703125, 6.338134765625, 6.6995849609375, 7.06103515625, 7.4224853515625, 7.783935546875, 8.1453857421875, 8.5068359375, 8.8682861328125, 9.229736328125, 9.5911865234375, 9.95263671875, 10.3140869140625, 10.675537109375, 11.0369873046875, 11.3984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 15.0, 9.0, 6.0, 12.0, 11.0, 29.0, 30.0, 35.0, 60.0, 42.0, 57.0, 69.0, 75.0, 65.0, 75.0, 74.0, 45.0, 56.0, 40.0, 37.0, 33.0, 21.0, 20.0, 11.0, 10.0, 16.0, 8.0, 7.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011281967163085938, -0.0010912269353866577, -0.0010542571544647217, -0.0010172873735427856, -0.0009803175926208496, -0.0009433478116989136, -0.0009063780307769775, -0.0008694082498550415, -0.0008324384689331055, -0.0007954686880111694, -0.0007584989070892334, -0.0007215291261672974, -0.0006845593452453613, -0.0006475895643234253, -0.0006106197834014893, -0.0005736500024795532, -0.0005366802215576172, -0.0004997104406356812, -0.0004627406597137451, -0.0004257708787918091, -0.00038880109786987305, -0.000351831316947937, -0.000314861536026001, -0.00027789175510406494, -0.0002409219741821289, -0.00020395219326019287, -0.00016698241233825684, -0.0001300126314163208, -9.304285049438477e-05, -5.607306957244873e-05, -1.9103288650512695e-05, 1.786649227142334e-05, 5.4836273193359375e-05, 9.180605411529541e-05, 0.00012877583503723145, 0.00016574561595916748, 0.00020271539688110352, 0.00023968517780303955, 0.0002766549587249756, 0.0003136247396469116, 0.00035059452056884766, 0.0003875643014907837, 0.0004245340824127197, 0.00046150386333465576, 0.0004984736442565918, 0.0005354434251785278, 0.0005724132061004639, 0.0006093829870223999, 0.0006463527679443359, 0.000683322548866272, 0.000720292329788208, 0.000757262110710144, 0.0007942318916320801, 0.0008312016725540161, 0.0008681714534759521, 0.0009051412343978882, 0.0009421110153198242, 0.0009790807962417603, 0.0010160505771636963, 0.0010530203580856323, 0.0010899901390075684, 0.0011269599199295044, 0.0011639297008514404, 0.0012008994817733765, 0.0012378692626953125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 20.0, 23.0, 32.0, 50.0, 56.0, 83.0, 116.0, 199.0, 311.0, 458.0, 716.0, 1145.0, 1884.0, 3169.0, 5289.0, 9035.0, 15929.0, 28232.0, 49698.0, 84454.0, 131496.0, 172771.0, 177100.0, 141466.0, 93614.0, 55985.0, 31840.0, 18341.0, 10076.0, 5875.0, 3441.0, 2090.0, 1288.0, 780.0, 484.0, 314.0, 218.0, 126.0, 101.0, 72.0, 60.0, 28.0, 24.0, 15.0, 15.0, 7.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.015625, -7.7579345703125, -7.500244140625, -7.2425537109375, -6.98486328125, -6.7271728515625, -6.469482421875, -6.2117919921875, -5.9541015625, -5.6964111328125, -5.438720703125, -5.1810302734375, -4.92333984375, -4.6656494140625, -4.407958984375, -4.1502685546875, -3.892578125, -3.6348876953125, -3.377197265625, -3.1195068359375, -2.86181640625, -2.6041259765625, -2.346435546875, -2.0887451171875, -1.8310546875, -1.5733642578125, -1.315673828125, -1.0579833984375, -0.80029296875, -0.5426025390625, -0.284912109375, -0.0272216796875, 0.23046875, 0.4881591796875, 0.745849609375, 1.0035400390625, 1.26123046875, 1.5189208984375, 1.776611328125, 2.0343017578125, 2.2919921875, 2.5496826171875, 2.807373046875, 3.0650634765625, 3.32275390625, 3.5804443359375, 3.838134765625, 4.0958251953125, 4.353515625, 4.6112060546875, 4.868896484375, 5.1265869140625, 5.38427734375, 5.6419677734375, 5.899658203125, 6.1573486328125, 6.4150390625, 6.6727294921875, 6.930419921875, 7.1881103515625, 7.44580078125, 7.7034912109375, 7.961181640625, 8.2188720703125, 8.4765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 5.0, 9.0, 5.0, 12.0, 14.0, 13.0, 14.0, 22.0, 21.0, 39.0, 37.0, 43.0, 42.0, 49.0, 52.0, 60.0, 47.0, 54.0, 61.0, 61.0, 45.0, 35.0, 41.0, 41.0, 33.0, 34.0, 27.0, 17.0, 18.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.42578125, -2.35546875, -2.28515625, -2.21484375, -2.14453125, -2.07421875, -2.00390625, -1.93359375, -1.86328125, -1.79296875, -1.72265625, -1.65234375, -1.58203125, -1.51171875, -1.44140625, -1.37109375, -1.30078125, -1.23046875, -1.16015625, -1.08984375, -1.01953125, -0.94921875, -0.87890625, -0.80859375, -0.73828125, -0.66796875, -0.59765625, -0.52734375, -0.45703125, -0.38671875, -0.31640625, -0.24609375, -0.17578125, -0.10546875, -0.03515625, 0.03515625, 0.10546875, 0.17578125, 0.24609375, 0.31640625, 0.38671875, 0.45703125, 0.52734375, 0.59765625, 0.66796875, 0.73828125, 0.80859375, 0.87890625, 0.94921875, 1.01953125, 1.08984375, 1.16015625, 1.23046875, 1.30078125, 1.37109375, 1.44140625, 1.51171875, 1.58203125, 1.65234375, 1.72265625, 1.79296875, 1.86328125, 1.93359375, 2.00390625, 2.07421875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 15.0, 18.0, 15.0, 30.0, 38.0, 35.0, 59.0, 64.0, 58.0, 77.0, 69.0, 75.0, 76.0, 68.0, 53.0, 43.0, 35.0, 29.0, 22.0, 20.0, 13.0, 15.0, 5.0, 9.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27089500427246, -18.551015853881836, -17.83113670349121, -17.11125946044922, -16.391380310058594, -15.671501159667969, -14.951622009277344, -14.231742858886719, -13.51186466217041, -12.791985511779785, -12.072107315063477, -11.352228164672852, -10.632349014282227, -9.912470817565918, -9.192591667175293, -8.472713470458984, -7.752834320068359, -7.032955646514893, -6.313076972961426, -5.593197822570801, -4.873319149017334, -4.153440475463867, -3.433561325073242, -2.7136826515197754, -1.9938039779663086, -1.2739251852035522, -0.5540463924407959, 0.16583251953125, 0.8857111930847168, 1.6055898666381836, 2.3254690170288086, 3.0453476905822754, 3.765228271484375, 4.485106945037842, 5.204985618591309, 5.924864768981934, 6.6447434425354, 7.364622116088867, 8.084501266479492, 8.804380416870117, 9.524258613586426, 10.24413776397705, 10.96401596069336, 11.683895111083984, 12.40377426147461, 13.123652458190918, 13.843531608581543, 14.563409805297852, 15.283288955688477, 16.0031681060791, 16.723047256469727, 17.44292449951172, 18.162803649902344, 18.88268280029297, 19.602561950683594, 20.32244110107422, 21.042320251464844, 21.76219940185547, 22.482078552246094, 23.20195770263672, 23.92183494567871, 24.641714096069336, 25.36159324645996, 26.081472396850586, 26.801349639892578]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 4.0, 9.0, 8.0, 12.0, 17.0, 15.0, 23.0, 24.0, 24.0, 31.0, 21.0, 36.0, 42.0, 45.0, 32.0, 42.0, 43.0, 47.0, 44.0, 40.0, 45.0, 35.0, 39.0, 38.0, 29.0, 24.0, 35.0, 19.0, 23.0, 22.0, 15.0, 23.0, 11.0, 16.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.428163528442383, -9.131139755249023, -8.834115982055664, -8.537092208862305, -8.240068435668945, -7.943045139312744, -7.646021366119385, -7.348998069763184, -7.051974296569824, -6.754950523376465, -6.4579267501831055, -6.160902976989746, -5.863879680633545, -5.5668559074401855, -5.269832134246826, -4.972808837890625, -4.675784587860107, -4.378760814666748, -4.081737041473389, -3.7847135066986084, -3.487689971923828, -3.1906661987304688, -2.8936424255371094, -2.596618890762329, -2.2995951175689697, -2.0025713443756104, -1.70554780960083, -1.4085240364074707, -1.1115003824234009, -0.814476728439331, -0.5174529552459717, -0.2204294204711914, 0.07659435272216797, 0.3736180365085602, 0.6706417202949524, 0.967665433883667, 1.2646890878677368, 1.5617127418518066, 1.858736515045166, 2.1557600498199463, 2.4527838230133057, 2.749807596206665, 3.0468311309814453, 3.3438549041748047, 3.640878677368164, 3.9379022121429443, 4.234926223754883, 4.531949520111084, 4.828973293304443, 5.125997066497803, 5.423020839691162, 5.720044136047363, 6.017067909240723, 6.314091682434082, 6.611115455627441, 6.908139228820801, 7.20516300201416, 7.5021867752075195, 7.799210548400879, 8.096234321594238, 8.393258094787598, 8.69028091430664, 8.9873046875, 9.28432846069336, 9.581352233886719]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 12.0, 12.0, 19.0, 48.0, 62.0, 92.0, 142.0, 250.0, 468.0, 812.0, 1442.0, 2578.0, 4815.0, 9495.0, 19446.0, 40661.0, 91648.0, 218491.0, 562537.0, 1221540.0, 1159082.0, 507554.0, 197779.0, 82172.0, 36799.0, 17538.0, 8674.0, 4359.0, 2430.0, 1369.0, 748.0, 477.0, 274.0, 150.0, 85.0, 62.0, 37.0, 21.0, 22.0, 22.0, 18.0, 9.0, 14.0, 9.0, 5.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6328125, -14.9515380859375, -14.270263671875, -13.5889892578125, -12.90771484375, -12.2264404296875, -11.545166015625, -10.8638916015625, -10.1826171875, -9.5013427734375, -8.820068359375, -8.1387939453125, -7.45751953125, -6.7762451171875, -6.094970703125, -5.4136962890625, -4.732421875, -4.0511474609375, -3.369873046875, -2.6885986328125, -2.00732421875, -1.3260498046875, -0.644775390625, 0.0364990234375, 0.7177734375, 1.3990478515625, 2.080322265625, 2.7615966796875, 3.44287109375, 4.1241455078125, 4.805419921875, 5.4866943359375, 6.16796875, 6.8492431640625, 7.530517578125, 8.2117919921875, 8.89306640625, 9.5743408203125, 10.255615234375, 10.9368896484375, 11.6181640625, 12.2994384765625, 12.980712890625, 13.6619873046875, 14.34326171875, 15.0245361328125, 15.705810546875, 16.3870849609375, 17.068359375, 17.7496337890625, 18.430908203125, 19.1121826171875, 19.79345703125, 20.4747314453125, 21.156005859375, 21.8372802734375, 22.5185546875, 23.1998291015625, 23.881103515625, 24.5623779296875, 25.24365234375, 25.9249267578125, 26.606201171875, 27.2874755859375, 27.96875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 7.0, 12.0, 13.0, 12.0, 21.0, 24.0, 23.0, 27.0, 40.0, 29.0, 35.0, 36.0, 41.0, 62.0, 57.0, 47.0, 50.0, 39.0, 46.0, 35.0, 49.0, 40.0, 45.0, 29.0, 23.0, 18.0, 23.0, 14.0, 13.0, 14.0, 14.0, 7.0, 8.0, 8.0, 7.0, 9.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.174560546875, -7.90380859375, -7.633056640625, -7.3623046875, -7.091552734375, -6.82080078125, -6.550048828125, -6.279296875, -6.008544921875, -5.73779296875, -5.467041015625, -5.1962890625, -4.925537109375, -4.65478515625, -4.384033203125, -4.11328125, -3.842529296875, -3.57177734375, -3.301025390625, -3.0302734375, -2.759521484375, -2.48876953125, -2.218017578125, -1.947265625, -1.676513671875, -1.40576171875, -1.135009765625, -0.8642578125, -0.593505859375, -0.32275390625, -0.052001953125, 0.21875, 0.489501953125, 0.76025390625, 1.031005859375, 1.3017578125, 1.572509765625, 1.84326171875, 2.114013671875, 2.384765625, 2.655517578125, 2.92626953125, 3.197021484375, 3.4677734375, 3.738525390625, 4.00927734375, 4.280029296875, 4.55078125, 4.821533203125, 5.09228515625, 5.363037109375, 5.6337890625, 5.904541015625, 6.17529296875, 6.446044921875, 6.716796875, 6.987548828125, 7.25830078125, 7.529052734375, 7.7998046875, 8.070556640625, 8.34130859375, 8.612060546875, 8.8828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 17.0, 18.0, 28.0, 37.0, 66.0, 98.0, 142.0, 239.0, 341.0, 509.0, 852.0, 1360.0, 2239.0, 3479.0, 5997.0, 10244.0, 17611.0, 32275.0, 60352.0, 113445.0, 215016.0, 405964.0, 701669.0, 922602.0, 745870.0, 442421.0, 238656.0, 124413.0, 65861.0, 35293.0, 19535.0, 11051.0, 6508.0, 3704.0, 2295.0, 1378.0, 938.0, 590.0, 395.0, 273.0, 166.0, 115.0, 73.0, 46.0, 27.0, 23.0, 13.0, 11.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.75, -17.205078125, -16.66015625, -16.115234375, -15.5703125, -15.025390625, -14.48046875, -13.935546875, -13.390625, -12.845703125, -12.30078125, -11.755859375, -11.2109375, -10.666015625, -10.12109375, -9.576171875, -9.03125, -8.486328125, -7.94140625, -7.396484375, -6.8515625, -6.306640625, -5.76171875, -5.216796875, -4.671875, -4.126953125, -3.58203125, -3.037109375, -2.4921875, -1.947265625, -1.40234375, -0.857421875, -0.3125, 0.232421875, 0.77734375, 1.322265625, 1.8671875, 2.412109375, 2.95703125, 3.501953125, 4.046875, 4.591796875, 5.13671875, 5.681640625, 6.2265625, 6.771484375, 7.31640625, 7.861328125, 8.40625, 8.951171875, 9.49609375, 10.041015625, 10.5859375, 11.130859375, 11.67578125, 12.220703125, 12.765625, 13.310546875, 13.85546875, 14.400390625, 14.9453125, 15.490234375, 16.03515625, 16.580078125, 17.125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 11.0, 19.0, 16.0, 23.0, 35.0, 52.0, 59.0, 56.0, 99.0, 135.0, 125.0, 173.0, 239.0, 285.0, 303.0, 324.0, 273.0, 286.0, 281.0, 251.0, 210.0, 184.0, 131.0, 126.0, 80.0, 68.0, 48.0, 42.0, 27.0, 29.0, 20.0, 11.0, 11.0, 12.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.1473388671875, -5.962646484375, -5.7779541015625, -5.59326171875, -5.4085693359375, -5.223876953125, -5.0391845703125, -4.8544921875, -4.6697998046875, -4.485107421875, -4.3004150390625, -4.11572265625, -3.9310302734375, -3.746337890625, -3.5616455078125, -3.376953125, -3.1922607421875, -3.007568359375, -2.8228759765625, -2.63818359375, -2.4534912109375, -2.268798828125, -2.0841064453125, -1.8994140625, -1.7147216796875, -1.530029296875, -1.3453369140625, -1.16064453125, -0.9759521484375, -0.791259765625, -0.6065673828125, -0.421875, -0.2371826171875, -0.052490234375, 0.1322021484375, 0.31689453125, 0.5015869140625, 0.686279296875, 0.8709716796875, 1.0556640625, 1.2403564453125, 1.425048828125, 1.6097412109375, 1.79443359375, 1.9791259765625, 2.163818359375, 2.3485107421875, 2.533203125, 2.7178955078125, 2.902587890625, 3.0872802734375, 3.27197265625, 3.4566650390625, 3.641357421875, 3.8260498046875, 4.0107421875, 4.1954345703125, 4.380126953125, 4.5648193359375, 4.74951171875, 4.9342041015625, 5.118896484375, 5.3035888671875, 5.48828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 8.0, 5.0, 9.0, 13.0, 17.0, 14.0, 19.0, 28.0, 27.0, 41.0, 49.0, 48.0, 63.0, 56.0, 68.0, 82.0, 60.0, 52.0, 67.0, 47.0, 38.0, 36.0, 35.0, 19.0, 21.0, 17.0, 13.0, 5.0, 9.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.768938064575195, -20.087682723999023, -19.406429290771484, -18.725173950195312, -18.04391860961914, -17.36266326904297, -16.68140983581543, -16.000154495239258, -15.318899154663086, -14.63764476776123, -13.956389427185059, -13.275135040283203, -12.593879699707031, -11.912625312805176, -11.23137092590332, -10.550115585327148, -9.868861198425293, -9.187606811523438, -8.506351470947266, -7.82509708404541, -7.143841743469238, -6.462587356567383, -5.781332492828369, -5.1000776290893555, -4.418822765350342, -3.737567901611328, -3.0563130378723145, -2.37505841255188, -1.6938035488128662, -1.0125486850738525, -0.33129405975341797, 0.3499608039855957, 1.0312156677246094, 1.712470531463623, 2.3937253952026367, 3.0749800205230713, 3.756234884262085, 4.4374895095825195, 5.118744373321533, 5.799999237060547, 6.4812541007995605, 7.162508964538574, 7.843763828277588, 8.525018692016602, 9.206273078918457, 9.887528419494629, 10.568782806396484, 11.250038146972656, 11.931292533874512, 12.612546920776367, 13.293802261352539, 13.975056648254395, 14.656311988830566, 15.337566375732422, 16.018821716308594, 16.700077056884766, 17.381330490112305, 18.062585830688477, 18.743839263916016, 19.425094604492188, 20.10634994506836, 20.78760528564453, 21.46885871887207, 22.150114059448242, 22.831369400024414]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 8.0, 3.0, 4.0, 11.0, 10.0, 6.0, 13.0, 13.0, 15.0, 14.0, 27.0, 21.0, 20.0, 28.0, 23.0, 31.0, 39.0, 35.0, 41.0, 25.0, 48.0, 41.0, 41.0, 42.0, 34.0, 37.0, 40.0, 29.0, 34.0, 27.0, 27.0, 27.0, 19.0, 35.0, 18.0, 15.0, 16.0, 17.0, 14.0, 10.0, 14.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9055757522583, -8.616514205932617, -8.327452659606934, -8.03839111328125, -7.749330043792725, -7.460268497467041, -7.171207427978516, -6.882145881652832, -6.593084335327148, -6.304022789001465, -6.014961242675781, -5.725900173187256, -5.436838626861572, -5.147777080535889, -4.858716011047363, -4.56965446472168, -4.280592918395996, -3.9915313720703125, -3.702470064163208, -3.4134087562561035, -3.12434720993042, -2.8352856636047363, -2.546224355697632, -2.2571630477905273, -1.9681015014648438, -1.6790400743484497, -1.3899786472320557, -1.1009172201156616, -0.8118557929992676, -0.5227943658828735, -0.2337329387664795, 0.055328369140625, 0.3443889617919922, 0.6334503889083862, 0.9225118160247803, 1.2115732431411743, 1.5006346702575684, 1.7896960973739624, 2.0787575244903564, 2.367818832397461, 2.6568803787231445, 2.945941925048828, 3.2350032329559326, 3.524064540863037, 3.8131260871887207, 4.102187633514404, 4.39124870300293, 4.680310249328613, 4.969371795654297, 5.2584333419799805, 5.547494888305664, 5.8365559577941895, 6.125617504119873, 6.414679050445557, 6.703740119934082, 6.992801666259766, 7.281863212585449, 7.570924758911133, 7.859986305236816, 8.1490478515625, 8.438108444213867, 8.72716999053955, 9.016231536865234, 9.305293083190918, 9.594354629516602]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 20.0, 35.0, 43.0, 69.0, 89.0, 128.0, 183.0, 255.0, 385.0, 543.0, 759.0, 1159.0, 1733.0, 2870.0, 4818.0, 8386.0, 15661.0, 29984.0, 58548.0, 107101.0, 172408.0, 210186.0, 180176.0, 115927.0, 63809.0, 32901.0, 17255.0, 9319.0, 5015.0, 3064.0, 1860.0, 1196.0, 803.0, 568.0, 346.0, 287.0, 179.0, 146.0, 98.0, 70.0, 45.0, 27.0, 21.0, 11.0, 14.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.1868896484375, -9.803466796875, -9.4200439453125, -9.03662109375, -8.6531982421875, -8.269775390625, -7.8863525390625, -7.5029296875, -7.1195068359375, -6.736083984375, -6.3526611328125, -5.96923828125, -5.5858154296875, -5.202392578125, -4.8189697265625, -4.435546875, -4.0521240234375, -3.668701171875, -3.2852783203125, -2.90185546875, -2.5184326171875, -2.135009765625, -1.7515869140625, -1.3681640625, -0.9847412109375, -0.601318359375, -0.2178955078125, 0.16552734375, 0.5489501953125, 0.932373046875, 1.3157958984375, 1.69921875, 2.0826416015625, 2.466064453125, 2.8494873046875, 3.23291015625, 3.6163330078125, 3.999755859375, 4.3831787109375, 4.7666015625, 5.1500244140625, 5.533447265625, 5.9168701171875, 6.30029296875, 6.6837158203125, 7.067138671875, 7.4505615234375, 7.833984375, 8.2174072265625, 8.600830078125, 8.9842529296875, 9.36767578125, 9.7510986328125, 10.134521484375, 10.5179443359375, 10.9013671875, 11.2847900390625, 11.668212890625, 12.0516357421875, 12.43505859375, 12.8184814453125, 13.201904296875, 13.5853271484375, 13.96875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 17.0, 16.0, 8.0, 17.0, 18.0, 20.0, 24.0, 36.0, 34.0, 34.0, 48.0, 44.0, 41.0, 50.0, 35.0, 46.0, 41.0, 43.0, 37.0, 44.0, 32.0, 35.0, 30.0, 34.0, 24.0, 32.0, 26.0, 14.0, 21.0, 15.0, 10.0, 8.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7578125, -10.3970947265625, -10.036376953125, -9.6756591796875, -9.31494140625, -8.9542236328125, -8.593505859375, -8.2327880859375, -7.8720703125, -7.5113525390625, -7.150634765625, -6.7899169921875, -6.42919921875, -6.0684814453125, -5.707763671875, -5.3470458984375, -4.986328125, -4.6256103515625, -4.264892578125, -3.9041748046875, -3.54345703125, -3.1827392578125, -2.822021484375, -2.4613037109375, -2.1005859375, -1.7398681640625, -1.379150390625, -1.0184326171875, -0.65771484375, -0.2969970703125, 0.063720703125, 0.4244384765625, 0.78515625, 1.1458740234375, 1.506591796875, 1.8673095703125, 2.22802734375, 2.5887451171875, 2.949462890625, 3.3101806640625, 3.6708984375, 4.0316162109375, 4.392333984375, 4.7530517578125, 5.11376953125, 5.4744873046875, 5.835205078125, 6.1959228515625, 6.556640625, 6.9173583984375, 7.278076171875, 7.6387939453125, 7.99951171875, 8.3602294921875, 8.720947265625, 9.0816650390625, 9.4423828125, 9.8031005859375, 10.163818359375, 10.5245361328125, 10.88525390625, 11.2459716796875, 11.606689453125, 11.9674072265625, 12.328125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 14.0, 12.0, 12.0, 14.0, 28.0, 37.0, 47.0, 53.0, 62.0, 101.0, 135.0, 182.0, 234.0, 339.0, 513.0, 963.0, 1924.0, 5046.0, 16143.0, 64834.0, 286758.0, 475723.0, 146123.0, 33000.0, 9274.0, 3259.0, 1488.0, 718.0, 386.0, 303.0, 222.0, 149.0, 112.0, 100.0, 58.0, 49.0, 41.0, 25.0, 11.0, 26.0, 4.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.205322265625, -27.20751953125, -26.209716796875, -25.2119140625, -24.214111328125, -23.21630859375, -22.218505859375, -21.220703125, -20.222900390625, -19.22509765625, -18.227294921875, -17.2294921875, -16.231689453125, -15.23388671875, -14.236083984375, -13.23828125, -12.240478515625, -11.24267578125, -10.244873046875, -9.2470703125, -8.249267578125, -7.25146484375, -6.253662109375, -5.255859375, -4.258056640625, -3.26025390625, -2.262451171875, -1.2646484375, -0.266845703125, 0.73095703125, 1.728759765625, 2.7265625, 3.724365234375, 4.72216796875, 5.719970703125, 6.7177734375, 7.715576171875, 8.71337890625, 9.711181640625, 10.708984375, 11.706787109375, 12.70458984375, 13.702392578125, 14.7001953125, 15.697998046875, 16.69580078125, 17.693603515625, 18.69140625, 19.689208984375, 20.68701171875, 21.684814453125, 22.6826171875, 23.680419921875, 24.67822265625, 25.676025390625, 26.673828125, 27.671630859375, 28.66943359375, 29.667236328125, 30.6650390625, 31.662841796875, 32.66064453125, 33.658447265625, 34.65625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 13.0, 8.0, 15.0, 18.0, 20.0, 28.0, 22.0, 24.0, 25.0, 27.0, 30.0, 46.0, 32.0, 39.0, 40.0, 39.0, 48.0, 45.0, 49.0, 36.0, 29.0, 40.0, 24.0, 41.0, 26.0, 28.0, 23.0, 22.0, 19.0, 18.0, 13.0, 12.0, 14.0, 13.0, 8.0, 14.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.492919921875, -5.30224609375, -5.111572265625, -4.9208984375, -4.730224609375, -4.53955078125, -4.348876953125, -4.158203125, -3.967529296875, -3.77685546875, -3.586181640625, -3.3955078125, -3.204833984375, -3.01416015625, -2.823486328125, -2.6328125, -2.442138671875, -2.25146484375, -2.060791015625, -1.8701171875, -1.679443359375, -1.48876953125, -1.298095703125, -1.107421875, -0.916748046875, -0.72607421875, -0.535400390625, -0.3447265625, -0.154052734375, 0.03662109375, 0.227294921875, 0.41796875, 0.608642578125, 0.79931640625, 0.989990234375, 1.1806640625, 1.371337890625, 1.56201171875, 1.752685546875, 1.943359375, 2.134033203125, 2.32470703125, 2.515380859375, 2.7060546875, 2.896728515625, 3.08740234375, 3.278076171875, 3.46875, 3.659423828125, 3.85009765625, 4.040771484375, 4.2314453125, 4.422119140625, 4.61279296875, 4.803466796875, 4.994140625, 5.184814453125, 5.37548828125, 5.566162109375, 5.7568359375, 5.947509765625, 6.13818359375, 6.328857421875, 6.51953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 18.0, 17.0, 23.0, 45.0, 55.0, 86.0, 119.0, 162.0, 226.0, 320.0, 458.0, 730.0, 1018.0, 1481.0, 2234.0, 3656.0, 6863.0, 19218.0, 81617.0, 399956.0, 408475.0, 84306.0, 19959.0, 7002.0, 3571.0, 2224.0, 1458.0, 1026.0, 686.0, 469.0, 315.0, 240.0, 155.0, 103.0, 76.0, 56.0, 46.0, 29.0, 12.0, 13.0, 14.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-20.09375, -19.519775390625, -18.94580078125, -18.371826171875, -17.7978515625, -17.223876953125, -16.64990234375, -16.075927734375, -15.501953125, -14.927978515625, -14.35400390625, -13.780029296875, -13.2060546875, -12.632080078125, -12.05810546875, -11.484130859375, -10.91015625, -10.336181640625, -9.76220703125, -9.188232421875, -8.6142578125, -8.040283203125, -7.46630859375, -6.892333984375, -6.318359375, -5.744384765625, -5.17041015625, -4.596435546875, -4.0224609375, -3.448486328125, -2.87451171875, -2.300537109375, -1.7265625, -1.152587890625, -0.57861328125, -0.004638671875, 0.5693359375, 1.143310546875, 1.71728515625, 2.291259765625, 2.865234375, 3.439208984375, 4.01318359375, 4.587158203125, 5.1611328125, 5.735107421875, 6.30908203125, 6.883056640625, 7.45703125, 8.031005859375, 8.60498046875, 9.178955078125, 9.7529296875, 10.326904296875, 10.90087890625, 11.474853515625, 12.048828125, 12.622802734375, 13.19677734375, 13.770751953125, 14.3447265625, 14.918701171875, 15.49267578125, 16.066650390625, 16.640625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 14.0, 14.0, 10.0, 22.0, 55.0, 78.0, 120.0, 151.0, 142.0, 136.0, 97.0, 64.0, 38.0, 22.0, 10.0, 9.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011377334594726562, -0.0011100620031356812, -0.001082390546798706, -0.001054719090461731, -0.0010270476341247559, -0.0009993761777877808, -0.0009717047214508057, -0.0009440332651138306, -0.0009163618087768555, -0.0008886903524398804, -0.0008610188961029053, -0.0008333474397659302, -0.0008056759834289551, -0.00077800452709198, -0.0007503330707550049, -0.0007226616144180298, -0.0006949901580810547, -0.0006673187017440796, -0.0006396472454071045, -0.0006119757890701294, -0.0005843043327331543, -0.0005566328763961792, -0.0005289614200592041, -0.000501289963722229, -0.0004736185073852539, -0.0004459470510482788, -0.0004182755947113037, -0.0003906041383743286, -0.0003629326820373535, -0.0003352612257003784, -0.0003075897693634033, -0.0002799183130264282, -0.0002522468566894531, -0.00022457540035247803, -0.00019690394401550293, -0.00016923248767852783, -0.00014156103134155273, -0.00011388957500457764, -8.621811866760254e-05, -5.854666233062744e-05, -3.0875205993652344e-05, -3.203749656677246e-06, 2.446770668029785e-05, 5.213916301727295e-05, 7.981061935424805e-05, 0.00010748207569122314, 0.00013515353202819824, 0.00016282498836517334, 0.00019049644470214844, 0.00021816790103912354, 0.00024583935737609863, 0.00027351081371307373, 0.00030118227005004883, 0.0003288537263870239, 0.000356525182723999, 0.0003841966390609741, 0.0004118680953979492, 0.0004395395517349243, 0.0004672110080718994, 0.0004948824644088745, 0.0005225539207458496, 0.0005502253770828247, 0.0005778968334197998, 0.0006055682897567749, 0.00063323974609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 9.0, 21.0, 16.0, 21.0, 35.0, 55.0, 64.0, 100.0, 166.0, 196.0, 274.0, 363.0, 514.0, 721.0, 951.0, 1327.0, 1801.0, 2541.0, 3843.0, 7418.0, 24394.0, 125070.0, 452066.0, 326521.0, 68192.0, 14916.0, 5541.0, 3286.0, 2219.0, 1556.0, 1219.0, 858.0, 617.0, 445.0, 323.0, 254.0, 156.0, 133.0, 103.0, 74.0, 41.0, 43.0, 28.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.140625, -15.599365234375, -15.05810546875, -14.516845703125, -13.9755859375, -13.434326171875, -12.89306640625, -12.351806640625, -11.810546875, -11.269287109375, -10.72802734375, -10.186767578125, -9.6455078125, -9.104248046875, -8.56298828125, -8.021728515625, -7.48046875, -6.939208984375, -6.39794921875, -5.856689453125, -5.3154296875, -4.774169921875, -4.23291015625, -3.691650390625, -3.150390625, -2.609130859375, -2.06787109375, -1.526611328125, -0.9853515625, -0.444091796875, 0.09716796875, 0.638427734375, 1.1796875, 1.720947265625, 2.26220703125, 2.803466796875, 3.3447265625, 3.885986328125, 4.42724609375, 4.968505859375, 5.509765625, 6.051025390625, 6.59228515625, 7.133544921875, 7.6748046875, 8.216064453125, 8.75732421875, 9.298583984375, 9.83984375, 10.381103515625, 10.92236328125, 11.463623046875, 12.0048828125, 12.546142578125, 13.08740234375, 13.628662109375, 14.169921875, 14.711181640625, 15.25244140625, 15.793701171875, 16.3349609375, 16.876220703125, 17.41748046875, 17.958740234375, 18.5]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 22.0, 30.0, 47.0, 101.0, 127.0, 134.0, 151.0, 126.0, 89.0, 51.0, 37.0, 20.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.44140625, -4.314208984375, -4.18701171875, -4.059814453125, -3.9326171875, -3.805419921875, -3.67822265625, -3.551025390625, -3.423828125, -3.296630859375, -3.16943359375, -3.042236328125, -2.9150390625, -2.787841796875, -2.66064453125, -2.533447265625, -2.40625, -2.279052734375, -2.15185546875, -2.024658203125, -1.8974609375, -1.770263671875, -1.64306640625, -1.515869140625, -1.388671875, -1.261474609375, -1.13427734375, -1.007080078125, -0.8798828125, -0.752685546875, -0.62548828125, -0.498291015625, -0.37109375, -0.243896484375, -0.11669921875, 0.010498046875, 0.1376953125, 0.264892578125, 0.39208984375, 0.519287109375, 0.646484375, 0.773681640625, 0.90087890625, 1.028076171875, 1.1552734375, 1.282470703125, 1.40966796875, 1.536865234375, 1.6640625, 1.791259765625, 1.91845703125, 2.045654296875, 2.1728515625, 2.300048828125, 2.42724609375, 2.554443359375, 2.681640625, 2.808837890625, 2.93603515625, 3.063232421875, 3.1904296875, 3.317626953125, 3.44482421875, 3.572021484375, 3.69921875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 19.0, 14.0, 24.0, 28.0, 24.0, 41.0, 33.0, 47.0, 63.0, 63.0, 66.0, 82.0, 65.0, 59.0, 43.0, 51.0, 43.0, 35.0, 25.0, 32.0, 24.0, 11.0, 11.0, 15.0, 11.0, 3.0, 8.0, 9.0, 0.0, 7.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.522510528564453, -16.86768341064453, -16.212858200073242, -15.558032035827637, -14.903205871582031, -14.248379707336426, -13.59355354309082, -12.938727378845215, -12.28390121459961, -11.629075050354004, -10.974248886108398, -10.319422721862793, -9.664596557617188, -9.009770393371582, -8.354944229125977, -7.700118064880371, -7.045291900634766, -6.39046573638916, -5.735639572143555, -5.080813407897949, -4.425987243652344, -3.7711610794067383, -3.116334915161133, -2.4615087509155273, -1.8066825866699219, -1.1518564224243164, -0.49703025817871094, 0.15779590606689453, 0.8126220703125, 1.4674482345581055, 2.122274398803711, 2.7771005630493164, 3.4319286346435547, 4.08675479888916, 4.741580963134766, 5.396407127380371, 6.051233291625977, 6.706059455871582, 7.3608856201171875, 8.015711784362793, 8.670537948608398, 9.325364112854004, 9.98019027709961, 10.635016441345215, 11.28984260559082, 11.944668769836426, 12.599494934082031, 13.254321098327637, 13.909147262573242, 14.563973426818848, 15.218799591064453, 15.873625755310059, 16.528451919555664, 17.183277130126953, 17.838104248046875, 18.492931365966797, 19.147756576538086, 19.802581787109375, 20.457408905029297, 21.11223602294922, 21.767061233520508, 22.421886444091797, 23.07671356201172, 23.73154067993164, 24.38636589050293]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 12.0, 8.0, 7.0, 19.0, 12.0, 12.0, 18.0, 23.0, 18.0, 23.0, 23.0, 31.0, 26.0, 32.0, 37.0, 39.0, 33.0, 44.0, 45.0, 34.0, 38.0, 48.0, 34.0, 35.0, 40.0, 29.0, 36.0, 27.0, 22.0, 25.0, 14.0, 26.0, 15.0, 15.0, 17.0, 14.0, 22.0, 8.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.298133850097656, -8.011815071105957, -7.725496292114258, -7.439177513122559, -7.152858734130859, -6.86653995513916, -6.580220699310303, -6.2939019203186035, -6.007583141326904, -5.721264362335205, -5.434945583343506, -5.148626804351807, -4.862307548522949, -4.57598876953125, -4.289669990539551, -4.003351211547852, -3.7170324325561523, -3.430713653564453, -3.144394874572754, -2.8580758571624756, -2.5717570781707764, -2.285438299179077, -1.9991194009780884, -1.7128005027770996, -1.4264817237854004, -1.1401629447937012, -0.8538440465927124, -0.5675252079963684, -0.2812063694000244, 0.005112409591674805, 0.2914313077926636, 0.5777502059936523, 0.8640689849853516, 1.1503877639770508, 1.4367066621780396, 1.7230255603790283, 2.0093443393707275, 2.2956631183624268, 2.581982135772705, 2.8683009147644043, 3.1546196937561035, 3.4409384727478027, 3.727257251739502, 4.013576030731201, 4.299895286560059, 4.586214065551758, 4.872532844543457, 5.158851623535156, 5.4451704025268555, 5.731489181518555, 6.017807960510254, 6.304126739501953, 6.590445518493652, 6.876764297485352, 7.163083553314209, 7.449402332305908, 7.735721111297607, 8.022040367126465, 8.308359146118164, 8.594677925109863, 8.880996704101562, 9.167315483093262, 9.453634262084961, 9.73995304107666, 10.02627182006836]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 5.0, 5.0, 6.0, 8.0, 11.0, 21.0, 28.0, 50.0, 97.0, 179.0, 314.0, 478.0, 1031.0, 2023.0, 4468.0, 9856.0, 22085.0, 49816.0, 106576.0, 191657.0, 243619.0, 200656.0, 115732.0, 55214.0, 24283.0, 10727.0, 4857.0, 2348.0, 1082.0, 572.0, 347.0, 167.0, 91.0, 51.0, 35.0, 18.0, 16.0, 14.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.76123046875, -21.9912109375, -21.22119140625, -20.451171875, -19.68115234375, -18.9111328125, -18.14111328125, -17.37109375, -16.60107421875, -15.8310546875, -15.06103515625, -14.291015625, -13.52099609375, -12.7509765625, -11.98095703125, -11.2109375, -10.44091796875, -9.6708984375, -8.90087890625, -8.130859375, -7.36083984375, -6.5908203125, -5.82080078125, -5.05078125, -4.28076171875, -3.5107421875, -2.74072265625, -1.970703125, -1.20068359375, -0.4306640625, 0.33935546875, 1.109375, 1.87939453125, 2.6494140625, 3.41943359375, 4.189453125, 4.95947265625, 5.7294921875, 6.49951171875, 7.26953125, 8.03955078125, 8.8095703125, 9.57958984375, 10.349609375, 11.11962890625, 11.8896484375, 12.65966796875, 13.4296875, 14.19970703125, 14.9697265625, 15.73974609375, 16.509765625, 17.27978515625, 18.0498046875, 18.81982421875, 19.58984375, 20.35986328125, 21.1298828125, 21.89990234375, 22.669921875, 23.43994140625, 24.2099609375, 24.97998046875, 25.75]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 16.0, 13.0, 25.0, 25.0, 15.0, 18.0, 37.0, 25.0, 37.0, 47.0, 44.0, 59.0, 56.0, 54.0, 58.0, 49.0, 53.0, 50.0, 31.0, 34.0, 31.0, 37.0, 34.0, 24.0, 24.0, 17.0, 24.0, 10.0, 9.0, 7.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.5062255859375, -9.098388671875, -8.6905517578125, -8.28271484375, -7.8748779296875, -7.467041015625, -7.0592041015625, -6.6513671875, -6.2435302734375, -5.835693359375, -5.4278564453125, -5.02001953125, -4.6121826171875, -4.204345703125, -3.7965087890625, -3.388671875, -2.9808349609375, -2.572998046875, -2.1651611328125, -1.75732421875, -1.3494873046875, -0.941650390625, -0.5338134765625, -0.1259765625, 0.2818603515625, 0.689697265625, 1.0975341796875, 1.50537109375, 1.9132080078125, 2.321044921875, 2.7288818359375, 3.13671875, 3.5445556640625, 3.952392578125, 4.3602294921875, 4.76806640625, 5.1759033203125, 5.583740234375, 5.9915771484375, 6.3994140625, 6.8072509765625, 7.215087890625, 7.6229248046875, 8.03076171875, 8.4385986328125, 8.846435546875, 9.2542724609375, 9.662109375, 10.0699462890625, 10.477783203125, 10.8856201171875, 11.29345703125, 11.7012939453125, 12.109130859375, 12.5169677734375, 12.9248046875, 13.3326416015625, 13.740478515625, 14.1483154296875, 14.55615234375, 14.9639892578125, 15.371826171875, 15.7796630859375, 16.1875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 9.0, 4.0, 22.0, 21.0, 29.0, 32.0, 52.0, 96.0, 137.0, 216.0, 302.0, 526.0, 731.0, 1140.0, 1783.0, 2701.0, 4409.0, 6682.0, 10563.0, 16257.0, 25016.0, 37983.0, 55527.0, 76937.0, 99498.0, 118346.0, 126291.0, 118813.0, 100309.0, 77414.0, 56051.0, 38819.0, 25400.0, 16689.0, 10635.0, 6780.0, 4314.0, 2770.0, 1868.0, 1176.0, 715.0, 472.0, 345.0, 214.0, 151.0, 105.0, 75.0, 41.0, 27.0, 23.0, 11.0, 9.0, 8.0, 7.0, 6.0, 1.0, 0.0, 5.0], "bins": [-13.0078125, -12.6077880859375, -12.207763671875, -11.8077392578125, -11.40771484375, -11.0076904296875, -10.607666015625, -10.2076416015625, -9.8076171875, -9.4075927734375, -9.007568359375, -8.6075439453125, -8.20751953125, -7.8074951171875, -7.407470703125, -7.0074462890625, -6.607421875, -6.2073974609375, -5.807373046875, -5.4073486328125, -5.00732421875, -4.6072998046875, -4.207275390625, -3.8072509765625, -3.4072265625, -3.0072021484375, -2.607177734375, -2.2071533203125, -1.80712890625, -1.4071044921875, -1.007080078125, -0.6070556640625, -0.20703125, 0.1929931640625, 0.593017578125, 0.9930419921875, 1.39306640625, 1.7930908203125, 2.193115234375, 2.5931396484375, 2.9931640625, 3.3931884765625, 3.793212890625, 4.1932373046875, 4.59326171875, 4.9932861328125, 5.393310546875, 5.7933349609375, 6.193359375, 6.5933837890625, 6.993408203125, 7.3934326171875, 7.79345703125, 8.1934814453125, 8.593505859375, 8.9935302734375, 9.3935546875, 9.7935791015625, 10.193603515625, 10.5936279296875, 10.99365234375, 11.3936767578125, 11.793701171875, 12.1937255859375, 12.59375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 5.0, 8.0, 2.0, 8.0, 12.0, 14.0, 17.0, 9.0, 19.0, 19.0, 27.0, 21.0, 35.0, 29.0, 28.0, 29.0, 39.0, 43.0, 54.0, 42.0, 40.0, 42.0, 34.0, 38.0, 45.0, 45.0, 40.0, 31.0, 22.0, 29.0, 29.0, 29.0, 18.0, 21.0, 16.0, 9.0, 7.0, 7.0, 6.0, 6.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.2720947265625, -6.071533203125, -5.8709716796875, -5.67041015625, -5.4698486328125, -5.269287109375, -5.0687255859375, -4.8681640625, -4.6676025390625, -4.467041015625, -4.2664794921875, -4.06591796875, -3.8653564453125, -3.664794921875, -3.4642333984375, -3.263671875, -3.0631103515625, -2.862548828125, -2.6619873046875, -2.46142578125, -2.2608642578125, -2.060302734375, -1.8597412109375, -1.6591796875, -1.4586181640625, -1.258056640625, -1.0574951171875, -0.85693359375, -0.6563720703125, -0.455810546875, -0.2552490234375, -0.0546875, 0.1458740234375, 0.346435546875, 0.5469970703125, 0.74755859375, 0.9481201171875, 1.148681640625, 1.3492431640625, 1.5498046875, 1.7503662109375, 1.950927734375, 2.1514892578125, 2.35205078125, 2.5526123046875, 2.753173828125, 2.9537353515625, 3.154296875, 3.3548583984375, 3.555419921875, 3.7559814453125, 3.95654296875, 4.1571044921875, 4.357666015625, 4.5582275390625, 4.7587890625, 4.9593505859375, 5.159912109375, 5.3604736328125, 5.56103515625, 5.7615966796875, 5.962158203125, 6.1627197265625, 6.36328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 12.0, 21.0, 17.0, 17.0, 30.0, 58.0, 63.0, 121.0, 163.0, 248.0, 339.0, 449.0, 642.0, 964.0, 1292.0, 1971.0, 2881.0, 4419.0, 6555.0, 10464.0, 16818.0, 28832.0, 51259.0, 93271.0, 163058.0, 218812.0, 184976.0, 111549.0, 60731.0, 33922.0, 19858.0, 12051.0, 7425.0, 4889.0, 3290.0, 2127.0, 1514.0, 1062.0, 734.0, 501.0, 343.0, 257.0, 177.0, 120.0, 78.0, 60.0, 29.0, 31.0, 25.0, 8.0, 10.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0], "bins": [-10.828125, -10.4859619140625, -10.143798828125, -9.8016357421875, -9.45947265625, -9.1173095703125, -8.775146484375, -8.4329833984375, -8.0908203125, -7.7486572265625, -7.406494140625, -7.0643310546875, -6.72216796875, -6.3800048828125, -6.037841796875, -5.6956787109375, -5.353515625, -5.0113525390625, -4.669189453125, -4.3270263671875, -3.98486328125, -3.6427001953125, -3.300537109375, -2.9583740234375, -2.6162109375, -2.2740478515625, -1.931884765625, -1.5897216796875, -1.24755859375, -0.9053955078125, -0.563232421875, -0.2210693359375, 0.12109375, 0.4632568359375, 0.805419921875, 1.1475830078125, 1.48974609375, 1.8319091796875, 2.174072265625, 2.5162353515625, 2.8583984375, 3.2005615234375, 3.542724609375, 3.8848876953125, 4.22705078125, 4.5692138671875, 4.911376953125, 5.2535400390625, 5.595703125, 5.9378662109375, 6.280029296875, 6.6221923828125, 6.96435546875, 7.3065185546875, 7.648681640625, 7.9908447265625, 8.3330078125, 8.6751708984375, 9.017333984375, 9.3594970703125, 9.70166015625, 10.0438232421875, 10.385986328125, 10.7281494140625, 11.0703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 6.0, 7.0, 11.0, 8.0, 12.0, 22.0, 14.0, 29.0, 28.0, 57.0, 50.0, 56.0, 57.0, 71.0, 77.0, 100.0, 73.0, 55.0, 44.0, 44.0, 27.0, 22.0, 17.0, 24.0, 15.0, 8.0, 13.0, 10.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00109100341796875, -0.0010495781898498535, -0.001008152961730957, -0.0009667277336120605, -0.0009253025054931641, -0.0008838772773742676, -0.0008424520492553711, -0.0008010268211364746, -0.0007596015930175781, -0.0007181763648986816, -0.0006767511367797852, -0.0006353259086608887, -0.0005939006805419922, -0.0005524754524230957, -0.0005110502243041992, -0.00046962499618530273, -0.00042819976806640625, -0.00038677453994750977, -0.0003453493118286133, -0.0003039240837097168, -0.0002624988555908203, -0.00022107362747192383, -0.00017964839935302734, -0.00013822317123413086, -9.679794311523438e-05, -5.537271499633789e-05, -1.3947486877441406e-05, 2.7477741241455078e-05, 6.890296936035156e-05, 0.00011032819747924805, 0.00015175342559814453, 0.00019317865371704102, 0.0002346038818359375, 0.000276029109954834, 0.00031745433807373047, 0.00035887956619262695, 0.00040030479431152344, 0.0004417300224304199, 0.0004831552505493164, 0.0005245804786682129, 0.0005660057067871094, 0.0006074309349060059, 0.0006488561630249023, 0.0006902813911437988, 0.0007317066192626953, 0.0007731318473815918, 0.0008145570755004883, 0.0008559823036193848, 0.0008974075317382812, 0.0009388327598571777, 0.0009802579879760742, 0.0010216832160949707, 0.0010631084442138672, 0.0011045336723327637, 0.0011459589004516602, 0.0011873841285705566, 0.0012288093566894531, 0.0012702345848083496, 0.001311659812927246, 0.0013530850410461426, 0.001394510269165039, 0.0014359354972839355, 0.001477360725402832, 0.0015187859535217285, 0.001560211181640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 10.0, 16.0, 5.0, 29.0, 39.0, 52.0, 86.0, 112.0, 176.0, 278.0, 392.0, 575.0, 912.0, 1446.0, 2186.0, 3577.0, 5569.0, 9457.0, 16076.0, 28420.0, 51911.0, 95075.0, 160080.0, 210813.0, 187389.0, 119923.0, 66760.0, 36362.0, 20359.0, 11595.0, 6928.0, 4250.0, 2686.0, 1730.0, 1117.0, 745.0, 489.0, 306.0, 205.0, 148.0, 87.0, 55.0, 41.0, 37.0, 15.0, 16.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.2734375, -8.971435546875, -8.66943359375, -8.367431640625, -8.0654296875, -7.763427734375, -7.46142578125, -7.159423828125, -6.857421875, -6.555419921875, -6.25341796875, -5.951416015625, -5.6494140625, -5.347412109375, -5.04541015625, -4.743408203125, -4.44140625, -4.139404296875, -3.83740234375, -3.535400390625, -3.2333984375, -2.931396484375, -2.62939453125, -2.327392578125, -2.025390625, -1.723388671875, -1.42138671875, -1.119384765625, -0.8173828125, -0.515380859375, -0.21337890625, 0.088623046875, 0.390625, 0.692626953125, 0.99462890625, 1.296630859375, 1.5986328125, 1.900634765625, 2.20263671875, 2.504638671875, 2.806640625, 3.108642578125, 3.41064453125, 3.712646484375, 4.0146484375, 4.316650390625, 4.61865234375, 4.920654296875, 5.22265625, 5.524658203125, 5.82666015625, 6.128662109375, 6.4306640625, 6.732666015625, 7.03466796875, 7.336669921875, 7.638671875, 7.940673828125, 8.24267578125, 8.544677734375, 8.8466796875, 9.148681640625, 9.45068359375, 9.752685546875, 10.0546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 10.0, 10.0, 16.0, 13.0, 22.0, 25.0, 25.0, 36.0, 45.0, 60.0, 73.0, 70.0, 77.0, 84.0, 72.0, 68.0, 46.0, 53.0, 35.0, 26.0, 24.0, 25.0, 11.0, 9.0, 9.0, 13.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.20703125, -3.10699462890625, -3.0069580078125, -2.90692138671875, -2.806884765625, -2.70684814453125, -2.6068115234375, -2.50677490234375, -2.40673828125, -2.30670166015625, -2.2066650390625, -2.10662841796875, -2.006591796875, -1.90655517578125, -1.8065185546875, -1.70648193359375, -1.6064453125, -1.50640869140625, -1.4063720703125, -1.30633544921875, -1.206298828125, -1.10626220703125, -1.0062255859375, -0.90618896484375, -0.80615234375, -0.70611572265625, -0.6060791015625, -0.50604248046875, -0.406005859375, -0.30596923828125, -0.2059326171875, -0.10589599609375, -0.005859375, 0.09417724609375, 0.1942138671875, 0.29425048828125, 0.394287109375, 0.49432373046875, 0.5943603515625, 0.69439697265625, 0.79443359375, 0.89447021484375, 0.9945068359375, 1.09454345703125, 1.194580078125, 1.29461669921875, 1.3946533203125, 1.49468994140625, 1.5947265625, 1.69476318359375, 1.7947998046875, 1.89483642578125, 1.994873046875, 2.09490966796875, 2.1949462890625, 2.29498291015625, 2.39501953125, 2.49505615234375, 2.5950927734375, 2.69512939453125, 2.795166015625, 2.89520263671875, 2.9952392578125, 3.09527587890625, 3.1953125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 5.0, 12.0, 17.0, 16.0, 20.0, 22.0, 27.0, 35.0, 48.0, 41.0, 58.0, 56.0, 64.0, 77.0, 77.0, 58.0, 48.0, 51.0, 45.0, 44.0, 31.0, 30.0, 23.0, 18.0, 12.0, 7.0, 8.0, 6.0, 9.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.015472412109375, -20.329940795898438, -19.644407272338867, -18.958873748779297, -18.27334213256836, -17.587810516357422, -16.90227699279785, -16.21674346923828, -15.531211853027344, -14.84567928314209, -14.160146713256836, -13.474614143371582, -12.789081573486328, -12.103549003601074, -11.41801643371582, -10.732483863830566, -10.046951293945312, -9.361418724060059, -8.675886154174805, -7.990353584289551, -7.304821014404297, -6.619288444519043, -5.933755874633789, -5.248223304748535, -4.562690734863281, -3.8771581649780273, -3.1916255950927734, -2.5060930252075195, -1.8205604553222656, -1.1350278854370117, -0.4494953155517578, 0.2360372543334961, 0.92156982421875, 1.607102394104004, 2.292634963989258, 2.9781675338745117, 3.6637001037597656, 4.3492326736450195, 5.034765243530273, 5.720297813415527, 6.405830383300781, 7.091362953186035, 7.776895523071289, 8.462428092956543, 9.147960662841797, 9.83349323272705, 10.519025802612305, 11.204558372497559, 11.890090942382812, 12.575623512268066, 13.26115608215332, 13.946688652038574, 14.632221221923828, 15.317753791809082, 16.003286361694336, 16.688819885253906, 17.374351501464844, 18.05988311767578, 18.74541664123535, 19.430950164794922, 20.11648178100586, 20.802013397216797, 21.487546920776367, 22.173080444335938, 22.858612060546875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 11.0, 17.0, 21.0, 23.0, 18.0, 30.0, 30.0, 17.0, 25.0, 37.0, 39.0, 41.0, 33.0, 36.0, 43.0, 37.0, 41.0, 36.0, 44.0, 40.0, 34.0, 26.0, 34.0, 31.0, 24.0, 25.0, 25.0, 18.0, 16.0, 14.0, 15.0, 13.0, 17.0, 5.0, 8.0, 7.0, 3.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-10.551229476928711, -10.25379467010498, -9.956360816955566, -9.658926010131836, -9.361491203308105, -9.064057350158691, -8.766622543334961, -8.469188690185547, -8.171753883361816, -7.874319553375244, -7.576884746551514, -7.279450416564941, -6.982016086578369, -6.684581756591797, -6.387146949768066, -6.089712619781494, -5.792277812957764, -5.494843482971191, -5.197408676147461, -4.899974346160889, -4.602540016174316, -4.305105209350586, -4.007670879364014, -3.7102365493774414, -3.41280198097229, -3.1153674125671387, -2.8179330825805664, -2.520498514175415, -2.2230639457702637, -1.9256296157836914, -1.62819504737854, -1.3307607173919678, -1.0333261489868164, -0.7358916997909546, -0.438457190990448, -0.1410226821899414, 0.1564117670059204, 0.4538462162017822, 0.7512807846069336, 1.0487151145935059, 1.3461496829986572, 1.643584132194519, 1.9410185813903809, 2.2384531497955322, 2.5358877182006836, 2.833322048187256, 3.1307566165924072, 3.4281909465789795, 3.725625514984131, 4.023059844970703, 4.320494651794434, 4.617928981781006, 4.915363311767578, 5.212798118591309, 5.510232448577881, 5.807666778564453, 6.105101585388184, 6.402535915374756, 6.699970722198486, 6.997405052185059, 7.294839382171631, 7.592273712158203, 7.889708518981934, 8.187143325805664, 8.484577178955078]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 10.0, 15.0, 22.0, 31.0, 47.0, 60.0, 84.0, 137.0, 221.0, 340.0, 558.0, 964.0, 1584.0, 3008.0, 5452.0, 10598.0, 22913.0, 50169.0, 118510.0, 298956.0, 761194.0, 1316778.0, 942052.0, 390717.0, 152590.0, 62293.0, 27534.0, 12859.0, 6501.0, 3307.0, 1939.0, 1072.0, 631.0, 393.0, 250.0, 140.0, 126.0, 60.0, 50.0, 31.0, 22.0, 17.0, 13.0, 10.0, 3.0, 3.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-19.90625, -19.18603515625, -18.4658203125, -17.74560546875, -17.025390625, -16.30517578125, -15.5849609375, -14.86474609375, -14.14453125, -13.42431640625, -12.7041015625, -11.98388671875, -11.263671875, -10.54345703125, -9.8232421875, -9.10302734375, -8.3828125, -7.66259765625, -6.9423828125, -6.22216796875, -5.501953125, -4.78173828125, -4.0615234375, -3.34130859375, -2.62109375, -1.90087890625, -1.1806640625, -0.46044921875, 0.259765625, 0.97998046875, 1.7001953125, 2.42041015625, 3.140625, 3.86083984375, 4.5810546875, 5.30126953125, 6.021484375, 6.74169921875, 7.4619140625, 8.18212890625, 8.90234375, 9.62255859375, 10.3427734375, 11.06298828125, 11.783203125, 12.50341796875, 13.2236328125, 13.94384765625, 14.6640625, 15.38427734375, 16.1044921875, 16.82470703125, 17.544921875, 18.26513671875, 18.9853515625, 19.70556640625, 20.42578125, 21.14599609375, 21.8662109375, 22.58642578125, 23.306640625, 24.02685546875, 24.7470703125, 25.46728515625, 26.1875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 8.0, 6.0, 5.0, 11.0, 12.0, 26.0, 16.0, 30.0, 29.0, 37.0, 38.0, 41.0, 55.0, 56.0, 49.0, 54.0, 58.0, 58.0, 63.0, 61.0, 43.0, 34.0, 44.0, 34.0, 25.0, 22.0, 31.0, 18.0, 10.0, 9.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.399169921875, -9.04052734375, -8.681884765625, -8.3232421875, -7.964599609375, -7.60595703125, -7.247314453125, -6.888671875, -6.530029296875, -6.17138671875, -5.812744140625, -5.4541015625, -5.095458984375, -4.73681640625, -4.378173828125, -4.01953125, -3.660888671875, -3.30224609375, -2.943603515625, -2.5849609375, -2.226318359375, -1.86767578125, -1.509033203125, -1.150390625, -0.791748046875, -0.43310546875, -0.074462890625, 0.2841796875, 0.642822265625, 1.00146484375, 1.360107421875, 1.71875, 2.077392578125, 2.43603515625, 2.794677734375, 3.1533203125, 3.511962890625, 3.87060546875, 4.229248046875, 4.587890625, 4.946533203125, 5.30517578125, 5.663818359375, 6.0224609375, 6.381103515625, 6.73974609375, 7.098388671875, 7.45703125, 7.815673828125, 8.17431640625, 8.532958984375, 8.8916015625, 9.250244140625, 9.60888671875, 9.967529296875, 10.326171875, 10.684814453125, 11.04345703125, 11.402099609375, 11.7607421875, 12.119384765625, 12.47802734375, 12.836669921875, 13.1953125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 11.0, 20.0, 21.0, 36.0, 79.0, 98.0, 160.0, 259.0, 435.0, 809.0, 1465.0, 2569.0, 4827.0, 9538.0, 19315.0, 42011.0, 93380.0, 215331.0, 485968.0, 952529.0, 1123965.0, 678551.0, 311800.0, 136639.0, 59593.0, 27360.0, 13170.0, 6606.0, 3385.0, 1905.0, 948.0, 639.0, 321.0, 204.0, 128.0, 77.0, 49.0, 33.0, 25.0, 8.0, 6.0, 6.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.625, -25.869140625, -25.11328125, -24.357421875, -23.6015625, -22.845703125, -22.08984375, -21.333984375, -20.578125, -19.822265625, -19.06640625, -18.310546875, -17.5546875, -16.798828125, -16.04296875, -15.287109375, -14.53125, -13.775390625, -13.01953125, -12.263671875, -11.5078125, -10.751953125, -9.99609375, -9.240234375, -8.484375, -7.728515625, -6.97265625, -6.216796875, -5.4609375, -4.705078125, -3.94921875, -3.193359375, -2.4375, -1.681640625, -0.92578125, -0.169921875, 0.5859375, 1.341796875, 2.09765625, 2.853515625, 3.609375, 4.365234375, 5.12109375, 5.876953125, 6.6328125, 7.388671875, 8.14453125, 8.900390625, 9.65625, 10.412109375, 11.16796875, 11.923828125, 12.6796875, 13.435546875, 14.19140625, 14.947265625, 15.703125, 16.458984375, 17.21484375, 17.970703125, 18.7265625, 19.482421875, 20.23828125, 20.994140625, 21.75]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 14.0, 20.0, 15.0, 28.0, 39.0, 60.0, 70.0, 112.0, 146.0, 182.0, 246.0, 273.0, 278.0, 326.0, 312.0, 364.0, 308.0, 283.0, 212.0, 180.0, 159.0, 121.0, 80.0, 58.0, 49.0, 48.0, 25.0, 10.0, 12.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.38525390625, -8.1611328125, -7.93701171875, -7.712890625, -7.48876953125, -7.2646484375, -7.04052734375, -6.81640625, -6.59228515625, -6.3681640625, -6.14404296875, -5.919921875, -5.69580078125, -5.4716796875, -5.24755859375, -5.0234375, -4.79931640625, -4.5751953125, -4.35107421875, -4.126953125, -3.90283203125, -3.6787109375, -3.45458984375, -3.23046875, -3.00634765625, -2.7822265625, -2.55810546875, -2.333984375, -2.10986328125, -1.8857421875, -1.66162109375, -1.4375, -1.21337890625, -0.9892578125, -0.76513671875, -0.541015625, -0.31689453125, -0.0927734375, 0.13134765625, 0.35546875, 0.57958984375, 0.8037109375, 1.02783203125, 1.251953125, 1.47607421875, 1.7001953125, 1.92431640625, 2.1484375, 2.37255859375, 2.5966796875, 2.82080078125, 3.044921875, 3.26904296875, 3.4931640625, 3.71728515625, 3.94140625, 4.16552734375, 4.3896484375, 4.61376953125, 4.837890625, 5.06201171875, 5.2861328125, 5.51025390625, 5.734375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 14.0, 13.0, 14.0, 18.0, 29.0, 38.0, 46.0, 52.0, 75.0, 66.0, 73.0, 90.0, 73.0, 77.0, 63.0, 62.0, 33.0, 45.0, 23.0, 22.0, 16.0, 16.0, 6.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.674388885498047, -23.811080932617188, -22.947772979736328, -22.08446502685547, -21.22115707397461, -20.35784912109375, -19.494543075561523, -18.631235122680664, -17.767927169799805, -16.904619216918945, -16.041311264038086, -15.178004264831543, -14.314696311950684, -13.451388359069824, -12.588081359863281, -11.724773406982422, -10.861465454101562, -9.998157501220703, -9.134849548339844, -8.2715425491333, -7.408234596252441, -6.544926643371582, -5.681619167327881, -4.81831169128418, -3.9550037384033203, -3.09169602394104, -2.2283883094787598, -1.3650805950164795, -0.5017728805541992, 0.36153507232666016, 1.2248425483703613, 2.0881500244140625, 2.951457977294922, 3.814765691757202, 4.678073406219482, 5.541380882263184, 6.404688835144043, 7.267996788024902, 8.131303787231445, 8.994611740112305, 9.857919692993164, 10.721227645874023, 11.584535598754883, 12.447842597961426, 13.311150550842285, 14.174458503723145, 15.037765502929688, 15.901073455810547, 16.764381408691406, 17.627689361572266, 18.490997314453125, 19.354305267333984, 20.217613220214844, 21.080921173095703, 21.94422721862793, 22.80753517150879, 23.67084312438965, 24.534151077270508, 25.397459030151367, 26.260766983032227, 27.124073028564453, 27.987380981445312, 28.850688934326172, 29.71399688720703, 30.57730484008789]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 6.0, 3.0, 8.0, 5.0, 12.0, 5.0, 8.0, 14.0, 22.0, 18.0, 12.0, 11.0, 30.0, 30.0, 30.0, 29.0, 33.0, 31.0, 36.0, 40.0, 40.0, 43.0, 43.0, 37.0, 41.0, 40.0, 33.0, 33.0, 38.0, 18.0, 37.0, 22.0, 22.0, 22.0, 21.0, 18.0, 17.0, 12.0, 11.0, 15.0, 15.0, 7.0, 10.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.755313873291016, -10.445636749267578, -10.13595962524414, -9.826282501220703, -9.516605377197266, -9.206928253173828, -8.89725112915039, -8.587574005126953, -8.277896881103516, -7.968219757080078, -7.658542633056641, -7.348865509033203, -7.039188385009766, -6.729511260986328, -6.419834613800049, -6.110157489776611, -5.800480842590332, -5.4908037185668945, -5.181126594543457, -4.8714494705200195, -4.561772346496582, -4.2520952224731445, -3.9424185752868652, -3.6327414512634277, -3.3230643272399902, -3.0133872032165527, -2.7037100791931152, -2.394033193588257, -2.0843560695648193, -1.7746789455413818, -1.4650019407272339, -1.155324935913086, -0.8456487655639648, -0.5359717011451721, -0.2262946367263794, 0.08338242769241333, 0.39305949211120605, 0.7027366161346436, 1.0124136209487915, 1.3220906257629395, 1.631767749786377, 1.9414448738098145, 2.251121997833252, 2.5607988834381104, 2.870476007461548, 3.1801531314849854, 3.4898300170898438, 3.7995071411132812, 4.109184265136719, 4.418861389160156, 4.728538513183594, 5.038215637207031, 5.347892761230469, 5.657569885253906, 5.9672465324401855, 6.276923656463623, 6.5866007804870605, 6.896277904510498, 7.2059550285339355, 7.515632152557373, 7.825308799743652, 8.13498592376709, 8.444663047790527, 8.754340171813965, 9.064017295837402]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 9.0, 6.0, 8.0, 9.0, 11.0, 18.0, 27.0, 47.0, 70.0, 88.0, 118.0, 247.0, 319.0, 512.0, 858.0, 1682.0, 2787.0, 5615.0, 11143.0, 23089.0, 48031.0, 96707.0, 170518.0, 228127.0, 201876.0, 127258.0, 65861.0, 31815.0, 15205.0, 7600.0, 3853.0, 2070.0, 1155.0, 673.0, 388.0, 230.0, 154.0, 101.0, 81.0, 49.0, 46.0, 36.0, 18.0, 17.0, 10.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7265625, -12.312255859375, -11.89794921875, -11.483642578125, -11.0693359375, -10.655029296875, -10.24072265625, -9.826416015625, -9.412109375, -8.997802734375, -8.58349609375, -8.169189453125, -7.7548828125, -7.340576171875, -6.92626953125, -6.511962890625, -6.09765625, -5.683349609375, -5.26904296875, -4.854736328125, -4.4404296875, -4.026123046875, -3.61181640625, -3.197509765625, -2.783203125, -2.368896484375, -1.95458984375, -1.540283203125, -1.1259765625, -0.711669921875, -0.29736328125, 0.116943359375, 0.53125, 0.945556640625, 1.35986328125, 1.774169921875, 2.1884765625, 2.602783203125, 3.01708984375, 3.431396484375, 3.845703125, 4.260009765625, 4.67431640625, 5.088623046875, 5.5029296875, 5.917236328125, 6.33154296875, 6.745849609375, 7.16015625, 7.574462890625, 7.98876953125, 8.403076171875, 8.8173828125, 9.231689453125, 9.64599609375, 10.060302734375, 10.474609375, 10.888916015625, 11.30322265625, 11.717529296875, 12.1318359375, 12.546142578125, 12.96044921875, 13.374755859375, 13.7890625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 10.0, 8.0, 12.0, 10.0, 21.0, 16.0, 13.0, 22.0, 26.0, 37.0, 29.0, 35.0, 41.0, 37.0, 38.0, 32.0, 50.0, 52.0, 48.0, 48.0, 37.0, 41.0, 43.0, 42.0, 30.0, 31.0, 21.0, 21.0, 23.0, 23.0, 18.0, 17.0, 15.0, 9.0, 4.0, 8.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.796875, -12.4193115234375, -12.041748046875, -11.6641845703125, -11.28662109375, -10.9090576171875, -10.531494140625, -10.1539306640625, -9.7763671875, -9.3988037109375, -9.021240234375, -8.6436767578125, -8.26611328125, -7.8885498046875, -7.510986328125, -7.1334228515625, -6.755859375, -6.3782958984375, -6.000732421875, -5.6231689453125, -5.24560546875, -4.8680419921875, -4.490478515625, -4.1129150390625, -3.7353515625, -3.3577880859375, -2.980224609375, -2.6026611328125, -2.22509765625, -1.8475341796875, -1.469970703125, -1.0924072265625, -0.71484375, -0.3372802734375, 0.040283203125, 0.4178466796875, 0.79541015625, 1.1729736328125, 1.550537109375, 1.9281005859375, 2.3056640625, 2.6832275390625, 3.060791015625, 3.4383544921875, 3.81591796875, 4.1934814453125, 4.571044921875, 4.9486083984375, 5.326171875, 5.7037353515625, 6.081298828125, 6.4588623046875, 6.83642578125, 7.2139892578125, 7.591552734375, 7.9691162109375, 8.3466796875, 8.7242431640625, 9.101806640625, 9.4793701171875, 9.85693359375, 10.2344970703125, 10.612060546875, 10.9896240234375, 11.3671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 10.0, 14.0, 11.0, 16.0, 27.0, 45.0, 75.0, 119.0, 224.0, 342.0, 631.0, 1079.0, 1912.0, 3746.0, 7298.0, 15415.0, 33274.0, 72425.0, 150772.0, 256561.0, 243005.0, 137768.0, 65079.0, 30360.0, 13942.0, 6786.0, 3515.0, 1741.0, 970.0, 544.0, 312.0, 201.0, 132.0, 66.0, 41.0, 37.0, 23.0, 12.0, 8.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.359375, -15.862548828125, -15.36572265625, -14.868896484375, -14.3720703125, -13.875244140625, -13.37841796875, -12.881591796875, -12.384765625, -11.887939453125, -11.39111328125, -10.894287109375, -10.3974609375, -9.900634765625, -9.40380859375, -8.906982421875, -8.41015625, -7.913330078125, -7.41650390625, -6.919677734375, -6.4228515625, -5.926025390625, -5.42919921875, -4.932373046875, -4.435546875, -3.938720703125, -3.44189453125, -2.945068359375, -2.4482421875, -1.951416015625, -1.45458984375, -0.957763671875, -0.4609375, 0.035888671875, 0.53271484375, 1.029541015625, 1.5263671875, 2.023193359375, 2.52001953125, 3.016845703125, 3.513671875, 4.010498046875, 4.50732421875, 5.004150390625, 5.5009765625, 5.997802734375, 6.49462890625, 6.991455078125, 7.48828125, 7.985107421875, 8.48193359375, 8.978759765625, 9.4755859375, 9.972412109375, 10.46923828125, 10.966064453125, 11.462890625, 11.959716796875, 12.45654296875, 12.953369140625, 13.4501953125, 13.947021484375, 14.44384765625, 14.940673828125, 15.4375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 19.0, 8.0, 13.0, 13.0, 14.0, 19.0, 15.0, 28.0, 28.0, 20.0, 30.0, 39.0, 34.0, 41.0, 41.0, 38.0, 38.0, 35.0, 44.0, 39.0, 44.0, 41.0, 33.0, 36.0, 35.0, 35.0, 27.0, 23.0, 19.0, 21.0, 15.0, 19.0, 13.0, 18.0, 11.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6953125, -5.4979248046875, -5.300537109375, -5.1031494140625, -4.90576171875, -4.7083740234375, -4.510986328125, -4.3135986328125, -4.1162109375, -3.9188232421875, -3.721435546875, -3.5240478515625, -3.32666015625, -3.1292724609375, -2.931884765625, -2.7344970703125, -2.537109375, -2.3397216796875, -2.142333984375, -1.9449462890625, -1.74755859375, -1.5501708984375, -1.352783203125, -1.1553955078125, -0.9580078125, -0.7606201171875, -0.563232421875, -0.3658447265625, -0.16845703125, 0.0289306640625, 0.226318359375, 0.4237060546875, 0.62109375, 0.8184814453125, 1.015869140625, 1.2132568359375, 1.41064453125, 1.6080322265625, 1.805419921875, 2.0028076171875, 2.2001953125, 2.3975830078125, 2.594970703125, 2.7923583984375, 2.98974609375, 3.1871337890625, 3.384521484375, 3.5819091796875, 3.779296875, 3.9766845703125, 4.174072265625, 4.3714599609375, 4.56884765625, 4.7662353515625, 4.963623046875, 5.1610107421875, 5.3583984375, 5.5557861328125, 5.753173828125, 5.9505615234375, 6.14794921875, 6.3453369140625, 6.542724609375, 6.7401123046875, 6.9375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 13.0, 18.0, 27.0, 41.0, 61.0, 91.0, 121.0, 193.0, 263.0, 369.0, 596.0, 832.0, 1158.0, 1761.0, 2609.0, 3890.0, 5881.0, 9023.0, 13436.0, 20784.0, 32354.0, 50246.0, 77524.0, 115310.0, 155103.0, 164577.0, 131786.0, 90966.0, 59402.0, 38364.0, 24656.0, 15910.0, 10437.0, 6907.0, 4517.0, 3028.0, 2004.0, 1347.0, 938.0, 627.0, 411.0, 283.0, 205.0, 148.0, 95.0, 83.0, 59.0, 31.0, 14.0, 16.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-4.796875, -4.64788818359375, -4.4989013671875, -4.34991455078125, -4.200927734375, -4.05194091796875, -3.9029541015625, -3.75396728515625, -3.60498046875, -3.45599365234375, -3.3070068359375, -3.15802001953125, -3.009033203125, -2.86004638671875, -2.7110595703125, -2.56207275390625, -2.4130859375, -2.26409912109375, -2.1151123046875, -1.96612548828125, -1.817138671875, -1.66815185546875, -1.5191650390625, -1.37017822265625, -1.22119140625, -1.07220458984375, -0.9232177734375, -0.77423095703125, -0.625244140625, -0.47625732421875, -0.3272705078125, -0.17828369140625, -0.029296875, 0.11968994140625, 0.2686767578125, 0.41766357421875, 0.566650390625, 0.71563720703125, 0.8646240234375, 1.01361083984375, 1.16259765625, 1.31158447265625, 1.4605712890625, 1.60955810546875, 1.758544921875, 1.90753173828125, 2.0565185546875, 2.20550537109375, 2.3544921875, 2.50347900390625, 2.6524658203125, 2.80145263671875, 2.950439453125, 3.09942626953125, 3.2484130859375, 3.39739990234375, 3.54638671875, 3.69537353515625, 3.8443603515625, 3.99334716796875, 4.142333984375, 4.29132080078125, 4.4403076171875, 4.58929443359375, 4.73828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 10.0, 10.0, 9.0, 20.0, 26.0, 24.0, 28.0, 24.0, 42.0, 52.0, 61.0, 65.0, 57.0, 62.0, 51.0, 55.0, 71.0, 52.0, 53.0, 41.0, 39.0, 23.0, 19.0, 17.0, 14.0, 16.0, 9.0, 9.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00033473968505859375, -0.00032487884163856506, -0.0003150179982185364, -0.0003051571547985077, -0.000295296311378479, -0.0002854354679584503, -0.00027557462453842163, -0.00026571378111839294, -0.00025585293769836426, -0.00024599209427833557, -0.00023613125085830688, -0.0002262704074382782, -0.0002164095640182495, -0.00020654872059822083, -0.00019668787717819214, -0.00018682703375816345, -0.00017696619033813477, -0.00016710534691810608, -0.0001572445034980774, -0.0001473836600780487, -0.00013752281665802002, -0.00012766197323799133, -0.00011780112981796265, -0.00010794028639793396, -9.807944297790527e-05, -8.821859955787659e-05, -7.83577561378479e-05, -6.849691271781921e-05, -5.863606929779053e-05, -4.877522587776184e-05, -3.8914382457733154e-05, -2.9053539037704468e-05, -1.919269561767578e-05, -9.331852197647095e-06, 5.289912223815918e-07, 1.0389834642410278e-05, 2.0250678062438965e-05, 3.011152148246765e-05, 3.997236490249634e-05, 4.9833208322525024e-05, 5.969405174255371e-05, 6.95548951625824e-05, 7.941573858261108e-05, 8.927658200263977e-05, 9.913742542266846e-05, 0.00010899826884269714, 0.00011885911226272583, 0.00012871995568275452, 0.0001385807991027832, 0.0001484416425228119, 0.00015830248594284058, 0.00016816332936286926, 0.00017802417278289795, 0.00018788501620292664, 0.00019774585962295532, 0.000207606703042984, 0.0002174675464630127, 0.00022732838988304138, 0.00023718923330307007, 0.00024705007672309875, 0.00025691092014312744, 0.00026677176356315613, 0.0002766326069831848, 0.0002864934504032135, 0.0002963542938232422]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 26.0, 37.0, 48.0, 70.0, 94.0, 124.0, 228.0, 321.0, 447.0, 752.0, 1101.0, 1756.0, 2736.0, 4284.0, 6593.0, 10535.0, 16142.0, 25430.0, 38980.0, 59299.0, 85086.0, 114902.0, 135758.0, 138299.0, 121389.0, 93390.0, 66255.0, 44093.0, 28831.0, 18630.0, 11784.0, 7607.0, 4683.0, 3090.0, 1965.0, 1259.0, 878.0, 517.0, 351.0, 287.0, 157.0, 103.0, 78.0, 50.0, 31.0, 27.0, 15.0, 10.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.4296875, -4.2918701171875, -4.154052734375, -4.0162353515625, -3.87841796875, -3.7406005859375, -3.602783203125, -3.4649658203125, -3.3271484375, -3.1893310546875, -3.051513671875, -2.9136962890625, -2.77587890625, -2.6380615234375, -2.500244140625, -2.3624267578125, -2.224609375, -2.0867919921875, -1.948974609375, -1.8111572265625, -1.67333984375, -1.5355224609375, -1.397705078125, -1.2598876953125, -1.1220703125, -0.9842529296875, -0.846435546875, -0.7086181640625, -0.57080078125, -0.4329833984375, -0.295166015625, -0.1573486328125, -0.01953125, 0.1182861328125, 0.256103515625, 0.3939208984375, 0.53173828125, 0.6695556640625, 0.807373046875, 0.9451904296875, 1.0830078125, 1.2208251953125, 1.358642578125, 1.4964599609375, 1.63427734375, 1.7720947265625, 1.909912109375, 2.0477294921875, 2.185546875, 2.3233642578125, 2.461181640625, 2.5989990234375, 2.73681640625, 2.8746337890625, 3.012451171875, 3.1502685546875, 3.2880859375, 3.4259033203125, 3.563720703125, 3.7015380859375, 3.83935546875, 3.9771728515625, 4.114990234375, 4.2528076171875, 4.390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 7.0, 10.0, 6.0, 12.0, 22.0, 22.0, 22.0, 29.0, 36.0, 32.0, 35.0, 49.0, 41.0, 50.0, 43.0, 59.0, 59.0, 53.0, 61.0, 51.0, 29.0, 43.0, 40.0, 33.0, 33.0, 19.0, 18.0, 17.0, 13.0, 6.0, 11.0, 8.0, 11.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.5604705810546875, -1.511566162109375, -1.4626617431640625, -1.41375732421875, -1.3648529052734375, -1.315948486328125, -1.2670440673828125, -1.2181396484375, -1.1692352294921875, -1.120330810546875, -1.0714263916015625, -1.02252197265625, -0.9736175537109375, -0.924713134765625, -0.8758087158203125, -0.826904296875, -0.7779998779296875, -0.729095458984375, -0.6801910400390625, -0.63128662109375, -0.5823822021484375, -0.533477783203125, -0.4845733642578125, -0.4356689453125, -0.3867645263671875, -0.337860107421875, -0.2889556884765625, -0.24005126953125, -0.1911468505859375, -0.142242431640625, -0.0933380126953125, -0.04443359375, 0.0044708251953125, 0.053375244140625, 0.1022796630859375, 0.15118408203125, 0.2000885009765625, 0.248992919921875, 0.2978973388671875, 0.3468017578125, 0.3957061767578125, 0.444610595703125, 0.4935150146484375, 0.54241943359375, 0.5913238525390625, 0.640228271484375, 0.6891326904296875, 0.738037109375, 0.7869415283203125, 0.835845947265625, 0.8847503662109375, 0.93365478515625, 0.9825592041015625, 1.031463623046875, 1.0803680419921875, 1.1292724609375, 1.1781768798828125, 1.227081298828125, 1.2759857177734375, 1.32489013671875, 1.3737945556640625, 1.422698974609375, 1.4716033935546875, 1.5205078125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 17.0, 14.0, 11.0, 14.0, 26.0, 35.0, 38.0, 57.0, 68.0, 66.0, 85.0, 80.0, 68.0, 74.0, 76.0, 61.0, 42.0, 36.0, 27.0, 29.0, 14.0, 20.0, 9.0, 6.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.879331588745117, -22.02912139892578, -21.178913116455078, -20.328702926635742, -19.478492736816406, -18.628284454345703, -17.778074264526367, -16.92786407470703, -16.077655792236328, -15.227446556091309, -14.377236366271973, -13.527027130126953, -12.676817893981934, -11.826608657836914, -10.976398468017578, -10.126189231872559, -9.275979042053223, -8.425769805908203, -7.575560092926025, -6.725350379943848, -5.875141143798828, -5.02493143081665, -4.174721717834473, -3.324512481689453, -2.4743027687072754, -1.6240932941436768, -0.7738837003707886, 0.07632589340209961, 0.9265353679656982, 1.7767448425292969, 2.6269545555114746, 3.477163791656494, 4.327373504638672, 5.17758321762085, 6.027792453765869, 6.878002166748047, 7.728211402893066, 8.578420639038086, 9.428630828857422, 10.278840065002441, 11.129049301147461, 11.97925853729248, 12.829468727111816, 13.679677963256836, 14.529887199401855, 15.380096435546875, 16.23030662536621, 17.080516815185547, 17.93072509765625, 18.780935287475586, 19.63114356994629, 20.481353759765625, 21.33156394958496, 22.181772232055664, 23.031982421875, 23.882190704345703, 24.732402801513672, 25.582612991333008, 26.43282127380371, 27.283031463623047, 28.133241653442383, 28.983449935913086, 29.833660125732422, 30.683868408203125, 31.53407859802246]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 2.0, 8.0, 7.0, 3.0, 7.0, 10.0, 12.0, 16.0, 22.0, 15.0, 10.0, 24.0, 21.0, 26.0, 29.0, 33.0, 40.0, 33.0, 33.0, 39.0, 42.0, 37.0, 38.0, 37.0, 47.0, 36.0, 36.0, 32.0, 24.0, 27.0, 31.0, 22.0, 24.0, 24.0, 18.0, 18.0, 18.0, 10.0, 20.0, 8.0, 15.0, 10.0, 5.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-10.28503704071045, -9.988395690917969, -9.691754341125488, -9.395112991333008, -9.098471641540527, -8.801830291748047, -8.505188941955566, -8.208547592163086, -7.911906719207764, -7.615265369415283, -7.318624019622803, -7.021982669830322, -6.725341796875, -6.4287004470825195, -6.132059097290039, -5.835417747497559, -5.538776397705078, -5.242135047912598, -4.945493698120117, -4.648852348327637, -4.352210998535156, -4.055569648742676, -3.7589287757873535, -3.462287425994873, -3.1656460762023926, -2.869004726409912, -2.5723633766174316, -2.2757222652435303, -1.9790809154510498, -1.6824395656585693, -1.3857983350753784, -1.0891571044921875, -0.7925148010253906, -0.49587351083755493, -0.19923222064971924, 0.09740906953811646, 0.39405035972595215, 0.6906917095184326, 0.9873329401016235, 1.2839741706848145, 1.580615520477295, 1.8772568702697754, 2.173898220062256, 2.4705393314361572, 2.7671806812286377, 3.063822031021118, 3.3604631423950195, 3.6571044921875, 3.9537458419799805, 4.250387191772461, 4.547028541564941, 4.843669891357422, 5.140311241149902, 5.436952590942383, 5.733593463897705, 6.0302348136901855, 6.326876163482666, 6.6235175132751465, 6.920158863067627, 7.216800212860107, 7.51344108581543, 7.81008243560791, 8.10672378540039, 8.403365135192871, 8.700006484985352]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 9.0, 15.0, 12.0, 26.0, 34.0, 33.0, 41.0, 81.0, 131.0, 166.0, 236.0, 348.0, 525.0, 904.0, 1701.0, 3280.0, 6861.0, 15148.0, 34465.0, 75735.0, 150797.0, 231406.0, 232204.0, 152055.0, 77147.0, 35027.0, 15627.0, 6860.0, 3429.0, 1682.0, 932.0, 539.0, 354.0, 221.0, 158.0, 105.0, 68.0, 43.0, 36.0, 31.0, 19.0, 11.0, 17.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-24.234375, -23.477294921875, -22.72021484375, -21.963134765625, -21.2060546875, -20.448974609375, -19.69189453125, -18.934814453125, -18.177734375, -17.420654296875, -16.66357421875, -15.906494140625, -15.1494140625, -14.392333984375, -13.63525390625, -12.878173828125, -12.12109375, -11.364013671875, -10.60693359375, -9.849853515625, -9.0927734375, -8.335693359375, -7.57861328125, -6.821533203125, -6.064453125, -5.307373046875, -4.55029296875, -3.793212890625, -3.0361328125, -2.279052734375, -1.52197265625, -0.764892578125, -0.0078125, 0.749267578125, 1.50634765625, 2.263427734375, 3.0205078125, 3.777587890625, 4.53466796875, 5.291748046875, 6.048828125, 6.805908203125, 7.56298828125, 8.320068359375, 9.0771484375, 9.834228515625, 10.59130859375, 11.348388671875, 12.10546875, 12.862548828125, 13.61962890625, 14.376708984375, 15.1337890625, 15.890869140625, 16.64794921875, 17.405029296875, 18.162109375, 18.919189453125, 19.67626953125, 20.433349609375, 21.1904296875, 21.947509765625, 22.70458984375, 23.461669921875, 24.21875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 11.0, 6.0, 9.0, 17.0, 16.0, 27.0, 30.0, 22.0, 29.0, 45.0, 34.0, 44.0, 45.0, 35.0, 41.0, 36.0, 43.0, 49.0, 42.0, 39.0, 40.0, 39.0, 26.0, 28.0, 31.0, 18.0, 28.0, 21.0, 20.0, 20.0, 13.0, 17.0, 13.0, 8.0, 7.0, 12.0, 3.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.296875, -11.950927734375, -11.60498046875, -11.259033203125, -10.9130859375, -10.567138671875, -10.22119140625, -9.875244140625, -9.529296875, -9.183349609375, -8.83740234375, -8.491455078125, -8.1455078125, -7.799560546875, -7.45361328125, -7.107666015625, -6.76171875, -6.415771484375, -6.06982421875, -5.723876953125, -5.3779296875, -5.031982421875, -4.68603515625, -4.340087890625, -3.994140625, -3.648193359375, -3.30224609375, -2.956298828125, -2.6103515625, -2.264404296875, -1.91845703125, -1.572509765625, -1.2265625, -0.880615234375, -0.53466796875, -0.188720703125, 0.1572265625, 0.503173828125, 0.84912109375, 1.195068359375, 1.541015625, 1.886962890625, 2.23291015625, 2.578857421875, 2.9248046875, 3.270751953125, 3.61669921875, 3.962646484375, 4.30859375, 4.654541015625, 5.00048828125, 5.346435546875, 5.6923828125, 6.038330078125, 6.38427734375, 6.730224609375, 7.076171875, 7.422119140625, 7.76806640625, 8.114013671875, 8.4599609375, 8.805908203125, 9.15185546875, 9.497802734375, 9.84375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 11.0, 10.0, 20.0, 38.0, 57.0, 77.0, 126.0, 165.0, 234.0, 432.0, 598.0, 958.0, 1528.0, 2402.0, 3898.0, 6609.0, 10872.0, 18862.0, 31501.0, 50961.0, 79491.0, 114062.0, 143272.0, 154409.0, 137340.0, 104526.0, 71617.0, 45212.0, 27703.0, 16384.0, 9840.0, 5827.0, 3590.0, 2107.0, 1364.0, 831.0, 533.0, 358.0, 261.0, 163.0, 88.0, 73.0, 53.0, 29.0, 17.0, 18.0, 10.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.9825439453125, -14.519775390625, -14.0570068359375, -13.59423828125, -13.1314697265625, -12.668701171875, -12.2059326171875, -11.7431640625, -11.2803955078125, -10.817626953125, -10.3548583984375, -9.89208984375, -9.4293212890625, -8.966552734375, -8.5037841796875, -8.041015625, -7.5782470703125, -7.115478515625, -6.6527099609375, -6.18994140625, -5.7271728515625, -5.264404296875, -4.8016357421875, -4.3388671875, -3.8760986328125, -3.413330078125, -2.9505615234375, -2.48779296875, -2.0250244140625, -1.562255859375, -1.0994873046875, -0.63671875, -0.1739501953125, 0.288818359375, 0.7515869140625, 1.21435546875, 1.6771240234375, 2.139892578125, 2.6026611328125, 3.0654296875, 3.5281982421875, 3.990966796875, 4.4537353515625, 4.91650390625, 5.3792724609375, 5.842041015625, 6.3048095703125, 6.767578125, 7.2303466796875, 7.693115234375, 8.1558837890625, 8.61865234375, 9.0814208984375, 9.544189453125, 10.0069580078125, 10.4697265625, 10.9324951171875, 11.395263671875, 11.8580322265625, 12.32080078125, 12.7835693359375, 13.246337890625, 13.7091064453125, 14.171875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 7.0, 15.0, 11.0, 4.0, 15.0, 17.0, 18.0, 22.0, 25.0, 26.0, 18.0, 40.0, 31.0, 30.0, 30.0, 31.0, 32.0, 44.0, 41.0, 33.0, 29.0, 53.0, 35.0, 40.0, 27.0, 39.0, 43.0, 33.0, 33.0, 23.0, 27.0, 24.0, 19.0, 7.0, 12.0, 11.0, 7.0, 6.0, 13.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.41015625, -6.21337890625, -6.0166015625, -5.81982421875, -5.623046875, -5.42626953125, -5.2294921875, -5.03271484375, -4.8359375, -4.63916015625, -4.4423828125, -4.24560546875, -4.048828125, -3.85205078125, -3.6552734375, -3.45849609375, -3.26171875, -3.06494140625, -2.8681640625, -2.67138671875, -2.474609375, -2.27783203125, -2.0810546875, -1.88427734375, -1.6875, -1.49072265625, -1.2939453125, -1.09716796875, -0.900390625, -0.70361328125, -0.5068359375, -0.31005859375, -0.11328125, 0.08349609375, 0.2802734375, 0.47705078125, 0.673828125, 0.87060546875, 1.0673828125, 1.26416015625, 1.4609375, 1.65771484375, 1.8544921875, 2.05126953125, 2.248046875, 2.44482421875, 2.6416015625, 2.83837890625, 3.03515625, 3.23193359375, 3.4287109375, 3.62548828125, 3.822265625, 4.01904296875, 4.2158203125, 4.41259765625, 4.609375, 4.80615234375, 5.0029296875, 5.19970703125, 5.396484375, 5.59326171875, 5.7900390625, 5.98681640625, 6.18359375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 20.0, 28.0, 34.0, 35.0, 67.0, 91.0, 141.0, 166.0, 235.0, 313.0, 482.0, 715.0, 1040.0, 1544.0, 2416.0, 3725.0, 6363.0, 11653.0, 22204.0, 43493.0, 89521.0, 177935.0, 260854.0, 206159.0, 107882.0, 52146.0, 25618.0, 13772.0, 7535.0, 4327.0, 2605.0, 1677.0, 1171.0, 743.0, 523.0, 365.0, 310.0, 189.0, 148.0, 94.0, 57.0, 44.0, 25.0, 20.0, 14.0, 17.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8551025390625, -11.468017578125, -11.0809326171875, -10.69384765625, -10.3067626953125, -9.919677734375, -9.5325927734375, -9.1455078125, -8.7584228515625, -8.371337890625, -7.9842529296875, -7.59716796875, -7.2100830078125, -6.822998046875, -6.4359130859375, -6.048828125, -5.6617431640625, -5.274658203125, -4.8875732421875, -4.50048828125, -4.1134033203125, -3.726318359375, -3.3392333984375, -2.9521484375, -2.5650634765625, -2.177978515625, -1.7908935546875, -1.40380859375, -1.0167236328125, -0.629638671875, -0.2425537109375, 0.14453125, 0.5316162109375, 0.918701171875, 1.3057861328125, 1.69287109375, 2.0799560546875, 2.467041015625, 2.8541259765625, 3.2412109375, 3.6282958984375, 4.015380859375, 4.4024658203125, 4.78955078125, 5.1766357421875, 5.563720703125, 5.9508056640625, 6.337890625, 6.7249755859375, 7.112060546875, 7.4991455078125, 7.88623046875, 8.2733154296875, 8.660400390625, 9.0474853515625, 9.4345703125, 9.8216552734375, 10.208740234375, 10.5958251953125, 10.98291015625, 11.3699951171875, 11.757080078125, 12.1441650390625, 12.53125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 16.0, 14.0, 18.0, 22.0, 44.0, 32.0, 79.0, 83.0, 116.0, 128.0, 93.0, 89.0, 78.0, 38.0, 37.0, 17.0, 19.0, 13.0, 6.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017423629760742188, -0.001691579818725586, -0.0016407966613769531, -0.0015900135040283203, -0.0015392303466796875, -0.0014884471893310547, -0.0014376640319824219, -0.001386880874633789, -0.0013360977172851562, -0.0012853145599365234, -0.0012345314025878906, -0.0011837482452392578, -0.001132965087890625, -0.0010821819305419922, -0.0010313987731933594, -0.0009806156158447266, -0.0009298324584960938, -0.0008790493011474609, -0.0008282661437988281, -0.0007774829864501953, -0.0007266998291015625, -0.0006759166717529297, -0.0006251335144042969, -0.0005743503570556641, -0.0005235671997070312, -0.00047278404235839844, -0.0004220008850097656, -0.0003712177276611328, -0.0003204345703125, -0.0002696514129638672, -0.00021886825561523438, -0.00016808509826660156, -0.00011730194091796875, -6.651878356933594e-05, -1.5735626220703125e-05, 3.504753112792969e-05, 8.58306884765625e-05, 0.0001366138458251953, 0.00018739700317382812, 0.00023818016052246094, 0.00028896331787109375, 0.00033974647521972656, 0.0003905296325683594, 0.0004413127899169922, 0.000492095947265625, 0.0005428791046142578, 0.0005936622619628906, 0.0006444454193115234, 0.0006952285766601562, 0.0007460117340087891, 0.0007967948913574219, 0.0008475780487060547, 0.0008983612060546875, 0.0009491443634033203, 0.0009999275207519531, 0.001050710678100586, 0.0011014938354492188, 0.0011522769927978516, 0.0012030601501464844, 0.0012538433074951172, 0.00130462646484375, 0.0013554096221923828, 0.0014061927795410156, 0.0014569759368896484, 0.0015077590942382812]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 11.0, 1.0, 7.0, 12.0, 14.0, 34.0, 60.0, 48.0, 72.0, 116.0, 166.0, 235.0, 304.0, 442.0, 660.0, 972.0, 1549.0, 2572.0, 4522.0, 8827.0, 19355.0, 45028.0, 111724.0, 243822.0, 301712.0, 174452.0, 72739.0, 30012.0, 13330.0, 6479.0, 3387.0, 1984.0, 1280.0, 832.0, 528.0, 352.0, 247.0, 195.0, 131.0, 102.0, 66.0, 50.0, 38.0, 31.0, 19.0, 14.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-15.2578125, -14.8125, -14.3671875, -13.921875, -13.4765625, -13.03125, -12.5859375, -12.140625, -11.6953125, -11.25, -10.8046875, -10.359375, -9.9140625, -9.46875, -9.0234375, -8.578125, -8.1328125, -7.6875, -7.2421875, -6.796875, -6.3515625, -5.90625, -5.4609375, -5.015625, -4.5703125, -4.125, -3.6796875, -3.234375, -2.7890625, -2.34375, -1.8984375, -1.453125, -1.0078125, -0.5625, -0.1171875, 0.328125, 0.7734375, 1.21875, 1.6640625, 2.109375, 2.5546875, 3.0, 3.4453125, 3.890625, 4.3359375, 4.78125, 5.2265625, 5.671875, 6.1171875, 6.5625, 7.0078125, 7.453125, 7.8984375, 8.34375, 8.7890625, 9.234375, 9.6796875, 10.125, 10.5703125, 11.015625, 11.4609375, 11.90625, 12.3515625, 12.796875, 13.2421875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 9.0, 13.0, 6.0, 15.0, 17.0, 19.0, 24.0, 36.0, 39.0, 52.0, 48.0, 58.0, 61.0, 59.0, 57.0, 74.0, 60.0, 56.0, 57.0, 41.0, 33.0, 32.0, 21.0, 14.0, 16.0, 11.0, 10.0, 8.0, 7.0, 8.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.125, -3.034820556640625, -2.94464111328125, -2.854461669921875, -2.7642822265625, -2.674102783203125, -2.58392333984375, -2.493743896484375, -2.403564453125, -2.313385009765625, -2.22320556640625, -2.133026123046875, -2.0428466796875, -1.952667236328125, -1.86248779296875, -1.772308349609375, -1.68212890625, -1.591949462890625, -1.50177001953125, -1.411590576171875, -1.3214111328125, -1.231231689453125, -1.14105224609375, -1.050872802734375, -0.960693359375, -0.870513916015625, -0.78033447265625, -0.690155029296875, -0.5999755859375, -0.509796142578125, -0.41961669921875, -0.329437255859375, -0.2392578125, -0.149078369140625, -0.05889892578125, 0.031280517578125, 0.1214599609375, 0.211639404296875, 0.30181884765625, 0.391998291015625, 0.482177734375, 0.572357177734375, 0.66253662109375, 0.752716064453125, 0.8428955078125, 0.933074951171875, 1.02325439453125, 1.113433837890625, 1.20361328125, 1.293792724609375, 1.38397216796875, 1.474151611328125, 1.5643310546875, 1.654510498046875, 1.74468994140625, 1.834869384765625, 1.925048828125, 2.015228271484375, 2.10540771484375, 2.195587158203125, 2.2857666015625, 2.375946044921875, 2.46612548828125, 2.556304931640625, 2.646484375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 9.0, 5.0, 11.0, 15.0, 10.0, 15.0, 26.0, 32.0, 36.0, 40.0, 36.0, 49.0, 49.0, 66.0, 61.0, 60.0, 80.0, 77.0, 49.0, 42.0, 37.0, 41.0, 27.0, 26.0, 23.0, 25.0, 18.0, 11.0, 6.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.293867111206055, -18.58577537536621, -17.877683639526367, -17.169593811035156, -16.461502075195312, -15.753410339355469, -15.045318603515625, -14.337226867675781, -13.629136085510254, -12.92104434967041, -12.212953567504883, -11.504861831665039, -10.796770095825195, -10.088679313659668, -9.380587577819824, -8.672496795654297, -7.964405059814453, -7.256313800811768, -6.548222541809082, -5.840130805969238, -5.132039546966553, -4.423948287963867, -3.7158565521240234, -3.007765293121338, -2.2996740341186523, -1.5915826559066772, -0.8834912776947021, -0.1753997802734375, 0.532691478729248, 1.2407827377319336, 1.9488744735717773, 2.656965732574463, 3.3650550842285156, 4.073146343231201, 4.781237602233887, 5.4893293380737305, 6.197420597076416, 6.905511856079102, 7.613603591918945, 8.321695327758789, 9.029786109924316, 9.73787784576416, 10.445968627929688, 11.154060363769531, 11.862152099609375, 12.570242881774902, 13.278334617614746, 13.986425399780273, 14.694517135620117, 15.402608871459961, 16.110700607299805, 16.818790435791016, 17.52688217163086, 18.234973907470703, 18.943065643310547, 19.65115737915039, 20.359249114990234, 21.067340850830078, 21.775432586669922, 22.483524322509766, 23.191614151000977, 23.89970588684082, 24.607797622680664, 25.315889358520508, 26.02397918701172]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 10.0, 5.0, 4.0, 14.0, 10.0, 15.0, 24.0, 22.0, 24.0, 27.0, 19.0, 40.0, 33.0, 36.0, 33.0, 46.0, 37.0, 46.0, 28.0, 35.0, 56.0, 53.0, 43.0, 42.0, 36.0, 31.0, 29.0, 21.0, 26.0, 22.0, 26.0, 14.0, 19.0, 13.0, 9.0, 7.0, 4.0, 8.0, 5.0, 4.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.718064308166504, -9.37883186340332, -9.03959846496582, -8.700366020202637, -8.361133575439453, -8.02190113067627, -7.682668209075928, -7.343435287475586, -7.004202842712402, -6.664970397949219, -6.325737476348877, -5.986504554748535, -5.647272109985352, -5.308039665222168, -4.968806743621826, -4.629573822021484, -4.290341377258301, -3.951108694076538, -3.6118760108947754, -3.2726433277130127, -2.93341064453125, -2.5941779613494873, -2.2549452781677246, -1.915712594985962, -1.5764799118041992, -1.2372472286224365, -0.8980145454406738, -0.5587818622589111, -0.21954917907714844, 0.11968350410461426, 0.45891618728637695, 0.7981488704681396, 1.1373815536499023, 1.476614236831665, 1.8158469200134277, 2.1550796031951904, 2.494312286376953, 2.833544969558716, 3.1727776527404785, 3.512010335922241, 3.851243019104004, 4.1904754638671875, 4.529708385467529, 4.868941307067871, 5.208173751831055, 5.547406196594238, 5.88663911819458, 6.225872039794922, 6.5651044845581055, 6.904336929321289, 7.243569850921631, 7.582802772521973, 7.922035217285156, 8.26126766204834, 8.600500106811523, 8.939733505249023, 9.278965950012207, 9.61819839477539, 9.95743179321289, 10.296664237976074, 10.635896682739258, 10.975129127502441, 11.314361572265625, 11.653594970703125, 11.992827415466309]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 9.0, 10.0, 16.0, 24.0, 27.0, 33.0, 51.0, 66.0, 112.0, 146.0, 217.0, 344.0, 482.0, 836.0, 1163.0, 1852.0, 3073.0, 5224.0, 8874.0, 16601.0, 31389.0, 62480.0, 130923.0, 286982.0, 622053.0, 1053119.0, 970843.0, 528769.0, 242456.0, 110747.0, 53930.0, 27261.0, 14248.0, 8149.0, 4549.0, 2568.0, 1665.0, 1001.0, 665.0, 426.0, 264.0, 215.0, 122.0, 83.0, 70.0, 34.0, 36.0, 24.0, 18.0, 16.0, 9.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.02880859375, -18.3701171875, -17.71142578125, -17.052734375, -16.39404296875, -15.7353515625, -15.07666015625, -14.41796875, -13.75927734375, -13.1005859375, -12.44189453125, -11.783203125, -11.12451171875, -10.4658203125, -9.80712890625, -9.1484375, -8.48974609375, -7.8310546875, -7.17236328125, -6.513671875, -5.85498046875, -5.1962890625, -4.53759765625, -3.87890625, -3.22021484375, -2.5615234375, -1.90283203125, -1.244140625, -0.58544921875, 0.0732421875, 0.73193359375, 1.390625, 2.04931640625, 2.7080078125, 3.36669921875, 4.025390625, 4.68408203125, 5.3427734375, 6.00146484375, 6.66015625, 7.31884765625, 7.9775390625, 8.63623046875, 9.294921875, 9.95361328125, 10.6123046875, 11.27099609375, 11.9296875, 12.58837890625, 13.2470703125, 13.90576171875, 14.564453125, 15.22314453125, 15.8818359375, 16.54052734375, 17.19921875, 17.85791015625, 18.5166015625, 19.17529296875, 19.833984375, 20.49267578125, 21.1513671875, 21.81005859375, 22.46875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 12.0, 10.0, 15.0, 17.0, 21.0, 27.0, 31.0, 32.0, 30.0, 33.0, 38.0, 39.0, 48.0, 50.0, 48.0, 53.0, 49.0, 49.0, 39.0, 38.0, 50.0, 33.0, 29.0, 26.0, 32.0, 22.0, 15.0, 9.0, 14.0, 12.0, 10.0, 14.0, 6.0, 7.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0272216796875, -8.718505859375, -8.4097900390625, -8.10107421875, -7.7923583984375, -7.483642578125, -7.1749267578125, -6.8662109375, -6.5574951171875, -6.248779296875, -5.9400634765625, -5.63134765625, -5.3226318359375, -5.013916015625, -4.7052001953125, -4.396484375, -4.0877685546875, -3.779052734375, -3.4703369140625, -3.16162109375, -2.8529052734375, -2.544189453125, -2.2354736328125, -1.9267578125, -1.6180419921875, -1.309326171875, -1.0006103515625, -0.69189453125, -0.3831787109375, -0.074462890625, 0.2342529296875, 0.54296875, 0.8516845703125, 1.160400390625, 1.4691162109375, 1.77783203125, 2.0865478515625, 2.395263671875, 2.7039794921875, 3.0126953125, 3.3214111328125, 3.630126953125, 3.9388427734375, 4.24755859375, 4.5562744140625, 4.864990234375, 5.1737060546875, 5.482421875, 5.7911376953125, 6.099853515625, 6.4085693359375, 6.71728515625, 7.0260009765625, 7.334716796875, 7.6434326171875, 7.9521484375, 8.2608642578125, 8.569580078125, 8.8782958984375, 9.18701171875, 9.4957275390625, 9.804443359375, 10.1131591796875, 10.421875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 6.0, 9.0, 12.0, 6.0, 19.0, 21.0, 40.0, 60.0, 60.0, 90.0, 146.0, 221.0, 348.0, 536.0, 879.0, 1406.0, 2259.0, 3802.0, 6575.0, 11286.0, 19651.0, 34508.0, 62868.0, 114539.0, 212807.0, 382621.0, 634483.0, 841551.0, 752811.0, 490491.0, 277905.0, 152857.0, 83064.0, 45143.0, 25451.0, 14633.0, 8431.0, 4835.0, 2924.0, 1811.0, 1130.0, 678.0, 449.0, 303.0, 192.0, 119.0, 95.0, 44.0, 38.0, 22.0, 12.0, 13.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.25, -18.643310546875, -18.03662109375, -17.429931640625, -16.8232421875, -16.216552734375, -15.60986328125, -15.003173828125, -14.396484375, -13.789794921875, -13.18310546875, -12.576416015625, -11.9697265625, -11.363037109375, -10.75634765625, -10.149658203125, -9.54296875, -8.936279296875, -8.32958984375, -7.722900390625, -7.1162109375, -6.509521484375, -5.90283203125, -5.296142578125, -4.689453125, -4.082763671875, -3.47607421875, -2.869384765625, -2.2626953125, -1.656005859375, -1.04931640625, -0.442626953125, 0.1640625, 0.770751953125, 1.37744140625, 1.984130859375, 2.5908203125, 3.197509765625, 3.80419921875, 4.410888671875, 5.017578125, 5.624267578125, 6.23095703125, 6.837646484375, 7.4443359375, 8.051025390625, 8.65771484375, 9.264404296875, 9.87109375, 10.477783203125, 11.08447265625, 11.691162109375, 12.2978515625, 12.904541015625, 13.51123046875, 14.117919921875, 14.724609375, 15.331298828125, 15.93798828125, 16.544677734375, 17.1513671875, 17.758056640625, 18.36474609375, 18.971435546875, 19.578125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 13.0, 13.0, 30.0, 22.0, 38.0, 32.0, 52.0, 84.0, 91.0, 119.0, 143.0, 188.0, 235.0, 248.0, 301.0, 269.0, 302.0, 320.0, 264.0, 262.0, 228.0, 177.0, 122.0, 112.0, 116.0, 67.0, 69.0, 30.0, 27.0, 26.0, 21.0, 9.0, 10.0, 8.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.0078125, -7.7862548828125, -7.564697265625, -7.3431396484375, -7.12158203125, -6.9000244140625, -6.678466796875, -6.4569091796875, -6.2353515625, -6.0137939453125, -5.792236328125, -5.5706787109375, -5.34912109375, -5.1275634765625, -4.906005859375, -4.6844482421875, -4.462890625, -4.2413330078125, -4.019775390625, -3.7982177734375, -3.57666015625, -3.3551025390625, -3.133544921875, -2.9119873046875, -2.6904296875, -2.4688720703125, -2.247314453125, -2.0257568359375, -1.80419921875, -1.5826416015625, -1.361083984375, -1.1395263671875, -0.91796875, -0.6964111328125, -0.474853515625, -0.2532958984375, -0.03173828125, 0.1898193359375, 0.411376953125, 0.6329345703125, 0.8544921875, 1.0760498046875, 1.297607421875, 1.5191650390625, 1.74072265625, 1.9622802734375, 2.183837890625, 2.4053955078125, 2.626953125, 2.8485107421875, 3.070068359375, 3.2916259765625, 3.51318359375, 3.7347412109375, 3.956298828125, 4.1778564453125, 4.3994140625, 4.6209716796875, 4.842529296875, 5.0640869140625, 5.28564453125, 5.5072021484375, 5.728759765625, 5.9503173828125, 6.171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 9.0, 19.0, 14.0, 17.0, 20.0, 28.0, 18.0, 40.0, 44.0, 51.0, 55.0, 43.0, 46.0, 55.0, 47.0, 56.0, 52.0, 52.0, 48.0, 44.0, 41.0, 24.0, 21.0, 21.0, 25.0, 16.0, 13.0, 8.0, 6.0, 9.0, 4.0, 11.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.998210906982422, -16.371292114257812, -15.744372367858887, -15.117452621459961, -14.490533828735352, -13.863615036010742, -13.236695289611816, -12.60977554321289, -11.982856750488281, -11.355937957763672, -10.729018211364746, -10.10209846496582, -9.475179672241211, -8.848260879516602, -8.221341133117676, -7.594421863555908, -6.967502593994141, -6.340583324432373, -5.7136640548706055, -5.086744785308838, -4.45982551574707, -3.8329062461853027, -3.205986976623535, -2.5790677070617676, -1.9521484375, -1.3252291679382324, -0.6983098983764648, -0.07139062881469727, 0.5555286407470703, 1.182447910308838, 1.8093671798706055, 2.436286449432373, 3.063203811645508, 3.6901230812072754, 4.317042350769043, 4.9439616203308105, 5.570880889892578, 6.197800159454346, 6.824719429016113, 7.451638698577881, 8.078557968139648, 8.705476760864258, 9.332396507263184, 9.95931625366211, 10.586235046386719, 11.213153839111328, 11.840073585510254, 12.46699333190918, 13.093912124633789, 13.720830917358398, 14.347750663757324, 14.97467041015625, 15.60158920288086, 16.22850799560547, 16.855426788330078, 17.48234748840332, 18.10926628112793, 18.73618507385254, 19.36310577392578, 19.99002456665039, 20.616943359375, 21.24386215209961, 21.87078094482422, 22.49770164489746, 23.12462043762207]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 11.0, 12.0, 11.0, 20.0, 13.0, 16.0, 24.0, 25.0, 20.0, 33.0, 33.0, 46.0, 42.0, 34.0, 42.0, 35.0, 48.0, 45.0, 41.0, 38.0, 36.0, 34.0, 37.0, 38.0, 32.0, 35.0, 24.0, 27.0, 26.0, 17.0, 15.0, 12.0, 15.0, 7.0, 11.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6232271194458, -12.234650611877441, -11.846074104309082, -11.457497596740723, -11.06892204284668, -10.68034553527832, -10.291769027709961, -9.903192520141602, -9.514616012573242, -9.126039505004883, -8.737462997436523, -8.348886489868164, -7.960310459136963, -7.5717339515686035, -7.183157920837402, -6.794581413269043, -6.406004905700684, -6.017428398132324, -5.628851890563965, -5.240275859832764, -4.851699352264404, -4.463122844696045, -4.074546813964844, -3.6859703063964844, -3.297393798828125, -2.9088172912597656, -2.5202410221099854, -2.131664752960205, -1.7430882453918457, -1.3545118570327759, -0.965935468673706, -0.5773591995239258, -0.1887836456298828, 0.199792742729187, 0.5883691310882568, 0.9769455194473267, 1.3655219078063965, 1.7540982961654663, 2.142674684524536, 2.5312509536743164, 2.919827461242676, 3.308403968811035, 3.6969802379608154, 4.085556507110596, 4.474133014678955, 4.8627095222473145, 5.251285552978516, 5.639862060546875, 6.028438568115234, 6.417015075683594, 6.805591583251953, 7.194167613983154, 7.582744121551514, 7.971320629119873, 8.359896659851074, 8.748473167419434, 9.137049674987793, 9.525626182556152, 9.914202690124512, 10.302779197692871, 10.691354751586914, 11.079931259155273, 11.468507766723633, 11.857084274291992, 12.245660781860352]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 8.0, 18.0, 44.0, 44.0, 67.0, 84.0, 148.0, 202.0, 306.0, 535.0, 818.0, 1342.0, 2163.0, 3814.0, 6910.0, 13635.0, 30306.0, 76403.0, 188641.0, 310426.0, 234222.0, 101651.0, 40063.0, 17178.0, 8418.0, 4409.0, 2652.0, 1519.0, 870.0, 528.0, 372.0, 237.0, 145.0, 119.0, 66.0, 38.0, 41.0, 27.0, 15.0, 20.0, 5.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.515625, -21.729736328125, -20.94384765625, -20.157958984375, -19.3720703125, -18.586181640625, -17.80029296875, -17.014404296875, -16.228515625, -15.442626953125, -14.65673828125, -13.870849609375, -13.0849609375, -12.299072265625, -11.51318359375, -10.727294921875, -9.94140625, -9.155517578125, -8.36962890625, -7.583740234375, -6.7978515625, -6.011962890625, -5.22607421875, -4.440185546875, -3.654296875, -2.868408203125, -2.08251953125, -1.296630859375, -0.5107421875, 0.275146484375, 1.06103515625, 1.846923828125, 2.6328125, 3.418701171875, 4.20458984375, 4.990478515625, 5.7763671875, 6.562255859375, 7.34814453125, 8.134033203125, 8.919921875, 9.705810546875, 10.49169921875, 11.277587890625, 12.0634765625, 12.849365234375, 13.63525390625, 14.421142578125, 15.20703125, 15.992919921875, 16.77880859375, 17.564697265625, 18.3505859375, 19.136474609375, 19.92236328125, 20.708251953125, 21.494140625, 22.280029296875, 23.06591796875, 23.851806640625, 24.6376953125, 25.423583984375, 26.20947265625, 26.995361328125, 27.78125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 4.0, 13.0, 19.0, 13.0, 21.0, 16.0, 24.0, 23.0, 32.0, 37.0, 33.0, 38.0, 41.0, 44.0, 40.0, 41.0, 32.0, 43.0, 44.0, 42.0, 36.0, 41.0, 39.0, 32.0, 27.0, 25.0, 26.0, 26.0, 23.0, 16.0, 15.0, 10.0, 10.0, 12.0, 11.0, 6.0, 5.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-14.453125, -14.03759765625, -13.6220703125, -13.20654296875, -12.791015625, -12.37548828125, -11.9599609375, -11.54443359375, -11.12890625, -10.71337890625, -10.2978515625, -9.88232421875, -9.466796875, -9.05126953125, -8.6357421875, -8.22021484375, -7.8046875, -7.38916015625, -6.9736328125, -6.55810546875, -6.142578125, -5.72705078125, -5.3115234375, -4.89599609375, -4.48046875, -4.06494140625, -3.6494140625, -3.23388671875, -2.818359375, -2.40283203125, -1.9873046875, -1.57177734375, -1.15625, -0.74072265625, -0.3251953125, 0.09033203125, 0.505859375, 0.92138671875, 1.3369140625, 1.75244140625, 2.16796875, 2.58349609375, 2.9990234375, 3.41455078125, 3.830078125, 4.24560546875, 4.6611328125, 5.07666015625, 5.4921875, 5.90771484375, 6.3232421875, 6.73876953125, 7.154296875, 7.56982421875, 7.9853515625, 8.40087890625, 8.81640625, 9.23193359375, 9.6474609375, 10.06298828125, 10.478515625, 10.89404296875, 11.3095703125, 11.72509765625, 12.140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 9.0, 7.0, 16.0, 18.0, 27.0, 32.0, 54.0, 59.0, 93.0, 116.0, 157.0, 226.0, 333.0, 422.0, 630.0, 928.0, 1436.0, 2473.0, 4365.0, 8644.0, 20467.0, 61866.0, 232867.0, 451484.0, 178812.0, 48238.0, 16795.0, 7581.0, 3820.0, 2255.0, 1423.0, 868.0, 590.0, 416.0, 284.0, 218.0, 125.0, 91.0, 88.0, 50.0, 49.0, 39.0, 24.0, 15.0, 12.0, 7.0, 3.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.40625, -36.21484375, -35.0234375, -33.83203125, -32.640625, -31.44921875, -30.2578125, -29.06640625, -27.875, -26.68359375, -25.4921875, -24.30078125, -23.109375, -21.91796875, -20.7265625, -19.53515625, -18.34375, -17.15234375, -15.9609375, -14.76953125, -13.578125, -12.38671875, -11.1953125, -10.00390625, -8.8125, -7.62109375, -6.4296875, -5.23828125, -4.046875, -2.85546875, -1.6640625, -0.47265625, 0.71875, 1.91015625, 3.1015625, 4.29296875, 5.484375, 6.67578125, 7.8671875, 9.05859375, 10.25, 11.44140625, 12.6328125, 13.82421875, 15.015625, 16.20703125, 17.3984375, 18.58984375, 19.78125, 20.97265625, 22.1640625, 23.35546875, 24.546875, 25.73828125, 26.9296875, 28.12109375, 29.3125, 30.50390625, 31.6953125, 32.88671875, 34.078125, 35.26953125, 36.4609375, 37.65234375, 38.84375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 6.0, 14.0, 12.0, 16.0, 19.0, 19.0, 20.0, 23.0, 35.0, 26.0, 26.0, 40.0, 28.0, 38.0, 38.0, 45.0, 35.0, 47.0, 27.0, 44.0, 41.0, 38.0, 35.0, 35.0, 36.0, 30.0, 31.0, 25.0, 21.0, 17.0, 17.0, 15.0, 8.0, 14.0, 8.0, 5.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-7.62890625, -7.397216796875, -7.16552734375, -6.933837890625, -6.7021484375, -6.470458984375, -6.23876953125, -6.007080078125, -5.775390625, -5.543701171875, -5.31201171875, -5.080322265625, -4.8486328125, -4.616943359375, -4.38525390625, -4.153564453125, -3.921875, -3.690185546875, -3.45849609375, -3.226806640625, -2.9951171875, -2.763427734375, -2.53173828125, -2.300048828125, -2.068359375, -1.836669921875, -1.60498046875, -1.373291015625, -1.1416015625, -0.909912109375, -0.67822265625, -0.446533203125, -0.21484375, 0.016845703125, 0.24853515625, 0.480224609375, 0.7119140625, 0.943603515625, 1.17529296875, 1.406982421875, 1.638671875, 1.870361328125, 2.10205078125, 2.333740234375, 2.5654296875, 2.797119140625, 3.02880859375, 3.260498046875, 3.4921875, 3.723876953125, 3.95556640625, 4.187255859375, 4.4189453125, 4.650634765625, 4.88232421875, 5.114013671875, 5.345703125, 5.577392578125, 5.80908203125, 6.040771484375, 6.2724609375, 6.504150390625, 6.73583984375, 6.967529296875, 7.19921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 12.0, 10.0, 14.0, 21.0, 34.0, 51.0, 59.0, 84.0, 126.0, 180.0, 292.0, 399.0, 584.0, 853.0, 1227.0, 1850.0, 2689.0, 4400.0, 7232.0, 13801.0, 31358.0, 92852.0, 299693.0, 377313.0, 131713.0, 41387.0, 16993.0, 8624.0, 5015.0, 3120.0, 2081.0, 1416.0, 952.0, 625.0, 476.0, 321.0, 209.0, 147.0, 114.0, 81.0, 47.0, 31.0, 20.0, 8.0, 16.0, 10.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.0, -16.487060546875, -15.97412109375, -15.461181640625, -14.9482421875, -14.435302734375, -13.92236328125, -13.409423828125, -12.896484375, -12.383544921875, -11.87060546875, -11.357666015625, -10.8447265625, -10.331787109375, -9.81884765625, -9.305908203125, -8.79296875, -8.280029296875, -7.76708984375, -7.254150390625, -6.7412109375, -6.228271484375, -5.71533203125, -5.202392578125, -4.689453125, -4.176513671875, -3.66357421875, -3.150634765625, -2.6376953125, -2.124755859375, -1.61181640625, -1.098876953125, -0.5859375, -0.072998046875, 0.43994140625, 0.952880859375, 1.4658203125, 1.978759765625, 2.49169921875, 3.004638671875, 3.517578125, 4.030517578125, 4.54345703125, 5.056396484375, 5.5693359375, 6.082275390625, 6.59521484375, 7.108154296875, 7.62109375, 8.134033203125, 8.64697265625, 9.159912109375, 9.6728515625, 10.185791015625, 10.69873046875, 11.211669921875, 11.724609375, 12.237548828125, 12.75048828125, 13.263427734375, 13.7763671875, 14.289306640625, 14.80224609375, 15.315185546875, 15.828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 3.0, 2.0, 12.0, 13.0, 18.0, 26.0, 55.0, 76.0, 122.0, 143.0, 142.0, 120.0, 82.0, 55.0, 30.0, 19.0, 16.0, 9.0, 12.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008711814880371094, -0.0008402243256568909, -0.0008092671632766724, -0.0007783100008964539, -0.0007473528385162354, -0.0007163956761360168, -0.0006854385137557983, -0.0006544813513755798, -0.0006235241889953613, -0.0005925670266151428, -0.0005616098642349243, -0.0005306527018547058, -0.0004996955394744873, -0.0004687383770942688, -0.0004377812147140503, -0.0004068240523338318, -0.0003758668899536133, -0.0003449097275733948, -0.00031395256519317627, -0.00028299540281295776, -0.00025203824043273926, -0.00022108107805252075, -0.00019012391567230225, -0.00015916675329208374, -0.00012820959091186523, -9.725242853164673e-05, -6.629526615142822e-05, -3.533810377120972e-05, -4.380941390991211e-06, 2.6576220989227295e-05, 5.75333833694458e-05, 8.84905457496643e-05, 0.00011944770812988281, 0.00015040487051010132, 0.00018136203289031982, 0.00021231919527053833, 0.00024327635765075684, 0.00027423352003097534, 0.00030519068241119385, 0.00033614784479141235, 0.00036710500717163086, 0.00039806216955184937, 0.00042901933193206787, 0.0004599764943122864, 0.0004909336566925049, 0.0005218908190727234, 0.0005528479814529419, 0.0005838051438331604, 0.0006147623062133789, 0.0006457194685935974, 0.0006766766309738159, 0.0007076337933540344, 0.0007385909557342529, 0.0007695481181144714, 0.0008005052804946899, 0.0008314624428749084, 0.000862419605255127, 0.0008933767676353455, 0.000924333930015564, 0.0009552910923957825, 0.000986248254776001, 0.0010172054171562195, 0.001048162579536438, 0.0010791197419166565, 0.001110076904296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 15.0, 31.0, 29.0, 60.0, 97.0, 90.0, 135.0, 179.0, 266.0, 326.0, 498.0, 676.0, 1000.0, 1314.0, 1765.0, 2334.0, 3454.0, 4993.0, 7652.0, 13254.0, 29506.0, 85327.0, 242484.0, 351801.0, 184129.0, 60911.0, 22694.0, 11171.0, 6525.0, 4509.0, 3119.0, 2280.0, 1541.0, 1168.0, 889.0, 676.0, 458.0, 349.0, 230.0, 159.0, 121.0, 86.0, 64.0, 52.0, 37.0, 18.0, 16.0, 9.0, 10.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-15.1171875, -14.635009765625, -14.15283203125, -13.670654296875, -13.1884765625, -12.706298828125, -12.22412109375, -11.741943359375, -11.259765625, -10.777587890625, -10.29541015625, -9.813232421875, -9.3310546875, -8.848876953125, -8.36669921875, -7.884521484375, -7.40234375, -6.920166015625, -6.43798828125, -5.955810546875, -5.4736328125, -4.991455078125, -4.50927734375, -4.027099609375, -3.544921875, -3.062744140625, -2.58056640625, -2.098388671875, -1.6162109375, -1.134033203125, -0.65185546875, -0.169677734375, 0.3125, 0.794677734375, 1.27685546875, 1.759033203125, 2.2412109375, 2.723388671875, 3.20556640625, 3.687744140625, 4.169921875, 4.652099609375, 5.13427734375, 5.616455078125, 6.0986328125, 6.580810546875, 7.06298828125, 7.545166015625, 8.02734375, 8.509521484375, 8.99169921875, 9.473876953125, 9.9560546875, 10.438232421875, 10.92041015625, 11.402587890625, 11.884765625, 12.366943359375, 12.84912109375, 13.331298828125, 13.8134765625, 14.295654296875, 14.77783203125, 15.260009765625, 15.7421875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 10.0, 18.0, 20.0, 33.0, 61.0, 108.0, 126.0, 135.0, 143.0, 120.0, 60.0, 44.0, 22.0, 17.0, 9.0, 10.0, 3.0, 4.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.8157958984375, -4.635498046875, -4.4552001953125, -4.27490234375, -4.0946044921875, -3.914306640625, -3.7340087890625, -3.5537109375, -3.3734130859375, -3.193115234375, -3.0128173828125, -2.83251953125, -2.6522216796875, -2.471923828125, -2.2916259765625, -2.111328125, -1.9310302734375, -1.750732421875, -1.5704345703125, -1.39013671875, -1.2098388671875, -1.029541015625, -0.8492431640625, -0.6689453125, -0.4886474609375, -0.308349609375, -0.1280517578125, 0.05224609375, 0.2325439453125, 0.412841796875, 0.5931396484375, 0.7734375, 0.9537353515625, 1.134033203125, 1.3143310546875, 1.49462890625, 1.6749267578125, 1.855224609375, 2.0355224609375, 2.2158203125, 2.3961181640625, 2.576416015625, 2.7567138671875, 2.93701171875, 3.1173095703125, 3.297607421875, 3.4779052734375, 3.658203125, 3.8385009765625, 4.018798828125, 4.1990966796875, 4.37939453125, 4.5596923828125, 4.739990234375, 4.9202880859375, 5.1005859375, 5.2808837890625, 5.461181640625, 5.6414794921875, 5.82177734375, 6.0020751953125, 6.182373046875, 6.3626708984375, 6.54296875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 2.0, 13.0, 11.0, 12.0, 16.0, 18.0, 15.0, 24.0, 23.0, 35.0, 39.0, 46.0, 58.0, 59.0, 54.0, 64.0, 48.0, 69.0, 62.0, 57.0, 43.0, 45.0, 29.0, 27.0, 40.0, 22.0, 17.0, 3.0, 8.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.16149139404297, -19.467941284179688, -18.774391174316406, -18.080839157104492, -17.38728904724121, -16.69373893737793, -16.000186920166016, -15.306636810302734, -14.613086700439453, -13.919536590576172, -13.225985527038574, -12.532434463500977, -11.838884353637695, -11.145334243774414, -10.451783180236816, -9.758232116699219, -9.064682006835938, -8.371131896972656, -7.677580833435059, -6.984030246734619, -6.29047966003418, -5.59692907333374, -4.903378486633301, -4.209827899932861, -3.516277313232422, -2.8227267265319824, -2.129176139831543, -1.4356255531311035, -0.7420749664306641, -0.04852437973022461, 0.6450262069702148, 1.3385767936706543, 2.0321273803710938, 2.725677967071533, 3.4192285537719727, 4.112779140472412, 4.806329727172852, 5.499880313873291, 6.1934309005737305, 6.88698148727417, 7.580532073974609, 8.27408218383789, 8.967633247375488, 9.661184310913086, 10.354734420776367, 11.048284530639648, 11.741835594177246, 12.435386657714844, 13.128936767578125, 13.822486877441406, 14.516037940979004, 15.209589004516602, 15.903139114379883, 16.596689224243164, 17.290241241455078, 17.98379135131836, 18.67734146118164, 19.370891571044922, 20.064441680908203, 20.757993698120117, 21.4515438079834, 22.14509391784668, 22.838645935058594, 23.532196044921875, 24.225746154785156]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 6.0, 5.0, 8.0, 13.0, 9.0, 12.0, 12.0, 15.0, 22.0, 24.0, 19.0, 33.0, 27.0, 32.0, 38.0, 46.0, 34.0, 41.0, 42.0, 37.0, 39.0, 32.0, 47.0, 34.0, 38.0, 34.0, 43.0, 37.0, 30.0, 25.0, 28.0, 17.0, 26.0, 12.0, 17.0, 13.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.440733909606934, -12.069839477539062, -11.698945045471191, -11.32805061340332, -10.957157135009766, -10.586262702941895, -10.215368270874023, -9.844473838806152, -9.473579406738281, -9.10268497467041, -8.731790542602539, -8.360896110534668, -7.990002155303955, -7.619107723236084, -7.248213768005371, -6.8773193359375, -6.506424903869629, -6.135530471801758, -5.764636039733887, -5.393742084503174, -5.022847652435303, -4.651953220367432, -4.281059265136719, -3.9101648330688477, -3.5392704010009766, -3.1683759689331055, -2.7974817752838135, -2.4265875816345215, -2.0556931495666504, -1.6847988367080688, -1.3139045238494873, -0.9430103302001953, -0.5721149444580078, -0.20122063159942627, 0.16967368125915527, 0.5405679941177368, 0.9114623069763184, 1.2823566198349, 1.6532509326934814, 2.0241451263427734, 2.3950395584106445, 2.7659339904785156, 3.1368281841278076, 3.5077223777770996, 3.8786168098449707, 4.249511241912842, 4.620405197143555, 4.991299629211426, 5.362194061279297, 5.733088493347168, 6.103982925415039, 6.474876880645752, 6.845771312713623, 7.216665744781494, 7.587559700012207, 7.958454132080078, 8.32934856414795, 8.70024299621582, 9.071137428283691, 9.442031860351562, 9.812925338745117, 10.183819770812988, 10.55471420288086, 10.92560863494873, 11.296503067016602]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 12.0, 20.0, 22.0, 24.0, 52.0, 70.0, 119.0, 172.0, 288.0, 394.0, 654.0, 998.0, 1620.0, 2649.0, 4147.0, 6606.0, 10747.0, 16956.0, 26570.0, 40557.0, 61366.0, 85718.0, 112100.0, 130219.0, 133303.0, 119228.0, 94835.0, 68534.0, 46980.0, 30792.0, 19592.0, 12397.0, 7808.0, 4811.0, 3105.0, 1956.0, 1155.0, 717.0, 449.0, 265.0, 174.0, 123.0, 88.0, 45.0, 38.0, 26.0, 16.0, 9.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-12.296875, -11.91455078125, -11.5322265625, -11.14990234375, -10.767578125, -10.38525390625, -10.0029296875, -9.62060546875, -9.23828125, -8.85595703125, -8.4736328125, -8.09130859375, -7.708984375, -7.32666015625, -6.9443359375, -6.56201171875, -6.1796875, -5.79736328125, -5.4150390625, -5.03271484375, -4.650390625, -4.26806640625, -3.8857421875, -3.50341796875, -3.12109375, -2.73876953125, -2.3564453125, -1.97412109375, -1.591796875, -1.20947265625, -0.8271484375, -0.44482421875, -0.0625, 0.31982421875, 0.7021484375, 1.08447265625, 1.466796875, 1.84912109375, 2.2314453125, 2.61376953125, 2.99609375, 3.37841796875, 3.7607421875, 4.14306640625, 4.525390625, 4.90771484375, 5.2900390625, 5.67236328125, 6.0546875, 6.43701171875, 6.8193359375, 7.20166015625, 7.583984375, 7.96630859375, 8.3486328125, 8.73095703125, 9.11328125, 9.49560546875, 9.8779296875, 10.26025390625, 10.642578125, 11.02490234375, 11.4072265625, 11.78955078125, 12.171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 6.0, 10.0, 14.0, 14.0, 14.0, 27.0, 19.0, 28.0, 26.0, 29.0, 41.0, 30.0, 32.0, 39.0, 35.0, 51.0, 46.0, 53.0, 40.0, 42.0, 37.0, 41.0, 44.0, 37.0, 38.0, 33.0, 14.0, 23.0, 15.0, 24.0, 16.0, 12.0, 19.0, 1.0, 4.0, 9.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.5404052734375, -12.127685546875, -11.7149658203125, -11.30224609375, -10.8895263671875, -10.476806640625, -10.0640869140625, -9.6513671875, -9.2386474609375, -8.825927734375, -8.4132080078125, -8.00048828125, -7.5877685546875, -7.175048828125, -6.7623291015625, -6.349609375, -5.9368896484375, -5.524169921875, -5.1114501953125, -4.69873046875, -4.2860107421875, -3.873291015625, -3.4605712890625, -3.0478515625, -2.6351318359375, -2.222412109375, -1.8096923828125, -1.39697265625, -0.9842529296875, -0.571533203125, -0.1588134765625, 0.25390625, 0.6666259765625, 1.079345703125, 1.4920654296875, 1.90478515625, 2.3175048828125, 2.730224609375, 3.1429443359375, 3.5556640625, 3.9683837890625, 4.381103515625, 4.7938232421875, 5.20654296875, 5.6192626953125, 6.031982421875, 6.4447021484375, 6.857421875, 7.2701416015625, 7.682861328125, 8.0955810546875, 8.50830078125, 8.9210205078125, 9.333740234375, 9.7464599609375, 10.1591796875, 10.5718994140625, 10.984619140625, 11.3973388671875, 11.81005859375, 12.2227783203125, 12.635498046875, 13.0482177734375, 13.4609375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 12.0, 11.0, 17.0, 36.0, 45.0, 78.0, 96.0, 136.0, 222.0, 303.0, 490.0, 722.0, 1178.0, 1883.0, 2842.0, 4403.0, 7068.0, 10501.0, 16721.0, 26065.0, 38732.0, 57043.0, 79537.0, 101494.0, 120792.0, 127239.0, 118298.0, 99168.0, 75310.0, 53637.0, 36821.0, 23955.0, 15437.0, 10225.0, 6396.0, 4224.0, 2662.0, 1617.0, 1108.0, 700.0, 489.0, 259.0, 190.0, 134.0, 85.0, 60.0, 40.0, 20.0, 16.0, 10.0, 12.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.984375, -10.634765625, -10.28515625, -9.935546875, -9.5859375, -9.236328125, -8.88671875, -8.537109375, -8.1875, -7.837890625, -7.48828125, -7.138671875, -6.7890625, -6.439453125, -6.08984375, -5.740234375, -5.390625, -5.041015625, -4.69140625, -4.341796875, -3.9921875, -3.642578125, -3.29296875, -2.943359375, -2.59375, -2.244140625, -1.89453125, -1.544921875, -1.1953125, -0.845703125, -0.49609375, -0.146484375, 0.203125, 0.552734375, 0.90234375, 1.251953125, 1.6015625, 1.951171875, 2.30078125, 2.650390625, 3.0, 3.349609375, 3.69921875, 4.048828125, 4.3984375, 4.748046875, 5.09765625, 5.447265625, 5.796875, 6.146484375, 6.49609375, 6.845703125, 7.1953125, 7.544921875, 7.89453125, 8.244140625, 8.59375, 8.943359375, 9.29296875, 9.642578125, 9.9921875, 10.341796875, 10.69140625, 11.041015625, 11.390625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 5.0, 7.0, 5.0, 11.0, 13.0, 21.0, 15.0, 22.0, 26.0, 37.0, 33.0, 24.0, 37.0, 46.0, 38.0, 46.0, 32.0, 30.0, 37.0, 32.0, 49.0, 29.0, 41.0, 30.0, 31.0, 32.0, 42.0, 24.0, 29.0, 26.0, 20.0, 17.0, 13.0, 8.0, 20.0, 11.0, 7.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.4921875, -7.26995849609375, -7.0477294921875, -6.82550048828125, -6.603271484375, -6.38104248046875, -6.1588134765625, -5.93658447265625, -5.71435546875, -5.49212646484375, -5.2698974609375, -5.04766845703125, -4.825439453125, -4.60321044921875, -4.3809814453125, -4.15875244140625, -3.9365234375, -3.71429443359375, -3.4920654296875, -3.26983642578125, -3.047607421875, -2.82537841796875, -2.6031494140625, -2.38092041015625, -2.15869140625, -1.93646240234375, -1.7142333984375, -1.49200439453125, -1.269775390625, -1.04754638671875, -0.8253173828125, -0.60308837890625, -0.380859375, -0.15863037109375, 0.0635986328125, 0.28582763671875, 0.508056640625, 0.73028564453125, 0.9525146484375, 1.17474365234375, 1.39697265625, 1.61920166015625, 1.8414306640625, 2.06365966796875, 2.285888671875, 2.50811767578125, 2.7303466796875, 2.95257568359375, 3.1748046875, 3.39703369140625, 3.6192626953125, 3.84149169921875, 4.063720703125, 4.28594970703125, 4.5081787109375, 4.73040771484375, 4.95263671875, 5.17486572265625, 5.3970947265625, 5.61932373046875, 5.841552734375, 6.06378173828125, 6.2860107421875, 6.50823974609375, 6.73046875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 9.0, 12.0, 10.0, 17.0, 31.0, 38.0, 78.0, 97.0, 139.0, 224.0, 294.0, 411.0, 683.0, 1012.0, 1532.0, 2437.0, 3805.0, 6075.0, 9750.0, 15544.0, 25139.0, 39473.0, 60272.0, 88270.0, 117255.0, 139236.0, 141343.0, 122371.0, 92680.0, 64914.0, 42664.0, 27100.0, 16959.0, 10397.0, 6417.0, 4220.0, 2743.0, 1734.0, 1074.0, 687.0, 445.0, 327.0, 201.0, 133.0, 104.0, 63.0, 41.0, 25.0, 13.0, 17.0, 10.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0], "bins": [-6.19921875, -6.0118408203125, -5.824462890625, -5.6370849609375, -5.44970703125, -5.2623291015625, -5.074951171875, -4.8875732421875, -4.7001953125, -4.5128173828125, -4.325439453125, -4.1380615234375, -3.95068359375, -3.7633056640625, -3.575927734375, -3.3885498046875, -3.201171875, -3.0137939453125, -2.826416015625, -2.6390380859375, -2.45166015625, -2.2642822265625, -2.076904296875, -1.8895263671875, -1.7021484375, -1.5147705078125, -1.327392578125, -1.1400146484375, -0.95263671875, -0.7652587890625, -0.577880859375, -0.3905029296875, -0.203125, -0.0157470703125, 0.171630859375, 0.3590087890625, 0.54638671875, 0.7337646484375, 0.921142578125, 1.1085205078125, 1.2958984375, 1.4832763671875, 1.670654296875, 1.8580322265625, 2.04541015625, 2.2327880859375, 2.420166015625, 2.6075439453125, 2.794921875, 2.9822998046875, 3.169677734375, 3.3570556640625, 3.54443359375, 3.7318115234375, 3.919189453125, 4.1065673828125, 4.2939453125, 4.4813232421875, 4.668701171875, 4.8560791015625, 5.04345703125, 5.2308349609375, 5.418212890625, 5.6055908203125, 5.79296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 3.0, 14.0, 10.0, 15.0, 19.0, 15.0, 30.0, 35.0, 44.0, 49.0, 58.0, 62.0, 71.0, 82.0, 76.0, 77.0, 57.0, 48.0, 42.0, 36.0, 40.0, 26.0, 21.0, 15.0, 15.0, 9.0, 8.0, 6.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008788108825683594, -0.0008503124117851257, -0.0008218139410018921, -0.0007933154702186584, -0.0007648169994354248, -0.0007363185286521912, -0.0007078200578689575, -0.0006793215870857239, -0.0006508231163024902, -0.0006223246455192566, -0.000593826174736023, -0.0005653277039527893, -0.0005368292331695557, -0.000508330762386322, -0.0004798322916030884, -0.00045133382081985474, -0.0004228353500366211, -0.00039433687925338745, -0.0003658384084701538, -0.00033733993768692017, -0.0003088414669036865, -0.0002803429961204529, -0.00025184452533721924, -0.0002233460545539856, -0.00019484758377075195, -0.0001663491129875183, -0.00013785064220428467, -0.00010935217142105103, -8.085370063781738e-05, -5.235522985458374e-05, -2.3856759071350098e-05, 4.641711711883545e-06, 3.314018249511719e-05, 6.163865327835083e-05, 9.013712406158447e-05, 0.00011863559484481812, 0.00014713406562805176, 0.0001756325364112854, 0.00020413100719451904, 0.00023262947797775269, 0.00026112794876098633, 0.00028962641954421997, 0.0003181248903274536, 0.00034662336111068726, 0.0003751218318939209, 0.00040362030267715454, 0.0004321187734603882, 0.0004606172442436218, 0.0004891157150268555, 0.0005176141858100891, 0.0005461126565933228, 0.0005746111273765564, 0.00060310959815979, 0.0006316080689430237, 0.0006601065397262573, 0.000688605010509491, 0.0007171034812927246, 0.0007456019520759583, 0.0007741004228591919, 0.0008025988936424255, 0.0008310973644256592, 0.0008595958352088928, 0.0008880943059921265, 0.0009165927767753601, 0.0009450912475585938]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 11.0, 18.0, 26.0, 27.0, 52.0, 70.0, 112.0, 194.0, 313.0, 452.0, 713.0, 1133.0, 1801.0, 2911.0, 5053.0, 7676.0, 13016.0, 20967.0, 33646.0, 52131.0, 77653.0, 106268.0, 131775.0, 141052.0, 130608.0, 105571.0, 77126.0, 51866.0, 32834.0, 20423.0, 12657.0, 7724.0, 4749.0, 2900.0, 1864.0, 1172.0, 705.0, 472.0, 302.0, 194.0, 131.0, 73.0, 49.0, 25.0, 9.0, 13.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.5625, -6.3721923828125, -6.181884765625, -5.9915771484375, -5.80126953125, -5.6109619140625, -5.420654296875, -5.2303466796875, -5.0400390625, -4.8497314453125, -4.659423828125, -4.4691162109375, -4.27880859375, -4.0885009765625, -3.898193359375, -3.7078857421875, -3.517578125, -3.3272705078125, -3.136962890625, -2.9466552734375, -2.75634765625, -2.5660400390625, -2.375732421875, -2.1854248046875, -1.9951171875, -1.8048095703125, -1.614501953125, -1.4241943359375, -1.23388671875, -1.0435791015625, -0.853271484375, -0.6629638671875, -0.47265625, -0.2823486328125, -0.092041015625, 0.0982666015625, 0.28857421875, 0.4788818359375, 0.669189453125, 0.8594970703125, 1.0498046875, 1.2401123046875, 1.430419921875, 1.6207275390625, 1.81103515625, 2.0013427734375, 2.191650390625, 2.3819580078125, 2.572265625, 2.7625732421875, 2.952880859375, 3.1431884765625, 3.33349609375, 3.5238037109375, 3.714111328125, 3.9044189453125, 4.0947265625, 4.2850341796875, 4.475341796875, 4.6656494140625, 4.85595703125, 5.0462646484375, 5.236572265625, 5.4268798828125, 5.6171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 11.0, 11.0, 12.0, 7.0, 16.0, 14.0, 15.0, 16.0, 18.0, 27.0, 22.0, 38.0, 30.0, 39.0, 33.0, 54.0, 35.0, 44.0, 41.0, 44.0, 39.0, 50.0, 52.0, 36.0, 29.0, 30.0, 25.0, 29.0, 35.0, 23.0, 12.0, 19.0, 16.0, 16.0, 10.0, 8.0, 7.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.5979766845703125, -1.546539306640625, -1.4951019287109375, -1.44366455078125, -1.3922271728515625, -1.340789794921875, -1.2893524169921875, -1.2379150390625, -1.1864776611328125, -1.135040283203125, -1.0836029052734375, -1.03216552734375, -0.9807281494140625, -0.929290771484375, -0.8778533935546875, -0.826416015625, -0.7749786376953125, -0.723541259765625, -0.6721038818359375, -0.62066650390625, -0.5692291259765625, -0.517791748046875, -0.4663543701171875, -0.4149169921875, -0.3634796142578125, -0.312042236328125, -0.2606048583984375, -0.20916748046875, -0.1577301025390625, -0.106292724609375, -0.0548553466796875, -0.00341796875, 0.0480194091796875, 0.099456787109375, 0.1508941650390625, 0.20233154296875, 0.2537689208984375, 0.305206298828125, 0.3566436767578125, 0.4080810546875, 0.4595184326171875, 0.510955810546875, 0.5623931884765625, 0.61383056640625, 0.6652679443359375, 0.716705322265625, 0.7681427001953125, 0.819580078125, 0.8710174560546875, 0.922454833984375, 0.9738922119140625, 1.02532958984375, 1.0767669677734375, 1.128204345703125, 1.1796417236328125, 1.2310791015625, 1.2825164794921875, 1.333953857421875, 1.3853912353515625, 1.43682861328125, 1.4882659912109375, 1.539703369140625, 1.5911407470703125, 1.642578125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 12.0, 10.0, 15.0, 13.0, 16.0, 26.0, 21.0, 34.0, 31.0, 48.0, 46.0, 57.0, 50.0, 60.0, 52.0, 60.0, 56.0, 59.0, 39.0, 40.0, 39.0, 44.0, 28.0, 21.0, 22.0, 16.0, 16.0, 12.0, 11.0, 4.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.861387252807617, -18.211864471435547, -17.562341690063477, -16.912818908691406, -16.263296127319336, -15.613773345947266, -14.964249610900879, -14.314726829528809, -13.665204048156738, -13.015681266784668, -12.366158485412598, -11.716635704040527, -11.06711196899414, -10.41758918762207, -9.76806640625, -9.11854362487793, -8.46902084350586, -7.819498062133789, -7.169975280761719, -6.52045202255249, -5.87092924118042, -5.22140645980835, -4.571883201599121, -3.922360420227051, -3.2728376388549805, -2.62331485748291, -1.9737918376922607, -1.3242689371109009, -0.674746036529541, -0.025223255157470703, 0.6242997646331787, 1.2738227844238281, 1.9233474731445312, 2.5728702545166016, 3.222393274307251, 3.8719162940979004, 4.521439075469971, 5.170961856842041, 5.8204851150512695, 6.47000789642334, 7.11953067779541, 7.7690534591674805, 8.41857624053955, 9.068099021911621, 9.717622756958008, 10.367145538330078, 11.016668319702148, 11.666191101074219, 12.315713882446289, 12.96523666381836, 13.61475944519043, 14.2642822265625, 14.91380500793457, 15.56332778930664, 16.21285057067871, 16.86237335205078, 17.511898040771484, 18.161420822143555, 18.810943603515625, 19.460466384887695, 20.109989166259766, 20.759511947631836, 21.409034729003906, 22.05855941772461, 22.708080291748047]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 10.0, 7.0, 5.0, 6.0, 3.0, 12.0, 9.0, 4.0, 10.0, 19.0, 17.0, 16.0, 27.0, 23.0, 22.0, 24.0, 27.0, 33.0, 37.0, 39.0, 33.0, 39.0, 44.0, 40.0, 33.0, 40.0, 29.0, 31.0, 37.0, 37.0, 27.0, 36.0, 37.0, 26.0, 29.0, 18.0, 17.0, 18.0, 12.0, 5.0, 14.0, 17.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.427643775939941, -10.08294677734375, -9.738249778747559, -9.393552780151367, -9.048856735229492, -8.7041597366333, -8.35946273803711, -8.014765739440918, -7.670069217681885, -7.325372219085693, -6.98067569732666, -6.635978698730469, -6.291281700134277, -5.946585178375244, -5.601888179779053, -5.2571916580200195, -4.912494659423828, -4.567797660827637, -4.2231011390686035, -3.878404140472412, -3.5337073802948, -3.1890106201171875, -2.844313621520996, -2.499616861343384, -2.1549201011657715, -1.8102233409881592, -1.4655264616012573, -1.1208295822143555, -0.7761328220367432, -0.43143606185913086, -0.08673906326293945, 0.25795769691467285, 0.6026544570922852, 0.9473512768745422, 1.2920480966567993, 1.6367449760437012, 1.9814417362213135, 2.326138496398926, 2.670835494995117, 3.0155322551727295, 3.360229015350342, 3.704925775527954, 4.049622535705566, 4.394319534301758, 4.739016532897949, 5.083713054656982, 5.428410053253174, 5.773106575012207, 6.117803573608398, 6.46250057220459, 6.807197093963623, 7.1518940925598145, 7.496590614318848, 7.841287612915039, 8.18598461151123, 8.530681610107422, 8.875377655029297, 9.220074653625488, 9.56477165222168, 9.909467697143555, 10.254164695739746, 10.598861694335938, 10.943558692932129, 11.28825569152832, 11.632952690124512]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 8.0, 17.0, 22.0, 29.0, 54.0, 72.0, 138.0, 171.0, 280.0, 478.0, 658.0, 1117.0, 1729.0, 2736.0, 4569.0, 7500.0, 13447.0, 25143.0, 49314.0, 101181.0, 219686.0, 475639.0, 882281.0, 1043729.0, 701520.0, 346834.0, 159304.0, 74740.0, 37003.0, 19018.0, 10308.0, 5939.0, 3506.0, 2097.0, 1371.0, 869.0, 555.0, 377.0, 249.0, 164.0, 118.0, 95.0, 64.0, 47.0, 28.0, 22.0, 20.0, 11.0, 7.0, 2.0, 1.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.935791015625, -19.23095703125, -18.526123046875, -17.8212890625, -17.116455078125, -16.41162109375, -15.706787109375, -15.001953125, -14.297119140625, -13.59228515625, -12.887451171875, -12.1826171875, -11.477783203125, -10.77294921875, -10.068115234375, -9.36328125, -8.658447265625, -7.95361328125, -7.248779296875, -6.5439453125, -5.839111328125, -5.13427734375, -4.429443359375, -3.724609375, -3.019775390625, -2.31494140625, -1.610107421875, -0.9052734375, -0.200439453125, 0.50439453125, 1.209228515625, 1.9140625, 2.618896484375, 3.32373046875, 4.028564453125, 4.7333984375, 5.438232421875, 6.14306640625, 6.847900390625, 7.552734375, 8.257568359375, 8.96240234375, 9.667236328125, 10.3720703125, 11.076904296875, 11.78173828125, 12.486572265625, 13.19140625, 13.896240234375, 14.60107421875, 15.305908203125, 16.0107421875, 16.715576171875, 17.42041015625, 18.125244140625, 18.830078125, 19.534912109375, 20.23974609375, 20.944580078125, 21.6494140625, 22.354248046875, 23.05908203125, 23.763916015625, 24.46875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 10.0, 8.0, 8.0, 11.0, 12.0, 11.0, 14.0, 28.0, 20.0, 23.0, 25.0, 28.0, 30.0, 31.0, 43.0, 29.0, 37.0, 44.0, 49.0, 49.0, 35.0, 34.0, 38.0, 44.0, 42.0, 45.0, 25.0, 31.0, 36.0, 23.0, 22.0, 15.0, 18.0, 16.0, 12.0, 13.0, 8.0, 6.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.359375, -9.0513916015625, -8.743408203125, -8.4354248046875, -8.12744140625, -7.8194580078125, -7.511474609375, -7.2034912109375, -6.8955078125, -6.5875244140625, -6.279541015625, -5.9715576171875, -5.66357421875, -5.3555908203125, -5.047607421875, -4.7396240234375, -4.431640625, -4.1236572265625, -3.815673828125, -3.5076904296875, -3.19970703125, -2.8917236328125, -2.583740234375, -2.2757568359375, -1.9677734375, -1.6597900390625, -1.351806640625, -1.0438232421875, -0.73583984375, -0.4278564453125, -0.119873046875, 0.1881103515625, 0.49609375, 0.8040771484375, 1.112060546875, 1.4200439453125, 1.72802734375, 2.0360107421875, 2.343994140625, 2.6519775390625, 2.9599609375, 3.2679443359375, 3.575927734375, 3.8839111328125, 4.19189453125, 4.4998779296875, 4.807861328125, 5.1158447265625, 5.423828125, 5.7318115234375, 6.039794921875, 6.3477783203125, 6.65576171875, 6.9637451171875, 7.271728515625, 7.5797119140625, 7.8876953125, 8.1956787109375, 8.503662109375, 8.8116455078125, 9.11962890625, 9.4276123046875, 9.735595703125, 10.0435791015625, 10.3515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 12.0, 17.0, 21.0, 48.0, 45.0, 61.0, 109.0, 150.0, 251.0, 354.0, 563.0, 898.0, 1407.0, 2147.0, 3647.0, 6040.0, 9870.0, 16943.0, 29287.0, 51554.0, 92424.0, 166679.0, 297522.0, 501227.0, 728089.0, 790793.0, 611937.0, 382971.0, 218117.0, 121613.0, 67545.0, 37791.0, 21606.0, 12694.0, 7507.0, 4521.0, 2772.0, 1826.0, 1176.0, 660.0, 459.0, 307.0, 184.0, 144.0, 95.0, 68.0, 44.0, 25.0, 26.0, 18.0, 13.0, 3.0, 5.0, 1.0, 2.0, 2.0], "bins": [-21.09375, -20.458984375, -19.82421875, -19.189453125, -18.5546875, -17.919921875, -17.28515625, -16.650390625, -16.015625, -15.380859375, -14.74609375, -14.111328125, -13.4765625, -12.841796875, -12.20703125, -11.572265625, -10.9375, -10.302734375, -9.66796875, -9.033203125, -8.3984375, -7.763671875, -7.12890625, -6.494140625, -5.859375, -5.224609375, -4.58984375, -3.955078125, -3.3203125, -2.685546875, -2.05078125, -1.416015625, -0.78125, -0.146484375, 0.48828125, 1.123046875, 1.7578125, 2.392578125, 3.02734375, 3.662109375, 4.296875, 4.931640625, 5.56640625, 6.201171875, 6.8359375, 7.470703125, 8.10546875, 8.740234375, 9.375, 10.009765625, 10.64453125, 11.279296875, 11.9140625, 12.548828125, 13.18359375, 13.818359375, 14.453125, 15.087890625, 15.72265625, 16.357421875, 16.9921875, 17.626953125, 18.26171875, 18.896484375, 19.53125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 11.0, 19.0, 21.0, 29.0, 37.0, 39.0, 66.0, 75.0, 97.0, 119.0, 163.0, 215.0, 242.0, 275.0, 314.0, 314.0, 311.0, 309.0, 278.0, 243.0, 184.0, 175.0, 124.0, 106.0, 88.0, 62.0, 38.0, 32.0, 20.0, 10.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.3125, -9.05865478515625, -8.8048095703125, -8.55096435546875, -8.297119140625, -8.04327392578125, -7.7894287109375, -7.53558349609375, -7.28173828125, -7.02789306640625, -6.7740478515625, -6.52020263671875, -6.266357421875, -6.01251220703125, -5.7586669921875, -5.50482177734375, -5.2509765625, -4.99713134765625, -4.7432861328125, -4.48944091796875, -4.235595703125, -3.98175048828125, -3.7279052734375, -3.47406005859375, -3.22021484375, -2.96636962890625, -2.7125244140625, -2.45867919921875, -2.204833984375, -1.95098876953125, -1.6971435546875, -1.44329833984375, -1.189453125, -0.93560791015625, -0.6817626953125, -0.42791748046875, -0.174072265625, 0.07977294921875, 0.3336181640625, 0.58746337890625, 0.84130859375, 1.09515380859375, 1.3489990234375, 1.60284423828125, 1.856689453125, 2.11053466796875, 2.3643798828125, 2.61822509765625, 2.8720703125, 3.12591552734375, 3.3797607421875, 3.63360595703125, 3.887451171875, 4.14129638671875, 4.3951416015625, 4.64898681640625, 4.90283203125, 5.15667724609375, 5.4105224609375, 5.66436767578125, 5.918212890625, 6.17205810546875, 6.4259033203125, 6.67974853515625, 6.93359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 6.0, 14.0, 13.0, 18.0, 29.0, 24.0, 33.0, 31.0, 48.0, 54.0, 64.0, 49.0, 80.0, 69.0, 72.0, 69.0, 61.0, 52.0, 39.0, 36.0, 29.0, 15.0, 15.0, 13.0, 6.0, 10.0, 7.0, 12.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.033483505249023, -23.233503341674805, -22.433523178100586, -21.633543014526367, -20.83356285095215, -20.03358268737793, -19.233600616455078, -18.43362045288086, -17.63364028930664, -16.833660125732422, -16.033679962158203, -15.233699798583984, -14.433719635009766, -13.633739471435547, -12.833758354187012, -12.033778190612793, -11.23379898071289, -10.433818817138672, -9.633838653564453, -8.833858489990234, -8.033878326416016, -7.233897686004639, -6.433917045593262, -5.633936882019043, -4.833956718444824, -4.0339765548706055, -3.2339961528778076, -2.4340157508850098, -1.634035587310791, -0.8340554237365723, -0.03407478332519531, 0.7659053802490234, 1.5658836364746094, 2.365863800048828, 3.165844202041626, 3.965824604034424, 4.765804767608643, 5.565784931182861, 6.365765571594238, 7.165745735168457, 7.965725898742676, 8.765706062316895, 9.565686225891113, 10.365667343139648, 11.165647506713867, 11.965627670288086, 12.765607833862305, 13.565587997436523, 14.365568161010742, 15.165548324584961, 15.96552848815918, 16.7655086517334, 17.565488815307617, 18.365468978881836, 19.165451049804688, 19.965431213378906, 20.765411376953125, 21.565391540527344, 22.365371704101562, 23.16535186767578, 23.96533203125, 24.76531219482422, 25.565292358398438, 26.365272521972656, 27.165252685546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 10.0, 8.0, 9.0, 15.0, 20.0, 22.0, 26.0, 25.0, 24.0, 30.0, 27.0, 31.0, 36.0, 37.0, 39.0, 45.0, 47.0, 50.0, 41.0, 48.0, 37.0, 32.0, 35.0, 39.0, 40.0, 32.0, 30.0, 28.0, 13.0, 19.0, 19.0, 19.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.314404487609863, -13.856593132019043, -13.398782730102539, -12.940971374511719, -12.483160018920898, -12.025349617004395, -11.567538261413574, -11.10972785949707, -10.65191650390625, -10.19410514831543, -9.736294746398926, -9.278483390808105, -8.820672988891602, -8.362861633300781, -7.905050277709961, -7.447239398956299, -6.989428520202637, -6.531617641448975, -6.0738067626953125, -5.615995407104492, -5.15818452835083, -4.700373649597168, -4.242562294006348, -3.7847514152526855, -3.3269405364990234, -2.8691296577453613, -2.41131854057312, -1.9535075426101685, -1.4956965446472168, -1.0378856658935547, -0.5800745487213135, -0.12226343154907227, 0.33554840087890625, 0.7933593988418579, 1.2511703968048096, 1.7089813947677612, 2.166792392730713, 2.624603271484375, 3.082414388656616, 3.5402255058288574, 3.9980363845825195, 4.455847263336182, 4.913658142089844, 5.371469497680664, 5.829280376434326, 6.287091255187988, 6.744902610778809, 7.202713489532471, 7.660524368286133, 8.118335723876953, 8.576146125793457, 9.033957481384277, 9.491767883300781, 9.949579238891602, 10.407390594482422, 10.865201950073242, 11.323012351989746, 11.780823707580566, 12.23863410949707, 12.69644546508789, 13.154256820678711, 13.612067222595215, 14.069878578186035, 14.527688980102539, 14.98550033569336]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 17.0, 12.0, 24.0, 33.0, 59.0, 71.0, 119.0, 187.0, 269.0, 383.0, 587.0, 929.0, 1441.0, 2291.0, 3521.0, 5814.0, 9684.0, 15611.0, 26221.0, 42874.0, 68183.0, 102067.0, 138034.0, 158214.0, 148092.0, 114778.0, 79270.0, 50507.0, 30747.0, 18664.0, 11373.0, 6786.0, 4245.0, 2665.0, 1654.0, 1062.0, 649.0, 444.0, 327.0, 212.0, 131.0, 93.0, 53.0, 46.0, 42.0, 17.0, 14.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.25, -10.894775390625, -10.53955078125, -10.184326171875, -9.8291015625, -9.473876953125, -9.11865234375, -8.763427734375, -8.408203125, -8.052978515625, -7.69775390625, -7.342529296875, -6.9873046875, -6.632080078125, -6.27685546875, -5.921630859375, -5.56640625, -5.211181640625, -4.85595703125, -4.500732421875, -4.1455078125, -3.790283203125, -3.43505859375, -3.079833984375, -2.724609375, -2.369384765625, -2.01416015625, -1.658935546875, -1.3037109375, -0.948486328125, -0.59326171875, -0.238037109375, 0.1171875, 0.472412109375, 0.82763671875, 1.182861328125, 1.5380859375, 1.893310546875, 2.24853515625, 2.603759765625, 2.958984375, 3.314208984375, 3.66943359375, 4.024658203125, 4.3798828125, 4.735107421875, 5.09033203125, 5.445556640625, 5.80078125, 6.156005859375, 6.51123046875, 6.866455078125, 7.2216796875, 7.576904296875, 7.93212890625, 8.287353515625, 8.642578125, 8.997802734375, 9.35302734375, 9.708251953125, 10.0634765625, 10.418701171875, 10.77392578125, 11.129150390625, 11.484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 7.0, 9.0, 4.0, 10.0, 19.0, 14.0, 14.0, 26.0, 24.0, 26.0, 35.0, 32.0, 45.0, 34.0, 36.0, 35.0, 52.0, 40.0, 51.0, 44.0, 44.0, 34.0, 34.0, 40.0, 32.0, 31.0, 30.0, 32.0, 29.0, 19.0, 24.0, 14.0, 13.0, 12.0, 10.0, 12.0, 5.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.75, -15.252197265625, -14.75439453125, -14.256591796875, -13.7587890625, -13.260986328125, -12.76318359375, -12.265380859375, -11.767578125, -11.269775390625, -10.77197265625, -10.274169921875, -9.7763671875, -9.278564453125, -8.78076171875, -8.282958984375, -7.78515625, -7.287353515625, -6.78955078125, -6.291748046875, -5.7939453125, -5.296142578125, -4.79833984375, -4.300537109375, -3.802734375, -3.304931640625, -2.80712890625, -2.309326171875, -1.8115234375, -1.313720703125, -0.81591796875, -0.318115234375, 0.1796875, 0.677490234375, 1.17529296875, 1.673095703125, 2.1708984375, 2.668701171875, 3.16650390625, 3.664306640625, 4.162109375, 4.659912109375, 5.15771484375, 5.655517578125, 6.1533203125, 6.651123046875, 7.14892578125, 7.646728515625, 8.14453125, 8.642333984375, 9.14013671875, 9.637939453125, 10.1357421875, 10.633544921875, 11.13134765625, 11.629150390625, 12.126953125, 12.624755859375, 13.12255859375, 13.620361328125, 14.1181640625, 14.615966796875, 15.11376953125, 15.611572265625, 16.109375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 15.0, 13.0, 25.0, 38.0, 55.0, 105.0, 151.0, 265.0, 424.0, 735.0, 1323.0, 2383.0, 4437.0, 9008.0, 18910.0, 41919.0, 95740.0, 200285.0, 288946.0, 203566.0, 97799.0, 43096.0, 19712.0, 9283.0, 4698.0, 2367.0, 1321.0, 751.0, 478.0, 256.0, 159.0, 105.0, 55.0, 37.0, 26.0, 27.0, 12.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.734375, -22.03515625, -21.3359375, -20.63671875, -19.9375, -19.23828125, -18.5390625, -17.83984375, -17.140625, -16.44140625, -15.7421875, -15.04296875, -14.34375, -13.64453125, -12.9453125, -12.24609375, -11.546875, -10.84765625, -10.1484375, -9.44921875, -8.75, -8.05078125, -7.3515625, -6.65234375, -5.953125, -5.25390625, -4.5546875, -3.85546875, -3.15625, -2.45703125, -1.7578125, -1.05859375, -0.359375, 0.33984375, 1.0390625, 1.73828125, 2.4375, 3.13671875, 3.8359375, 4.53515625, 5.234375, 5.93359375, 6.6328125, 7.33203125, 8.03125, 8.73046875, 9.4296875, 10.12890625, 10.828125, 11.52734375, 12.2265625, 12.92578125, 13.625, 14.32421875, 15.0234375, 15.72265625, 16.421875, 17.12109375, 17.8203125, 18.51953125, 19.21875, 19.91796875, 20.6171875, 21.31640625, 22.015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 6.0, 17.0, 14.0, 19.0, 18.0, 19.0, 24.0, 21.0, 23.0, 29.0, 36.0, 35.0, 48.0, 36.0, 42.0, 36.0, 38.0, 38.0, 39.0, 42.0, 43.0, 37.0, 41.0, 36.0, 30.0, 29.0, 22.0, 20.0, 14.0, 18.0, 21.0, 22.0, 8.0, 12.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.63134765625, -6.3564453125, -6.08154296875, -5.806640625, -5.53173828125, -5.2568359375, -4.98193359375, -4.70703125, -4.43212890625, -4.1572265625, -3.88232421875, -3.607421875, -3.33251953125, -3.0576171875, -2.78271484375, -2.5078125, -2.23291015625, -1.9580078125, -1.68310546875, -1.408203125, -1.13330078125, -0.8583984375, -0.58349609375, -0.30859375, -0.03369140625, 0.2412109375, 0.51611328125, 0.791015625, 1.06591796875, 1.3408203125, 1.61572265625, 1.890625, 2.16552734375, 2.4404296875, 2.71533203125, 2.990234375, 3.26513671875, 3.5400390625, 3.81494140625, 4.08984375, 4.36474609375, 4.6396484375, 4.91455078125, 5.189453125, 5.46435546875, 5.7392578125, 6.01416015625, 6.2890625, 6.56396484375, 6.8388671875, 7.11376953125, 7.388671875, 7.66357421875, 7.9384765625, 8.21337890625, 8.48828125, 8.76318359375, 9.0380859375, 9.31298828125, 9.587890625, 9.86279296875, 10.1376953125, 10.41259765625, 10.6875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 11.0, 20.0, 17.0, 26.0, 46.0, 57.0, 81.0, 94.0, 179.0, 249.0, 412.0, 590.0, 969.0, 1542.0, 2621.0, 4288.0, 7244.0, 12904.0, 23481.0, 43300.0, 80662.0, 145764.0, 222260.0, 210114.0, 131359.0, 72307.0, 38517.0, 20865.0, 11636.0, 6619.0, 3966.0, 2421.0, 1444.0, 831.0, 525.0, 366.0, 263.0, 155.0, 123.0, 63.0, 54.0, 23.0, 25.0, 14.0, 9.0, 13.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.890625, -9.6072998046875, -9.323974609375, -9.0406494140625, -8.75732421875, -8.4739990234375, -8.190673828125, -7.9073486328125, -7.6240234375, -7.3406982421875, -7.057373046875, -6.7740478515625, -6.49072265625, -6.2073974609375, -5.924072265625, -5.6407470703125, -5.357421875, -5.0740966796875, -4.790771484375, -4.5074462890625, -4.22412109375, -3.9407958984375, -3.657470703125, -3.3741455078125, -3.0908203125, -2.8074951171875, -2.524169921875, -2.2408447265625, -1.95751953125, -1.6741943359375, -1.390869140625, -1.1075439453125, -0.82421875, -0.5408935546875, -0.257568359375, 0.0257568359375, 0.30908203125, 0.5924072265625, 0.875732421875, 1.1590576171875, 1.4423828125, 1.7257080078125, 2.009033203125, 2.2923583984375, 2.57568359375, 2.8590087890625, 3.142333984375, 3.4256591796875, 3.708984375, 3.9923095703125, 4.275634765625, 4.5589599609375, 4.84228515625, 5.1256103515625, 5.408935546875, 5.6922607421875, 5.9755859375, 6.2589111328125, 6.542236328125, 6.8255615234375, 7.10888671875, 7.3922119140625, 7.675537109375, 7.9588623046875, 8.2421875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 12.0, 28.0, 31.0, 43.0, 54.0, 73.0, 69.0, 91.0, 73.0, 108.0, 74.0, 82.0, 53.0, 43.0, 34.0, 34.0, 17.0, 10.0, 11.0, 7.0, 8.0, 5.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006556510925292969, -0.0006361603736877441, -0.0006166696548461914, -0.0005971789360046387, -0.0005776882171630859, -0.0005581974983215332, -0.0005387067794799805, -0.0005192160606384277, -0.000499725341796875, -0.00048023462295532227, -0.00046074390411376953, -0.0004412531852722168, -0.00042176246643066406, -0.00040227174758911133, -0.0003827810287475586, -0.00036329030990600586, -0.0003437995910644531, -0.0003243088722229004, -0.00030481815338134766, -0.0002853274345397949, -0.0002658367156982422, -0.00024634599685668945, -0.00022685527801513672, -0.00020736455917358398, -0.00018787384033203125, -0.00016838312149047852, -0.00014889240264892578, -0.00012940168380737305, -0.00010991096496582031, -9.042024612426758e-05, -7.092952728271484e-05, -5.143880844116211e-05, -3.1948089599609375e-05, -1.245737075805664e-05, 7.033348083496094e-06, 2.6524066925048828e-05, 4.601478576660156e-05, 6.55055046081543e-05, 8.499622344970703e-05, 0.00010448694229125977, 0.0001239776611328125, 0.00014346837997436523, 0.00016295909881591797, 0.0001824498176574707, 0.00020194053649902344, 0.00022143125534057617, 0.0002409219741821289, 0.00026041269302368164, 0.0002799034118652344, 0.0002993941307067871, 0.00031888484954833984, 0.0003383755683898926, 0.0003578662872314453, 0.00037735700607299805, 0.0003968477249145508, 0.0004163384437561035, 0.00043582916259765625, 0.000455319881439209, 0.0004748106002807617, 0.0004943013191223145, 0.0005137920379638672, 0.0005332827568054199, 0.0005527734756469727, 0.0005722641944885254, 0.0005917549133300781]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 11.0, 15.0, 25.0, 28.0, 44.0, 67.0, 99.0, 141.0, 240.0, 279.0, 519.0, 747.0, 1142.0, 1747.0, 2606.0, 4151.0, 6194.0, 9608.0, 14765.0, 22736.0, 35416.0, 52876.0, 77548.0, 106870.0, 131283.0, 140603.0, 127000.0, 100057.0, 71941.0, 48654.0, 32040.0, 20709.0, 13321.0, 8531.0, 5666.0, 3667.0, 2419.0, 1620.0, 1103.0, 667.0, 488.0, 279.0, 230.0, 140.0, 87.0, 75.0, 37.0, 20.0, 9.0, 11.0, 14.0, 2.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0], "bins": [-6.33203125, -6.13031005859375, -5.9285888671875, -5.72686767578125, -5.525146484375, -5.32342529296875, -5.1217041015625, -4.91998291015625, -4.71826171875, -4.51654052734375, -4.3148193359375, -4.11309814453125, -3.911376953125, -3.70965576171875, -3.5079345703125, -3.30621337890625, -3.1044921875, -2.90277099609375, -2.7010498046875, -2.49932861328125, -2.297607421875, -2.09588623046875, -1.8941650390625, -1.69244384765625, -1.49072265625, -1.28900146484375, -1.0872802734375, -0.88555908203125, -0.683837890625, -0.48211669921875, -0.2803955078125, -0.07867431640625, 0.123046875, 0.32476806640625, 0.5264892578125, 0.72821044921875, 0.929931640625, 1.13165283203125, 1.3333740234375, 1.53509521484375, 1.73681640625, 1.93853759765625, 2.1402587890625, 2.34197998046875, 2.543701171875, 2.74542236328125, 2.9471435546875, 3.14886474609375, 3.3505859375, 3.55230712890625, 3.7540283203125, 3.95574951171875, 4.157470703125, 4.35919189453125, 4.5609130859375, 4.76263427734375, 4.96435546875, 5.16607666015625, 5.3677978515625, 5.56951904296875, 5.771240234375, 5.97296142578125, 6.1746826171875, 6.37640380859375, 6.578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 10.0, 5.0, 5.0, 8.0, 10.0, 7.0, 13.0, 10.0, 22.0, 15.0, 20.0, 19.0, 21.0, 28.0, 37.0, 39.0, 39.0, 45.0, 43.0, 45.0, 37.0, 53.0, 55.0, 47.0, 41.0, 40.0, 36.0, 33.0, 37.0, 26.0, 24.0, 19.0, 19.0, 19.0, 17.0, 12.0, 10.0, 3.0, 7.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.8759765625, -1.8157958984375, -1.755615234375, -1.6954345703125, -1.63525390625, -1.5750732421875, -1.514892578125, -1.4547119140625, -1.39453125, -1.3343505859375, -1.274169921875, -1.2139892578125, -1.15380859375, -1.0936279296875, -1.033447265625, -0.9732666015625, -0.9130859375, -0.8529052734375, -0.792724609375, -0.7325439453125, -0.67236328125, -0.6121826171875, -0.552001953125, -0.4918212890625, -0.431640625, -0.3714599609375, -0.311279296875, -0.2510986328125, -0.19091796875, -0.1307373046875, -0.070556640625, -0.0103759765625, 0.0498046875, 0.1099853515625, 0.170166015625, 0.2303466796875, 0.29052734375, 0.3507080078125, 0.410888671875, 0.4710693359375, 0.53125, 0.5914306640625, 0.651611328125, 0.7117919921875, 0.77197265625, 0.8321533203125, 0.892333984375, 0.9525146484375, 1.0126953125, 1.0728759765625, 1.133056640625, 1.1932373046875, 1.25341796875, 1.3135986328125, 1.373779296875, 1.4339599609375, 1.494140625, 1.5543212890625, 1.614501953125, 1.6746826171875, 1.73486328125, 1.7950439453125, 1.855224609375, 1.9154052734375, 1.9755859375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 12.0, 22.0, 22.0, 24.0, 29.0, 27.0, 35.0, 37.0, 58.0, 65.0, 53.0, 77.0, 76.0, 69.0, 66.0, 58.0, 43.0, 43.0, 37.0, 25.0, 20.0, 16.0, 10.0, 6.0, 7.0, 9.0, 13.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.444873809814453, -22.66288185119629, -21.880887985229492, -21.098896026611328, -20.31690216064453, -19.534910202026367, -18.752918243408203, -17.970924377441406, -17.188932418823242, -16.406940460205078, -15.624946594238281, -14.842954635620117, -14.060961723327637, -13.278968811035156, -12.496976852416992, -11.714983940124512, -10.932991027832031, -10.15099811553955, -9.36900520324707, -8.587013244628906, -7.805020332336426, -7.023027420043945, -6.241034984588623, -5.459042549133301, -4.67704963684082, -3.895056962966919, -3.1130642890930176, -2.331071615219116, -1.5490789413452148, -0.7670862674713135, 0.01490640640258789, 0.7968988418579102, 1.5788917541503906, 2.360884428024292, 3.1428771018981934, 3.9248697757720947, 4.706862449645996, 5.488855361938477, 6.270847797393799, 7.052840232849121, 7.834833145141602, 8.616826057434082, 9.398818969726562, 10.180810928344727, 10.962803840637207, 11.744796752929688, 12.526788711547852, 13.308781623840332, 14.090774536132812, 14.872767448425293, 15.654760360717773, 16.436752319335938, 17.218746185302734, 18.0007381439209, 18.782730102539062, 19.56472396850586, 20.346715927124023, 21.128707885742188, 21.910701751708984, 22.69269371032715, 23.474685668945312, 24.25667953491211, 25.038671493530273, 25.820663452148438, 26.602657318115234]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 5.0, 7.0, 6.0, 12.0, 18.0, 12.0, 16.0, 27.0, 26.0, 27.0, 20.0, 23.0, 26.0, 35.0, 33.0, 47.0, 35.0, 39.0, 56.0, 41.0, 48.0, 39.0, 43.0, 33.0, 32.0, 37.0, 39.0, 28.0, 32.0, 24.0, 23.0, 19.0, 15.0, 17.0, 5.0, 13.0, 6.0, 6.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.84384536743164, -13.400592803955078, -12.957340240478516, -12.514087677001953, -12.07083511352539, -11.627582550048828, -11.184329986572266, -10.741076469421387, -10.297823905944824, -9.854571342468262, -9.4113187789917, -8.968066215515137, -8.524813652038574, -8.081560134887695, -7.638308048248291, -7.19505500793457, -6.751802921295166, -6.3085503578186035, -5.865297794342041, -5.42204475402832, -4.978792190551758, -4.535539627075195, -4.092287063598633, -3.649034261703491, -3.2057816982269287, -2.762529134750366, -2.3192763328552246, -1.876023769378662, -1.43277108669281, -0.989518404006958, -0.5462658405303955, -0.1030130386352539, 0.3402395248413086, 0.7834922075271606, 1.2267448902130127, 1.6699974536895752, 2.113250255584717, 2.5565028190612793, 2.999755382537842, 3.4430081844329834, 3.886260747909546, 4.3295135498046875, 4.77276611328125, 5.2160186767578125, 5.659271240234375, 6.1025238037109375, 6.5457763671875, 6.989029407501221, 7.432281970977783, 7.875534534454346, 8.318787574768066, 8.762040138244629, 9.205292701721191, 9.648545265197754, 10.091797828674316, 10.535050392150879, 10.978302955627441, 11.421555519104004, 11.864808082580566, 12.308060646057129, 12.751313209533691, 13.19456672668457, 13.637819290161133, 14.081071853637695, 14.524324417114258]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 14.0, 16.0, 26.0, 31.0, 59.0, 67.0, 127.0, 176.0, 309.0, 445.0, 717.0, 1136.0, 1675.0, 2701.0, 4162.0, 6395.0, 9588.0, 14736.0, 22470.0, 32949.0, 47720.0, 65845.0, 86206.0, 104971.0, 117713.0, 117800.0, 107628.0, 88046.0, 66700.0, 48415.0, 33718.0, 22594.0, 15037.0, 9936.0, 6496.0, 4184.0, 2790.0, 1756.0, 1146.0, 732.0, 459.0, 311.0, 189.0, 145.0, 80.0, 47.0, 30.0, 19.0, 23.0, 6.0, 8.0, 5.0, 5.0, 1.0, 2.0, 5.0], "bins": [-12.15625, -11.7882080078125, -11.420166015625, -11.0521240234375, -10.68408203125, -10.3160400390625, -9.947998046875, -9.5799560546875, -9.2119140625, -8.8438720703125, -8.475830078125, -8.1077880859375, -7.73974609375, -7.3717041015625, -7.003662109375, -6.6356201171875, -6.267578125, -5.8995361328125, -5.531494140625, -5.1634521484375, -4.79541015625, -4.4273681640625, -4.059326171875, -3.6912841796875, -3.3232421875, -2.9552001953125, -2.587158203125, -2.2191162109375, -1.85107421875, -1.4830322265625, -1.114990234375, -0.7469482421875, -0.37890625, -0.0108642578125, 0.357177734375, 0.7252197265625, 1.09326171875, 1.4613037109375, 1.829345703125, 2.1973876953125, 2.5654296875, 2.9334716796875, 3.301513671875, 3.6695556640625, 4.03759765625, 4.4056396484375, 4.773681640625, 5.1417236328125, 5.509765625, 5.8778076171875, 6.245849609375, 6.6138916015625, 6.98193359375, 7.3499755859375, 7.718017578125, 8.0860595703125, 8.4541015625, 8.8221435546875, 9.190185546875, 9.5582275390625, 9.92626953125, 10.2943115234375, 10.662353515625, 11.0303955078125, 11.3984375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 16.0, 24.0, 18.0, 19.0, 23.0, 19.0, 33.0, 25.0, 34.0, 36.0, 34.0, 39.0, 38.0, 47.0, 47.0, 46.0, 53.0, 38.0, 39.0, 43.0, 34.0, 27.0, 36.0, 26.0, 22.0, 17.0, 23.0, 15.0, 16.0, 17.0, 9.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5234375, -15.05126953125, -14.5791015625, -14.10693359375, -13.634765625, -13.16259765625, -12.6904296875, -12.21826171875, -11.74609375, -11.27392578125, -10.8017578125, -10.32958984375, -9.857421875, -9.38525390625, -8.9130859375, -8.44091796875, -7.96875, -7.49658203125, -7.0244140625, -6.55224609375, -6.080078125, -5.60791015625, -5.1357421875, -4.66357421875, -4.19140625, -3.71923828125, -3.2470703125, -2.77490234375, -2.302734375, -1.83056640625, -1.3583984375, -0.88623046875, -0.4140625, 0.05810546875, 0.5302734375, 1.00244140625, 1.474609375, 1.94677734375, 2.4189453125, 2.89111328125, 3.36328125, 3.83544921875, 4.3076171875, 4.77978515625, 5.251953125, 5.72412109375, 6.1962890625, 6.66845703125, 7.140625, 7.61279296875, 8.0849609375, 8.55712890625, 9.029296875, 9.50146484375, 9.9736328125, 10.44580078125, 10.91796875, 11.39013671875, 11.8623046875, 12.33447265625, 12.806640625, 13.27880859375, 13.7509765625, 14.22314453125, 14.6953125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 19.0, 22.0, 35.0, 61.0, 81.0, 124.0, 198.0, 300.0, 494.0, 703.0, 1114.0, 1685.0, 2505.0, 3761.0, 5699.0, 8317.0, 12193.0, 17883.0, 25515.0, 35981.0, 49046.0, 64995.0, 80572.0, 95684.0, 104528.0, 105260.0, 97678.0, 84531.0, 68415.0, 52534.0, 39218.0, 28306.0, 19448.0, 13628.0, 9284.0, 6439.0, 4226.0, 2773.0, 1820.0, 1221.0, 785.0, 505.0, 339.0, 243.0, 136.0, 90.0, 67.0, 30.0, 20.0, 22.0, 12.0, 7.0, 3.0, 0.0, 3.0], "bins": [-11.15625, -10.829345703125, -10.50244140625, -10.175537109375, -9.8486328125, -9.521728515625, -9.19482421875, -8.867919921875, -8.541015625, -8.214111328125, -7.88720703125, -7.560302734375, -7.2333984375, -6.906494140625, -6.57958984375, -6.252685546875, -5.92578125, -5.598876953125, -5.27197265625, -4.945068359375, -4.6181640625, -4.291259765625, -3.96435546875, -3.637451171875, -3.310546875, -2.983642578125, -2.65673828125, -2.329833984375, -2.0029296875, -1.676025390625, -1.34912109375, -1.022216796875, -0.6953125, -0.368408203125, -0.04150390625, 0.285400390625, 0.6123046875, 0.939208984375, 1.26611328125, 1.593017578125, 1.919921875, 2.246826171875, 2.57373046875, 2.900634765625, 3.2275390625, 3.554443359375, 3.88134765625, 4.208251953125, 4.53515625, 4.862060546875, 5.18896484375, 5.515869140625, 5.8427734375, 6.169677734375, 6.49658203125, 6.823486328125, 7.150390625, 7.477294921875, 7.80419921875, 8.131103515625, 8.4580078125, 8.784912109375, 9.11181640625, 9.438720703125, 9.765625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 4.0, 7.0, 14.0, 6.0, 9.0, 8.0, 11.0, 8.0, 7.0, 22.0, 19.0, 31.0, 26.0, 41.0, 44.0, 30.0, 27.0, 47.0, 33.0, 39.0, 43.0, 44.0, 50.0, 39.0, 42.0, 44.0, 35.0, 27.0, 27.0, 29.0, 27.0, 24.0, 14.0, 27.0, 12.0, 17.0, 14.0, 6.0, 8.0, 6.0, 6.0, 3.0, 5.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.4036865234375, -8.135498046875, -7.8673095703125, -7.59912109375, -7.3309326171875, -7.062744140625, -6.7945556640625, -6.5263671875, -6.2581787109375, -5.989990234375, -5.7218017578125, -5.45361328125, -5.1854248046875, -4.917236328125, -4.6490478515625, -4.380859375, -4.1126708984375, -3.844482421875, -3.5762939453125, -3.30810546875, -3.0399169921875, -2.771728515625, -2.5035400390625, -2.2353515625, -1.9671630859375, -1.698974609375, -1.4307861328125, -1.16259765625, -0.8944091796875, -0.626220703125, -0.3580322265625, -0.08984375, 0.1783447265625, 0.446533203125, 0.7147216796875, 0.98291015625, 1.2510986328125, 1.519287109375, 1.7874755859375, 2.0556640625, 2.3238525390625, 2.592041015625, 2.8602294921875, 3.12841796875, 3.3966064453125, 3.664794921875, 3.9329833984375, 4.201171875, 4.4693603515625, 4.737548828125, 5.0057373046875, 5.27392578125, 5.5421142578125, 5.810302734375, 6.0784912109375, 6.3466796875, 6.6148681640625, 6.883056640625, 7.1512451171875, 7.41943359375, 7.6876220703125, 7.955810546875, 8.2239990234375, 8.4921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 11.0, 15.0, 22.0, 30.0, 53.0, 82.0, 126.0, 179.0, 314.0, 441.0, 688.0, 1129.0, 1835.0, 2945.0, 4536.0, 7319.0, 12100.0, 19082.0, 29466.0, 44700.0, 65070.0, 89578.0, 113554.0, 129324.0, 129194.0, 113988.0, 90598.0, 65726.0, 45113.0, 29640.0, 19273.0, 12210.0, 7489.0, 4840.0, 2832.0, 1884.0, 1137.0, 779.0, 407.0, 285.0, 205.0, 121.0, 76.0, 65.0, 29.0, 18.0, 19.0, 15.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-5.53125, -5.36370849609375, -5.1961669921875, -5.02862548828125, -4.861083984375, -4.69354248046875, -4.5260009765625, -4.35845947265625, -4.19091796875, -4.02337646484375, -3.8558349609375, -3.68829345703125, -3.520751953125, -3.35321044921875, -3.1856689453125, -3.01812744140625, -2.8505859375, -2.68304443359375, -2.5155029296875, -2.34796142578125, -2.180419921875, -2.01287841796875, -1.8453369140625, -1.67779541015625, -1.51025390625, -1.34271240234375, -1.1751708984375, -1.00762939453125, -0.840087890625, -0.67254638671875, -0.5050048828125, -0.33746337890625, -0.169921875, -0.00238037109375, 0.1651611328125, 0.33270263671875, 0.500244140625, 0.66778564453125, 0.8353271484375, 1.00286865234375, 1.17041015625, 1.33795166015625, 1.5054931640625, 1.67303466796875, 1.840576171875, 2.00811767578125, 2.1756591796875, 2.34320068359375, 2.5107421875, 2.67828369140625, 2.8458251953125, 3.01336669921875, 3.180908203125, 3.34844970703125, 3.5159912109375, 3.68353271484375, 3.85107421875, 4.01861572265625, 4.1861572265625, 4.35369873046875, 4.521240234375, 4.68878173828125, 4.8563232421875, 5.02386474609375, 5.19140625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 6.0, 2.0, 9.0, 16.0, 15.0, 18.0, 29.0, 21.0, 38.0, 38.0, 37.0, 50.0, 58.0, 71.0, 53.0, 60.0, 60.0, 42.0, 60.0, 50.0, 47.0, 34.0, 28.0, 24.0, 29.0, 21.0, 19.0, 17.0, 10.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006580352783203125, -0.0006364732980728149, -0.0006149113178253174, -0.0005933493375778198, -0.0005717873573303223, -0.0005502253770828247, -0.0005286633968353271, -0.0005071014165878296, -0.00048553943634033203, -0.00046397745609283447, -0.0004424154758453369, -0.00042085349559783936, -0.0003992915153503418, -0.00037772953510284424, -0.0003561675548553467, -0.0003346055746078491, -0.00031304359436035156, -0.000291481614112854, -0.00026991963386535645, -0.0002483576536178589, -0.00022679567337036133, -0.00020523369312286377, -0.0001836717128753662, -0.00016210973262786865, -0.0001405477523803711, -0.00011898577213287354, -9.742379188537598e-05, -7.586181163787842e-05, -5.429983139038086e-05, -3.27378511428833e-05, -1.1175870895385742e-05, 1.0386109352111816e-05, 3.1948089599609375e-05, 5.3510069847106934e-05, 7.507205009460449e-05, 9.663403034210205e-05, 0.00011819601058959961, 0.00013975799083709717, 0.00016131997108459473, 0.00018288195133209229, 0.00020444393157958984, 0.0002260059118270874, 0.00024756789207458496, 0.0002691298723220825, 0.0002906918525695801, 0.00031225383281707764, 0.0003338158130645752, 0.00035537779331207275, 0.0003769397735595703, 0.00039850175380706787, 0.00042006373405456543, 0.000441625714302063, 0.00046318769454956055, 0.0004847496747970581, 0.0005063116550445557, 0.0005278736352920532, 0.0005494356155395508, 0.0005709975957870483, 0.0005925595760345459, 0.0006141215562820435, 0.000635683536529541, 0.0006572455167770386, 0.0006788074970245361, 0.0007003694772720337, 0.0007219314575195312]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 19.0, 23.0, 45.0, 55.0, 97.0, 148.0, 214.0, 332.0, 515.0, 714.0, 1118.0, 1682.0, 2484.0, 3790.0, 5733.0, 8552.0, 12787.0, 18554.0, 27741.0, 39744.0, 55165.0, 73760.0, 92397.0, 107478.0, 114636.0, 110094.0, 96329.0, 77932.0, 59380.0, 43470.0, 30150.0, 20857.0, 14030.0, 9417.0, 6390.0, 4235.0, 2751.0, 1888.0, 1270.0, 905.0, 550.0, 366.0, 258.0, 183.0, 91.0, 91.0, 46.0, 18.0, 23.0, 12.0, 9.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.42108154296875, -4.2718505859375, -4.12261962890625, -3.973388671875, -3.82415771484375, -3.6749267578125, -3.52569580078125, -3.37646484375, -3.22723388671875, -3.0780029296875, -2.92877197265625, -2.779541015625, -2.63031005859375, -2.4810791015625, -2.33184814453125, -2.1826171875, -2.03338623046875, -1.8841552734375, -1.73492431640625, -1.585693359375, -1.43646240234375, -1.2872314453125, -1.13800048828125, -0.98876953125, -0.83953857421875, -0.6903076171875, -0.54107666015625, -0.391845703125, -0.24261474609375, -0.0933837890625, 0.05584716796875, 0.205078125, 0.35430908203125, 0.5035400390625, 0.65277099609375, 0.802001953125, 0.95123291015625, 1.1004638671875, 1.24969482421875, 1.39892578125, 1.54815673828125, 1.6973876953125, 1.84661865234375, 1.995849609375, 2.14508056640625, 2.2943115234375, 2.44354248046875, 2.5927734375, 2.74200439453125, 2.8912353515625, 3.04046630859375, 3.189697265625, 3.33892822265625, 3.4881591796875, 3.63739013671875, 3.78662109375, 3.93585205078125, 4.0850830078125, 4.23431396484375, 4.383544921875, 4.53277587890625, 4.6820068359375, 4.83123779296875, 4.98046875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 7.0, 8.0, 8.0, 7.0, 12.0, 11.0, 17.0, 19.0, 22.0, 21.0, 34.0, 29.0, 39.0, 26.0, 42.0, 39.0, 41.0, 38.0, 39.0, 56.0, 49.0, 48.0, 38.0, 32.0, 32.0, 31.0, 42.0, 38.0, 32.0, 22.0, 16.0, 16.0, 12.0, 13.0, 12.0, 13.0, 5.0, 5.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9201507568359375, -1.860809326171875, -1.8014678955078125, -1.74212646484375, -1.6827850341796875, -1.623443603515625, -1.5641021728515625, -1.5047607421875, -1.4454193115234375, -1.386077880859375, -1.3267364501953125, -1.26739501953125, -1.2080535888671875, -1.148712158203125, -1.0893707275390625, -1.030029296875, -0.9706878662109375, -0.911346435546875, -0.8520050048828125, -0.79266357421875, -0.7333221435546875, -0.673980712890625, -0.6146392822265625, -0.5552978515625, -0.4959564208984375, -0.436614990234375, -0.3772735595703125, -0.31793212890625, -0.2585906982421875, -0.199249267578125, -0.1399078369140625, -0.08056640625, -0.0212249755859375, 0.038116455078125, 0.0974578857421875, 0.15679931640625, 0.2161407470703125, 0.275482177734375, 0.3348236083984375, 0.3941650390625, 0.4535064697265625, 0.512847900390625, 0.5721893310546875, 0.63153076171875, 0.6908721923828125, 0.750213623046875, 0.8095550537109375, 0.868896484375, 0.9282379150390625, 0.987579345703125, 1.0469207763671875, 1.10626220703125, 1.1656036376953125, 1.224945068359375, 1.2842864990234375, 1.3436279296875, 1.4029693603515625, 1.462310791015625, 1.5216522216796875, 1.58099365234375, 1.6403350830078125, 1.699676513671875, 1.7590179443359375, 1.818359375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 5.0, 15.0, 5.0, 13.0, 11.0, 23.0, 28.0, 31.0, 46.0, 49.0, 51.0, 60.0, 54.0, 61.0, 77.0, 66.0, 69.0, 58.0, 49.0, 42.0, 34.0, 16.0, 26.0, 16.0, 18.0, 11.0, 8.0, 7.0, 11.0, 3.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.74799919128418, -22.989160537719727, -22.230321884155273, -21.471485137939453, -20.712646484375, -19.953807830810547, -19.194969177246094, -18.43613052368164, -17.677291870117188, -16.918453216552734, -16.15961456298828, -15.400776863098145, -14.641939163208008, -13.883100509643555, -13.124261856079102, -12.365423202514648, -11.606586456298828, -10.847747802734375, -10.088910102844238, -9.330071449279785, -8.571233749389648, -7.812395095825195, -7.053556442260742, -6.294718265533447, -5.535880088806152, -4.777041912078857, -4.0182037353515625, -3.2593650817871094, -2.5005269050598145, -1.7416887283325195, -0.9828500747680664, -0.22401189804077148, 0.5348281860351562, 1.2936664819717407, 2.052504777908325, 2.811343193054199, 3.570181369781494, 4.329019546508789, 5.087858200073242, 5.846696376800537, 6.605534553527832, 7.364372730255127, 8.123210906982422, 8.882049560546875, 9.640888214111328, 10.399725914001465, 11.158564567565918, 11.917402267456055, 12.676240921020508, 13.435079574584961, 14.193917274475098, 14.95275592803955, 15.711593627929688, 16.47043228149414, 17.229270935058594, 17.988109588623047, 18.7469482421875, 19.505786895751953, 20.264625549316406, 21.02346420288086, 21.78230094909668, 22.541139602661133, 23.299978256225586, 24.05881690979004, 24.81765365600586]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 6.0, 4.0, 9.0, 10.0, 13.0, 19.0, 16.0, 24.0, 26.0, 26.0, 35.0, 37.0, 44.0, 44.0, 45.0, 43.0, 42.0, 49.0, 47.0, 41.0, 48.0, 47.0, 37.0, 35.0, 40.0, 31.0, 37.0, 26.0, 20.0, 18.0, 11.0, 13.0, 18.0, 6.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.983983993530273, -15.481595993041992, -14.979207992553711, -14.47681999206543, -13.974432945251465, -13.472044944763184, -12.969656944274902, -12.467268943786621, -11.964881896972656, -11.462493896484375, -10.960105895996094, -10.457717895507812, -9.955330848693848, -9.452942848205566, -8.950554847717285, -8.448166847229004, -7.945778846740723, -7.443390846252441, -6.941003322601318, -6.438615322113037, -5.936227798461914, -5.433839797973633, -4.931451797485352, -4.42906379699707, -3.9266762733459473, -3.424288511276245, -2.921900749206543, -2.4195127487182617, -1.9171249866485596, -1.4147372245788574, -0.9123492240905762, -0.409961462020874, 0.09242630004882812, 0.594814121723175, 1.097201943397522, 1.5995898246765137, 2.101977586746216, 2.604365348815918, 3.106753349304199, 3.6091411113739014, 4.1115288734436035, 4.613916873931885, 5.116304397583008, 5.618692398071289, 6.12108039855957, 6.623467922210693, 7.125855922698975, 7.628243446350098, 8.130631446838379, 8.63301944732666, 9.135407447814941, 9.637794494628906, 10.140182495117188, 10.642570495605469, 11.14495849609375, 11.647346496582031, 12.149734497070312, 12.652122497558594, 13.154510498046875, 13.656898498535156, 14.159285545349121, 14.661673545837402, 15.164061546325684, 15.666449546813965, 16.16883659362793]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 23.0, 21.0, 31.0, 41.0, 68.0, 111.0, 183.0, 263.0, 344.0, 580.0, 876.0, 1367.0, 2113.0, 3431.0, 5850.0, 10023.0, 17868.0, 32856.0, 63297.0, 125981.0, 258339.0, 508127.0, 845495.0, 945040.0, 663911.0, 355428.0, 173634.0, 84422.0, 42582.0, 22138.0, 12071.0, 6912.0, 4017.0, 2460.0, 1584.0, 982.0, 616.0, 385.0, 285.0, 176.0, 136.0, 77.0, 44.0, 32.0, 21.0, 16.0, 8.0, 11.0, 3.0, 2.0, 2.0], "bins": [-26.890625, -26.148193359375, -25.40576171875, -24.663330078125, -23.9208984375, -23.178466796875, -22.43603515625, -21.693603515625, -20.951171875, -20.208740234375, -19.46630859375, -18.723876953125, -17.9814453125, -17.239013671875, -16.49658203125, -15.754150390625, -15.01171875, -14.269287109375, -13.52685546875, -12.784423828125, -12.0419921875, -11.299560546875, -10.55712890625, -9.814697265625, -9.072265625, -8.329833984375, -7.58740234375, -6.844970703125, -6.1025390625, -5.360107421875, -4.61767578125, -3.875244140625, -3.1328125, -2.390380859375, -1.64794921875, -0.905517578125, -0.1630859375, 0.579345703125, 1.32177734375, 2.064208984375, 2.806640625, 3.549072265625, 4.29150390625, 5.033935546875, 5.7763671875, 6.518798828125, 7.26123046875, 8.003662109375, 8.74609375, 9.488525390625, 10.23095703125, 10.973388671875, 11.7158203125, 12.458251953125, 13.20068359375, 13.943115234375, 14.685546875, 15.427978515625, 16.17041015625, 16.912841796875, 17.6552734375, 18.397705078125, 19.14013671875, 19.882568359375, 20.625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 8.0, 2.0, 3.0, 16.0, 16.0, 14.0, 21.0, 19.0, 27.0, 30.0, 33.0, 43.0, 46.0, 44.0, 45.0, 46.0, 57.0, 37.0, 43.0, 57.0, 60.0, 42.0, 47.0, 42.0, 40.0, 41.0, 24.0, 18.0, 18.0, 16.0, 7.0, 14.0, 7.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.79248046875, -13.3271484375, -12.86181640625, -12.396484375, -11.93115234375, -11.4658203125, -11.00048828125, -10.53515625, -10.06982421875, -9.6044921875, -9.13916015625, -8.673828125, -8.20849609375, -7.7431640625, -7.27783203125, -6.8125, -6.34716796875, -5.8818359375, -5.41650390625, -4.951171875, -4.48583984375, -4.0205078125, -3.55517578125, -3.08984375, -2.62451171875, -2.1591796875, -1.69384765625, -1.228515625, -0.76318359375, -0.2978515625, 0.16748046875, 0.6328125, 1.09814453125, 1.5634765625, 2.02880859375, 2.494140625, 2.95947265625, 3.4248046875, 3.89013671875, 4.35546875, 4.82080078125, 5.2861328125, 5.75146484375, 6.216796875, 6.68212890625, 7.1474609375, 7.61279296875, 8.078125, 8.54345703125, 9.0087890625, 9.47412109375, 9.939453125, 10.40478515625, 10.8701171875, 11.33544921875, 11.80078125, 12.26611328125, 12.7314453125, 13.19677734375, 13.662109375, 14.12744140625, 14.5927734375, 15.05810546875, 15.5234375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 16.0, 25.0, 27.0, 59.0, 61.0, 110.0, 176.0, 279.0, 414.0, 567.0, 941.0, 1552.0, 2330.0, 3890.0, 6632.0, 11408.0, 19723.0, 35033.0, 64320.0, 119541.0, 221537.0, 399993.0, 647676.0, 826738.0, 734623.0, 484396.0, 277344.0, 150579.0, 80938.0, 44293.0, 24632.0, 13834.0, 8090.0, 4760.0, 2843.0, 1714.0, 1092.0, 758.0, 457.0, 324.0, 182.0, 140.0, 83.0, 48.0, 34.0, 23.0, 17.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0], "bins": [-27.453125, -26.66162109375, -25.8701171875, -25.07861328125, -24.287109375, -23.49560546875, -22.7041015625, -21.91259765625, -21.12109375, -20.32958984375, -19.5380859375, -18.74658203125, -17.955078125, -17.16357421875, -16.3720703125, -15.58056640625, -14.7890625, -13.99755859375, -13.2060546875, -12.41455078125, -11.623046875, -10.83154296875, -10.0400390625, -9.24853515625, -8.45703125, -7.66552734375, -6.8740234375, -6.08251953125, -5.291015625, -4.49951171875, -3.7080078125, -2.91650390625, -2.125, -1.33349609375, -0.5419921875, 0.24951171875, 1.041015625, 1.83251953125, 2.6240234375, 3.41552734375, 4.20703125, 4.99853515625, 5.7900390625, 6.58154296875, 7.373046875, 8.16455078125, 8.9560546875, 9.74755859375, 10.5390625, 11.33056640625, 12.1220703125, 12.91357421875, 13.705078125, 14.49658203125, 15.2880859375, 16.07958984375, 16.87109375, 17.66259765625, 18.4541015625, 19.24560546875, 20.037109375, 20.82861328125, 21.6201171875, 22.41162109375, 23.203125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 0.0, 6.0, 5.0, 17.0, 15.0, 22.0, 18.0, 38.0, 51.0, 73.0, 80.0, 134.0, 164.0, 197.0, 262.0, 299.0, 317.0, 346.0, 344.0, 335.0, 275.0, 254.0, 208.0, 147.0, 130.0, 100.0, 68.0, 59.0, 26.0, 25.0, 13.0, 16.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.4296875, -12.10009765625, -11.7705078125, -11.44091796875, -11.111328125, -10.78173828125, -10.4521484375, -10.12255859375, -9.79296875, -9.46337890625, -9.1337890625, -8.80419921875, -8.474609375, -8.14501953125, -7.8154296875, -7.48583984375, -7.15625, -6.82666015625, -6.4970703125, -6.16748046875, -5.837890625, -5.50830078125, -5.1787109375, -4.84912109375, -4.51953125, -4.18994140625, -3.8603515625, -3.53076171875, -3.201171875, -2.87158203125, -2.5419921875, -2.21240234375, -1.8828125, -1.55322265625, -1.2236328125, -0.89404296875, -0.564453125, -0.23486328125, 0.0947265625, 0.42431640625, 0.75390625, 1.08349609375, 1.4130859375, 1.74267578125, 2.072265625, 2.40185546875, 2.7314453125, 3.06103515625, 3.390625, 3.72021484375, 4.0498046875, 4.37939453125, 4.708984375, 5.03857421875, 5.3681640625, 5.69775390625, 6.02734375, 6.35693359375, 6.6865234375, 7.01611328125, 7.345703125, 7.67529296875, 8.0048828125, 8.33447265625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 3.0, 8.0, 20.0, 8.0, 15.0, 27.0, 24.0, 25.0, 36.0, 35.0, 52.0, 58.0, 59.0, 58.0, 64.0, 50.0, 69.0, 55.0, 45.0, 55.0, 51.0, 38.0, 27.0, 25.0, 16.0, 13.0, 9.0, 12.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.259218215942383, -20.40230941772461, -19.545400619506836, -18.688491821289062, -17.83158302307129, -16.974674224853516, -16.117765426635742, -15.260856628417969, -14.403947830200195, -13.547039031982422, -12.690130233764648, -11.833221435546875, -10.976312637329102, -10.119403839111328, -9.262495040893555, -8.405586242675781, -7.548677444458008, -6.691768646240234, -5.834859848022461, -4.9779510498046875, -4.121042251586914, -3.2641334533691406, -2.407224655151367, -1.5503158569335938, -0.6934070587158203, 0.16350173950195312, 1.0204105377197266, 1.8773193359375, 2.7342281341552734, 3.591136932373047, 4.44804573059082, 5.304954528808594, 6.161865234375, 7.018774032592773, 7.875682830810547, 8.73259162902832, 9.589500427246094, 10.446409225463867, 11.30331802368164, 12.160226821899414, 13.017135620117188, 13.874044418334961, 14.730953216552734, 15.587862014770508, 16.44477081298828, 17.301679611206055, 18.158588409423828, 19.0154972076416, 19.872406005859375, 20.72931480407715, 21.586223602294922, 22.443132400512695, 23.30004119873047, 24.156949996948242, 25.013858795166016, 25.87076759338379, 26.727676391601562, 27.584585189819336, 28.44149398803711, 29.298402786254883, 30.155311584472656, 31.01222038269043, 31.869129180908203, 32.726036071777344, 33.58294677734375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 5.0, 14.0, 11.0, 12.0, 19.0, 15.0, 26.0, 24.0, 35.0, 32.0, 26.0, 37.0, 43.0, 51.0, 40.0, 42.0, 43.0, 44.0, 45.0, 42.0, 33.0, 33.0, 42.0, 23.0, 16.0, 23.0, 31.0, 24.0, 26.0, 20.0, 23.0, 23.0, 13.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.862382888793945, -16.340221405029297, -15.818058967590332, -15.295896530151367, -14.773735046386719, -14.25157356262207, -13.729411125183105, -13.20724868774414, -12.685087203979492, -12.162925720214844, -11.640763282775879, -11.118600845336914, -10.596439361572266, -10.074277877807617, -9.552115440368652, -9.029953002929688, -8.507791519165039, -7.985629558563232, -7.463467597961426, -6.941305637359619, -6.4191436767578125, -5.896981716156006, -5.374819755554199, -4.852657794952393, -4.330495834350586, -3.8083338737487793, -3.2861719131469727, -2.764009952545166, -2.2418479919433594, -1.7196860313415527, -1.197524070739746, -0.6753621101379395, -0.1532001495361328, 0.36896181106567383, 0.8911237716674805, 1.413285732269287, 1.9354476928710938, 2.4576096534729004, 2.979771614074707, 3.5019335746765137, 4.02409553527832, 4.546257495880127, 5.068419456481934, 5.59058141708374, 6.112743377685547, 6.6349053382873535, 7.15706729888916, 7.679229259490967, 8.201391220092773, 8.723552703857422, 9.245715141296387, 9.767877578735352, 10.2900390625, 10.812200546264648, 11.334362983703613, 11.856525421142578, 12.378686904907227, 12.900848388671875, 13.42301082611084, 13.945173263549805, 14.467334747314453, 14.989496231079102, 15.511658668518066, 16.03382110595703, 16.55598258972168]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 17.0, 27.0, 34.0, 70.0, 90.0, 143.0, 204.0, 286.0, 495.0, 766.0, 1129.0, 1651.0, 2731.0, 4353.0, 6848.0, 10828.0, 17083.0, 26636.0, 40408.0, 59362.0, 82861.0, 108603.0, 127139.0, 132023.0, 119024.0, 95661.0, 70375.0, 48608.0, 32795.0, 21211.0, 13530.0, 8719.0, 5390.0, 3440.0, 2140.0, 1367.0, 912.0, 503.0, 373.0, 243.0, 139.0, 109.0, 66.0, 55.0, 35.0, 17.0, 15.0, 9.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.859375, -10.5225830078125, -10.185791015625, -9.8489990234375, -9.51220703125, -9.1754150390625, -8.838623046875, -8.5018310546875, -8.1650390625, -7.8282470703125, -7.491455078125, -7.1546630859375, -6.81787109375, -6.4810791015625, -6.144287109375, -5.8074951171875, -5.470703125, -5.1339111328125, -4.797119140625, -4.4603271484375, -4.12353515625, -3.7867431640625, -3.449951171875, -3.1131591796875, -2.7763671875, -2.4395751953125, -2.102783203125, -1.7659912109375, -1.42919921875, -1.0924072265625, -0.755615234375, -0.4188232421875, -0.08203125, 0.2547607421875, 0.591552734375, 0.9283447265625, 1.26513671875, 1.6019287109375, 1.938720703125, 2.2755126953125, 2.6123046875, 2.9490966796875, 3.285888671875, 3.6226806640625, 3.95947265625, 4.2962646484375, 4.633056640625, 4.9698486328125, 5.306640625, 5.6434326171875, 5.980224609375, 6.3170166015625, 6.65380859375, 6.9906005859375, 7.327392578125, 7.6641845703125, 8.0009765625, 8.3377685546875, 8.674560546875, 9.0113525390625, 9.34814453125, 9.6849365234375, 10.021728515625, 10.3585205078125, 10.6953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 15.0, 19.0, 14.0, 25.0, 25.0, 30.0, 33.0, 47.0, 35.0, 40.0, 47.0, 57.0, 42.0, 41.0, 51.0, 53.0, 51.0, 41.0, 31.0, 34.0, 38.0, 31.0, 24.0, 23.0, 23.0, 12.0, 17.0, 25.0, 14.0, 13.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.90625, -21.2646484375, -20.623046875, -19.9814453125, -19.33984375, -18.6982421875, -18.056640625, -17.4150390625, -16.7734375, -16.1318359375, -15.490234375, -14.8486328125, -14.20703125, -13.5654296875, -12.923828125, -12.2822265625, -11.640625, -10.9990234375, -10.357421875, -9.7158203125, -9.07421875, -8.4326171875, -7.791015625, -7.1494140625, -6.5078125, -5.8662109375, -5.224609375, -4.5830078125, -3.94140625, -3.2998046875, -2.658203125, -2.0166015625, -1.375, -0.7333984375, -0.091796875, 0.5498046875, 1.19140625, 1.8330078125, 2.474609375, 3.1162109375, 3.7578125, 4.3994140625, 5.041015625, 5.6826171875, 6.32421875, 6.9658203125, 7.607421875, 8.2490234375, 8.890625, 9.5322265625, 10.173828125, 10.8154296875, 11.45703125, 12.0986328125, 12.740234375, 13.3818359375, 14.0234375, 14.6650390625, 15.306640625, 15.9482421875, 16.58984375, 17.2314453125, 17.873046875, 18.5146484375, 19.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 11.0, 8.0, 11.0, 27.0, 30.0, 33.0, 67.0, 102.0, 125.0, 183.0, 359.0, 508.0, 838.0, 1309.0, 2201.0, 3696.0, 6457.0, 11832.0, 21036.0, 40246.0, 74590.0, 133764.0, 203508.0, 213516.0, 148264.0, 85358.0, 45419.0, 23958.0, 13077.0, 7462.0, 4083.0, 2455.0, 1484.0, 885.0, 594.0, 352.0, 223.0, 140.0, 127.0, 69.0, 50.0, 26.0, 20.0, 17.0, 13.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.359375, -18.75634765625, -18.1533203125, -17.55029296875, -16.947265625, -16.34423828125, -15.7412109375, -15.13818359375, -14.53515625, -13.93212890625, -13.3291015625, -12.72607421875, -12.123046875, -11.52001953125, -10.9169921875, -10.31396484375, -9.7109375, -9.10791015625, -8.5048828125, -7.90185546875, -7.298828125, -6.69580078125, -6.0927734375, -5.48974609375, -4.88671875, -4.28369140625, -3.6806640625, -3.07763671875, -2.474609375, -1.87158203125, -1.2685546875, -0.66552734375, -0.0625, 0.54052734375, 1.1435546875, 1.74658203125, 2.349609375, 2.95263671875, 3.5556640625, 4.15869140625, 4.76171875, 5.36474609375, 5.9677734375, 6.57080078125, 7.173828125, 7.77685546875, 8.3798828125, 8.98291015625, 9.5859375, 10.18896484375, 10.7919921875, 11.39501953125, 11.998046875, 12.60107421875, 13.2041015625, 13.80712890625, 14.41015625, 15.01318359375, 15.6162109375, 16.21923828125, 16.822265625, 17.42529296875, 18.0283203125, 18.63134765625, 19.234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 11.0, 8.0, 12.0, 12.0, 12.0, 16.0, 19.0, 18.0, 26.0, 37.0, 26.0, 36.0, 37.0, 32.0, 32.0, 38.0, 44.0, 46.0, 36.0, 35.0, 37.0, 43.0, 41.0, 31.0, 33.0, 30.0, 27.0, 25.0, 37.0, 26.0, 25.0, 16.0, 15.0, 16.0, 9.0, 12.0, 15.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-10.5, -10.195068359375, -9.89013671875, -9.585205078125, -9.2802734375, -8.975341796875, -8.67041015625, -8.365478515625, -8.060546875, -7.755615234375, -7.45068359375, -7.145751953125, -6.8408203125, -6.535888671875, -6.23095703125, -5.926025390625, -5.62109375, -5.316162109375, -5.01123046875, -4.706298828125, -4.4013671875, -4.096435546875, -3.79150390625, -3.486572265625, -3.181640625, -2.876708984375, -2.57177734375, -2.266845703125, -1.9619140625, -1.656982421875, -1.35205078125, -1.047119140625, -0.7421875, -0.437255859375, -0.13232421875, 0.172607421875, 0.4775390625, 0.782470703125, 1.08740234375, 1.392333984375, 1.697265625, 2.002197265625, 2.30712890625, 2.612060546875, 2.9169921875, 3.221923828125, 3.52685546875, 3.831787109375, 4.13671875, 4.441650390625, 4.74658203125, 5.051513671875, 5.3564453125, 5.661376953125, 5.96630859375, 6.271240234375, 6.576171875, 6.881103515625, 7.18603515625, 7.490966796875, 7.7958984375, 8.100830078125, 8.40576171875, 8.710693359375, 9.015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 17.0, 22.0, 30.0, 51.0, 79.0, 98.0, 159.0, 268.0, 439.0, 648.0, 1021.0, 1663.0, 2650.0, 4393.0, 7453.0, 13238.0, 23613.0, 43280.0, 78814.0, 140225.0, 210374.0, 208467.0, 137406.0, 77168.0, 42326.0, 22696.0, 13029.0, 7406.0, 4418.0, 2582.0, 1605.0, 994.0, 643.0, 419.0, 280.0, 189.0, 135.0, 74.0, 55.0, 41.0, 22.0, 19.0, 20.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0, -10.66650390625, -10.3330078125, -9.99951171875, -9.666015625, -9.33251953125, -8.9990234375, -8.66552734375, -8.33203125, -7.99853515625, -7.6650390625, -7.33154296875, -6.998046875, -6.66455078125, -6.3310546875, -5.99755859375, -5.6640625, -5.33056640625, -4.9970703125, -4.66357421875, -4.330078125, -3.99658203125, -3.6630859375, -3.32958984375, -2.99609375, -2.66259765625, -2.3291015625, -1.99560546875, -1.662109375, -1.32861328125, -0.9951171875, -0.66162109375, -0.328125, 0.00537109375, 0.3388671875, 0.67236328125, 1.005859375, 1.33935546875, 1.6728515625, 2.00634765625, 2.33984375, 2.67333984375, 3.0068359375, 3.34033203125, 3.673828125, 4.00732421875, 4.3408203125, 4.67431640625, 5.0078125, 5.34130859375, 5.6748046875, 6.00830078125, 6.341796875, 6.67529296875, 7.0087890625, 7.34228515625, 7.67578125, 8.00927734375, 8.3427734375, 8.67626953125, 9.009765625, 9.34326171875, 9.6767578125, 10.01025390625, 10.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 10.0, 7.0, 11.0, 14.0, 12.0, 18.0, 17.0, 24.0, 29.0, 32.0, 45.0, 37.0, 62.0, 56.0, 55.0, 56.0, 52.0, 57.0, 35.0, 56.0, 43.0, 34.0, 38.0, 40.0, 32.0, 27.0, 18.0, 18.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004820823669433594, -0.00046910718083381653, -0.0004561319947242737, -0.00044315680861473083, -0.000430181622505188, -0.00041720643639564514, -0.0004042312502861023, -0.00039125606417655945, -0.0003782808780670166, -0.00036530569195747375, -0.0003523305058479309, -0.00033935531973838806, -0.0003263801336288452, -0.00031340494751930237, -0.0003004297614097595, -0.0002874545753002167, -0.00027447938919067383, -0.000261504203081131, -0.00024852901697158813, -0.0002355538308620453, -0.00022257864475250244, -0.0002096034586429596, -0.00019662827253341675, -0.0001836530864238739, -0.00017067790031433105, -0.0001577027142047882, -0.00014472752809524536, -0.00013175234198570251, -0.00011877715587615967, -0.00010580196976661682, -9.282678365707397e-05, -7.985159754753113e-05, -6.687641143798828e-05, -5.3901225328445435e-05, -4.092603921890259e-05, -2.795085310935974e-05, -1.4975666999816895e-05, -2.000480890274048e-06, 1.0974705219268799e-05, 2.3949891328811646e-05, 3.692507743835449e-05, 4.990026354789734e-05, 6.287544965744019e-05, 7.585063576698303e-05, 8.882582187652588e-05, 0.00010180100798606873, 0.00011477619409561157, 0.00012775138020515442, 0.00014072656631469727, 0.0001537017524242401, 0.00016667693853378296, 0.0001796521246433258, 0.00019262731075286865, 0.0002056024968624115, 0.00021857768297195435, 0.0002315528690814972, 0.00024452805519104004, 0.0002575032413005829, 0.00027047842741012573, 0.0002834536135196686, 0.0002964287996292114, 0.00030940398573875427, 0.0003223791718482971, 0.00033535435795783997, 0.0003483295440673828]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 13.0, 26.0, 25.0, 45.0, 81.0, 111.0, 191.0, 231.0, 362.0, 568.0, 844.0, 1279.0, 1934.0, 3078.0, 4364.0, 6812.0, 10313.0, 15740.0, 25034.0, 37716.0, 56820.0, 82909.0, 112185.0, 135559.0, 140732.0, 122699.0, 94344.0, 65945.0, 44368.0, 29538.0, 18731.0, 12305.0, 8075.0, 5330.0, 3426.0, 2254.0, 1516.0, 1065.0, 684.0, 432.0, 282.0, 194.0, 129.0, 91.0, 61.0, 41.0, 29.0, 14.0, 13.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.3125, -8.0543212890625, -7.796142578125, -7.5379638671875, -7.27978515625, -7.0216064453125, -6.763427734375, -6.5052490234375, -6.2470703125, -5.9888916015625, -5.730712890625, -5.4725341796875, -5.21435546875, -4.9561767578125, -4.697998046875, -4.4398193359375, -4.181640625, -3.9234619140625, -3.665283203125, -3.4071044921875, -3.14892578125, -2.8907470703125, -2.632568359375, -2.3743896484375, -2.1162109375, -1.8580322265625, -1.599853515625, -1.3416748046875, -1.08349609375, -0.8253173828125, -0.567138671875, -0.3089599609375, -0.05078125, 0.2073974609375, 0.465576171875, 0.7237548828125, 0.98193359375, 1.2401123046875, 1.498291015625, 1.7564697265625, 2.0146484375, 2.2728271484375, 2.531005859375, 2.7891845703125, 3.04736328125, 3.3055419921875, 3.563720703125, 3.8218994140625, 4.080078125, 4.3382568359375, 4.596435546875, 4.8546142578125, 5.11279296875, 5.3709716796875, 5.629150390625, 5.8873291015625, 6.1455078125, 6.4036865234375, 6.661865234375, 6.9200439453125, 7.17822265625, 7.4364013671875, 7.694580078125, 7.9527587890625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 10.0, 9.0, 8.0, 12.0, 12.0, 17.0, 19.0, 19.0, 30.0, 21.0, 40.0, 43.0, 38.0, 36.0, 52.0, 54.0, 38.0, 49.0, 49.0, 47.0, 46.0, 48.0, 35.0, 37.0, 35.0, 24.0, 27.0, 23.0, 16.0, 23.0, 13.0, 10.0, 6.0, 10.0, 2.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.595703125, -2.512664794921875, -2.42962646484375, -2.346588134765625, -2.2635498046875, -2.180511474609375, -2.09747314453125, -2.014434814453125, -1.931396484375, -1.848358154296875, -1.76531982421875, -1.682281494140625, -1.5992431640625, -1.516204833984375, -1.43316650390625, -1.350128173828125, -1.26708984375, -1.184051513671875, -1.10101318359375, -1.017974853515625, -0.9349365234375, -0.851898193359375, -0.76885986328125, -0.685821533203125, -0.602783203125, -0.519744873046875, -0.43670654296875, -0.353668212890625, -0.2706298828125, -0.187591552734375, -0.10455322265625, -0.021514892578125, 0.0615234375, 0.144561767578125, 0.22760009765625, 0.310638427734375, 0.3936767578125, 0.476715087890625, 0.55975341796875, 0.642791748046875, 0.725830078125, 0.808868408203125, 0.89190673828125, 0.974945068359375, 1.0579833984375, 1.141021728515625, 1.22406005859375, 1.307098388671875, 1.39013671875, 1.473175048828125, 1.55621337890625, 1.639251708984375, 1.7222900390625, 1.805328369140625, 1.88836669921875, 1.971405029296875, 2.054443359375, 2.137481689453125, 2.22052001953125, 2.303558349609375, 2.3865966796875, 2.469635009765625, 2.55267333984375, 2.635711669921875, 2.71875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 4.0, 8.0, 11.0, 12.0, 20.0, 26.0, 28.0, 28.0, 34.0, 57.0, 63.0, 52.0, 76.0, 61.0, 62.0, 70.0, 64.0, 54.0, 60.0, 43.0, 30.0, 36.0, 21.0, 18.0, 14.0, 10.0, 10.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.695209503173828, -23.747371673583984, -22.79953384399414, -21.851696014404297, -20.903858184814453, -19.95602035522461, -19.008182525634766, -18.060344696044922, -17.112506866455078, -16.164669036865234, -15.21683120727539, -14.268993377685547, -13.321155548095703, -12.37331771850586, -11.425479888916016, -10.477642059326172, -9.529803276062012, -8.581965446472168, -7.634127616882324, -6.6862897872924805, -5.738451957702637, -4.790613651275635, -3.842775821685791, -2.8949379920959473, -1.9471001625061035, -0.999262273311615, -0.051424384117126465, 0.8964135646820068, 1.8442513942718506, 2.7920894622802734, 3.739927291870117, 4.687765121459961, 5.635602951049805, 6.583440780639648, 7.531278610229492, 8.479116439819336, 9.42695426940918, 10.374792098999023, 11.322629928588867, 12.270467758178711, 13.218305587768555, 14.166143417358398, 15.113981246948242, 16.061819076538086, 17.00965690612793, 17.957494735717773, 18.905332565307617, 19.85317039489746, 20.801010131835938, 21.74884796142578, 22.696685791015625, 23.64452362060547, 24.592361450195312, 25.540199279785156, 26.488037109375, 27.435874938964844, 28.383712768554688, 29.33155059814453, 30.279388427734375, 31.22722625732422, 32.17506408691406, 33.122901916503906, 34.07073974609375, 35.018577575683594, 35.96641540527344]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 9.0, 13.0, 11.0, 15.0, 11.0, 21.0, 19.0, 21.0, 31.0, 31.0, 32.0, 33.0, 50.0, 34.0, 43.0, 39.0, 51.0, 41.0, 49.0, 42.0, 39.0, 28.0, 34.0, 33.0, 21.0, 21.0, 20.0, 24.0, 27.0, 23.0, 23.0, 23.0, 14.0, 15.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.635669708251953, -16.127405166625977, -15.619141578674316, -15.11087703704834, -14.60261344909668, -14.094348907470703, -13.586084365844727, -13.07781982421875, -12.56955623626709, -12.061291694641113, -11.553028106689453, -11.044763565063477, -10.5364990234375, -10.02823543548584, -9.519970893859863, -9.011707305908203, -8.503442764282227, -7.995178699493408, -7.48691463470459, -6.978650093078613, -6.470386028289795, -5.962121963500977, -5.453857421875, -4.945593357086182, -4.437329292297363, -3.929065227508545, -3.4208009243011475, -2.91253662109375, -2.4042725563049316, -1.8960084915161133, -1.3877441883087158, -0.8794798851013184, -0.3712167739868164, 0.1370474100112915, 0.6453115940093994, 1.1535757780075073, 1.6618399620056152, 2.1701040267944336, 2.678368330001831, 3.1866326332092285, 3.694896697998047, 4.203160762786865, 4.711424827575684, 5.21968936920166, 5.7279534339904785, 6.236217498779297, 6.744482040405273, 7.252746105194092, 7.76101016998291, 8.269274711608887, 8.777538299560547, 9.285802841186523, 9.7940673828125, 10.30233097076416, 10.810595512390137, 11.318859100341797, 11.827123641967773, 12.33538818359375, 12.84365177154541, 13.351916313171387, 13.860179901123047, 14.368444442749023, 14.876708984375, 15.384973526000977, 15.893237113952637]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 18.0, 27.0, 49.0, 85.0, 153.0, 199.0, 286.0, 430.0, 715.0, 1148.0, 1829.0, 3014.0, 4797.0, 7595.0, 11806.0, 18695.0, 28795.0, 43623.0, 63515.0, 86814.0, 111006.0, 126479.0, 128356.0, 114977.0, 92019.0, 67648.0, 47218.0, 31150.0, 20398.0, 13234.0, 8295.0, 5219.0, 3223.0, 2176.0, 1289.0, 832.0, 506.0, 327.0, 195.0, 147.0, 97.0, 56.0, 28.0, 21.0, 19.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-15.5234375, -15.0682373046875, -14.613037109375, -14.1578369140625, -13.70263671875, -13.2474365234375, -12.792236328125, -12.3370361328125, -11.8818359375, -11.4266357421875, -10.971435546875, -10.5162353515625, -10.06103515625, -9.6058349609375, -9.150634765625, -8.6954345703125, -8.240234375, -7.7850341796875, -7.329833984375, -6.8746337890625, -6.41943359375, -5.9642333984375, -5.509033203125, -5.0538330078125, -4.5986328125, -4.1434326171875, -3.688232421875, -3.2330322265625, -2.77783203125, -2.3226318359375, -1.867431640625, -1.4122314453125, -0.95703125, -0.5018310546875, -0.046630859375, 0.4085693359375, 0.86376953125, 1.3189697265625, 1.774169921875, 2.2293701171875, 2.6845703125, 3.1397705078125, 3.594970703125, 4.0501708984375, 4.50537109375, 4.9605712890625, 5.415771484375, 5.8709716796875, 6.326171875, 6.7813720703125, 7.236572265625, 7.6917724609375, 8.14697265625, 8.6021728515625, 9.057373046875, 9.5125732421875, 9.9677734375, 10.4229736328125, 10.878173828125, 11.3333740234375, 11.78857421875, 12.2437744140625, 12.698974609375, 13.1541748046875, 13.609375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 13.0, 8.0, 13.0, 15.0, 18.0, 23.0, 20.0, 29.0, 49.0, 38.0, 29.0, 47.0, 47.0, 51.0, 43.0, 40.0, 47.0, 39.0, 41.0, 34.0, 34.0, 48.0, 29.0, 36.0, 28.0, 30.0, 23.0, 22.0, 14.0, 14.0, 9.0, 8.0, 10.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.0625, -17.471435546875, -16.88037109375, -16.289306640625, -15.6982421875, -15.107177734375, -14.51611328125, -13.925048828125, -13.333984375, -12.742919921875, -12.15185546875, -11.560791015625, -10.9697265625, -10.378662109375, -9.78759765625, -9.196533203125, -8.60546875, -8.014404296875, -7.42333984375, -6.832275390625, -6.2412109375, -5.650146484375, -5.05908203125, -4.468017578125, -3.876953125, -3.285888671875, -2.69482421875, -2.103759765625, -1.5126953125, -0.921630859375, -0.33056640625, 0.260498046875, 0.8515625, 1.442626953125, 2.03369140625, 2.624755859375, 3.2158203125, 3.806884765625, 4.39794921875, 4.989013671875, 5.580078125, 6.171142578125, 6.76220703125, 7.353271484375, 7.9443359375, 8.535400390625, 9.12646484375, 9.717529296875, 10.30859375, 10.899658203125, 11.49072265625, 12.081787109375, 12.6728515625, 13.263916015625, 13.85498046875, 14.446044921875, 15.037109375, 15.628173828125, 16.21923828125, 16.810302734375, 17.4013671875, 17.992431640625, 18.58349609375, 19.174560546875, 19.765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 17.0, 13.0, 28.0, 54.0, 85.0, 134.0, 182.0, 303.0, 454.0, 668.0, 1161.0, 1775.0, 2617.0, 4319.0, 6726.0, 10388.0, 16219.0, 24589.0, 37115.0, 53781.0, 74780.0, 96389.0, 114943.0, 124073.0, 118559.0, 101358.0, 79891.0, 58806.0, 40870.0, 27500.0, 18329.0, 11803.0, 7417.0, 4834.0, 3027.0, 1919.0, 1193.0, 818.0, 514.0, 336.0, 210.0, 130.0, 75.0, 59.0, 31.0, 25.0, 14.0, 7.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.6328125, -14.184326171875, -13.73583984375, -13.287353515625, -12.8388671875, -12.390380859375, -11.94189453125, -11.493408203125, -11.044921875, -10.596435546875, -10.14794921875, -9.699462890625, -9.2509765625, -8.802490234375, -8.35400390625, -7.905517578125, -7.45703125, -7.008544921875, -6.56005859375, -6.111572265625, -5.6630859375, -5.214599609375, -4.76611328125, -4.317626953125, -3.869140625, -3.420654296875, -2.97216796875, -2.523681640625, -2.0751953125, -1.626708984375, -1.17822265625, -0.729736328125, -0.28125, 0.167236328125, 0.61572265625, 1.064208984375, 1.5126953125, 1.961181640625, 2.40966796875, 2.858154296875, 3.306640625, 3.755126953125, 4.20361328125, 4.652099609375, 5.1005859375, 5.549072265625, 5.99755859375, 6.446044921875, 6.89453125, 7.343017578125, 7.79150390625, 8.239990234375, 8.6884765625, 9.136962890625, 9.58544921875, 10.033935546875, 10.482421875, 10.930908203125, 11.37939453125, 11.827880859375, 12.2763671875, 12.724853515625, 13.17333984375, 13.621826171875, 14.0703125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 9.0, 2.0, 6.0, 6.0, 5.0, 4.0, 9.0, 12.0, 23.0, 24.0, 22.0, 23.0, 32.0, 21.0, 35.0, 32.0, 36.0, 34.0, 49.0, 49.0, 37.0, 46.0, 50.0, 29.0, 38.0, 37.0, 31.0, 16.0, 38.0, 34.0, 34.0, 28.0, 22.0, 22.0, 24.0, 16.0, 19.0, 11.0, 8.0, 5.0, 6.0, 8.0, 2.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.7822265625, -8.431640625, -8.0810546875, -7.73046875, -7.3798828125, -7.029296875, -6.6787109375, -6.328125, -5.9775390625, -5.626953125, -5.2763671875, -4.92578125, -4.5751953125, -4.224609375, -3.8740234375, -3.5234375, -3.1728515625, -2.822265625, -2.4716796875, -2.12109375, -1.7705078125, -1.419921875, -1.0693359375, -0.71875, -0.3681640625, -0.017578125, 0.3330078125, 0.68359375, 1.0341796875, 1.384765625, 1.7353515625, 2.0859375, 2.4365234375, 2.787109375, 3.1376953125, 3.48828125, 3.8388671875, 4.189453125, 4.5400390625, 4.890625, 5.2412109375, 5.591796875, 5.9423828125, 6.29296875, 6.6435546875, 6.994140625, 7.3447265625, 7.6953125, 8.0458984375, 8.396484375, 8.7470703125, 9.09765625, 9.4482421875, 9.798828125, 10.1494140625, 10.5, 10.8505859375, 11.201171875, 11.5517578125, 11.90234375, 12.2529296875, 12.603515625, 12.9541015625, 13.3046875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 6.0, 12.0, 10.0, 21.0, 24.0, 49.0, 59.0, 76.0, 129.0, 196.0, 277.0, 397.0, 710.0, 1136.0, 1761.0, 3056.0, 5278.0, 9286.0, 17232.0, 32105.0, 59815.0, 103925.0, 158256.0, 192492.0, 174621.0, 123906.0, 73664.0, 40363.0, 21854.0, 11657.0, 6584.0, 3730.0, 2178.0, 1342.0, 809.0, 518.0, 328.0, 230.0, 135.0, 105.0, 71.0, 44.0, 33.0, 23.0, 19.0, 13.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0], "bins": [-12.21875, -11.8763427734375, -11.533935546875, -11.1915283203125, -10.84912109375, -10.5067138671875, -10.164306640625, -9.8218994140625, -9.4794921875, -9.1370849609375, -8.794677734375, -8.4522705078125, -8.10986328125, -7.7674560546875, -7.425048828125, -7.0826416015625, -6.740234375, -6.3978271484375, -6.055419921875, -5.7130126953125, -5.37060546875, -5.0281982421875, -4.685791015625, -4.3433837890625, -4.0009765625, -3.6585693359375, -3.316162109375, -2.9737548828125, -2.63134765625, -2.2889404296875, -1.946533203125, -1.6041259765625, -1.26171875, -0.9193115234375, -0.576904296875, -0.2344970703125, 0.10791015625, 0.4503173828125, 0.792724609375, 1.1351318359375, 1.4775390625, 1.8199462890625, 2.162353515625, 2.5047607421875, 2.84716796875, 3.1895751953125, 3.531982421875, 3.8743896484375, 4.216796875, 4.5592041015625, 4.901611328125, 5.2440185546875, 5.58642578125, 5.9288330078125, 6.271240234375, 6.6136474609375, 6.9560546875, 7.2984619140625, 7.640869140625, 7.9832763671875, 8.32568359375, 8.6680908203125, 9.010498046875, 9.3529052734375, 9.6953125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 2.0, 4.0, 9.0, 5.0, 5.0, 13.0, 6.0, 13.0, 18.0, 23.0, 15.0, 22.0, 36.0, 23.0, 32.0, 36.0, 48.0, 54.0, 50.0, 43.0, 40.0, 47.0, 47.0, 43.0, 45.0, 34.0, 35.0, 34.0, 27.0, 32.0, 27.0, 23.0, 17.0, 15.0, 10.0, 11.0, 7.0, 6.0, 9.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007491111755371094, -0.0007250681519508362, -0.000701025128364563, -0.0006769821047782898, -0.0006529390811920166, -0.0006288960576057434, -0.0006048530340194702, -0.000580810010433197, -0.0005567669868469238, -0.0005327239632606506, -0.0005086809396743774, -0.00048463791608810425, -0.00046059489250183105, -0.00043655186891555786, -0.00041250884532928467, -0.0003884658217430115, -0.0003644227981567383, -0.0003403797745704651, -0.0003163367509841919, -0.0002922937273979187, -0.0002682507038116455, -0.0002442076802253723, -0.00022016465663909912, -0.00019612163305282593, -0.00017207860946655273, -0.00014803558588027954, -0.00012399256229400635, -9.994953870773315e-05, -7.590651512145996e-05, -5.186349153518677e-05, -2.7820467948913574e-05, -3.777444362640381e-06, 2.0265579223632812e-05, 4.4308602809906006e-05, 6.83516263961792e-05, 9.239464998245239e-05, 0.00011643767356872559, 0.00014048069715499878, 0.00016452372074127197, 0.00018856674432754517, 0.00021260976791381836, 0.00023665279150009155, 0.00026069581508636475, 0.00028473883867263794, 0.00030878186225891113, 0.0003328248858451843, 0.0003568679094314575, 0.0003809109330177307, 0.0004049539566040039, 0.0004289969801902771, 0.0004530400037765503, 0.0004770830273628235, 0.0005011260509490967, 0.0005251690745353699, 0.0005492120981216431, 0.0005732551217079163, 0.0005972981452941895, 0.0006213411688804626, 0.0006453841924667358, 0.000669427216053009, 0.0006934702396392822, 0.0007175132632255554, 0.0007415562868118286, 0.0007655993103981018, 0.000789642333984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 21.0, 28.0, 28.0, 39.0, 70.0, 120.0, 146.0, 269.0, 422.0, 737.0, 1266.0, 2592.0, 5940.0, 15599.0, 43730.0, 122001.0, 261405.0, 306287.0, 177899.0, 69271.0, 24065.0, 8879.0, 3637.0, 1714.0, 924.0, 509.0, 319.0, 206.0, 137.0, 82.0, 56.0, 40.0, 26.0, 25.0, 16.0, 8.0, 9.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.38916015625, -16.7939453125, -16.19873046875, -15.603515625, -15.00830078125, -14.4130859375, -13.81787109375, -13.22265625, -12.62744140625, -12.0322265625, -11.43701171875, -10.841796875, -10.24658203125, -9.6513671875, -9.05615234375, -8.4609375, -7.86572265625, -7.2705078125, -6.67529296875, -6.080078125, -5.48486328125, -4.8896484375, -4.29443359375, -3.69921875, -3.10400390625, -2.5087890625, -1.91357421875, -1.318359375, -0.72314453125, -0.1279296875, 0.46728515625, 1.0625, 1.65771484375, 2.2529296875, 2.84814453125, 3.443359375, 4.03857421875, 4.6337890625, 5.22900390625, 5.82421875, 6.41943359375, 7.0146484375, 7.60986328125, 8.205078125, 8.80029296875, 9.3955078125, 9.99072265625, 10.5859375, 11.18115234375, 11.7763671875, 12.37158203125, 12.966796875, 13.56201171875, 14.1572265625, 14.75244140625, 15.34765625, 15.94287109375, 16.5380859375, 17.13330078125, 17.728515625, 18.32373046875, 18.9189453125, 19.51416015625, 20.109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 19.0, 15.0, 31.0, 27.0, 39.0, 43.0, 60.0, 59.0, 50.0, 68.0, 72.0, 62.0, 69.0, 45.0, 56.0, 49.0, 28.0, 26.0, 35.0, 28.0, 22.0, 16.0, 12.0, 6.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.78173828125, -3.6572265625, -3.53271484375, -3.408203125, -3.28369140625, -3.1591796875, -3.03466796875, -2.91015625, -2.78564453125, -2.6611328125, -2.53662109375, -2.412109375, -2.28759765625, -2.1630859375, -2.03857421875, -1.9140625, -1.78955078125, -1.6650390625, -1.54052734375, -1.416015625, -1.29150390625, -1.1669921875, -1.04248046875, -0.91796875, -0.79345703125, -0.6689453125, -0.54443359375, -0.419921875, -0.29541015625, -0.1708984375, -0.04638671875, 0.078125, 0.20263671875, 0.3271484375, 0.45166015625, 0.576171875, 0.70068359375, 0.8251953125, 0.94970703125, 1.07421875, 1.19873046875, 1.3232421875, 1.44775390625, 1.572265625, 1.69677734375, 1.8212890625, 1.94580078125, 2.0703125, 2.19482421875, 2.3193359375, 2.44384765625, 2.568359375, 2.69287109375, 2.8173828125, 2.94189453125, 3.06640625, 3.19091796875, 3.3154296875, 3.43994140625, 3.564453125, 3.68896484375, 3.8134765625, 3.93798828125, 4.0625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 7.0, 16.0, 9.0, 11.0, 20.0, 22.0, 32.0, 38.0, 40.0, 51.0, 61.0, 70.0, 69.0, 62.0, 66.0, 67.0, 50.0, 51.0, 61.0, 36.0, 33.0, 33.0, 20.0, 16.0, 10.0, 14.0, 7.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.203081130981445, -23.262569427490234, -22.322057723999023, -21.381546020507812, -20.4410343170166, -19.50052261352539, -18.560012817382812, -17.61949920654297, -16.67898941040039, -15.73847770690918, -14.797966003417969, -13.857454299926758, -12.916942596435547, -11.976430892944336, -11.035920143127441, -10.09540843963623, -9.154895782470703, -8.214384078979492, -7.273872375488281, -6.3333611488342285, -5.392849445343018, -4.452337741851807, -3.511826515197754, -2.571314811706543, -1.630803108215332, -0.6902915239334106, 0.25022006034851074, 1.1907315254211426, 2.1312432289123535, 3.0717549324035645, 4.012266159057617, 4.952777862548828, 5.893291473388672, 6.833803176879883, 7.774314880371094, 8.714826583862305, 9.655338287353516, 10.595849990844727, 11.536360740661621, 12.476872444152832, 13.417384147644043, 14.357895851135254, 15.298407554626465, 16.23891830444336, 17.17943000793457, 18.11994171142578, 19.060453414916992, 20.000965118408203, 20.941476821899414, 21.881988525390625, 22.822500228881836, 23.763011932373047, 24.703523635864258, 25.64403533935547, 26.584545135498047, 27.52505874633789, 28.46556854248047, 29.40608024597168, 30.34659194946289, 31.2871036529541, 32.22761535644531, 33.16812515258789, 34.108638763427734, 35.04914855957031, 35.989662170410156]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 8.0, 5.0, 11.0, 10.0, 14.0, 9.0, 19.0, 18.0, 21.0, 23.0, 28.0, 32.0, 26.0, 38.0, 42.0, 36.0, 40.0, 42.0, 42.0, 40.0, 38.0, 40.0, 43.0, 49.0, 33.0, 33.0, 38.0, 27.0, 18.0, 28.0, 22.0, 18.0, 13.0, 18.0, 8.0, 9.0, 7.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-17.0711669921875, -16.55986213684082, -16.048559188842773, -15.53725528717041, -15.025951385498047, -14.514646530151367, -14.003342628479004, -13.49203872680664, -12.980734825134277, -12.469430923461914, -11.95812702178955, -11.446823120117188, -10.935518264770508, -10.424215316772461, -9.912910461425781, -9.401606559753418, -8.890302658081055, -8.378998756408691, -7.867694854736328, -7.356390476226807, -6.845086574554443, -6.33378267288208, -5.822478294372559, -5.311174392700195, -4.799870491027832, -4.288566589355469, -3.7772624492645264, -3.265958309173584, -2.7546544075012207, -2.2433505058288574, -1.732046365737915, -1.2207422256469727, -0.7094402313232422, -0.19813621044158936, 0.3131678104400635, 0.8244718313217163, 1.3357758522033691, 1.8470797538757324, 2.358383893966675, 2.869688034057617, 3.3809919357299805, 3.8922958374023438, 4.403599739074707, 4.9149041175842285, 5.426208019256592, 5.937511920928955, 6.448816299438477, 6.96012020111084, 7.471424102783203, 7.982728004455566, 8.49403190612793, 9.005335807800293, 9.516639709472656, 10.027944564819336, 10.5392484664917, 11.050552368164062, 11.561856269836426, 12.073160171508789, 12.584464073181152, 13.095767974853516, 13.607072830200195, 14.118375778198242, 14.629680633544922, 15.140984535217285, 15.652288436889648]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 8.0, 9.0, 7.0, 11.0, 31.0, 44.0, 53.0, 97.0, 140.0, 212.0, 348.0, 537.0, 927.0, 1606.0, 2640.0, 4635.0, 8550.0, 15619.0, 30449.0, 61422.0, 128583.0, 274104.0, 549928.0, 893863.0, 950438.0, 637087.0, 327392.0, 153976.0, 73643.0, 36199.0, 18462.0, 9972.0, 5561.0, 3082.0, 1791.0, 1074.0, 648.0, 387.0, 254.0, 165.0, 123.0, 71.0, 44.0, 31.0, 21.0, 14.0, 12.0, 3.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.90625, -28.97509765625, -28.0439453125, -27.11279296875, -26.181640625, -25.25048828125, -24.3193359375, -23.38818359375, -22.45703125, -21.52587890625, -20.5947265625, -19.66357421875, -18.732421875, -17.80126953125, -16.8701171875, -15.93896484375, -15.0078125, -14.07666015625, -13.1455078125, -12.21435546875, -11.283203125, -10.35205078125, -9.4208984375, -8.48974609375, -7.55859375, -6.62744140625, -5.6962890625, -4.76513671875, -3.833984375, -2.90283203125, -1.9716796875, -1.04052734375, -0.109375, 0.82177734375, 1.7529296875, 2.68408203125, 3.615234375, 4.54638671875, 5.4775390625, 6.40869140625, 7.33984375, 8.27099609375, 9.2021484375, 10.13330078125, 11.064453125, 11.99560546875, 12.9267578125, 13.85791015625, 14.7890625, 15.72021484375, 16.6513671875, 17.58251953125, 18.513671875, 19.44482421875, 20.3759765625, 21.30712890625, 22.23828125, 23.16943359375, 24.1005859375, 25.03173828125, 25.962890625, 26.89404296875, 27.8251953125, 28.75634765625, 29.6875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 10.0, 12.0, 11.0, 20.0, 10.0, 22.0, 23.0, 27.0, 32.0, 30.0, 35.0, 33.0, 43.0, 44.0, 42.0, 51.0, 38.0, 48.0, 45.0, 43.0, 55.0, 43.0, 30.0, 30.0, 30.0, 26.0, 22.0, 21.0, 23.0, 17.0, 8.0, 15.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-18.03125, -17.537353515625, -17.04345703125, -16.549560546875, -16.0556640625, -15.561767578125, -15.06787109375, -14.573974609375, -14.080078125, -13.586181640625, -13.09228515625, -12.598388671875, -12.1044921875, -11.610595703125, -11.11669921875, -10.622802734375, -10.12890625, -9.635009765625, -9.14111328125, -8.647216796875, -8.1533203125, -7.659423828125, -7.16552734375, -6.671630859375, -6.177734375, -5.683837890625, -5.18994140625, -4.696044921875, -4.2021484375, -3.708251953125, -3.21435546875, -2.720458984375, -2.2265625, -1.732666015625, -1.23876953125, -0.744873046875, -0.2509765625, 0.242919921875, 0.73681640625, 1.230712890625, 1.724609375, 2.218505859375, 2.71240234375, 3.206298828125, 3.7001953125, 4.194091796875, 4.68798828125, 5.181884765625, 5.67578125, 6.169677734375, 6.66357421875, 7.157470703125, 7.6513671875, 8.145263671875, 8.63916015625, 9.133056640625, 9.626953125, 10.120849609375, 10.61474609375, 11.108642578125, 11.6025390625, 12.096435546875, 12.59033203125, 13.084228515625, 13.578125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 4.0, 10.0, 22.0, 38.0, 51.0, 87.0, 117.0, 192.0, 373.0, 578.0, 1061.0, 1982.0, 3758.0, 7386.0, 14883.0, 29579.0, 60667.0, 125907.0, 255598.0, 491933.0, 803007.0, 925365.0, 690466.0, 392592.0, 198412.0, 96609.0, 46935.0, 22980.0, 11403.0, 5664.0, 3023.0, 1580.0, 873.0, 450.0, 251.0, 170.0, 97.0, 67.0, 42.0, 27.0, 13.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5625, -35.43115234375, -34.2998046875, -33.16845703125, -32.037109375, -30.90576171875, -29.7744140625, -28.64306640625, -27.51171875, -26.38037109375, -25.2490234375, -24.11767578125, -22.986328125, -21.85498046875, -20.7236328125, -19.59228515625, -18.4609375, -17.32958984375, -16.1982421875, -15.06689453125, -13.935546875, -12.80419921875, -11.6728515625, -10.54150390625, -9.41015625, -8.27880859375, -7.1474609375, -6.01611328125, -4.884765625, -3.75341796875, -2.6220703125, -1.49072265625, -0.359375, 0.77197265625, 1.9033203125, 3.03466796875, 4.166015625, 5.29736328125, 6.4287109375, 7.56005859375, 8.69140625, 9.82275390625, 10.9541015625, 12.08544921875, 13.216796875, 14.34814453125, 15.4794921875, 16.61083984375, 17.7421875, 18.87353515625, 20.0048828125, 21.13623046875, 22.267578125, 23.39892578125, 24.5302734375, 25.66162109375, 26.79296875, 27.92431640625, 29.0556640625, 30.18701171875, 31.318359375, 32.44970703125, 33.5810546875, 34.71240234375, 35.84375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 28.0, 25.0, 42.0, 51.0, 50.0, 74.0, 100.0, 120.0, 155.0, 186.0, 237.0, 238.0, 272.0, 304.0, 293.0, 310.0, 266.0, 249.0, 243.0, 179.0, 146.0, 118.0, 96.0, 63.0, 57.0, 42.0, 22.0, 22.0, 23.0, 7.0, 5.0, 8.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.33837890625, -10.9736328125, -10.60888671875, -10.244140625, -9.87939453125, -9.5146484375, -9.14990234375, -8.78515625, -8.42041015625, -8.0556640625, -7.69091796875, -7.326171875, -6.96142578125, -6.5966796875, -6.23193359375, -5.8671875, -5.50244140625, -5.1376953125, -4.77294921875, -4.408203125, -4.04345703125, -3.6787109375, -3.31396484375, -2.94921875, -2.58447265625, -2.2197265625, -1.85498046875, -1.490234375, -1.12548828125, -0.7607421875, -0.39599609375, -0.03125, 0.33349609375, 0.6982421875, 1.06298828125, 1.427734375, 1.79248046875, 2.1572265625, 2.52197265625, 2.88671875, 3.25146484375, 3.6162109375, 3.98095703125, 4.345703125, 4.71044921875, 5.0751953125, 5.43994140625, 5.8046875, 6.16943359375, 6.5341796875, 6.89892578125, 7.263671875, 7.62841796875, 7.9931640625, 8.35791015625, 8.72265625, 9.08740234375, 9.4521484375, 9.81689453125, 10.181640625, 10.54638671875, 10.9111328125, 11.27587890625, 11.640625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 13.0, 6.0, 18.0, 20.0, 27.0, 25.0, 27.0, 38.0, 47.0, 46.0, 38.0, 48.0, 55.0, 61.0, 56.0, 49.0, 60.0, 56.0, 38.0, 33.0, 37.0, 26.0, 28.0, 16.0, 14.0, 9.0, 12.0, 20.0, 6.0, 8.0, 5.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.080623626708984, -26.166078567504883, -25.25153350830078, -24.33698844909668, -23.422443389892578, -22.507898330688477, -21.593353271484375, -20.67880630493164, -19.764263153076172, -18.84971809387207, -17.93517303466797, -17.020627975463867, -16.106082916259766, -15.191537857055664, -14.276991844177246, -13.362446784973145, -12.447900772094727, -11.533355712890625, -10.618810653686523, -9.704265594482422, -8.78972053527832, -7.8751749992370605, -6.960629463195801, -6.046084403991699, -5.131539344787598, -4.216994285583496, -3.3024489879608154, -2.3879036903381348, -1.4733586311340332, -0.5588135719299316, 0.3557319641113281, 1.2702770233154297, 2.1848201751708984, 3.099365234375, 4.013910293579102, 4.928455829620361, 5.843000888824463, 6.7575459480285645, 7.672091484069824, 8.586636543273926, 9.501181602478027, 10.415726661682129, 11.33027172088623, 12.244817733764648, 13.15936279296875, 14.073907852172852, 14.988452911376953, 15.902997970581055, 16.817543029785156, 17.732088088989258, 18.64663314819336, 19.56117820739746, 20.475723266601562, 21.390268325805664, 22.304813385009766, 23.2193603515625, 24.13390350341797, 25.04844856262207, 25.962993621826172, 26.877538681030273, 27.792083740234375, 28.706628799438477, 29.621173858642578, 30.535720825195312, 31.450265884399414]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 10.0, 18.0, 15.0, 20.0, 15.0, 25.0, 32.0, 32.0, 25.0, 28.0, 30.0, 52.0, 45.0, 40.0, 57.0, 48.0, 39.0, 42.0, 40.0, 36.0, 40.0, 31.0, 32.0, 29.0, 34.0, 32.0, 19.0, 20.0, 11.0, 15.0, 10.0, 13.0, 7.0, 7.0, 3.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.500263214111328, -21.853761672973633, -21.207260131835938, -20.560758590698242, -19.914257049560547, -19.26775360107422, -18.621253967285156, -17.974750518798828, -17.328248977661133, -16.681747436523438, -16.035245895385742, -15.388744354248047, -14.742241859436035, -14.09574031829834, -13.449238777160645, -12.802736282348633, -12.156235694885254, -11.509734153747559, -10.863232612609863, -10.216730117797852, -9.570228576660156, -8.923727035522461, -8.277225494384766, -7.630723476409912, -6.984221935272217, -6.3377203941345215, -5.691218376159668, -5.044716835021973, -4.398215293884277, -3.751713275909424, -3.1052117347717285, -2.458709716796875, -1.8122081756591797, -1.1657063961029053, -0.5192047357559204, 0.12729692459106445, 0.7737987041473389, 1.4203004837036133, 2.0668020248413086, 2.713304042816162, 3.3598055839538574, 4.006307125091553, 4.652809143066406, 5.299310684204102, 5.945812225341797, 6.59231424331665, 7.238815784454346, 7.885317802429199, 8.531819343566895, 9.17832088470459, 9.824822425842285, 10.471324920654297, 11.117826461791992, 11.764328002929688, 12.410829544067383, 13.057331085205078, 13.703832626342773, 14.350334167480469, 14.996835708618164, 15.64333724975586, 16.289838790893555, 16.93634033203125, 17.582843780517578, 18.229345321655273, 18.87584686279297]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 15.0, 13.0, 23.0, 34.0, 59.0, 77.0, 124.0, 182.0, 273.0, 487.0, 762.0, 1263.0, 1941.0, 3361.0, 5564.0, 9288.0, 15048.0, 25128.0, 41087.0, 64799.0, 95254.0, 128589.0, 150086.0, 146116.0, 120975.0, 87661.0, 57174.0, 36576.0, 22419.0, 13740.0, 8113.0, 4797.0, 2929.0, 1733.0, 1088.0, 641.0, 387.0, 272.0, 156.0, 105.0, 60.0, 62.0, 32.0, 24.0, 14.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4375, -14.9375, -14.4375, -13.9375, -13.4375, -12.9375, -12.4375, -11.9375, -11.4375, -10.9375, -10.4375, -9.9375, -9.4375, -8.9375, -8.4375, -7.9375, -7.4375, -6.9375, -6.4375, -5.9375, -5.4375, -4.9375, -4.4375, -3.9375, -3.4375, -2.9375, -2.4375, -1.9375, -1.4375, -0.9375, -0.4375, 0.0625, 0.5625, 1.0625, 1.5625, 2.0625, 2.5625, 3.0625, 3.5625, 4.0625, 4.5625, 5.0625, 5.5625, 6.0625, 6.5625, 7.0625, 7.5625, 8.0625, 8.5625, 9.0625, 9.5625, 10.0625, 10.5625, 11.0625, 11.5625, 12.0625, 12.5625, 13.0625, 13.5625, 14.0625, 14.5625, 15.0625, 15.5625, 16.0625, 16.5625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 2.0, 8.0, 7.0, 13.0, 11.0, 15.0, 28.0, 31.0, 20.0, 32.0, 22.0, 35.0, 40.0, 50.0, 55.0, 44.0, 54.0, 52.0, 53.0, 44.0, 45.0, 51.0, 44.0, 34.0, 32.0, 30.0, 28.0, 20.0, 14.0, 13.0, 15.0, 9.0, 8.0, 9.0, 9.0, 5.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5, -25.705810546875, -24.91162109375, -24.117431640625, -23.3232421875, -22.529052734375, -21.73486328125, -20.940673828125, -20.146484375, -19.352294921875, -18.55810546875, -17.763916015625, -16.9697265625, -16.175537109375, -15.38134765625, -14.587158203125, -13.79296875, -12.998779296875, -12.20458984375, -11.410400390625, -10.6162109375, -9.822021484375, -9.02783203125, -8.233642578125, -7.439453125, -6.645263671875, -5.85107421875, -5.056884765625, -4.2626953125, -3.468505859375, -2.67431640625, -1.880126953125, -1.0859375, -0.291748046875, 0.50244140625, 1.296630859375, 2.0908203125, 2.885009765625, 3.67919921875, 4.473388671875, 5.267578125, 6.061767578125, 6.85595703125, 7.650146484375, 8.4443359375, 9.238525390625, 10.03271484375, 10.826904296875, 11.62109375, 12.415283203125, 13.20947265625, 14.003662109375, 14.7978515625, 15.592041015625, 16.38623046875, 17.180419921875, 17.974609375, 18.768798828125, 19.56298828125, 20.357177734375, 21.1513671875, 21.945556640625, 22.73974609375, 23.533935546875, 24.328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 9.0, 15.0, 22.0, 28.0, 53.0, 47.0, 70.0, 99.0, 161.0, 246.0, 447.0, 677.0, 1131.0, 1933.0, 3272.0, 5892.0, 11204.0, 21913.0, 44281.0, 89082.0, 165483.0, 241287.0, 210223.0, 122755.0, 63017.0, 30997.0, 15545.0, 7959.0, 4331.0, 2493.0, 1419.0, 851.0, 538.0, 360.0, 208.0, 146.0, 94.0, 66.0, 42.0, 23.0, 21.0, 23.0, 14.0, 10.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-27.21875, -26.361328125, -25.50390625, -24.646484375, -23.7890625, -22.931640625, -22.07421875, -21.216796875, -20.359375, -19.501953125, -18.64453125, -17.787109375, -16.9296875, -16.072265625, -15.21484375, -14.357421875, -13.5, -12.642578125, -11.78515625, -10.927734375, -10.0703125, -9.212890625, -8.35546875, -7.498046875, -6.640625, -5.783203125, -4.92578125, -4.068359375, -3.2109375, -2.353515625, -1.49609375, -0.638671875, 0.21875, 1.076171875, 1.93359375, 2.791015625, 3.6484375, 4.505859375, 5.36328125, 6.220703125, 7.078125, 7.935546875, 8.79296875, 9.650390625, 10.5078125, 11.365234375, 12.22265625, 13.080078125, 13.9375, 14.794921875, 15.65234375, 16.509765625, 17.3671875, 18.224609375, 19.08203125, 19.939453125, 20.796875, 21.654296875, 22.51171875, 23.369140625, 24.2265625, 25.083984375, 25.94140625, 26.798828125, 27.65625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 7.0, 4.0, 8.0, 4.0, 13.0, 10.0, 12.0, 13.0, 20.0, 14.0, 18.0, 24.0, 25.0, 22.0, 26.0, 39.0, 32.0, 26.0, 42.0, 33.0, 44.0, 49.0, 36.0, 43.0, 39.0, 34.0, 36.0, 40.0, 34.0, 33.0, 27.0, 24.0, 20.0, 20.0, 21.0, 13.0, 15.0, 18.0, 11.0, 7.0, 9.0, 12.0, 11.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.6953125, -11.3287353515625, -10.962158203125, -10.5955810546875, -10.22900390625, -9.8624267578125, -9.495849609375, -9.1292724609375, -8.7626953125, -8.3961181640625, -8.029541015625, -7.6629638671875, -7.29638671875, -6.9298095703125, -6.563232421875, -6.1966552734375, -5.830078125, -5.4635009765625, -5.096923828125, -4.7303466796875, -4.36376953125, -3.9971923828125, -3.630615234375, -3.2640380859375, -2.8974609375, -2.5308837890625, -2.164306640625, -1.7977294921875, -1.43115234375, -1.0645751953125, -0.697998046875, -0.3314208984375, 0.03515625, 0.4017333984375, 0.768310546875, 1.1348876953125, 1.50146484375, 1.8680419921875, 2.234619140625, 2.6011962890625, 2.9677734375, 3.3343505859375, 3.700927734375, 4.0675048828125, 4.43408203125, 4.8006591796875, 5.167236328125, 5.5338134765625, 5.900390625, 6.2669677734375, 6.633544921875, 7.0001220703125, 7.36669921875, 7.7332763671875, 8.099853515625, 8.4664306640625, 8.8330078125, 9.1995849609375, 9.566162109375, 9.9327392578125, 10.29931640625, 10.6658935546875, 11.032470703125, 11.3990478515625, 11.765625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 16.0, 19.0, 40.0, 56.0, 60.0, 110.0, 149.0, 206.0, 307.0, 438.0, 639.0, 993.0, 1509.0, 2303.0, 3631.0, 5509.0, 9055.0, 15051.0, 25021.0, 42697.0, 72637.0, 119276.0, 175729.0, 193388.0, 147759.0, 93262.0, 55786.0, 32657.0, 18930.0, 11430.0, 7014.0, 4479.0, 2794.0, 1780.0, 1247.0, 790.0, 535.0, 379.0, 263.0, 184.0, 115.0, 82.0, 70.0, 44.0, 19.0, 24.0, 14.0, 14.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0], "bins": [-13.7109375, -13.298583984375, -12.88623046875, -12.473876953125, -12.0615234375, -11.649169921875, -11.23681640625, -10.824462890625, -10.412109375, -9.999755859375, -9.58740234375, -9.175048828125, -8.7626953125, -8.350341796875, -7.93798828125, -7.525634765625, -7.11328125, -6.700927734375, -6.28857421875, -5.876220703125, -5.4638671875, -5.051513671875, -4.63916015625, -4.226806640625, -3.814453125, -3.402099609375, -2.98974609375, -2.577392578125, -2.1650390625, -1.752685546875, -1.34033203125, -0.927978515625, -0.515625, -0.103271484375, 0.30908203125, 0.721435546875, 1.1337890625, 1.546142578125, 1.95849609375, 2.370849609375, 2.783203125, 3.195556640625, 3.60791015625, 4.020263671875, 4.4326171875, 4.844970703125, 5.25732421875, 5.669677734375, 6.08203125, 6.494384765625, 6.90673828125, 7.319091796875, 7.7314453125, 8.143798828125, 8.55615234375, 8.968505859375, 9.380859375, 9.793212890625, 10.20556640625, 10.617919921875, 11.0302734375, 11.442626953125, 11.85498046875, 12.267333984375, 12.6796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 0.0, 10.0, 8.0, 12.0, 6.0, 8.0, 18.0, 18.0, 20.0, 38.0, 24.0, 32.0, 45.0, 36.0, 40.0, 27.0, 43.0, 49.0, 59.0, 52.0, 38.0, 51.0, 47.0, 37.0, 42.0, 28.0, 31.0, 32.0, 20.0, 22.0, 13.0, 20.0, 5.0, 4.0, 7.0, 14.0, 9.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004608631134033203, -0.00044594332575798035, -0.0004310235381126404, -0.0004161037504673004, -0.00040118396282196045, -0.0003862641751766205, -0.0003713443875312805, -0.00035642459988594055, -0.0003415048122406006, -0.0003265850245952606, -0.00031166523694992065, -0.0002967454493045807, -0.0002818256616592407, -0.00026690587401390076, -0.0002519860863685608, -0.00023706629872322083, -0.00022214651107788086, -0.0002072267234325409, -0.00019230693578720093, -0.00017738714814186096, -0.000162467360496521, -0.00014754757285118103, -0.00013262778520584106, -0.0001177079975605011, -0.00010278820991516113, -8.786842226982117e-05, -7.29486346244812e-05, -5.8028846979141235e-05, -4.310905933380127e-05, -2.8189271688461304e-05, -1.3269484043121338e-05, 1.650303602218628e-06, 1.6570091247558594e-05, 3.148987889289856e-05, 4.6409666538238525e-05, 6.132945418357849e-05, 7.624924182891846e-05, 9.116902947425842e-05, 0.00010608881711959839, 0.00012100860476493835, 0.00013592839241027832, 0.00015084818005561829, 0.00016576796770095825, 0.00018068775534629822, 0.00019560754299163818, 0.00021052733063697815, 0.00022544711828231812, 0.00024036690592765808, 0.00025528669357299805, 0.000270206481218338, 0.000285126268863678, 0.00030004605650901794, 0.0003149658441543579, 0.0003298856317996979, 0.00034480541944503784, 0.0003597252070903778, 0.0003746449947357178, 0.00038956478238105774, 0.0004044845700263977, 0.00041940435767173767, 0.00043432414531707764, 0.0004492439329624176, 0.00046416372060775757, 0.00047908350825309753, 0.0004940032958984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 22.0, 17.0, 39.0, 60.0, 73.0, 122.0, 167.0, 281.0, 407.0, 646.0, 967.0, 1549.0, 2317.0, 3609.0, 5952.0, 9654.0, 15679.0, 25219.0, 41017.0, 64428.0, 96241.0, 130339.0, 152058.0, 147127.0, 118588.0, 84410.0, 55458.0, 34641.0, 21764.0, 13241.0, 8290.0, 5194.0, 3175.0, 2062.0, 1260.0, 840.0, 544.0, 355.0, 254.0, 151.0, 102.0, 66.0, 42.0, 32.0, 21.0, 18.0, 11.0, 8.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.1796875, -12.765625, -12.3515625, -11.9375, -11.5234375, -11.109375, -10.6953125, -10.28125, -9.8671875, -9.453125, -9.0390625, -8.625, -8.2109375, -7.796875, -7.3828125, -6.96875, -6.5546875, -6.140625, -5.7265625, -5.3125, -4.8984375, -4.484375, -4.0703125, -3.65625, -3.2421875, -2.828125, -2.4140625, -2.0, -1.5859375, -1.171875, -0.7578125, -0.34375, 0.0703125, 0.484375, 0.8984375, 1.3125, 1.7265625, 2.140625, 2.5546875, 2.96875, 3.3828125, 3.796875, 4.2109375, 4.625, 5.0390625, 5.453125, 5.8671875, 6.28125, 6.6953125, 7.109375, 7.5234375, 7.9375, 8.3515625, 8.765625, 9.1796875, 9.59375, 10.0078125, 10.421875, 10.8359375, 11.25, 11.6640625, 12.078125, 12.4921875, 12.90625, 13.3203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 15.0, 28.0, 23.0, 34.0, 35.0, 35.0, 54.0, 51.0, 67.0, 52.0, 52.0, 65.0, 48.0, 51.0, 64.0, 30.0, 37.0, 32.0, 33.0, 29.0, 16.0, 20.0, 13.0, 14.0, 14.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.96875, -4.82220458984375, -4.6756591796875, -4.52911376953125, -4.382568359375, -4.23602294921875, -4.0894775390625, -3.94293212890625, -3.79638671875, -3.64984130859375, -3.5032958984375, -3.35675048828125, -3.210205078125, -3.06365966796875, -2.9171142578125, -2.77056884765625, -2.6240234375, -2.47747802734375, -2.3309326171875, -2.18438720703125, -2.037841796875, -1.89129638671875, -1.7447509765625, -1.59820556640625, -1.45166015625, -1.30511474609375, -1.1585693359375, -1.01202392578125, -0.865478515625, -0.71893310546875, -0.5723876953125, -0.42584228515625, -0.279296875, -0.13275146484375, 0.0137939453125, 0.16033935546875, 0.306884765625, 0.45343017578125, 0.5999755859375, 0.74652099609375, 0.89306640625, 1.03961181640625, 1.1861572265625, 1.33270263671875, 1.479248046875, 1.62579345703125, 1.7723388671875, 1.91888427734375, 2.0654296875, 2.21197509765625, 2.3585205078125, 2.50506591796875, 2.651611328125, 2.79815673828125, 2.9447021484375, 3.09124755859375, 3.23779296875, 3.38433837890625, 3.5308837890625, 3.67742919921875, 3.823974609375, 3.97052001953125, 4.1170654296875, 4.26361083984375, 4.41015625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 9.0, 7.0, 12.0, 10.0, 15.0, 12.0, 23.0, 24.0, 28.0, 35.0, 31.0, 55.0, 52.0, 48.0, 40.0, 44.0, 61.0, 56.0, 50.0, 57.0, 55.0, 30.0, 40.0, 33.0, 28.0, 16.0, 16.0, 21.0, 13.0, 14.0, 14.0, 7.0, 8.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.911890029907227, -25.99489402770996, -25.077896118164062, -24.160900115966797, -23.24390411376953, -22.326908111572266, -21.409912109375, -20.4929141998291, -19.575918197631836, -18.65892219543457, -17.741924285888672, -16.824928283691406, -15.90793228149414, -14.990936279296875, -14.073939323425293, -13.156942367553711, -12.239946365356445, -11.32295036315918, -10.405953407287598, -9.488956451416016, -8.57196044921875, -7.654963970184326, -6.737967491149902, -5.8209710121154785, -4.903974533081055, -3.986978054046631, -3.069981575012207, -2.152985095977783, -1.2359886169433594, -0.31899213790893555, 0.5980043411254883, 1.515000820159912, 2.431997299194336, 3.3489937782287598, 4.265990257263184, 5.182986736297607, 6.099983215332031, 7.016979694366455, 7.933976173400879, 8.850973129272461, 9.767969131469727, 10.684965133666992, 11.601962089538574, 12.518959045410156, 13.435955047607422, 14.352951049804688, 15.26994800567627, 16.18694496154785, 17.103940963745117, 18.020936965942383, 18.93793487548828, 19.854930877685547, 20.771926879882812, 21.688922882080078, 22.605918884277344, 23.522916793823242, 24.439912796020508, 25.356908798217773, 26.273906707763672, 27.190902709960938, 28.107898712158203, 29.02489471435547, 29.941890716552734, 30.858888626098633, 31.7758846282959]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 3.0, 3.0, 8.0, 3.0, 16.0, 13.0, 9.0, 12.0, 21.0, 24.0, 25.0, 37.0, 30.0, 32.0, 32.0, 36.0, 42.0, 46.0, 44.0, 47.0, 45.0, 37.0, 38.0, 38.0, 44.0, 35.0, 34.0, 33.0, 32.0, 28.0, 25.0, 21.0, 18.0, 19.0, 12.0, 11.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.62870216369629, -21.98770523071289, -21.34670639038086, -20.70570945739746, -20.064712524414062, -19.42371368408203, -18.782716751098633, -18.141719818115234, -17.500720977783203, -16.859724044799805, -16.218725204467773, -15.577728271484375, -14.936731338500977, -14.295733451843262, -13.654735565185547, -13.013738632202148, -12.37274169921875, -11.731743812561035, -11.090746879577637, -10.449748992919922, -9.808752059936523, -9.167754173278809, -8.526756286621094, -7.885758876800537, -7.2447614669799805, -6.603764057159424, -5.962766647338867, -5.321768760681152, -4.680771350860596, -4.039773941040039, -3.3987762928009033, -2.7577786445617676, -2.116781234741211, -1.4757837057113647, -0.8347861766815186, -0.19378864765167236, 0.44720888137817383, 1.0882062911987305, 1.7292039394378662, 2.370201587677002, 3.0111989974975586, 3.6521964073181152, 4.293193817138672, 4.934191703796387, 5.575189113616943, 6.2161865234375, 6.857184410095215, 7.4981818199157715, 8.139179229736328, 8.780177116394043, 9.421174049377441, 10.062171936035156, 10.703168869018555, 11.34416675567627, 11.985164642333984, 12.626161575317383, 13.267159461975098, 13.908157348632812, 14.549154281616211, 15.190152168273926, 15.83115005493164, 16.47214698791504, 17.113143920898438, 17.75414276123047, 18.395139694213867]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 9.0, 17.0, 23.0, 25.0, 37.0, 60.0, 72.0, 116.0, 149.0, 295.0, 411.0, 655.0, 1029.0, 1525.0, 2357.0, 3675.0, 5678.0, 8490.0, 13218.0, 20352.0, 30561.0, 44547.0, 63298.0, 85558.0, 105655.0, 120881.0, 121861.0, 111085.0, 90417.0, 68678.0, 49218.0, 33461.0, 22466.0, 14869.0, 9735.0, 6374.0, 4036.0, 2761.0, 1669.0, 1139.0, 721.0, 473.0, 321.0, 204.0, 134.0, 81.0, 59.0, 33.0, 25.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-16.296875, -15.804931640625, -15.31298828125, -14.821044921875, -14.3291015625, -13.837158203125, -13.34521484375, -12.853271484375, -12.361328125, -11.869384765625, -11.37744140625, -10.885498046875, -10.3935546875, -9.901611328125, -9.40966796875, -8.917724609375, -8.42578125, -7.933837890625, -7.44189453125, -6.949951171875, -6.4580078125, -5.966064453125, -5.47412109375, -4.982177734375, -4.490234375, -3.998291015625, -3.50634765625, -3.014404296875, -2.5224609375, -2.030517578125, -1.53857421875, -1.046630859375, -0.5546875, -0.062744140625, 0.42919921875, 0.921142578125, 1.4130859375, 1.905029296875, 2.39697265625, 2.888916015625, 3.380859375, 3.872802734375, 4.36474609375, 4.856689453125, 5.3486328125, 5.840576171875, 6.33251953125, 6.824462890625, 7.31640625, 7.808349609375, 8.30029296875, 8.792236328125, 9.2841796875, 9.776123046875, 10.26806640625, 10.760009765625, 11.251953125, 11.743896484375, 12.23583984375, 12.727783203125, 13.2197265625, 13.711669921875, 14.20361328125, 14.695556640625, 15.1875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 6.0, 10.0, 7.0, 14.0, 11.0, 20.0, 23.0, 31.0, 36.0, 28.0, 37.0, 40.0, 42.0, 47.0, 58.0, 47.0, 50.0, 60.0, 49.0, 42.0, 35.0, 38.0, 29.0, 36.0, 30.0, 26.0, 23.0, 11.0, 19.0, 15.0, 13.0, 9.0, 7.0, 9.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.34375, -20.591064453125, -19.83837890625, -19.085693359375, -18.3330078125, -17.580322265625, -16.82763671875, -16.074951171875, -15.322265625, -14.569580078125, -13.81689453125, -13.064208984375, -12.3115234375, -11.558837890625, -10.80615234375, -10.053466796875, -9.30078125, -8.548095703125, -7.79541015625, -7.042724609375, -6.2900390625, -5.537353515625, -4.78466796875, -4.031982421875, -3.279296875, -2.526611328125, -1.77392578125, -1.021240234375, -0.2685546875, 0.484130859375, 1.23681640625, 1.989501953125, 2.7421875, 3.494873046875, 4.24755859375, 5.000244140625, 5.7529296875, 6.505615234375, 7.25830078125, 8.010986328125, 8.763671875, 9.516357421875, 10.26904296875, 11.021728515625, 11.7744140625, 12.527099609375, 13.27978515625, 14.032470703125, 14.78515625, 15.537841796875, 16.29052734375, 17.043212890625, 17.7958984375, 18.548583984375, 19.30126953125, 20.053955078125, 20.806640625, 21.559326171875, 22.31201171875, 23.064697265625, 23.8173828125, 24.570068359375, 25.32275390625, 26.075439453125, 26.828125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 9.0, 13.0, 8.0, 26.0, 34.0, 49.0, 91.0, 146.0, 232.0, 331.0, 561.0, 995.0, 1712.0, 2935.0, 4738.0, 7697.0, 12620.0, 20362.0, 32117.0, 49470.0, 72639.0, 98912.0, 121853.0, 134723.0, 129206.0, 109725.0, 83667.0, 59351.0, 39579.0, 25039.0, 15588.0, 9508.0, 5809.0, 3483.0, 2087.0, 1280.0, 770.0, 474.0, 268.0, 179.0, 115.0, 49.0, 31.0, 31.0, 23.0, 13.0, 5.0, 5.0, 5.0, 6.0, 0.0, 1.0], "bins": [-22.125, -21.505615234375, -20.88623046875, -20.266845703125, -19.6474609375, -19.028076171875, -18.40869140625, -17.789306640625, -17.169921875, -16.550537109375, -15.93115234375, -15.311767578125, -14.6923828125, -14.072998046875, -13.45361328125, -12.834228515625, -12.21484375, -11.595458984375, -10.97607421875, -10.356689453125, -9.7373046875, -9.117919921875, -8.49853515625, -7.879150390625, -7.259765625, -6.640380859375, -6.02099609375, -5.401611328125, -4.7822265625, -4.162841796875, -3.54345703125, -2.924072265625, -2.3046875, -1.685302734375, -1.06591796875, -0.446533203125, 0.1728515625, 0.792236328125, 1.41162109375, 2.031005859375, 2.650390625, 3.269775390625, 3.88916015625, 4.508544921875, 5.1279296875, 5.747314453125, 6.36669921875, 6.986083984375, 7.60546875, 8.224853515625, 8.84423828125, 9.463623046875, 10.0830078125, 10.702392578125, 11.32177734375, 11.941162109375, 12.560546875, 13.179931640625, 13.79931640625, 14.418701171875, 15.0380859375, 15.657470703125, 16.27685546875, 16.896240234375, 17.515625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 16.0, 8.0, 11.0, 19.0, 18.0, 20.0, 20.0, 27.0, 30.0, 34.0, 33.0, 38.0, 35.0, 38.0, 43.0, 41.0, 41.0, 38.0, 35.0, 32.0, 46.0, 37.0, 25.0, 40.0, 38.0, 44.0, 21.0, 21.0, 17.0, 18.0, 17.0, 18.0, 13.0, 13.0, 9.0, 13.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-14.7421875, -14.2867431640625, -13.831298828125, -13.3758544921875, -12.92041015625, -12.4649658203125, -12.009521484375, -11.5540771484375, -11.0986328125, -10.6431884765625, -10.187744140625, -9.7322998046875, -9.27685546875, -8.8214111328125, -8.365966796875, -7.9105224609375, -7.455078125, -6.9996337890625, -6.544189453125, -6.0887451171875, -5.63330078125, -5.1778564453125, -4.722412109375, -4.2669677734375, -3.8115234375, -3.3560791015625, -2.900634765625, -2.4451904296875, -1.98974609375, -1.5343017578125, -1.078857421875, -0.6234130859375, -0.16796875, 0.2874755859375, 0.742919921875, 1.1983642578125, 1.65380859375, 2.1092529296875, 2.564697265625, 3.0201416015625, 3.4755859375, 3.9310302734375, 4.386474609375, 4.8419189453125, 5.29736328125, 5.7528076171875, 6.208251953125, 6.6636962890625, 7.119140625, 7.5745849609375, 8.030029296875, 8.4854736328125, 8.94091796875, 9.3963623046875, 9.851806640625, 10.3072509765625, 10.7626953125, 11.2181396484375, 11.673583984375, 12.1290283203125, 12.58447265625, 13.0399169921875, 13.495361328125, 13.9508056640625, 14.40625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 12.0, 11.0, 17.0, 24.0, 32.0, 51.0, 87.0, 121.0, 189.0, 323.0, 585.0, 932.0, 1593.0, 2826.0, 5643.0, 12174.0, 28910.0, 74286.0, 180980.0, 301271.0, 246349.0, 112992.0, 44623.0, 17607.0, 7921.0, 3991.0, 2026.0, 1061.0, 717.0, 446.0, 258.0, 157.0, 111.0, 65.0, 44.0, 40.0, 19.0, 26.0, 9.0, 9.0, 1.0, 5.0, 1.0, 4.0, 1.0, 2.0], "bins": [-28.40625, -27.6533203125, -26.900390625, -26.1474609375, -25.39453125, -24.6416015625, -23.888671875, -23.1357421875, -22.3828125, -21.6298828125, -20.876953125, -20.1240234375, -19.37109375, -18.6181640625, -17.865234375, -17.1123046875, -16.359375, -15.6064453125, -14.853515625, -14.1005859375, -13.34765625, -12.5947265625, -11.841796875, -11.0888671875, -10.3359375, -9.5830078125, -8.830078125, -8.0771484375, -7.32421875, -6.5712890625, -5.818359375, -5.0654296875, -4.3125, -3.5595703125, -2.806640625, -2.0537109375, -1.30078125, -0.5478515625, 0.205078125, 0.9580078125, 1.7109375, 2.4638671875, 3.216796875, 3.9697265625, 4.72265625, 5.4755859375, 6.228515625, 6.9814453125, 7.734375, 8.4873046875, 9.240234375, 9.9931640625, 10.74609375, 11.4990234375, 12.251953125, 13.0048828125, 13.7578125, 14.5107421875, 15.263671875, 16.0166015625, 16.76953125, 17.5224609375, 18.275390625, 19.0283203125, 19.78125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 6.0, 1.0, 12.0, 10.0, 18.0, 21.0, 29.0, 37.0, 54.0, 77.0, 84.0, 79.0, 98.0, 74.0, 76.0, 64.0, 62.0, 44.0, 28.0, 34.0, 27.0, 13.0, 13.0, 10.0, 4.0, 3.0, 9.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015993118286132812, -0.0015435665845870972, -0.001487821340560913, -0.001432076096534729, -0.001376330852508545, -0.0013205856084823608, -0.0012648403644561768, -0.0012090951204299927, -0.0011533498764038086, -0.0010976046323776245, -0.0010418593883514404, -0.0009861141443252563, -0.0009303689002990723, -0.0008746236562728882, -0.0008188784122467041, -0.00076313316822052, -0.0007073879241943359, -0.0006516426801681519, -0.0005958974361419678, -0.0005401521921157837, -0.0004844069480895996, -0.00042866170406341553, -0.00037291646003723145, -0.00031717121601104736, -0.0002614259719848633, -0.0002056807279586792, -0.00014993548393249512, -9.419023990631104e-05, -3.844499588012695e-05, 1.730024814605713e-05, 7.304549217224121e-05, 0.0001287907361984253, 0.00018453598022460938, 0.00024028122425079346, 0.00029602646827697754, 0.0003517717123031616, 0.0004075169563293457, 0.0004632622003555298, 0.0005190074443817139, 0.000574752688407898, 0.000630497932434082, 0.0006862431764602661, 0.0007419884204864502, 0.0007977336645126343, 0.0008534789085388184, 0.0009092241525650024, 0.0009649693965911865, 0.0010207146406173706, 0.0010764598846435547, 0.0011322051286697388, 0.0011879503726959229, 0.001243695616722107, 0.001299440860748291, 0.001355186104774475, 0.0014109313488006592, 0.0014666765928268433, 0.0015224218368530273, 0.0015781670808792114, 0.0016339123249053955, 0.0016896575689315796, 0.0017454028129577637, 0.0018011480569839478, 0.0018568933010101318, 0.001912638545036316, 0.0019683837890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 14.0, 16.0, 18.0, 31.0, 46.0, 73.0, 91.0, 133.0, 182.0, 210.0, 306.0, 487.0, 637.0, 1005.0, 1532.0, 2451.0, 3919.0, 6651.0, 11370.0, 20602.0, 38271.0, 70800.0, 122983.0, 179367.0, 198224.0, 160730.0, 100995.0, 56560.0, 30463.0, 16360.0, 9231.0, 5365.0, 3235.0, 2036.0, 1282.0, 869.0, 621.0, 395.0, 304.0, 196.0, 143.0, 101.0, 83.0, 47.0, 33.0, 27.0, 17.0, 11.0, 5.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-16.0, -15.489013671875, -14.97802734375, -14.467041015625, -13.9560546875, -13.445068359375, -12.93408203125, -12.423095703125, -11.912109375, -11.401123046875, -10.89013671875, -10.379150390625, -9.8681640625, -9.357177734375, -8.84619140625, -8.335205078125, -7.82421875, -7.313232421875, -6.80224609375, -6.291259765625, -5.7802734375, -5.269287109375, -4.75830078125, -4.247314453125, -3.736328125, -3.225341796875, -2.71435546875, -2.203369140625, -1.6923828125, -1.181396484375, -0.67041015625, -0.159423828125, 0.3515625, 0.862548828125, 1.37353515625, 1.884521484375, 2.3955078125, 2.906494140625, 3.41748046875, 3.928466796875, 4.439453125, 4.950439453125, 5.46142578125, 5.972412109375, 6.4833984375, 6.994384765625, 7.50537109375, 8.016357421875, 8.52734375, 9.038330078125, 9.54931640625, 10.060302734375, 10.5712890625, 11.082275390625, 11.59326171875, 12.104248046875, 12.615234375, 13.126220703125, 13.63720703125, 14.148193359375, 14.6591796875, 15.170166015625, 15.68115234375, 16.192138671875, 16.703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 11.0, 8.0, 11.0, 9.0, 18.0, 18.0, 19.0, 24.0, 29.0, 25.0, 37.0, 40.0, 51.0, 49.0, 47.0, 58.0, 68.0, 46.0, 68.0, 55.0, 57.0, 28.0, 48.0, 21.0, 17.0, 28.0, 16.0, 12.0, 15.0, 4.0, 10.0, 5.0, 10.0, 3.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.71484375, -5.55792236328125, -5.4010009765625, -5.24407958984375, -5.087158203125, -4.93023681640625, -4.7733154296875, -4.61639404296875, -4.45947265625, -4.30255126953125, -4.1456298828125, -3.98870849609375, -3.831787109375, -3.67486572265625, -3.5179443359375, -3.36102294921875, -3.2041015625, -3.04718017578125, -2.8902587890625, -2.73333740234375, -2.576416015625, -2.41949462890625, -2.2625732421875, -2.10565185546875, -1.94873046875, -1.79180908203125, -1.6348876953125, -1.47796630859375, -1.321044921875, -1.16412353515625, -1.0072021484375, -0.85028076171875, -0.693359375, -0.53643798828125, -0.3795166015625, -0.22259521484375, -0.065673828125, 0.09124755859375, 0.2481689453125, 0.40509033203125, 0.56201171875, 0.71893310546875, 0.8758544921875, 1.03277587890625, 1.189697265625, 1.34661865234375, 1.5035400390625, 1.66046142578125, 1.8173828125, 1.97430419921875, 2.1312255859375, 2.28814697265625, 2.445068359375, 2.60198974609375, 2.7589111328125, 2.91583251953125, 3.07275390625, 3.22967529296875, 3.3865966796875, 3.54351806640625, 3.700439453125, 3.85736083984375, 4.0142822265625, 4.17120361328125, 4.328125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 11.0, 8.0, 9.0, 8.0, 12.0, 18.0, 25.0, 26.0, 31.0, 37.0, 36.0, 36.0, 48.0, 49.0, 61.0, 59.0, 65.0, 61.0, 56.0, 52.0, 59.0, 41.0, 25.0, 18.0, 22.0, 20.0, 25.0, 17.0, 13.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.86786460876465, -30.837194442749023, -29.8065242767334, -28.775854110717773, -27.745182037353516, -26.71451187133789, -25.683841705322266, -24.65317153930664, -23.622501373291016, -22.59183120727539, -21.561161041259766, -20.53049087524414, -19.499820709228516, -18.46915054321289, -17.438478469848633, -16.407808303833008, -15.377138137817383, -14.346467971801758, -13.315797805786133, -12.285126686096191, -11.254456520080566, -10.223786354064941, -9.193115234375, -8.162445068359375, -7.13177490234375, -6.101104736328125, -5.070434093475342, -4.039763450622559, -3.0090932846069336, -1.9784231185913086, -0.9477524757385254, 0.08291816711425781, 1.11358642578125, 2.144256830215454, 3.174927234649658, 4.205597877502441, 5.236268043518066, 6.266938209533691, 7.297608852386475, 8.328279495239258, 9.358949661254883, 10.389619827270508, 11.420289993286133, 12.450961112976074, 13.4816312789917, 14.512301445007324, 15.542972564697266, 16.57364273071289, 17.604312896728516, 18.63498306274414, 19.665653228759766, 20.69632339477539, 21.726993560791016, 22.75766372680664, 23.7883358001709, 24.819005966186523, 25.84967613220215, 26.880346298217773, 27.9110164642334, 28.941686630249023, 29.97235870361328, 31.003028869628906, 32.03369903564453, 33.064369201660156, 34.09503936767578]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 8.0, 12.0, 7.0, 9.0, 13.0, 19.0, 19.0, 18.0, 20.0, 24.0, 24.0, 22.0, 29.0, 28.0, 41.0, 33.0, 36.0, 43.0, 35.0, 41.0, 33.0, 43.0, 35.0, 34.0, 26.0, 45.0, 31.0, 30.0, 21.0, 28.0, 18.0, 14.0, 23.0, 18.0, 18.0, 15.0, 10.0, 11.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.195226669311523, -17.602327346801758, -17.009428024291992, -16.416528701782227, -15.823630332946777, -15.230731010437012, -14.637832641601562, -14.044933319091797, -13.452033996582031, -12.859134674072266, -12.2662353515625, -11.67333698272705, -11.080437660217285, -10.48753833770752, -9.89463996887207, -9.301740646362305, -8.708841323852539, -8.115942001342773, -7.523043155670166, -6.930144309997559, -6.337244987487793, -5.744345664978027, -5.15144681930542, -4.5585479736328125, -3.965648651123047, -3.3727495670318604, -2.779850482940674, -2.1869513988494873, -1.5940523147583008, -1.0011532306671143, -0.40825414657592773, 0.1846446990966797, 0.7775421142578125, 1.370441198348999, 1.9633402824401855, 2.556239366531372, 3.1491384506225586, 3.742037534713745, 4.334936618804932, 4.927835464477539, 5.520734786987305, 6.11363410949707, 6.706532955169678, 7.299431800842285, 7.892331123352051, 8.485230445861816, 9.078128814697266, 9.671028137207031, 10.263927459716797, 10.856826782226562, 11.449726104736328, 12.042624473571777, 12.635523796081543, 13.228423118591309, 13.821321487426758, 14.414220809936523, 15.007120132446289, 15.600019454956055, 16.19291877746582, 16.785818099975586, 17.37871551513672, 17.971614837646484, 18.56451416015625, 19.157413482666016, 19.75031280517578]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 15.0, 14.0, 24.0, 36.0, 72.0, 120.0, 212.0, 327.0, 619.0, 1020.0, 1913.0, 3403.0, 6571.0, 12677.0, 25033.0, 51337.0, 106052.0, 221711.0, 443756.0, 768107.0, 952362.0, 752088.0, 429892.0, 213219.0, 102074.0, 49184.0, 24282.0, 12371.0, 6616.0, 3675.0, 2118.0, 1237.0, 760.0, 446.0, 336.0, 208.0, 116.0, 86.0, 63.0, 35.0, 30.0, 17.0, 16.0, 14.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.15625, -32.03125, -30.90625, -29.78125, -28.65625, -27.53125, -26.40625, -25.28125, -24.15625, -23.03125, -21.90625, -20.78125, -19.65625, -18.53125, -17.40625, -16.28125, -15.15625, -14.03125, -12.90625, -11.78125, -10.65625, -9.53125, -8.40625, -7.28125, -6.15625, -5.03125, -3.90625, -2.78125, -1.65625, -0.53125, 0.59375, 1.71875, 2.84375, 3.96875, 5.09375, 6.21875, 7.34375, 8.46875, 9.59375, 10.71875, 11.84375, 12.96875, 14.09375, 15.21875, 16.34375, 17.46875, 18.59375, 19.71875, 20.84375, 21.96875, 23.09375, 24.21875, 25.34375, 26.46875, 27.59375, 28.71875, 29.84375, 30.96875, 32.09375, 33.21875, 34.34375, 35.46875, 36.59375, 37.71875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 5.0, 9.0, 9.0, 4.0, 10.0, 11.0, 14.0, 26.0, 22.0, 18.0, 34.0, 26.0, 42.0, 27.0, 35.0, 43.0, 38.0, 41.0, 45.0, 43.0, 44.0, 42.0, 44.0, 32.0, 47.0, 33.0, 36.0, 25.0, 30.0, 28.0, 19.0, 17.0, 16.0, 18.0, 7.0, 20.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.203125, -16.57861328125, -15.9541015625, -15.32958984375, -14.705078125, -14.08056640625, -13.4560546875, -12.83154296875, -12.20703125, -11.58251953125, -10.9580078125, -10.33349609375, -9.708984375, -9.08447265625, -8.4599609375, -7.83544921875, -7.2109375, -6.58642578125, -5.9619140625, -5.33740234375, -4.712890625, -4.08837890625, -3.4638671875, -2.83935546875, -2.21484375, -1.59033203125, -0.9658203125, -0.34130859375, 0.283203125, 0.90771484375, 1.5322265625, 2.15673828125, 2.78125, 3.40576171875, 4.0302734375, 4.65478515625, 5.279296875, 5.90380859375, 6.5283203125, 7.15283203125, 7.77734375, 8.40185546875, 9.0263671875, 9.65087890625, 10.275390625, 10.89990234375, 11.5244140625, 12.14892578125, 12.7734375, 13.39794921875, 14.0224609375, 14.64697265625, 15.271484375, 15.89599609375, 16.5205078125, 17.14501953125, 17.76953125, 18.39404296875, 19.0185546875, 19.64306640625, 20.267578125, 20.89208984375, 21.5166015625, 22.14111328125, 22.765625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 13.0, 22.0, 37.0, 56.0, 87.0, 139.0, 248.0, 415.0, 716.0, 1306.0, 2202.0, 3941.0, 7495.0, 14466.0, 27980.0, 55203.0, 109322.0, 215476.0, 406620.0, 673930.0, 864530.0, 761815.0, 494214.0, 270312.0, 139035.0, 70454.0, 35428.0, 18101.0, 9477.0, 4997.0, 2705.0, 1512.0, 808.0, 501.0, 257.0, 164.0, 125.0, 44.0, 51.0, 24.0, 19.0, 10.0, 8.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-40.65625, -39.2861328125, -37.916015625, -36.5458984375, -35.17578125, -33.8056640625, -32.435546875, -31.0654296875, -29.6953125, -28.3251953125, -26.955078125, -25.5849609375, -24.21484375, -22.8447265625, -21.474609375, -20.1044921875, -18.734375, -17.3642578125, -15.994140625, -14.6240234375, -13.25390625, -11.8837890625, -10.513671875, -9.1435546875, -7.7734375, -6.4033203125, -5.033203125, -3.6630859375, -2.29296875, -0.9228515625, 0.447265625, 1.8173828125, 3.1875, 4.5576171875, 5.927734375, 7.2978515625, 8.66796875, 10.0380859375, 11.408203125, 12.7783203125, 14.1484375, 15.5185546875, 16.888671875, 18.2587890625, 19.62890625, 20.9990234375, 22.369140625, 23.7392578125, 25.109375, 26.4794921875, 27.849609375, 29.2197265625, 30.58984375, 31.9599609375, 33.330078125, 34.7001953125, 36.0703125, 37.4404296875, 38.810546875, 40.1806640625, 41.55078125, 42.9208984375, 44.291015625, 45.6611328125, 47.03125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 5.0, 15.0, 20.0, 19.0, 31.0, 49.0, 70.0, 85.0, 98.0, 110.0, 142.0, 193.0, 209.0, 243.0, 278.0, 295.0, 309.0, 240.0, 253.0, 263.0, 211.0, 203.0, 177.0, 129.0, 99.0, 92.0, 55.0, 52.0, 35.0, 19.0, 14.0, 9.0, 11.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.7841796875, -12.333984375, -11.8837890625, -11.43359375, -10.9833984375, -10.533203125, -10.0830078125, -9.6328125, -9.1826171875, -8.732421875, -8.2822265625, -7.83203125, -7.3818359375, -6.931640625, -6.4814453125, -6.03125, -5.5810546875, -5.130859375, -4.6806640625, -4.23046875, -3.7802734375, -3.330078125, -2.8798828125, -2.4296875, -1.9794921875, -1.529296875, -1.0791015625, -0.62890625, -0.1787109375, 0.271484375, 0.7216796875, 1.171875, 1.6220703125, 2.072265625, 2.5224609375, 2.97265625, 3.4228515625, 3.873046875, 4.3232421875, 4.7734375, 5.2236328125, 5.673828125, 6.1240234375, 6.57421875, 7.0244140625, 7.474609375, 7.9248046875, 8.375, 8.8251953125, 9.275390625, 9.7255859375, 10.17578125, 10.6259765625, 11.076171875, 11.5263671875, 11.9765625, 12.4267578125, 12.876953125, 13.3271484375, 13.77734375, 14.2275390625, 14.677734375, 15.1279296875, 15.578125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 6.0, 11.0, 9.0, 7.0, 8.0, 12.0, 14.0, 22.0, 23.0, 39.0, 33.0, 39.0, 48.0, 52.0, 54.0, 59.0, 51.0, 61.0, 57.0, 50.0, 45.0, 50.0, 37.0, 41.0, 28.0, 24.0, 27.0, 16.0, 15.0, 15.0, 8.0, 8.0, 10.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.26799011230469, -38.92879867553711, -37.58960723876953, -36.25041580200195, -34.911224365234375, -33.5720329284668, -32.23284149169922, -30.893648147583008, -29.55445671081543, -28.21526527404785, -26.876073837280273, -25.536880493164062, -24.197689056396484, -22.858497619628906, -21.519306182861328, -20.18011474609375, -18.840923309326172, -17.501731872558594, -16.162540435791016, -14.823348045349121, -13.484156608581543, -12.144965171813965, -10.80577278137207, -9.466581344604492, -8.127389907836914, -6.788198471069336, -5.4490065574646, -4.109814643859863, -2.770623207092285, -1.431431770324707, -0.0922393798828125, 1.2469520568847656, 2.5861473083496094, 3.9253389835357666, 5.264530658721924, 6.60372257232666, 7.942914009094238, 9.282105445861816, 10.621297836303711, 11.960489273071289, 13.299680709838867, 14.638872146606445, 15.978063583374023, 17.317256927490234, 18.656448364257812, 19.99563980102539, 21.33483123779297, 22.674022674560547, 24.013214111328125, 25.352405548095703, 26.69159698486328, 28.03078842163086, 29.369979858398438, 30.709171295166016, 32.048362731933594, 33.38755798339844, 34.72674560546875, 36.06593704223633, 37.405128479003906, 38.744319915771484, 40.08351135253906, 41.42270278930664, 42.76189422607422, 44.10108947753906, 45.44028091430664]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 8.0, 11.0, 12.0, 11.0, 10.0, 11.0, 13.0, 19.0, 22.0, 20.0, 32.0, 29.0, 25.0, 34.0, 30.0, 43.0, 37.0, 44.0, 30.0, 42.0, 49.0, 37.0, 47.0, 42.0, 32.0, 33.0, 38.0, 35.0, 21.0, 30.0, 15.0, 25.0, 17.0, 16.0, 15.0, 9.0, 10.0, 8.0, 3.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.071855545043945, -23.28384017944336, -22.495824813842773, -21.707809448242188, -20.919795989990234, -20.13178062438965, -19.343765258789062, -18.555749893188477, -17.76773452758789, -16.979719161987305, -16.19170379638672, -15.40368938446045, -14.61567497253418, -13.827659606933594, -13.039644241333008, -12.251628875732422, -11.463615417480469, -10.675600051879883, -9.887585639953613, -9.099570274353027, -8.311555862426758, -7.523540496826172, -6.735525131225586, -5.947510242462158, -5.1594953536987305, -4.371480464935303, -3.583465337753296, -2.795450210571289, -2.0074353218078613, -1.2194204330444336, -0.43140506744384766, 0.3566098213195801, 1.1446247100830078, 1.932639718055725, 2.7206547260284424, 3.508669853210449, 4.296684741973877, 5.084699630737305, 5.872714996337891, 6.660729885101318, 7.448744773864746, 8.236760139465332, 9.024774551391602, 9.812789916992188, 10.600805282592773, 11.388819694519043, 12.176835060119629, 12.964849472045898, 13.752864837646484, 14.54088020324707, 15.32889461517334, 16.11690902709961, 16.904924392700195, 17.69293975830078, 18.480955123901367, 19.268970489501953, 20.056983947753906, 20.844999313354492, 21.633014678955078, 22.42102813720703, 23.209043502807617, 23.997058868408203, 24.78507423400879, 25.573089599609375, 26.36110496520996]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 25.0, 35.0, 52.0, 79.0, 125.0, 227.0, 359.0, 534.0, 880.0, 1439.0, 2376.0, 4033.0, 6682.0, 11290.0, 18888.0, 31628.0, 51661.0, 79990.0, 114212.0, 144557.0, 154445.0, 137468.0, 104078.0, 70747.0, 44858.0, 27375.0, 15999.0, 9703.0, 5937.0, 3390.0, 2083.0, 1340.0, 749.0, 491.0, 293.0, 182.0, 118.0, 64.0, 56.0, 33.0, 19.0, 15.0, 13.0, 11.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.09228515625, -18.4189453125, -17.74560546875, -17.072265625, -16.39892578125, -15.7255859375, -15.05224609375, -14.37890625, -13.70556640625, -13.0322265625, -12.35888671875, -11.685546875, -11.01220703125, -10.3388671875, -9.66552734375, -8.9921875, -8.31884765625, -7.6455078125, -6.97216796875, -6.298828125, -5.62548828125, -4.9521484375, -4.27880859375, -3.60546875, -2.93212890625, -2.2587890625, -1.58544921875, -0.912109375, -0.23876953125, 0.4345703125, 1.10791015625, 1.78125, 2.45458984375, 3.1279296875, 3.80126953125, 4.474609375, 5.14794921875, 5.8212890625, 6.49462890625, 7.16796875, 7.84130859375, 8.5146484375, 9.18798828125, 9.861328125, 10.53466796875, 11.2080078125, 11.88134765625, 12.5546875, 13.22802734375, 13.9013671875, 14.57470703125, 15.248046875, 15.92138671875, 16.5947265625, 17.26806640625, 17.94140625, 18.61474609375, 19.2880859375, 19.96142578125, 20.634765625, 21.30810546875, 21.9814453125, 22.65478515625, 23.328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 3.0, 6.0, 13.0, 11.0, 14.0, 15.0, 22.0, 22.0, 15.0, 32.0, 41.0, 29.0, 34.0, 35.0, 39.0, 40.0, 34.0, 44.0, 42.0, 40.0, 45.0, 34.0, 41.0, 41.0, 28.0, 35.0, 23.0, 37.0, 18.0, 22.0, 19.0, 18.0, 19.0, 17.0, 11.0, 7.0, 6.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-28.265625, -27.398193359375, -26.53076171875, -25.663330078125, -24.7958984375, -23.928466796875, -23.06103515625, -22.193603515625, -21.326171875, -20.458740234375, -19.59130859375, -18.723876953125, -17.8564453125, -16.989013671875, -16.12158203125, -15.254150390625, -14.38671875, -13.519287109375, -12.65185546875, -11.784423828125, -10.9169921875, -10.049560546875, -9.18212890625, -8.314697265625, -7.447265625, -6.579833984375, -5.71240234375, -4.844970703125, -3.9775390625, -3.110107421875, -2.24267578125, -1.375244140625, -0.5078125, 0.359619140625, 1.22705078125, 2.094482421875, 2.9619140625, 3.829345703125, 4.69677734375, 5.564208984375, 6.431640625, 7.299072265625, 8.16650390625, 9.033935546875, 9.9013671875, 10.768798828125, 11.63623046875, 12.503662109375, 13.37109375, 14.238525390625, 15.10595703125, 15.973388671875, 16.8408203125, 17.708251953125, 18.57568359375, 19.443115234375, 20.310546875, 21.177978515625, 22.04541015625, 22.912841796875, 23.7802734375, 24.647705078125, 25.51513671875, 26.382568359375, 27.25]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 15.0, 35.0, 33.0, 54.0, 81.0, 123.0, 181.0, 274.0, 428.0, 658.0, 1081.0, 1672.0, 2774.0, 4861.0, 8562.0, 15882.0, 30241.0, 58614.0, 110490.0, 186474.0, 229798.0, 177056.0, 102331.0, 54406.0, 27931.0, 14834.0, 8158.0, 4529.0, 2571.0, 1550.0, 979.0, 642.0, 401.0, 257.0, 164.0, 115.0, 76.0, 66.0, 54.0, 33.0, 15.0, 12.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.794921875, -30.71484375, -29.634765625, -28.5546875, -27.474609375, -26.39453125, -25.314453125, -24.234375, -23.154296875, -22.07421875, -20.994140625, -19.9140625, -18.833984375, -17.75390625, -16.673828125, -15.59375, -14.513671875, -13.43359375, -12.353515625, -11.2734375, -10.193359375, -9.11328125, -8.033203125, -6.953125, -5.873046875, -4.79296875, -3.712890625, -2.6328125, -1.552734375, -0.47265625, 0.607421875, 1.6875, 2.767578125, 3.84765625, 4.927734375, 6.0078125, 7.087890625, 8.16796875, 9.248046875, 10.328125, 11.408203125, 12.48828125, 13.568359375, 14.6484375, 15.728515625, 16.80859375, 17.888671875, 18.96875, 20.048828125, 21.12890625, 22.208984375, 23.2890625, 24.369140625, 25.44921875, 26.529296875, 27.609375, 28.689453125, 29.76953125, 30.849609375, 31.9296875, 33.009765625, 34.08984375, 35.169921875, 36.25]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 10.0, 9.0, 11.0, 15.0, 13.0, 14.0, 16.0, 24.0, 23.0, 16.0, 27.0, 28.0, 39.0, 31.0, 41.0, 29.0, 48.0, 48.0, 49.0, 47.0, 41.0, 51.0, 31.0, 42.0, 39.0, 37.0, 28.0, 26.0, 15.0, 19.0, 32.0, 11.0, 13.0, 13.0, 14.0, 7.0, 7.0, 9.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.929931640625, -16.39111328125, -15.852294921875, -15.3134765625, -14.774658203125, -14.23583984375, -13.697021484375, -13.158203125, -12.619384765625, -12.08056640625, -11.541748046875, -11.0029296875, -10.464111328125, -9.92529296875, -9.386474609375, -8.84765625, -8.308837890625, -7.77001953125, -7.231201171875, -6.6923828125, -6.153564453125, -5.61474609375, -5.075927734375, -4.537109375, -3.998291015625, -3.45947265625, -2.920654296875, -2.3818359375, -1.843017578125, -1.30419921875, -0.765380859375, -0.2265625, 0.312255859375, 0.85107421875, 1.389892578125, 1.9287109375, 2.467529296875, 3.00634765625, 3.545166015625, 4.083984375, 4.622802734375, 5.16162109375, 5.700439453125, 6.2392578125, 6.778076171875, 7.31689453125, 7.855712890625, 8.39453125, 8.933349609375, 9.47216796875, 10.010986328125, 10.5498046875, 11.088623046875, 11.62744140625, 12.166259765625, 12.705078125, 13.243896484375, 13.78271484375, 14.321533203125, 14.8603515625, 15.399169921875, 15.93798828125, 16.476806640625, 17.015625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 8.0, 11.0, 10.0, 13.0, 28.0, 46.0, 67.0, 91.0, 146.0, 195.0, 375.0, 573.0, 935.0, 1529.0, 2706.0, 4745.0, 8600.0, 16291.0, 32633.0, 65234.0, 127644.0, 218743.0, 242848.0, 157330.0, 81963.0, 40701.0, 20393.0, 10815.0, 5775.0, 3324.0, 1873.0, 1093.0, 642.0, 413.0, 273.0, 169.0, 110.0, 64.0, 54.0, 32.0, 18.0, 15.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.566650390625, -19.83642578125, -19.106201171875, -18.3759765625, -17.645751953125, -16.91552734375, -16.185302734375, -15.455078125, -14.724853515625, -13.99462890625, -13.264404296875, -12.5341796875, -11.803955078125, -11.07373046875, -10.343505859375, -9.61328125, -8.883056640625, -8.15283203125, -7.422607421875, -6.6923828125, -5.962158203125, -5.23193359375, -4.501708984375, -3.771484375, -3.041259765625, -2.31103515625, -1.580810546875, -0.8505859375, -0.120361328125, 0.60986328125, 1.340087890625, 2.0703125, 2.800537109375, 3.53076171875, 4.260986328125, 4.9912109375, 5.721435546875, 6.45166015625, 7.181884765625, 7.912109375, 8.642333984375, 9.37255859375, 10.102783203125, 10.8330078125, 11.563232421875, 12.29345703125, 13.023681640625, 13.75390625, 14.484130859375, 15.21435546875, 15.944580078125, 16.6748046875, 17.405029296875, 18.13525390625, 18.865478515625, 19.595703125, 20.325927734375, 21.05615234375, 21.786376953125, 22.5166015625, 23.246826171875, 23.97705078125, 24.707275390625, 25.4375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 12.0, 11.0, 18.0, 12.0, 22.0, 18.0, 29.0, 27.0, 43.0, 45.0, 47.0, 52.0, 66.0, 69.0, 65.0, 59.0, 60.0, 56.0, 48.0, 47.0, 28.0, 33.0, 24.0, 27.0, 15.0, 7.0, 9.0, 8.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000919342041015625, -0.0008916258811950684, -0.0008639097213745117, -0.0008361935615539551, -0.0008084774017333984, -0.0007807612419128418, -0.0007530450820922852, -0.0007253289222717285, -0.0006976127624511719, -0.0006698966026306152, -0.0006421804428100586, -0.000614464282989502, -0.0005867481231689453, -0.0005590319633483887, -0.000531315803527832, -0.0005035996437072754, -0.00047588348388671875, -0.0004481673240661621, -0.00042045116424560547, -0.00039273500442504883, -0.0003650188446044922, -0.00033730268478393555, -0.0003095865249633789, -0.00028187036514282227, -0.0002541542053222656, -0.00022643804550170898, -0.00019872188568115234, -0.0001710057258605957, -0.00014328956604003906, -0.00011557340621948242, -8.785724639892578e-05, -6.014108657836914e-05, -3.24249267578125e-05, -4.708766937255859e-06, 2.300739288330078e-05, 5.072355270385742e-05, 7.843971252441406e-05, 0.0001061558723449707, 0.00013387203216552734, 0.00016158819198608398, 0.00018930435180664062, 0.00021702051162719727, 0.0002447366714477539, 0.00027245283126831055, 0.0003001689910888672, 0.00032788515090942383, 0.00035560131072998047, 0.0003833174705505371, 0.00041103363037109375, 0.0004387497901916504, 0.00046646595001220703, 0.0004941821098327637, 0.0005218982696533203, 0.000549614429473877, 0.0005773305892944336, 0.0006050467491149902, 0.0006327629089355469, 0.0006604790687561035, 0.0006881952285766602, 0.0007159113883972168, 0.0007436275482177734, 0.0007713437080383301, 0.0007990598678588867, 0.0008267760276794434, 0.0008544921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 8.0, 3.0, 9.0, 15.0, 13.0, 25.0, 40.0, 54.0, 71.0, 104.0, 145.0, 208.0, 268.0, 500.0, 751.0, 1223.0, 2105.0, 3688.0, 6581.0, 12563.0, 24403.0, 46640.0, 88175.0, 149480.0, 205669.0, 198857.0, 138578.0, 79202.0, 41827.0, 21578.0, 11246.0, 6073.0, 3257.0, 1875.0, 1145.0, 744.0, 486.0, 308.0, 162.0, 139.0, 94.0, 60.0, 40.0, 47.0, 27.0, 24.0, 10.0, 12.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.609375, -24.781005859375, -23.95263671875, -23.124267578125, -22.2958984375, -21.467529296875, -20.63916015625, -19.810791015625, -18.982421875, -18.154052734375, -17.32568359375, -16.497314453125, -15.6689453125, -14.840576171875, -14.01220703125, -13.183837890625, -12.35546875, -11.527099609375, -10.69873046875, -9.870361328125, -9.0419921875, -8.213623046875, -7.38525390625, -6.556884765625, -5.728515625, -4.900146484375, -4.07177734375, -3.243408203125, -2.4150390625, -1.586669921875, -0.75830078125, 0.070068359375, 0.8984375, 1.726806640625, 2.55517578125, 3.383544921875, 4.2119140625, 5.040283203125, 5.86865234375, 6.697021484375, 7.525390625, 8.353759765625, 9.18212890625, 10.010498046875, 10.8388671875, 11.667236328125, 12.49560546875, 13.323974609375, 14.15234375, 14.980712890625, 15.80908203125, 16.637451171875, 17.4658203125, 18.294189453125, 19.12255859375, 19.950927734375, 20.779296875, 21.607666015625, 22.43603515625, 23.264404296875, 24.0927734375, 24.921142578125, 25.74951171875, 26.577880859375, 27.40625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 17.0, 12.0, 18.0, 21.0, 30.0, 44.0, 21.0, 37.0, 44.0, 50.0, 53.0, 41.0, 56.0, 53.0, 58.0, 62.0, 63.0, 57.0, 37.0, 32.0, 24.0, 31.0, 19.0, 15.0, 13.0, 14.0, 7.0, 9.0, 10.0, 4.0, 3.0, 2.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.390625, -7.19158935546875, -6.9925537109375, -6.79351806640625, -6.594482421875, -6.39544677734375, -6.1964111328125, -5.99737548828125, -5.79833984375, -5.59930419921875, -5.4002685546875, -5.20123291015625, -5.002197265625, -4.80316162109375, -4.6041259765625, -4.40509033203125, -4.2060546875, -4.00701904296875, -3.8079833984375, -3.60894775390625, -3.409912109375, -3.21087646484375, -3.0118408203125, -2.81280517578125, -2.61376953125, -2.41473388671875, -2.2156982421875, -2.01666259765625, -1.817626953125, -1.61859130859375, -1.4195556640625, -1.22052001953125, -1.021484375, -0.82244873046875, -0.6234130859375, -0.42437744140625, -0.225341796875, -0.02630615234375, 0.1727294921875, 0.37176513671875, 0.57080078125, 0.76983642578125, 0.9688720703125, 1.16790771484375, 1.366943359375, 1.56597900390625, 1.7650146484375, 1.96405029296875, 2.1630859375, 2.36212158203125, 2.5611572265625, 2.76019287109375, 2.959228515625, 3.15826416015625, 3.3572998046875, 3.55633544921875, 3.75537109375, 3.95440673828125, 4.1534423828125, 4.35247802734375, 4.551513671875, 4.75054931640625, 4.9495849609375, 5.14862060546875, 5.34765625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 8.0, 7.0, 9.0, 11.0, 10.0, 13.0, 18.0, 29.0, 30.0, 26.0, 39.0, 51.0, 45.0, 61.0, 44.0, 60.0, 61.0, 57.0, 47.0, 48.0, 51.0, 43.0, 44.0, 32.0, 28.0, 25.0, 17.0, 17.0, 13.0, 8.0, 12.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21493148803711, -39.865421295166016, -38.515907287597656, -37.16639709472656, -35.81688690185547, -34.467376708984375, -33.11786651611328, -31.768352508544922, -30.418842315673828, -29.069332122802734, -27.719820022583008, -26.37030792236328, -25.020797729492188, -23.671287536621094, -22.321775436401367, -20.97226333618164, -19.622753143310547, -18.273242950439453, -16.923730850219727, -15.574219703674316, -14.224708557128906, -12.875197410583496, -11.525686264038086, -10.176175117492676, -8.826663970947266, -7.4771528244018555, -6.127641677856445, -4.778130531311035, -3.428619384765625, -2.079108238220215, -0.7295970916748047, 0.6199140548706055, 1.9694252014160156, 3.318936347961426, 4.668447494506836, 6.017958641052246, 7.367469787597656, 8.716980934143066, 10.066492080688477, 11.416003227233887, 12.765514373779297, 14.115025520324707, 15.464536666870117, 16.814048767089844, 18.163558959960938, 19.51306915283203, 20.862581253051758, 22.212093353271484, 23.561603546142578, 24.911113739013672, 26.2606258392334, 27.610137939453125, 28.95964813232422, 30.309158325195312, 31.65867042541504, 33.008182525634766, 34.35769271850586, 35.70720291137695, 37.05671691894531, 38.406227111816406, 39.7557373046875, 41.105247497558594, 42.45475769042969, 43.80427169799805, 45.15378189086914]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 7.0, 17.0, 9.0, 13.0, 8.0, 15.0, 18.0, 20.0, 25.0, 20.0, 29.0, 27.0, 33.0, 33.0, 34.0, 38.0, 44.0, 40.0, 32.0, 49.0, 48.0, 45.0, 47.0, 38.0, 32.0, 22.0, 44.0, 23.0, 25.0, 20.0, 17.0, 23.0, 13.0, 19.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.21017074584961, -24.417564392089844, -23.624958038330078, -22.832353591918945, -22.03974723815918, -21.247140884399414, -20.45453643798828, -19.661930084228516, -18.86932373046875, -18.076717376708984, -17.28411102294922, -16.491506576538086, -15.69890022277832, -14.906293869018555, -14.113688468933105, -13.321083068847656, -12.52847671508789, -11.735870361328125, -10.943264961242676, -10.150659561157227, -9.358053207397461, -8.565446853637695, -7.772841453552246, -6.980235576629639, -6.187629699707031, -5.395023822784424, -4.602417945861816, -3.809812068939209, -3.0172061920166016, -2.224600315093994, -1.4319944381713867, -0.6393885612487793, 0.1532154083251953, 0.9458212852478027, 1.7384271621704102, 2.5310330390930176, 3.323638916015625, 4.116244792938232, 4.90885066986084, 5.701456546783447, 6.494062423706055, 7.286668300628662, 8.07927417755127, 8.871879577636719, 9.664485931396484, 10.45709228515625, 11.2496976852417, 12.042303085327148, 12.834909439086914, 13.62751579284668, 14.420121192932129, 15.212726593017578, 16.005332946777344, 16.79793930053711, 17.590545654296875, 18.383150100708008, 19.175756454467773, 19.96836280822754, 20.760967254638672, 21.553573608398438, 22.346179962158203, 23.13878631591797, 23.931392669677734, 24.723997116088867, 25.516603469848633]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 16.0, 13.0, 23.0, 43.0, 52.0, 89.0, 136.0, 229.0, 320.0, 545.0, 808.0, 1269.0, 2064.0, 3129.0, 5350.0, 8854.0, 14758.0, 24836.0, 39970.0, 63968.0, 94843.0, 128732.0, 149965.0, 147091.0, 122194.0, 88413.0, 58215.0, 36580.0, 21975.0, 13349.0, 7909.0, 4832.0, 2998.0, 1826.0, 1162.0, 742.0, 445.0, 279.0, 187.0, 117.0, 81.0, 44.0, 33.0, 23.0, 16.0, 8.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.25, -24.405517578125, -23.56103515625, -22.716552734375, -21.8720703125, -21.027587890625, -20.18310546875, -19.338623046875, -18.494140625, -17.649658203125, -16.80517578125, -15.960693359375, -15.1162109375, -14.271728515625, -13.42724609375, -12.582763671875, -11.73828125, -10.893798828125, -10.04931640625, -9.204833984375, -8.3603515625, -7.515869140625, -6.67138671875, -5.826904296875, -4.982421875, -4.137939453125, -3.29345703125, -2.448974609375, -1.6044921875, -0.760009765625, 0.08447265625, 0.928955078125, 1.7734375, 2.617919921875, 3.46240234375, 4.306884765625, 5.1513671875, 5.995849609375, 6.84033203125, 7.684814453125, 8.529296875, 9.373779296875, 10.21826171875, 11.062744140625, 11.9072265625, 12.751708984375, 13.59619140625, 14.440673828125, 15.28515625, 16.129638671875, 16.97412109375, 17.818603515625, 18.6630859375, 19.507568359375, 20.35205078125, 21.196533203125, 22.041015625, 22.885498046875, 23.72998046875, 24.574462890625, 25.4189453125, 26.263427734375, 27.10791015625, 27.952392578125, 28.796875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 11.0, 9.0, 15.0, 20.0, 22.0, 19.0, 12.0, 20.0, 16.0, 44.0, 30.0, 46.0, 33.0, 49.0, 51.0, 57.0, 65.0, 55.0, 42.0, 53.0, 46.0, 43.0, 34.0, 41.0, 31.0, 19.0, 24.0, 13.0, 18.0, 15.0, 11.0, 10.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.169189453125, -28.13525390625, -27.101318359375, -26.0673828125, -25.033447265625, -23.99951171875, -22.965576171875, -21.931640625, -20.897705078125, -19.86376953125, -18.829833984375, -17.7958984375, -16.761962890625, -15.72802734375, -14.694091796875, -13.66015625, -12.626220703125, -11.59228515625, -10.558349609375, -9.5244140625, -8.490478515625, -7.45654296875, -6.422607421875, -5.388671875, -4.354736328125, -3.32080078125, -2.286865234375, -1.2529296875, -0.218994140625, 0.81494140625, 1.848876953125, 2.8828125, 3.916748046875, 4.95068359375, 5.984619140625, 7.0185546875, 8.052490234375, 9.08642578125, 10.120361328125, 11.154296875, 12.188232421875, 13.22216796875, 14.256103515625, 15.2900390625, 16.323974609375, 17.35791015625, 18.391845703125, 19.42578125, 20.459716796875, 21.49365234375, 22.527587890625, 23.5615234375, 24.595458984375, 25.62939453125, 26.663330078125, 27.697265625, 28.731201171875, 29.76513671875, 30.799072265625, 31.8330078125, 32.866943359375, 33.90087890625, 34.934814453125, 35.96875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 3.0, 6.0, 6.0, 13.0, 18.0, 33.0, 33.0, 52.0, 72.0, 91.0, 167.0, 219.0, 323.0, 453.0, 710.0, 1186.0, 1961.0, 3251.0, 5777.0, 11110.0, 21896.0, 45688.0, 93532.0, 166494.0, 224217.0, 205476.0, 130613.0, 67702.0, 32429.0, 15839.0, 8157.0, 4205.0, 2551.0, 1484.0, 925.0, 619.0, 390.0, 249.0, 180.0, 112.0, 91.0, 82.0, 43.0, 24.0, 21.0, 19.0, 10.0, 3.0, 9.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.40625, -44.89794921875, -43.3896484375, -41.88134765625, -40.373046875, -38.86474609375, -37.3564453125, -35.84814453125, -34.33984375, -32.83154296875, -31.3232421875, -29.81494140625, -28.306640625, -26.79833984375, -25.2900390625, -23.78173828125, -22.2734375, -20.76513671875, -19.2568359375, -17.74853515625, -16.240234375, -14.73193359375, -13.2236328125, -11.71533203125, -10.20703125, -8.69873046875, -7.1904296875, -5.68212890625, -4.173828125, -2.66552734375, -1.1572265625, 0.35107421875, 1.859375, 3.36767578125, 4.8759765625, 6.38427734375, 7.892578125, 9.40087890625, 10.9091796875, 12.41748046875, 13.92578125, 15.43408203125, 16.9423828125, 18.45068359375, 19.958984375, 21.46728515625, 22.9755859375, 24.48388671875, 25.9921875, 27.50048828125, 29.0087890625, 30.51708984375, 32.025390625, 33.53369140625, 35.0419921875, 36.55029296875, 38.05859375, 39.56689453125, 41.0751953125, 42.58349609375, 44.091796875, 45.60009765625, 47.1083984375, 48.61669921875, 50.125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 5.0, 11.0, 8.0, 10.0, 12.0, 10.0, 23.0, 11.0, 21.0, 35.0, 25.0, 28.0, 39.0, 34.0, 35.0, 46.0, 38.0, 42.0, 45.0, 38.0, 35.0, 31.0, 46.0, 43.0, 38.0, 29.0, 24.0, 41.0, 31.0, 23.0, 21.0, 19.0, 22.0, 16.0, 14.0, 7.0, 9.0, 10.0, 2.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.015625, -20.408203125, -19.80078125, -19.193359375, -18.5859375, -17.978515625, -17.37109375, -16.763671875, -16.15625, -15.548828125, -14.94140625, -14.333984375, -13.7265625, -13.119140625, -12.51171875, -11.904296875, -11.296875, -10.689453125, -10.08203125, -9.474609375, -8.8671875, -8.259765625, -7.65234375, -7.044921875, -6.4375, -5.830078125, -5.22265625, -4.615234375, -4.0078125, -3.400390625, -2.79296875, -2.185546875, -1.578125, -0.970703125, -0.36328125, 0.244140625, 0.8515625, 1.458984375, 2.06640625, 2.673828125, 3.28125, 3.888671875, 4.49609375, 5.103515625, 5.7109375, 6.318359375, 6.92578125, 7.533203125, 8.140625, 8.748046875, 9.35546875, 9.962890625, 10.5703125, 11.177734375, 11.78515625, 12.392578125, 13.0, 13.607421875, 14.21484375, 14.822265625, 15.4296875, 16.037109375, 16.64453125, 17.251953125, 17.859375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 11.0, 16.0, 10.0, 21.0, 39.0, 55.0, 67.0, 95.0, 149.0, 180.0, 260.0, 336.0, 540.0, 869.0, 1378.0, 2185.0, 3661.0, 6296.0, 11546.0, 20937.0, 39877.0, 74570.0, 133868.0, 199478.0, 209265.0, 151496.0, 88069.0, 46782.0, 24714.0, 13176.0, 7542.0, 4186.0, 2471.0, 1505.0, 965.0, 587.0, 379.0, 265.0, 209.0, 153.0, 95.0, 74.0, 57.0, 36.0, 31.0, 20.0, 13.0, 13.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.4375, -25.662841796875, -24.88818359375, -24.113525390625, -23.3388671875, -22.564208984375, -21.78955078125, -21.014892578125, -20.240234375, -19.465576171875, -18.69091796875, -17.916259765625, -17.1416015625, -16.366943359375, -15.59228515625, -14.817626953125, -14.04296875, -13.268310546875, -12.49365234375, -11.718994140625, -10.9443359375, -10.169677734375, -9.39501953125, -8.620361328125, -7.845703125, -7.071044921875, -6.29638671875, -5.521728515625, -4.7470703125, -3.972412109375, -3.19775390625, -2.423095703125, -1.6484375, -0.873779296875, -0.09912109375, 0.675537109375, 1.4501953125, 2.224853515625, 2.99951171875, 3.774169921875, 4.548828125, 5.323486328125, 6.09814453125, 6.872802734375, 7.6474609375, 8.422119140625, 9.19677734375, 9.971435546875, 10.74609375, 11.520751953125, 12.29541015625, 13.070068359375, 13.8447265625, 14.619384765625, 15.39404296875, 16.168701171875, 16.943359375, 17.718017578125, 18.49267578125, 19.267333984375, 20.0419921875, 20.816650390625, 21.59130859375, 22.365966796875, 23.140625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 7.0, 8.0, 11.0, 11.0, 20.0, 29.0, 44.0, 67.0, 81.0, 95.0, 125.0, 119.0, 95.0, 81.0, 69.0, 47.0, 27.0, 21.0, 12.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032787322998046875, -0.0031517446041107178, -0.003024756908416748, -0.0028977692127227783, -0.0027707815170288086, -0.002643793821334839, -0.002516806125640869, -0.0023898184299468994, -0.0022628307342529297, -0.00213584303855896, -0.0020088553428649902, -0.0018818676471710205, -0.0017548799514770508, -0.001627892255783081, -0.0015009045600891113, -0.0013739168643951416, -0.0012469291687011719, -0.0011199414730072021, -0.0009929537773132324, -0.0008659660816192627, -0.000738978385925293, -0.0006119906902313232, -0.0004850029945373535, -0.0003580152988433838, -0.00023102760314941406, -0.00010403990745544434, 2.294778823852539e-05, 0.00014993548393249512, 0.00027692317962646484, 0.00040391087532043457, 0.0005308985710144043, 0.000657886266708374, 0.0007848739624023438, 0.0009118616580963135, 0.0010388493537902832, 0.001165837049484253, 0.0012928247451782227, 0.0014198124408721924, 0.0015468001365661621, 0.0016737878322601318, 0.0018007755279541016, 0.0019277632236480713, 0.002054750919342041, 0.0021817386150360107, 0.0023087263107299805, 0.00243571400642395, 0.00256270170211792, 0.0026896893978118896, 0.0028166770935058594, 0.002943664789199829, 0.003070652484893799, 0.0031976401805877686, 0.0033246278762817383, 0.003451615571975708, 0.0035786032676696777, 0.0037055909633636475, 0.003832578659057617, 0.003959566354751587, 0.004086554050445557, 0.004213541746139526, 0.004340529441833496, 0.004467517137527466, 0.0045945048332214355, 0.004721492528915405, 0.004848480224609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 15.0, 16.0, 24.0, 47.0, 53.0, 80.0, 115.0, 178.0, 276.0, 424.0, 601.0, 951.0, 1412.0, 2361.0, 3652.0, 6230.0, 10685.0, 19082.0, 34887.0, 65306.0, 116803.0, 181193.0, 207424.0, 166589.0, 103035.0, 56502.0, 30140.0, 16533.0, 9468.0, 5475.0, 3268.0, 2042.0, 1250.0, 795.0, 534.0, 334.0, 237.0, 153.0, 113.0, 79.0, 54.0, 33.0, 31.0, 23.0, 9.0, 14.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-24.53125, -23.74951171875, -22.9677734375, -22.18603515625, -21.404296875, -20.62255859375, -19.8408203125, -19.05908203125, -18.27734375, -17.49560546875, -16.7138671875, -15.93212890625, -15.150390625, -14.36865234375, -13.5869140625, -12.80517578125, -12.0234375, -11.24169921875, -10.4599609375, -9.67822265625, -8.896484375, -8.11474609375, -7.3330078125, -6.55126953125, -5.76953125, -4.98779296875, -4.2060546875, -3.42431640625, -2.642578125, -1.86083984375, -1.0791015625, -0.29736328125, 0.484375, 1.26611328125, 2.0478515625, 2.82958984375, 3.611328125, 4.39306640625, 5.1748046875, 5.95654296875, 6.73828125, 7.52001953125, 8.3017578125, 9.08349609375, 9.865234375, 10.64697265625, 11.4287109375, 12.21044921875, 12.9921875, 13.77392578125, 14.5556640625, 15.33740234375, 16.119140625, 16.90087890625, 17.6826171875, 18.46435546875, 19.24609375, 20.02783203125, 20.8095703125, 21.59130859375, 22.373046875, 23.15478515625, 23.9365234375, 24.71826171875, 25.5]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 7.0, 16.0, 12.0, 20.0, 31.0, 30.0, 38.0, 44.0, 67.0, 65.0, 63.0, 93.0, 68.0, 74.0, 75.0, 65.0, 51.0, 26.0, 24.0, 22.0, 27.0, 10.0, 12.0, 8.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.9005126953125, -7.629150390625, -7.3577880859375, -7.08642578125, -6.8150634765625, -6.543701171875, -6.2723388671875, -6.0009765625, -5.7296142578125, -5.458251953125, -5.1868896484375, -4.91552734375, -4.6441650390625, -4.372802734375, -4.1014404296875, -3.830078125, -3.5587158203125, -3.287353515625, -3.0159912109375, -2.74462890625, -2.4732666015625, -2.201904296875, -1.9305419921875, -1.6591796875, -1.3878173828125, -1.116455078125, -0.8450927734375, -0.57373046875, -0.3023681640625, -0.031005859375, 0.2403564453125, 0.51171875, 0.7830810546875, 1.054443359375, 1.3258056640625, 1.59716796875, 1.8685302734375, 2.139892578125, 2.4112548828125, 2.6826171875, 2.9539794921875, 3.225341796875, 3.4967041015625, 3.76806640625, 4.0394287109375, 4.310791015625, 4.5821533203125, 4.853515625, 5.1248779296875, 5.396240234375, 5.6676025390625, 5.93896484375, 6.2103271484375, 6.481689453125, 6.7530517578125, 7.0244140625, 7.2957763671875, 7.567138671875, 7.8385009765625, 8.10986328125, 8.3812255859375, 8.652587890625, 8.9239501953125, 9.1953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 12.0, 8.0, 11.0, 12.0, 17.0, 26.0, 20.0, 20.0, 46.0, 37.0, 41.0, 50.0, 45.0, 45.0, 48.0, 38.0, 48.0, 47.0, 50.0, 43.0, 48.0, 41.0, 28.0, 37.0, 29.0, 19.0, 22.0, 21.0, 17.0, 10.0, 11.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.419578552246094, -34.14214324951172, -32.864707946777344, -31.58727264404297, -30.309837341308594, -29.03240203857422, -27.754966735839844, -26.47753143310547, -25.200096130371094, -23.92266082763672, -22.645225524902344, -21.36779022216797, -20.090354919433594, -18.81291961669922, -17.535484313964844, -16.25804901123047, -14.980615615844727, -13.703180313110352, -12.425745010375977, -11.148309707641602, -9.870874404907227, -8.593439102172852, -7.316004753112793, -6.038569450378418, -4.761134147644043, -3.483698844909668, -2.206263780593872, -0.9288287162780762, 0.34860658645629883, 1.6260418891906738, 2.9034767150878906, 4.180912017822266, 5.458347320556641, 6.735782623291016, 8.01321792602539, 9.290653228759766, 10.56808853149414, 11.845523834228516, 13.122958183288574, 14.40039348602295, 15.677828788757324, 16.955263137817383, 18.232698440551758, 19.510133743286133, 20.787569046020508, 22.065004348754883, 23.342439651489258, 24.619874954223633, 25.897310256958008, 27.174745559692383, 28.452180862426758, 29.729616165161133, 31.007051467895508, 32.28448486328125, 33.561920166015625, 34.83935546875, 36.116790771484375, 37.39422607421875, 38.671661376953125, 39.9490966796875, 41.226531982421875, 42.50396728515625, 43.781402587890625, 45.058837890625, 46.336273193359375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 6.0, 7.0, 12.0, 11.0, 13.0, 6.0, 28.0, 8.0, 24.0, 29.0, 24.0, 25.0, 33.0, 42.0, 38.0, 45.0, 35.0, 43.0, 49.0, 45.0, 52.0, 43.0, 31.0, 37.0, 34.0, 38.0, 29.0, 29.0, 30.0, 16.0, 29.0, 17.0, 14.0, 12.0, 15.0, 5.0, 5.0, 13.0, 12.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.991695404052734, -33.017005920410156, -32.042320251464844, -31.0676326751709, -30.092945098876953, -29.118255615234375, -28.14356803894043, -27.168880462646484, -26.19419288635254, -25.219505310058594, -24.24481773376465, -23.270130157470703, -22.295440673828125, -21.320755004882812, -20.346065521240234, -19.37137794494629, -18.396690368652344, -17.4220027923584, -16.447315216064453, -15.472626686096191, -14.497939109802246, -13.5232515335083, -12.548563003540039, -11.573875427246094, -10.599187850952148, -9.624500274658203, -8.649812698364258, -7.675124168395996, -6.700436592102051, -5.7257490158081055, -4.751060962677002, -3.7763729095458984, -2.801685333251953, -1.8269975185394287, -0.8523097038269043, 0.12237811088562012, 1.0970659255981445, 2.07175350189209, 3.0464415550231934, 4.021129608154297, 4.995817184448242, 5.9705047607421875, 6.945192813873291, 7.9198808670043945, 8.89456844329834, 9.869256019592285, 10.843944549560547, 11.818632125854492, 12.793319702148438, 13.768007278442383, 14.742694854736328, 15.71738338470459, 16.69207000732422, 17.666759490966797, 18.641447067260742, 19.616134643554688, 20.590822219848633, 21.565509796142578, 22.540197372436523, 23.51488494873047, 24.489574432373047, 25.46426010131836, 26.438949584960938, 27.413637161254883, 28.388324737548828]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 16.0, 14.0, 26.0, 50.0, 71.0, 116.0, 205.0, 337.0, 550.0, 1012.0, 1772.0, 3163.0, 5632.0, 10130.0, 18898.0, 35827.0, 69036.0, 135464.0, 268491.0, 501172.0, 789335.0, 886923.0, 670110.0, 385608.0, 198975.0, 100430.0, 51500.0, 26948.0, 14265.0, 7760.0, 4379.0, 2432.0, 1421.0, 811.0, 505.0, 297.0, 206.0, 129.0, 82.0, 73.0, 38.0, 18.0, 15.0, 14.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-43.53125, -42.1396484375, -40.748046875, -39.3564453125, -37.96484375, -36.5732421875, -35.181640625, -33.7900390625, -32.3984375, -31.0068359375, -29.615234375, -28.2236328125, -26.83203125, -25.4404296875, -24.048828125, -22.6572265625, -21.265625, -19.8740234375, -18.482421875, -17.0908203125, -15.69921875, -14.3076171875, -12.916015625, -11.5244140625, -10.1328125, -8.7412109375, -7.349609375, -5.9580078125, -4.56640625, -3.1748046875, -1.783203125, -0.3916015625, 1.0, 2.3916015625, 3.783203125, 5.1748046875, 6.56640625, 7.9580078125, 9.349609375, 10.7412109375, 12.1328125, 13.5244140625, 14.916015625, 16.3076171875, 17.69921875, 19.0908203125, 20.482421875, 21.8740234375, 23.265625, 24.6572265625, 26.048828125, 27.4404296875, 28.83203125, 30.2236328125, 31.615234375, 33.0068359375, 34.3984375, 35.7900390625, 37.181640625, 38.5732421875, 39.96484375, 41.3564453125, 42.748046875, 44.1396484375, 45.53125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 9.0, 5.0, 20.0, 14.0, 12.0, 14.0, 20.0, 17.0, 24.0, 22.0, 32.0, 36.0, 30.0, 42.0, 31.0, 39.0, 37.0, 42.0, 46.0, 46.0, 45.0, 42.0, 33.0, 36.0, 39.0, 41.0, 33.0, 32.0, 17.0, 22.0, 13.0, 12.0, 21.0, 15.0, 10.0, 8.0, 10.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.6875, -28.724609375, -27.76171875, -26.798828125, -25.8359375, -24.873046875, -23.91015625, -22.947265625, -21.984375, -21.021484375, -20.05859375, -19.095703125, -18.1328125, -17.169921875, -16.20703125, -15.244140625, -14.28125, -13.318359375, -12.35546875, -11.392578125, -10.4296875, -9.466796875, -8.50390625, -7.541015625, -6.578125, -5.615234375, -4.65234375, -3.689453125, -2.7265625, -1.763671875, -0.80078125, 0.162109375, 1.125, 2.087890625, 3.05078125, 4.013671875, 4.9765625, 5.939453125, 6.90234375, 7.865234375, 8.828125, 9.791015625, 10.75390625, 11.716796875, 12.6796875, 13.642578125, 14.60546875, 15.568359375, 16.53125, 17.494140625, 18.45703125, 19.419921875, 20.3828125, 21.345703125, 22.30859375, 23.271484375, 24.234375, 25.197265625, 26.16015625, 27.123046875, 28.0859375, 29.048828125, 30.01171875, 30.974609375, 31.9375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 7.0, 10.0, 11.0, 17.0, 29.0, 50.0, 58.0, 108.0, 136.0, 244.0, 362.0, 610.0, 965.0, 1613.0, 2535.0, 4119.0, 6812.0, 11763.0, 19568.0, 34178.0, 58718.0, 102402.0, 177157.0, 301787.0, 483858.0, 677016.0, 737788.0, 599140.0, 399391.0, 241594.0, 139803.0, 80501.0, 46005.0, 26826.0, 15665.0, 9264.0, 5455.0, 3309.0, 2007.0, 1260.0, 792.0, 501.0, 292.0, 223.0, 122.0, 91.0, 47.0, 32.0, 18.0, 19.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.71435546875, -46.0849609375, -44.45556640625, -42.826171875, -41.19677734375, -39.5673828125, -37.93798828125, -36.30859375, -34.67919921875, -33.0498046875, -31.42041015625, -29.791015625, -28.16162109375, -26.5322265625, -24.90283203125, -23.2734375, -21.64404296875, -20.0146484375, -18.38525390625, -16.755859375, -15.12646484375, -13.4970703125, -11.86767578125, -10.23828125, -8.60888671875, -6.9794921875, -5.35009765625, -3.720703125, -2.09130859375, -0.4619140625, 1.16748046875, 2.796875, 4.42626953125, 6.0556640625, 7.68505859375, 9.314453125, 10.94384765625, 12.5732421875, 14.20263671875, 15.83203125, 17.46142578125, 19.0908203125, 20.72021484375, 22.349609375, 23.97900390625, 25.6083984375, 27.23779296875, 28.8671875, 30.49658203125, 32.1259765625, 33.75537109375, 35.384765625, 37.01416015625, 38.6435546875, 40.27294921875, 41.90234375, 43.53173828125, 45.1611328125, 46.79052734375, 48.419921875, 50.04931640625, 51.6787109375, 53.30810546875, 54.9375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 13.0, 17.0, 31.0, 35.0, 29.0, 49.0, 56.0, 82.0, 90.0, 121.0, 160.0, 169.0, 203.0, 218.0, 257.0, 274.0, 258.0, 272.0, 233.0, 270.0, 239.0, 196.0, 158.0, 116.0, 94.0, 91.0, 65.0, 60.0, 51.0, 31.0, 32.0, 22.0, 15.0, 12.0, 10.0, 6.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.17333984375, -18.5498046875, -17.92626953125, -17.302734375, -16.67919921875, -16.0556640625, -15.43212890625, -14.80859375, -14.18505859375, -13.5615234375, -12.93798828125, -12.314453125, -11.69091796875, -11.0673828125, -10.44384765625, -9.8203125, -9.19677734375, -8.5732421875, -7.94970703125, -7.326171875, -6.70263671875, -6.0791015625, -5.45556640625, -4.83203125, -4.20849609375, -3.5849609375, -2.96142578125, -2.337890625, -1.71435546875, -1.0908203125, -0.46728515625, 0.15625, 0.77978515625, 1.4033203125, 2.02685546875, 2.650390625, 3.27392578125, 3.8974609375, 4.52099609375, 5.14453125, 5.76806640625, 6.3916015625, 7.01513671875, 7.638671875, 8.26220703125, 8.8857421875, 9.50927734375, 10.1328125, 10.75634765625, 11.3798828125, 12.00341796875, 12.626953125, 13.25048828125, 13.8740234375, 14.49755859375, 15.12109375, 15.74462890625, 16.3681640625, 16.99169921875, 17.615234375, 18.23876953125, 18.8623046875, 19.48583984375, 20.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 6.0, 15.0, 11.0, 14.0, 15.0, 30.0, 29.0, 34.0, 30.0, 40.0, 42.0, 49.0, 44.0, 41.0, 54.0, 58.0, 46.0, 55.0, 54.0, 45.0, 43.0, 21.0, 38.0, 27.0, 23.0, 23.0, 23.0, 16.0, 6.0, 11.0, 10.0, 12.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.776466369628906, -52.83802032470703, -50.89957046508789, -48.961124420166016, -47.022674560546875, -45.084228515625, -43.145782470703125, -41.207332611083984, -39.268882751464844, -37.33043670654297, -35.39198684692383, -33.45354080200195, -31.515090942382812, -29.576644897460938, -27.63819694519043, -25.699748992919922, -23.761302947998047, -21.82285499572754, -19.88440704345703, -17.945960998535156, -16.007511138916016, -14.069064140319824, -12.130617141723633, -10.192169189453125, -8.253721237182617, -6.315273284912109, -4.37682580947876, -2.43837833404541, -0.49993038177490234, 1.4385175704956055, 3.376964569091797, 5.315412521362305, 7.2538604736328125, 9.19230842590332, 11.130756378173828, 13.06920337677002, 15.007651329040527, 16.94609832763672, 18.884546279907227, 20.822994232177734, 22.761442184448242, 24.69989013671875, 26.638338088989258, 28.576786041259766, 30.51523208618164, 32.45368194580078, 34.392127990722656, 36.33057403564453, 38.26902389526367, 40.20746994018555, 42.14591979980469, 44.08436584472656, 46.0228157043457, 47.96126174926758, 49.89971160888672, 51.838157653808594, 53.77660369873047, 55.715049743652344, 57.653499603271484, 59.59194564819336, 61.5303955078125, 63.468841552734375, 65.40728759765625, 67.34573364257812, 69.28418731689453]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 12.0, 6.0, 9.0, 9.0, 10.0, 18.0, 20.0, 21.0, 26.0, 22.0, 30.0, 29.0, 38.0, 31.0, 42.0, 34.0, 41.0, 48.0, 37.0, 41.0, 32.0, 34.0, 37.0, 31.0, 37.0, 45.0, 29.0, 35.0, 26.0, 23.0, 22.0, 12.0, 15.0, 13.0, 12.0, 13.0, 12.0, 14.0, 4.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.55194854736328, -44.18765640258789, -42.8233642578125, -41.459068298339844, -40.09477615356445, -38.73048400878906, -37.36619186401367, -36.00189971923828, -34.637603759765625, -33.273311614990234, -31.90901756286621, -30.54472541809082, -29.180431365966797, -27.816139221191406, -26.451847076416016, -25.087554931640625, -23.723262786865234, -22.358970642089844, -20.99467658996582, -19.63038444519043, -18.266090393066406, -16.901798248291016, -15.537506103515625, -14.173213005065918, -12.808919906616211, -11.444626808166504, -10.080333709716797, -8.716041564941406, -7.351748466491699, -5.987455368041992, -4.623163223266602, -3.2588701248168945, -1.8945770263671875, -0.5302841663360596, 0.8340086936950684, 2.198301315307617, 3.562594413757324, 4.926887512207031, 6.291179656982422, 7.655472755432129, 9.019765853881836, 10.384058952331543, 11.74835205078125, 13.11264419555664, 14.476937294006348, 15.841230392456055, 17.205522537231445, 18.56981658935547, 19.93410873413086, 21.29840087890625, 22.662694931030273, 24.026987075805664, 25.391281127929688, 26.755573272705078, 28.11986541748047, 29.48415756225586, 30.848451614379883, 32.212745666503906, 33.5770378112793, 34.94132995605469, 36.30562210083008, 37.66991424560547, 39.034210205078125, 40.398502349853516, 41.762794494628906]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 12.0, 18.0, 34.0, 40.0, 57.0, 98.0, 132.0, 228.0, 314.0, 426.0, 689.0, 1040.0, 1622.0, 2529.0, 3679.0, 5609.0, 8628.0, 13261.0, 20639.0, 32014.0, 47661.0, 70233.0, 97913.0, 123687.0, 137379.0, 130417.0, 107484.0, 80126.0, 55740.0, 37235.0, 24151.0, 15835.0, 10360.0, 6558.0, 4394.0, 2851.0, 1958.0, 1177.0, 774.0, 559.0, 334.0, 182.0, 166.0, 104.0, 71.0, 65.0, 24.0, 19.0, 14.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-25.25, -24.453125, -23.65625, -22.859375, -22.0625, -21.265625, -20.46875, -19.671875, -18.875, -18.078125, -17.28125, -16.484375, -15.6875, -14.890625, -14.09375, -13.296875, -12.5, -11.703125, -10.90625, -10.109375, -9.3125, -8.515625, -7.71875, -6.921875, -6.125, -5.328125, -4.53125, -3.734375, -2.9375, -2.140625, -1.34375, -0.546875, 0.25, 1.046875, 1.84375, 2.640625, 3.4375, 4.234375, 5.03125, 5.828125, 6.625, 7.421875, 8.21875, 9.015625, 9.8125, 10.609375, 11.40625, 12.203125, 13.0, 13.796875, 14.59375, 15.390625, 16.1875, 16.984375, 17.78125, 18.578125, 19.375, 20.171875, 20.96875, 21.765625, 22.5625, 23.359375, 24.15625, 24.953125, 25.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 9.0, 14.0, 9.0, 12.0, 25.0, 22.0, 21.0, 28.0, 30.0, 34.0, 47.0, 28.0, 39.0, 38.0, 36.0, 54.0, 40.0, 45.0, 32.0, 33.0, 47.0, 39.0, 41.0, 39.0, 34.0, 30.0, 26.0, 23.0, 12.0, 13.0, 10.0, 15.0, 14.0, 9.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.53125, -46.95654296875, -45.3818359375, -43.80712890625, -42.232421875, -40.65771484375, -39.0830078125, -37.50830078125, -35.93359375, -34.35888671875, -32.7841796875, -31.20947265625, -29.634765625, -28.06005859375, -26.4853515625, -24.91064453125, -23.3359375, -21.76123046875, -20.1865234375, -18.61181640625, -17.037109375, -15.46240234375, -13.8876953125, -12.31298828125, -10.73828125, -9.16357421875, -7.5888671875, -6.01416015625, -4.439453125, -2.86474609375, -1.2900390625, 0.28466796875, 1.859375, 3.43408203125, 5.0087890625, 6.58349609375, 8.158203125, 9.73291015625, 11.3076171875, 12.88232421875, 14.45703125, 16.03173828125, 17.6064453125, 19.18115234375, 20.755859375, 22.33056640625, 23.9052734375, 25.47998046875, 27.0546875, 28.62939453125, 30.2041015625, 31.77880859375, 33.353515625, 34.92822265625, 36.5029296875, 38.07763671875, 39.65234375, 41.22705078125, 42.8017578125, 44.37646484375, 45.951171875, 47.52587890625, 49.1005859375, 50.67529296875, 52.25]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 16.0, 14.0, 36.0, 56.0, 69.0, 93.0, 177.0, 264.0, 466.0, 659.0, 1133.0, 1787.0, 2996.0, 5131.0, 9326.0, 16460.0, 29720.0, 54483.0, 97210.0, 158343.0, 207225.0, 184016.0, 121621.0, 69980.0, 38395.0, 21172.0, 11760.0, 6390.0, 3687.0, 2291.0, 1339.0, 798.0, 485.0, 344.0, 202.0, 132.0, 85.0, 60.0, 46.0, 23.0, 28.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.21875, -36.8876953125, -35.556640625, -34.2255859375, -32.89453125, -31.5634765625, -30.232421875, -28.9013671875, -27.5703125, -26.2392578125, -24.908203125, -23.5771484375, -22.24609375, -20.9150390625, -19.583984375, -18.2529296875, -16.921875, -15.5908203125, -14.259765625, -12.9287109375, -11.59765625, -10.2666015625, -8.935546875, -7.6044921875, -6.2734375, -4.9423828125, -3.611328125, -2.2802734375, -0.94921875, 0.3818359375, 1.712890625, 3.0439453125, 4.375, 5.7060546875, 7.037109375, 8.3681640625, 9.69921875, 11.0302734375, 12.361328125, 13.6923828125, 15.0234375, 16.3544921875, 17.685546875, 19.0166015625, 20.34765625, 21.6787109375, 23.009765625, 24.3408203125, 25.671875, 27.0029296875, 28.333984375, 29.6650390625, 30.99609375, 32.3271484375, 33.658203125, 34.9892578125, 36.3203125, 37.6513671875, 38.982421875, 40.3134765625, 41.64453125, 42.9755859375, 44.306640625, 45.6376953125, 46.96875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 4.0, 7.0, 12.0, 11.0, 19.0, 20.0, 19.0, 35.0, 25.0, 24.0, 33.0, 32.0, 38.0, 32.0, 58.0, 57.0, 47.0, 42.0, 36.0, 36.0, 32.0, 39.0, 33.0, 40.0, 35.0, 35.0, 33.0, 27.0, 24.0, 19.0, 21.0, 15.0, 7.0, 9.0, 5.0, 11.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.3125, -24.433349609375, -23.55419921875, -22.675048828125, -21.7958984375, -20.916748046875, -20.03759765625, -19.158447265625, -18.279296875, -17.400146484375, -16.52099609375, -15.641845703125, -14.7626953125, -13.883544921875, -13.00439453125, -12.125244140625, -11.24609375, -10.366943359375, -9.48779296875, -8.608642578125, -7.7294921875, -6.850341796875, -5.97119140625, -5.092041015625, -4.212890625, -3.333740234375, -2.45458984375, -1.575439453125, -0.6962890625, 0.182861328125, 1.06201171875, 1.941162109375, 2.8203125, 3.699462890625, 4.57861328125, 5.457763671875, 6.3369140625, 7.216064453125, 8.09521484375, 8.974365234375, 9.853515625, 10.732666015625, 11.61181640625, 12.490966796875, 13.3701171875, 14.249267578125, 15.12841796875, 16.007568359375, 16.88671875, 17.765869140625, 18.64501953125, 19.524169921875, 20.4033203125, 21.282470703125, 22.16162109375, 23.040771484375, 23.919921875, 24.799072265625, 25.67822265625, 26.557373046875, 27.4365234375, 28.315673828125, 29.19482421875, 30.073974609375, 30.953125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 15.0, 16.0, 19.0, 39.0, 43.0, 72.0, 113.0, 189.0, 291.0, 444.0, 794.0, 1286.0, 2282.0, 3925.0, 7162.0, 12988.0, 24749.0, 47365.0, 88257.0, 157779.0, 225541.0, 203013.0, 126129.0, 68411.0, 35478.0, 18732.0, 10119.0, 5668.0, 3097.0, 1721.0, 1076.0, 630.0, 387.0, 254.0, 150.0, 107.0, 60.0, 40.0, 39.0, 21.0, 19.0, 9.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.578125, -20.8017578125, -20.025390625, -19.2490234375, -18.47265625, -17.6962890625, -16.919921875, -16.1435546875, -15.3671875, -14.5908203125, -13.814453125, -13.0380859375, -12.26171875, -11.4853515625, -10.708984375, -9.9326171875, -9.15625, -8.3798828125, -7.603515625, -6.8271484375, -6.05078125, -5.2744140625, -4.498046875, -3.7216796875, -2.9453125, -2.1689453125, -1.392578125, -0.6162109375, 0.16015625, 0.9365234375, 1.712890625, 2.4892578125, 3.265625, 4.0419921875, 4.818359375, 5.5947265625, 6.37109375, 7.1474609375, 7.923828125, 8.7001953125, 9.4765625, 10.2529296875, 11.029296875, 11.8056640625, 12.58203125, 13.3583984375, 14.134765625, 14.9111328125, 15.6875, 16.4638671875, 17.240234375, 18.0166015625, 18.79296875, 19.5693359375, 20.345703125, 21.1220703125, 21.8984375, 22.6748046875, 23.451171875, 24.2275390625, 25.00390625, 25.7802734375, 26.556640625, 27.3330078125, 28.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 6.0, 5.0, 8.0, 14.0, 13.0, 18.0, 22.0, 23.0, 33.0, 33.0, 28.0, 51.0, 39.0, 39.0, 53.0, 52.0, 43.0, 48.0, 50.0, 46.0, 46.0, 40.0, 30.0, 29.0, 29.0, 27.0, 32.0, 16.0, 12.0, 18.0, 13.0, 15.0, 16.0, 12.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008177757263183594, -0.0007904618978500366, -0.0007631480693817139, -0.0007358342409133911, -0.0007085204124450684, -0.0006812065839767456, -0.0006538927555084229, -0.0006265789270401001, -0.0005992650985717773, -0.0005719512701034546, -0.0005446374416351318, -0.0005173236131668091, -0.0004900097846984863, -0.0004626959562301636, -0.0004353821277618408, -0.00040806829929351807, -0.0003807544708251953, -0.00035344064235687256, -0.0003261268138885498, -0.00029881298542022705, -0.0002714991569519043, -0.00024418532848358154, -0.0002168715000152588, -0.00018955767154693604, -0.00016224384307861328, -0.00013493001461029053, -0.00010761618614196777, -8.030235767364502e-05, -5.2988529205322266e-05, -2.5674700736999512e-05, 1.6391277313232422e-06, 2.8952956199645996e-05, 5.626678466796875e-05, 8.35806131362915e-05, 0.00011089444160461426, 0.000138208270072937, 0.00016552209854125977, 0.00019283592700958252, 0.00022014975547790527, 0.00024746358394622803, 0.0002747774124145508, 0.00030209124088287354, 0.0003294050693511963, 0.00035671889781951904, 0.0003840327262878418, 0.00041134655475616455, 0.0004386603832244873, 0.00046597421169281006, 0.0004932880401611328, 0.0005206018686294556, 0.0005479156970977783, 0.0005752295255661011, 0.0006025433540344238, 0.0006298571825027466, 0.0006571710109710693, 0.0006844848394393921, 0.0007117986679077148, 0.0007391124963760376, 0.0007664263248443604, 0.0007937401533126831, 0.0008210539817810059, 0.0008483678102493286, 0.0008756816387176514, 0.0009029954671859741, 0.0009303092956542969]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 14.0, 15.0, 22.0, 29.0, 41.0, 75.0, 85.0, 159.0, 224.0, 280.0, 500.0, 732.0, 1141.0, 1849.0, 2863.0, 4708.0, 8049.0, 14632.0, 26361.0, 48814.0, 86490.0, 139372.0, 188151.0, 186947.0, 139789.0, 86278.0, 48794.0, 26455.0, 14807.0, 8248.0, 4646.0, 2837.0, 1817.0, 1141.0, 742.0, 443.0, 306.0, 197.0, 165.0, 109.0, 56.0, 51.0, 36.0, 30.0, 16.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.5625, -22.75, -21.9375, -21.125, -20.3125, -19.5, -18.6875, -17.875, -17.0625, -16.25, -15.4375, -14.625, -13.8125, -13.0, -12.1875, -11.375, -10.5625, -9.75, -8.9375, -8.125, -7.3125, -6.5, -5.6875, -4.875, -4.0625, -3.25, -2.4375, -1.625, -0.8125, 0.0, 0.8125, 1.625, 2.4375, 3.25, 4.0625, 4.875, 5.6875, 6.5, 7.3125, 8.125, 8.9375, 9.75, 10.5625, 11.375, 12.1875, 13.0, 13.8125, 14.625, 15.4375, 16.25, 17.0625, 17.875, 18.6875, 19.5, 20.3125, 21.125, 21.9375, 22.75, 23.5625, 24.375, 25.1875, 26.0, 26.8125, 27.625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 4.0, 7.0, 9.0, 7.0, 15.0, 17.0, 14.0, 15.0, 18.0, 25.0, 33.0, 33.0, 27.0, 41.0, 39.0, 50.0, 59.0, 52.0, 46.0, 39.0, 56.0, 57.0, 48.0, 43.0, 40.0, 31.0, 27.0, 19.0, 17.0, 17.0, 18.0, 11.0, 9.0, 13.0, 5.0, 10.0, 2.0, 6.0, 3.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-7.03125, -6.82421875, -6.6171875, -6.41015625, -6.203125, -5.99609375, -5.7890625, -5.58203125, -5.375, -5.16796875, -4.9609375, -4.75390625, -4.546875, -4.33984375, -4.1328125, -3.92578125, -3.71875, -3.51171875, -3.3046875, -3.09765625, -2.890625, -2.68359375, -2.4765625, -2.26953125, -2.0625, -1.85546875, -1.6484375, -1.44140625, -1.234375, -1.02734375, -0.8203125, -0.61328125, -0.40625, -0.19921875, 0.0078125, 0.21484375, 0.421875, 0.62890625, 0.8359375, 1.04296875, 1.25, 1.45703125, 1.6640625, 1.87109375, 2.078125, 2.28515625, 2.4921875, 2.69921875, 2.90625, 3.11328125, 3.3203125, 3.52734375, 3.734375, 3.94140625, 4.1484375, 4.35546875, 4.5625, 4.76953125, 4.9765625, 5.18359375, 5.390625, 5.59765625, 5.8046875, 6.01171875, 6.21875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 21.0, 26.0, 34.0, 36.0, 34.0, 35.0, 41.0, 52.0, 39.0, 48.0, 53.0, 45.0, 43.0, 56.0, 43.0, 47.0, 39.0, 30.0, 36.0, 23.0, 22.0, 21.0, 20.0, 15.0, 13.0, 12.0, 15.0, 4.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.782806396484375, -50.89947509765625, -49.016143798828125, -47.132808685302734, -45.24947738647461, -43.366146087646484, -41.482810974121094, -39.59947967529297, -37.716148376464844, -35.83281707763672, -33.949485778808594, -32.0661506652832, -30.182819366455078, -28.299488067626953, -26.416154861450195, -24.532821655273438, -22.649490356445312, -20.766159057617188, -18.88282585144043, -16.999492645263672, -15.116161346435547, -13.232829093933105, -11.349496841430664, -9.466164588928223, -7.582832336425781, -5.69950008392334, -3.8161678314208984, -1.932835578918457, -0.049503326416015625, 1.8338289260864258, 3.717161178588867, 5.600493431091309, 7.48382568359375, 9.367157936096191, 11.250490188598633, 13.133822441101074, 15.017154693603516, 16.90048599243164, 18.7838191986084, 20.667152404785156, 22.55048370361328, 24.433815002441406, 26.317148208618164, 28.200481414794922, 30.083812713623047, 31.967144012451172, 33.85047912597656, 35.73381042480469, 37.61714172363281, 39.50047302246094, 41.38380432128906, 43.26713943481445, 45.15047073364258, 47.0338020324707, 48.917137145996094, 50.80046844482422, 52.683799743652344, 54.56713104248047, 56.450462341308594, 58.333797454833984, 60.21712875366211, 62.100460052490234, 63.983795166015625, 65.86712646484375, 67.75045776367188]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 5.0, 10.0, 11.0, 15.0, 16.0, 20.0, 26.0, 21.0, 30.0, 39.0, 29.0, 31.0, 37.0, 38.0, 40.0, 50.0, 44.0, 31.0, 35.0, 44.0, 29.0, 30.0, 41.0, 42.0, 29.0, 42.0, 27.0, 24.0, 19.0, 16.0, 14.0, 13.0, 10.0, 11.0, 16.0, 9.0, 11.0, 3.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.820247650146484, -45.43103790283203, -44.04182815551758, -42.652618408203125, -41.263404846191406, -39.87419509887695, -38.4849853515625, -37.09577560424805, -35.706565856933594, -34.31735610961914, -32.92814636230469, -31.5389347076416, -30.149723052978516, -28.760513305664062, -27.37130355834961, -25.982093811035156, -24.592880249023438, -23.203670501708984, -21.8144588470459, -20.425249099731445, -19.03603744506836, -17.646827697753906, -16.257617950439453, -14.868407249450684, -13.479196548461914, -12.089985847473145, -10.700775146484375, -9.311565399169922, -7.922354698181152, -6.533143997192383, -5.14393424987793, -3.75472354888916, -2.3655128479003906, -0.9763023853302002, 0.41290807723999023, 1.8021183013916016, 3.191329002380371, 4.580539703369141, 5.969749450683594, 7.358960151672363, 8.748170852661133, 10.137381553649902, 11.526592254638672, 12.915802001953125, 14.305012702941895, 15.694223403930664, 17.083433151245117, 18.472644805908203, 19.861854553222656, 21.25106430053711, 22.640275955200195, 24.02948570251465, 25.418697357177734, 26.807907104492188, 28.19711685180664, 29.586326599121094, 30.97553825378418, 32.364749908447266, 33.75395965576172, 35.14316940307617, 36.532379150390625, 37.921592712402344, 39.31079864501953, 40.70001220703125, 42.0892219543457]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 12.0, 14.0, 31.0, 41.0, 64.0, 82.0, 111.0, 198.0, 290.0, 374.0, 592.0, 904.0, 1304.0, 2012.0, 2858.0, 4231.0, 6128.0, 9091.0, 13072.0, 19207.0, 27290.0, 38282.0, 52715.0, 69469.0, 87459.0, 102190.0, 109943.0, 107545.0, 96194.0, 79966.0, 62387.0, 46283.0, 33480.0, 23427.0, 16195.0, 11346.0, 7540.0, 5143.0, 3526.0, 2375.0, 1669.0, 1137.0, 797.0, 499.0, 327.0, 254.0, 170.0, 122.0, 66.0, 59.0, 25.0, 20.0, 12.0, 6.0, 8.0, 5.0, 1.0, 2.0], "bins": [-28.015625, -27.1611328125, -26.306640625, -25.4521484375, -24.59765625, -23.7431640625, -22.888671875, -22.0341796875, -21.1796875, -20.3251953125, -19.470703125, -18.6162109375, -17.76171875, -16.9072265625, -16.052734375, -15.1982421875, -14.34375, -13.4892578125, -12.634765625, -11.7802734375, -10.92578125, -10.0712890625, -9.216796875, -8.3623046875, -7.5078125, -6.6533203125, -5.798828125, -4.9443359375, -4.08984375, -3.2353515625, -2.380859375, -1.5263671875, -0.671875, 0.1826171875, 1.037109375, 1.8916015625, 2.74609375, 3.6005859375, 4.455078125, 5.3095703125, 6.1640625, 7.0185546875, 7.873046875, 8.7275390625, 9.58203125, 10.4365234375, 11.291015625, 12.1455078125, 13.0, 13.8544921875, 14.708984375, 15.5634765625, 16.41796875, 17.2724609375, 18.126953125, 18.9814453125, 19.8359375, 20.6904296875, 21.544921875, 22.3994140625, 23.25390625, 24.1083984375, 24.962890625, 25.8173828125, 26.671875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 5.0, 8.0, 11.0, 6.0, 7.0, 5.0, 17.0, 15.0, 19.0, 27.0, 30.0, 23.0, 32.0, 31.0, 35.0, 42.0, 34.0, 37.0, 39.0, 38.0, 42.0, 44.0, 30.0, 37.0, 34.0, 29.0, 34.0, 44.0, 44.0, 22.0, 28.0, 19.0, 22.0, 18.0, 14.0, 15.0, 6.0, 5.0, 11.0, 9.0, 4.0, 6.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.28125, -39.89208984375, -38.5029296875, -37.11376953125, -35.724609375, -34.33544921875, -32.9462890625, -31.55712890625, -30.16796875, -28.77880859375, -27.3896484375, -26.00048828125, -24.611328125, -23.22216796875, -21.8330078125, -20.44384765625, -19.0546875, -17.66552734375, -16.2763671875, -14.88720703125, -13.498046875, -12.10888671875, -10.7197265625, -9.33056640625, -7.94140625, -6.55224609375, -5.1630859375, -3.77392578125, -2.384765625, -0.99560546875, 0.3935546875, 1.78271484375, 3.171875, 4.56103515625, 5.9501953125, 7.33935546875, 8.728515625, 10.11767578125, 11.5068359375, 12.89599609375, 14.28515625, 15.67431640625, 17.0634765625, 18.45263671875, 19.841796875, 21.23095703125, 22.6201171875, 24.00927734375, 25.3984375, 26.78759765625, 28.1767578125, 29.56591796875, 30.955078125, 32.34423828125, 33.7333984375, 35.12255859375, 36.51171875, 37.90087890625, 39.2900390625, 40.67919921875, 42.068359375, 43.45751953125, 44.8466796875, 46.23583984375, 47.625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 6.0, 19.0, 27.0, 38.0, 62.0, 84.0, 113.0, 172.0, 287.0, 383.0, 620.0, 867.0, 1356.0, 2183.0, 3352.0, 5436.0, 8888.0, 14929.0, 25966.0, 45965.0, 82188.0, 138235.0, 193126.0, 192920.0, 138013.0, 82274.0, 46152.0, 26217.0, 14816.0, 8722.0, 5509.0, 3420.0, 2090.0, 1365.0, 909.0, 601.0, 407.0, 288.0, 156.0, 117.0, 86.0, 62.0, 36.0, 32.0, 23.0, 13.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.5625, -72.232421875, -69.90234375, -67.572265625, -65.2421875, -62.912109375, -60.58203125, -58.251953125, -55.921875, -53.591796875, -51.26171875, -48.931640625, -46.6015625, -44.271484375, -41.94140625, -39.611328125, -37.28125, -34.951171875, -32.62109375, -30.291015625, -27.9609375, -25.630859375, -23.30078125, -20.970703125, -18.640625, -16.310546875, -13.98046875, -11.650390625, -9.3203125, -6.990234375, -4.66015625, -2.330078125, 0.0, 2.330078125, 4.66015625, 6.990234375, 9.3203125, 11.650390625, 13.98046875, 16.310546875, 18.640625, 20.970703125, 23.30078125, 25.630859375, 27.9609375, 30.291015625, 32.62109375, 34.951171875, 37.28125, 39.611328125, 41.94140625, 44.271484375, 46.6015625, 48.931640625, 51.26171875, 53.591796875, 55.921875, 58.251953125, 60.58203125, 62.912109375, 65.2421875, 67.572265625, 69.90234375, 72.232421875, 74.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 13.0, 14.0, 14.0, 15.0, 20.0, 21.0, 15.0, 32.0, 28.0, 31.0, 34.0, 39.0, 46.0, 32.0, 45.0, 54.0, 58.0, 36.0, 34.0, 40.0, 50.0, 51.0, 31.0, 25.0, 29.0, 24.0, 20.0, 31.0, 16.0, 12.0, 11.0, 12.0, 16.0, 11.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.8125, -34.59326171875, -33.3740234375, -32.15478515625, -30.935546875, -29.71630859375, -28.4970703125, -27.27783203125, -26.05859375, -24.83935546875, -23.6201171875, -22.40087890625, -21.181640625, -19.96240234375, -18.7431640625, -17.52392578125, -16.3046875, -15.08544921875, -13.8662109375, -12.64697265625, -11.427734375, -10.20849609375, -8.9892578125, -7.77001953125, -6.55078125, -5.33154296875, -4.1123046875, -2.89306640625, -1.673828125, -0.45458984375, 0.7646484375, 1.98388671875, 3.203125, 4.42236328125, 5.6416015625, 6.86083984375, 8.080078125, 9.29931640625, 10.5185546875, 11.73779296875, 12.95703125, 14.17626953125, 15.3955078125, 16.61474609375, 17.833984375, 19.05322265625, 20.2724609375, 21.49169921875, 22.7109375, 23.93017578125, 25.1494140625, 26.36865234375, 27.587890625, 28.80712890625, 30.0263671875, 31.24560546875, 32.46484375, 33.68408203125, 34.9033203125, 36.12255859375, 37.341796875, 38.56103515625, 39.7802734375, 40.99951171875, 42.21875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 16.0, 12.0, 17.0, 37.0, 42.0, 68.0, 118.0, 171.0, 285.0, 563.0, 875.0, 1615.0, 2933.0, 5321.0, 9907.0, 19371.0, 38934.0, 79463.0, 151829.0, 226254.0, 220710.0, 141216.0, 74297.0, 36163.0, 18177.0, 9163.0, 4863.0, 2606.0, 1448.0, 801.0, 484.0, 284.0, 176.0, 85.0, 68.0, 56.0, 34.0, 23.0, 17.0, 6.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-52.15625, -50.61962890625, -49.0830078125, -47.54638671875, -46.009765625, -44.47314453125, -42.9365234375, -41.39990234375, -39.86328125, -38.32666015625, -36.7900390625, -35.25341796875, -33.716796875, -32.18017578125, -30.6435546875, -29.10693359375, -27.5703125, -26.03369140625, -24.4970703125, -22.96044921875, -21.423828125, -19.88720703125, -18.3505859375, -16.81396484375, -15.27734375, -13.74072265625, -12.2041015625, -10.66748046875, -9.130859375, -7.59423828125, -6.0576171875, -4.52099609375, -2.984375, -1.44775390625, 0.0888671875, 1.62548828125, 3.162109375, 4.69873046875, 6.2353515625, 7.77197265625, 9.30859375, 10.84521484375, 12.3818359375, 13.91845703125, 15.455078125, 16.99169921875, 18.5283203125, 20.06494140625, 21.6015625, 23.13818359375, 24.6748046875, 26.21142578125, 27.748046875, 29.28466796875, 30.8212890625, 32.35791015625, 33.89453125, 35.43115234375, 36.9677734375, 38.50439453125, 40.041015625, 41.57763671875, 43.1142578125, 44.65087890625, 46.1875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 4.0, 11.0, 8.0, 10.0, 14.0, 6.0, 20.0, 33.0, 40.0, 48.0, 69.0, 75.0, 77.0, 76.0, 106.0, 82.0, 81.0, 58.0, 44.0, 28.0, 34.0, 15.0, 23.0, 6.0, 12.0, 3.0, 3.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005977630615234375, -0.00580209493637085, -0.005626559257507324, -0.005451023578643799, -0.0052754878997802734, -0.005099952220916748, -0.004924416542053223, -0.004748880863189697, -0.004573345184326172, -0.0043978095054626465, -0.004222273826599121, -0.004046738147735596, -0.0038712024688720703, -0.003695666790008545, -0.0035201311111450195, -0.003344595432281494, -0.0031690597534179688, -0.0029935240745544434, -0.002817988395690918, -0.0026424527168273926, -0.002466917037963867, -0.002291381359100342, -0.0021158456802368164, -0.001940310001373291, -0.0017647743225097656, -0.0015892386436462402, -0.0014137029647827148, -0.0012381672859191895, -0.001062631607055664, -0.0008870959281921387, -0.0007115602493286133, -0.0005360245704650879, -0.0003604888916015625, -0.0001849532127380371, -9.417533874511719e-06, 0.00016611814498901367, 0.00034165382385253906, 0.0005171895027160645, 0.0006927251815795898, 0.0008682608604431152, 0.0010437965393066406, 0.001219332218170166, 0.0013948678970336914, 0.0015704035758972168, 0.0017459392547607422, 0.0019214749336242676, 0.002097010612487793, 0.0022725462913513184, 0.0024480819702148438, 0.002623617649078369, 0.0027991533279418945, 0.00297468900680542, 0.0031502246856689453, 0.0033257603645324707, 0.003501296043395996, 0.0036768317222595215, 0.003852367401123047, 0.004027903079986572, 0.004203438758850098, 0.004378974437713623, 0.0045545101165771484, 0.004730045795440674, 0.004905581474304199, 0.005081117153167725, 0.00525665283203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 19.0, 22.0, 43.0, 49.0, 68.0, 105.0, 134.0, 222.0, 299.0, 457.0, 695.0, 966.0, 1394.0, 2072.0, 3061.0, 4621.0, 6828.0, 10779.0, 16496.0, 25635.0, 40094.0, 61495.0, 91021.0, 124157.0, 147225.0, 144287.0, 119075.0, 85025.0, 56928.0, 36932.0, 23699.0, 15457.0, 9870.0, 6257.0, 4237.0, 2757.0, 1950.0, 1310.0, 888.0, 587.0, 397.0, 289.0, 207.0, 129.0, 99.0, 70.0, 33.0, 29.0, 24.0, 22.0, 12.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0], "bins": [-26.75, -25.884521484375, -25.01904296875, -24.153564453125, -23.2880859375, -22.422607421875, -21.55712890625, -20.691650390625, -19.826171875, -18.960693359375, -18.09521484375, -17.229736328125, -16.3642578125, -15.498779296875, -14.63330078125, -13.767822265625, -12.90234375, -12.036865234375, -11.17138671875, -10.305908203125, -9.4404296875, -8.574951171875, -7.70947265625, -6.843994140625, -5.978515625, -5.113037109375, -4.24755859375, -3.382080078125, -2.5166015625, -1.651123046875, -0.78564453125, 0.079833984375, 0.9453125, 1.810791015625, 2.67626953125, 3.541748046875, 4.4072265625, 5.272705078125, 6.13818359375, 7.003662109375, 7.869140625, 8.734619140625, 9.60009765625, 10.465576171875, 11.3310546875, 12.196533203125, 13.06201171875, 13.927490234375, 14.79296875, 15.658447265625, 16.52392578125, 17.389404296875, 18.2548828125, 19.120361328125, 19.98583984375, 20.851318359375, 21.716796875, 22.582275390625, 23.44775390625, 24.313232421875, 25.1787109375, 26.044189453125, 26.90966796875, 27.775146484375, 28.640625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 11.0, 16.0, 17.0, 21.0, 20.0, 30.0, 25.0, 38.0, 31.0, 41.0, 44.0, 55.0, 49.0, 52.0, 39.0, 54.0, 51.0, 46.0, 52.0, 43.0, 49.0, 30.0, 27.0, 22.0, 17.0, 11.0, 15.0, 13.0, 8.0, 7.0, 9.0, 4.0, 4.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.0859375, -9.784423828125, -9.48291015625, -9.181396484375, -8.8798828125, -8.578369140625, -8.27685546875, -7.975341796875, -7.673828125, -7.372314453125, -7.07080078125, -6.769287109375, -6.4677734375, -6.166259765625, -5.86474609375, -5.563232421875, -5.26171875, -4.960205078125, -4.65869140625, -4.357177734375, -4.0556640625, -3.754150390625, -3.45263671875, -3.151123046875, -2.849609375, -2.548095703125, -2.24658203125, -1.945068359375, -1.6435546875, -1.342041015625, -1.04052734375, -0.739013671875, -0.4375, -0.135986328125, 0.16552734375, 0.467041015625, 0.7685546875, 1.070068359375, 1.37158203125, 1.673095703125, 1.974609375, 2.276123046875, 2.57763671875, 2.879150390625, 3.1806640625, 3.482177734375, 3.78369140625, 4.085205078125, 4.38671875, 4.688232421875, 4.98974609375, 5.291259765625, 5.5927734375, 5.894287109375, 6.19580078125, 6.497314453125, 6.798828125, 7.100341796875, 7.40185546875, 7.703369140625, 8.0048828125, 8.306396484375, 8.60791015625, 8.909423828125, 9.2109375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 8.0, 10.0, 17.0, 29.0, 16.0, 27.0, 41.0, 26.0, 35.0, 40.0, 41.0, 45.0, 51.0, 49.0, 48.0, 47.0, 43.0, 38.0, 52.0, 39.0, 35.0, 31.0, 39.0, 32.0, 17.0, 26.0, 19.0, 17.0, 8.0, 9.0, 8.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.01078796386719, -66.85242462158203, -64.69405364990234, -62.53569030761719, -60.37732696533203, -58.21895980834961, -56.06059265136719, -53.90222930908203, -51.74386215209961, -49.58549499511719, -47.42713165283203, -45.26876449584961, -43.11039733886719, -40.95203399658203, -38.79366683959961, -36.63529968261719, -34.47693634033203, -32.31856918334961, -30.160205841064453, -28.00183868408203, -25.843473434448242, -23.685108184814453, -21.52674102783203, -19.368375778198242, -17.210010528564453, -15.051645278930664, -12.893279075622559, -10.734912872314453, -8.576547622680664, -6.418182373046875, -4.2598161697387695, -2.101449966430664, 0.05690765380859375, 2.215273380279541, 4.373639106750488, 6.5320048332214355, 8.690370559692383, 10.848735809326172, 13.007102012634277, 15.165468215942383, 17.323833465576172, 19.48219871520996, 21.64056396484375, 23.798931121826172, 25.95729637145996, 28.11566162109375, 30.274028778076172, 32.432395935058594, 34.59075927734375, 36.74912643432617, 38.90748977661133, 41.06585693359375, 43.224220275878906, 45.38258743286133, 47.54095458984375, 49.699317932128906, 51.85768508911133, 54.01605224609375, 56.174415588378906, 58.33278274536133, 60.49114990234375, 62.649513244628906, 64.80787658691406, 66.96624755859375, 69.1246109008789]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 11.0, 8.0, 18.0, 15.0, 12.0, 20.0, 24.0, 30.0, 28.0, 43.0, 32.0, 35.0, 37.0, 29.0, 39.0, 38.0, 47.0, 46.0, 40.0, 45.0, 39.0, 35.0, 33.0, 30.0, 35.0, 19.0, 23.0, 25.0, 27.0, 26.0, 17.0, 9.0, 13.0, 12.0, 6.0, 8.0, 8.0, 1.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.76392364501953, -62.54938888549805, -60.3348503112793, -58.12031555175781, -55.90577697753906, -53.69124221801758, -51.476707458496094, -49.262168884277344, -47.04763412475586, -44.833099365234375, -42.618560791015625, -40.40402603149414, -38.189491271972656, -35.974952697753906, -33.76041793823242, -31.545881271362305, -29.331344604492188, -27.11680793762207, -24.902271270751953, -22.68773651123047, -20.47319984436035, -18.258663177490234, -16.04412841796875, -13.829591751098633, -11.615055084228516, -9.400518417358398, -7.185982704162598, -4.971446514129639, -2.7569103240966797, -0.5423736572265625, 1.6721620559692383, 3.886697769165039, 6.101234436035156, 8.315771102905273, 10.530306816101074, 12.744842529296875, 14.959379196166992, 17.17391586303711, 19.388450622558594, 21.60298728942871, 23.817523956298828, 26.032060623168945, 28.246597290039062, 30.461132049560547, 32.67566680908203, 34.89020538330078, 37.104740142822266, 39.31927490234375, 41.5338134765625, 43.748348236083984, 45.962886810302734, 48.17742156982422, 50.39196014404297, 52.60649490356445, 54.82102966308594, 57.03556823730469, 59.25010299682617, 61.464637756347656, 63.679176330566406, 65.89371490478516, 68.10824584960938, 70.32278442382812, 72.53732299804688, 74.7518539428711, 76.96639251708984]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 11.0, 11.0, 19.0, 25.0, 28.0, 40.0, 51.0, 74.0, 68.0, 133.0, 126.0, 171.0, 232.0, 293.0, 414.0, 537.0, 730.0, 940.0, 1402.0, 2411.0, 4144.0, 8885.0, 491303.0, 4284.0, 2432.0, 1420.0, 1011.0, 752.0, 568.0, 430.0, 311.0, 241.0, 183.0, 112.0, 118.0, 93.0, 54.0, 44.0, 33.0, 34.0, 21.0, 21.0, 13.0, 11.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-737.7885131835938, -713.224609375, -688.6607055664062, -664.0968017578125, -639.5328369140625, -614.9689331054688, -590.405029296875, -565.8411254882812, -541.2772216796875, -516.7133178710938, -492.1494140625, -467.5854797363281, -443.0215759277344, -418.4576721191406, -393.89373779296875, -369.329833984375, -344.76593017578125, -320.2020263671875, -295.63812255859375, -271.0741882324219, -246.51028442382812, -221.94638061523438, -197.38246154785156, -172.81854248046875, -148.254638671875, -123.69072723388672, -99.12681579589844, -74.56290435791016, -49.998992919921875, -25.435081481933594, -0.8711700439453125, 23.6927490234375, 48.25665283203125, 72.82056427001953, 97.38447570800781, 121.9483871459961, 146.51229858398438, 171.07620239257812, 195.64012145996094, 220.20404052734375, 244.7679443359375, 269.33184814453125, 293.895751953125, 318.4596862792969, 343.0235900878906, 367.5874938964844, 392.15142822265625, 416.71533203125, 441.27923583984375, 465.8431396484375, 490.40704345703125, 514.970947265625, 539.534912109375, 564.0988159179688, 588.6627197265625, 613.2266235351562, 637.79052734375, 662.3544311523438, 686.9183349609375, 711.4822387695312, 736.046142578125, 760.610107421875, 785.1740112304688, 809.7379150390625, 834.3018188476562]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 3.0, 9.0, 10.0, 14.0, 21.0, 10.0, 21.0, 25.0, 29.0, 27.0, 45.0, 32.0, 30.0, 42.0, 28.0, 39.0, 48.0, 41.0, 1070.0, 36.0, 43.0, 45.0, 31.0, 32.0, 31.0, 33.0, 23.0, 22.0, 31.0, 23.0, 19.0, 22.0, 9.0, 10.0, 11.0, 11.0, 9.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2068.56884765625, -1997.9425048828125, -1927.316162109375, -1856.6898193359375, -1786.0634765625, -1715.43701171875, -1644.8106689453125, -1574.184326171875, -1503.5579833984375, -1432.931640625, -1362.3052978515625, -1291.678955078125, -1221.052490234375, -1150.42626953125, -1079.7998046875, -1009.1734619140625, -938.547119140625, -867.9207763671875, -797.29443359375, -726.6680297851562, -656.0416870117188, -585.4153442382812, -514.7889404296875, -444.16259765625, -373.5362548828125, -302.909912109375, -232.28353881835938, -161.6571807861328, -91.03082275390625, -20.40447998046875, 50.221893310546875, 120.8482666015625, 191.474853515625, 262.1011962890625, 332.7275695800781, 403.35394287109375, 473.98028564453125, 544.6066284179688, 615.2330322265625, 685.859375, 756.4857177734375, 827.112060546875, 897.7384033203125, 968.3648071289062, 1038.9912109375, 1109.617431640625, 1180.243896484375, 1250.8702392578125, 1321.49658203125, 1392.1229248046875, 1462.749267578125, 1533.3756103515625, 1604.001953125, 1674.62841796875, 1745.2547607421875, 1815.881103515625, 1886.5074462890625, 1957.1337890625, 2027.7601318359375, 2098.386474609375, 2169.012939453125, 2239.63916015625, 2310.265625, 2380.89208984375, 2451.518310546875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 4.0, 5.0, 7.0, 4.0, 11.0, 9.0, 13.0, 13.0, 11.0, 30.0, 35.0, 27.0, 37.0, 62.0, 74.0, 118.0, 154.0, 212.0, 311.0, 437.0, 569.0, 740.0, 925.0, 1237.0, 1614.0, 2117.0, 2660.0, 4093.0, 7531.0, 64020.0, 31128602.0, 15112.0, 9158.0, 7984.0, 3354.0, 1239.0, 732.0, 400.0, 227.0, 178.0, 123.0, 127.0, 86.0, 50.0, 30.0, 13.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2639.215087890625, -2579.439697265625, -2519.664306640625, -2459.88916015625, -2400.11376953125, -2340.33837890625, -2280.56298828125, -2220.78759765625, -2161.01220703125, -2101.23681640625, -2041.4615478515625, -1981.6861572265625, -1921.9107666015625, -1862.135498046875, -1802.360107421875, -1742.584716796875, -1682.8094482421875, -1623.0340576171875, -1563.2587890625, -1503.4833984375, -1443.7080078125, -1383.9326171875, -1324.1573486328125, -1264.3819580078125, -1204.606689453125, -1144.831298828125, -1085.0560302734375, -1025.2806396484375, -965.5052490234375, -905.7299194335938, -845.95458984375, -786.17919921875, -726.4039306640625, -666.6286010742188, -606.8532104492188, -547.077880859375, -487.3025207519531, -427.52716064453125, -367.7518310546875, -307.9764709472656, -248.20111083984375, -188.42575073242188, -128.65040588378906, -68.87506103515625, -9.099700927734375, 50.6756591796875, 110.45098876953125, 170.22634887695312, 230.001708984375, 289.7770690917969, 349.55242919921875, 409.3277587890625, 469.1031188964844, 528.8784790039062, 588.65380859375, 648.42919921875, 708.2045288085938, 767.9798583984375, 827.7552490234375, 887.5305786132812, 947.305908203125, 1007.081298828125, 1066.856689453125, 1126.6319580078125, 1186.4073486328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 18.0, 20.0, 31.0, 34.0, 55.0, 95.0, 109.0, 173.0, 278.0, 396.0, 573.0, 834.0, 1389.0, 2150.0, 3548.0, 5633.0, 9535.0, 16273.0, 28471.0, 50647.0, 92299.0, 175690.0, 351865.0, 773437.0, 1821933.0, 1611281.0, 678234.0, 313769.0, 159150.0, 83891.0, 45874.0, 25861.0, 14927.0, 8935.0, 5198.0, 3242.0, 1960.0, 1257.0, 809.0, 540.0, 337.0, 196.0, 157.0, 117.0, 71.0, 41.0, 32.0, 25.0, 13.0, 6.0, 6.0, 10.0, 1.0, 2.0, 1.0, 1.0], "bins": [-199.375, -193.318359375, -187.26171875, -181.205078125, -175.1484375, -169.091796875, -163.03515625, -156.978515625, -150.921875, -144.865234375, -138.80859375, -132.751953125, -126.6953125, -120.638671875, -114.58203125, -108.525390625, -102.46875, -96.412109375, -90.35546875, -84.298828125, -78.2421875, -72.185546875, -66.12890625, -60.072265625, -54.015625, -47.958984375, -41.90234375, -35.845703125, -29.7890625, -23.732421875, -17.67578125, -11.619140625, -5.5625, 0.494140625, 6.55078125, 12.607421875, 18.6640625, 24.720703125, 30.77734375, 36.833984375, 42.890625, 48.947265625, 55.00390625, 61.060546875, 67.1171875, 73.173828125, 79.23046875, 85.287109375, 91.34375, 97.400390625, 103.45703125, 109.513671875, 115.5703125, 121.626953125, 127.68359375, 133.740234375, 139.796875, 145.853515625, 151.91015625, 157.966796875, 164.0234375, 170.080078125, 176.13671875, 182.193359375, 188.25]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 1.0, 5.0, 9.0, 15.0, 14.0, 13.0, 17.0, 22.0, 28.0, 22.0, 44.0, 54.0, 54.0, 78.0, 83.0, 131.0, 136.0, 180.0, 214.0, 169.0, 157.0, 109.0, 92.0, 77.0, 57.0, 50.0, 37.0, 18.0, 31.0, 25.0, 15.0, 9.0, 10.0, 10.0, 5.0, 13.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-82.5625, -80.03515625, -77.5078125, -74.98046875, -72.453125, -69.92578125, -67.3984375, -64.87109375, -62.34375, -59.81640625, -57.2890625, -54.76171875, -52.234375, -49.70703125, -47.1796875, -44.65234375, -42.125, -39.59765625, -37.0703125, -34.54296875, -32.015625, -29.48828125, -26.9609375, -24.43359375, -21.90625, -19.37890625, -16.8515625, -14.32421875, -11.796875, -9.26953125, -6.7421875, -4.21484375, -1.6875, 0.83984375, 3.3671875, 5.89453125, 8.421875, 10.94921875, 13.4765625, 16.00390625, 18.53125, 21.05859375, 23.5859375, 26.11328125, 28.640625, 31.16796875, 33.6953125, 36.22265625, 38.75, 41.27734375, 43.8046875, 46.33203125, 48.859375, 51.38671875, 53.9140625, 56.44140625, 58.96875, 61.49609375, 64.0234375, 66.55078125, 69.078125, 71.60546875, 74.1328125, 76.66015625, 79.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 17.0, 14.0, 22.0, 22.0, 28.0, 56.0, 91.0, 121.0, 179.0, 253.0, 348.0, 529.0, 783.0, 1270.0, 1888.0, 3057.0, 5135.0, 8548.0, 14640.0, 24624.0, 42670.0, 76094.0, 135727.0, 244195.0, 458225.0, 985853.0, 1969935.0, 1167544.0, 522490.0, 272559.0, 152026.0, 85714.0, 48255.0, 27702.0, 16098.0, 9451.0, 5497.0, 3511.0, 2064.0, 1428.0, 911.0, 585.0, 394.0, 292.0, 178.0, 123.0, 87.0, 55.0, 36.0, 36.0, 30.0, 22.0, 8.0, 5.0, 5.0, 8.0, 2.0, 3.0], "bins": [-98.625, -95.599609375, -92.57421875, -89.548828125, -86.5234375, -83.498046875, -80.47265625, -77.447265625, -74.421875, -71.396484375, -68.37109375, -65.345703125, -62.3203125, -59.294921875, -56.26953125, -53.244140625, -50.21875, -47.193359375, -44.16796875, -41.142578125, -38.1171875, -35.091796875, -32.06640625, -29.041015625, -26.015625, -22.990234375, -19.96484375, -16.939453125, -13.9140625, -10.888671875, -7.86328125, -4.837890625, -1.8125, 1.212890625, 4.23828125, 7.263671875, 10.2890625, 13.314453125, 16.33984375, 19.365234375, 22.390625, 25.416015625, 28.44140625, 31.466796875, 34.4921875, 37.517578125, 40.54296875, 43.568359375, 46.59375, 49.619140625, 52.64453125, 55.669921875, 58.6953125, 61.720703125, 64.74609375, 67.771484375, 70.796875, 73.822265625, 76.84765625, 79.873046875, 82.8984375, 85.923828125, 88.94921875, 91.974609375, 95.0]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 11.0, 15.0, 12.0, 11.0, 22.0, 28.0, 38.0, 61.0, 73.0, 100.0, 150.0, 189.0, 273.0, 279.0, 229.0, 157.0, 90.0, 56.0, 45.0, 30.0, 37.0, 24.0, 18.0, 14.0, 7.0, 12.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-157.375, -153.2744140625, -149.173828125, -145.0732421875, -140.97265625, -136.8720703125, -132.771484375, -128.6708984375, -124.5703125, -120.4697265625, -116.369140625, -112.2685546875, -108.16796875, -104.0673828125, -99.966796875, -95.8662109375, -91.765625, -87.6650390625, -83.564453125, -79.4638671875, -75.36328125, -71.2626953125, -67.162109375, -63.0615234375, -58.9609375, -54.8603515625, -50.759765625, -46.6591796875, -42.55859375, -38.4580078125, -34.357421875, -30.2568359375, -26.15625, -22.0556640625, -17.955078125, -13.8544921875, -9.75390625, -5.6533203125, -1.552734375, 2.5478515625, 6.6484375, 10.7490234375, 14.849609375, 18.9501953125, 23.05078125, 27.1513671875, 31.251953125, 35.3525390625, 39.453125, 43.5537109375, 47.654296875, 51.7548828125, 55.85546875, 59.9560546875, 64.056640625, 68.1572265625, 72.2578125, 76.3583984375, 80.458984375, 84.5595703125, 88.66015625, 92.7607421875, 96.861328125, 100.9619140625, 105.0625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 26.0, 26.0, 35.0, 61.0, 79.0, 120.0, 217.0, 348.0, 555.0, 890.0, 1468.0, 2680.0, 5104.0, 9861.0, 20252.0, 43308.0, 109605.0, 5442987.0, 491098.0, 89461.0, 36893.0, 17436.0, 8740.0, 4535.0, 2354.0, 1261.0, 772.0, 439.0, 293.0, 193.0, 124.0, 85.0, 38.0, 24.0, 13.0, 13.0, 9.0, 7.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-239.125, -229.119140625, -219.11328125, -209.107421875, -199.1015625, -189.095703125, -179.08984375, -169.083984375, -159.078125, -149.072265625, -139.06640625, -129.060546875, -119.0546875, -109.048828125, -99.04296875, -89.037109375, -79.03125, -69.025390625, -59.01953125, -49.013671875, -39.0078125, -29.001953125, -18.99609375, -8.990234375, 1.015625, 11.021484375, 21.02734375, 31.033203125, 41.0390625, 51.044921875, 61.05078125, 71.056640625, 81.0625, 91.068359375, 101.07421875, 111.080078125, 121.0859375, 131.091796875, 141.09765625, 151.103515625, 161.109375, 171.115234375, 181.12109375, 191.126953125, 201.1328125, 211.138671875, 221.14453125, 231.150390625, 241.15625, 251.162109375, 261.16796875, 271.173828125, 281.1796875, 291.185546875, 301.19140625, 311.197265625, 321.203125, 331.208984375, 341.21484375, 351.220703125, 361.2265625, 371.232421875, 381.23828125, 391.244140625, 401.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 9.0, 18.0, 27.0, 35.0, 23.0, 42.0, 42.0, 42.0, 63.0, 71.0, 135.0, 235.0, 329.0, 260.0, 147.0, 87.0, 68.0, 56.0, 33.0, 36.0, 46.0, 29.0, 19.0, 19.0, 25.0, 13.0, 12.0, 9.0, 7.0, 7.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-152.5, -147.5546875, -142.609375, -137.6640625, -132.71875, -127.7734375, -122.828125, -117.8828125, -112.9375, -107.9921875, -103.046875, -98.1015625, -93.15625, -88.2109375, -83.265625, -78.3203125, -73.375, -68.4296875, -63.484375, -58.5390625, -53.59375, -48.6484375, -43.703125, -38.7578125, -33.8125, -28.8671875, -23.921875, -18.9765625, -14.03125, -9.0859375, -4.140625, 0.8046875, 5.75, 10.6953125, 15.640625, 20.5859375, 25.53125, 30.4765625, 35.421875, 40.3671875, 45.3125, 50.2578125, 55.203125, 60.1484375, 65.09375, 70.0390625, 74.984375, 79.9296875, 84.875, 89.8203125, 94.765625, 99.7109375, 104.65625, 109.6015625, 114.546875, 119.4921875, 124.4375, 129.3828125, 134.328125, 139.2734375, 144.21875, 149.1640625, 154.109375, 159.0546875, 164.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 7.0, 12.0, 15.0, 22.0, 30.0, 51.0, 45.0, 71.0, 105.0, 177.0, 142.0, 79.0, 56.0, 32.0, 41.0, 26.0, 19.0, 10.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-8581.712890625, -8398.4638671875, -8215.2138671875, -8031.96484375, -7848.71533203125, -7665.4658203125, -7482.216796875, -7298.96728515625, -7115.7177734375, -6932.46826171875, -6749.21875, -6565.9697265625, -6382.72021484375, -6199.470703125, -6016.2216796875, -5832.97216796875, -5649.72265625, -5466.47314453125, -5283.2236328125, -5099.974609375, -4916.72509765625, -4733.4755859375, -4550.2265625, -4366.97705078125, -4183.7275390625, -4000.47802734375, -3817.228759765625, -3633.9794921875, -3450.72998046875, -3267.48046875, -3084.231201171875, -2900.98193359375, -2717.732421875, -2534.48291015625, -2351.233642578125, -2167.984375, -1984.73486328125, -1801.4854736328125, -1618.236083984375, -1434.9866943359375, -1251.7373046875, -1068.4879150390625, -885.238525390625, -701.9891357421875, -518.73974609375, -335.4903564453125, -152.240966796875, 31.0084228515625, 214.2578125, 397.5072021484375, 580.756591796875, 764.0059814453125, 947.25537109375, 1130.5047607421875, 1313.754150390625, 1497.0035400390625, 1680.2529296875, 1863.5023193359375, 2046.751708984375, 2230.0009765625, 2413.25048828125, 2596.5, 2779.749267578125, 2962.99853515625, 3146.248046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 3.0, 4.0, 7.0, 12.0, 12.0, 19.0, 8.0, 21.0, 18.0, 14.0, 18.0, 25.0, 21.0, 23.0, 47.0, 70.0, 117.0, 149.0, 85.0, 45.0, 44.0, 31.0, 35.0, 19.0, 24.0, 16.0, 19.0, 12.0, 8.0, 9.0, 6.0, 13.0, 8.0, 6.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4715.66064453125, -4569.54931640625, -4423.4375, -4277.326171875, -4131.21484375, -3985.10302734375, -3838.99169921875, -3692.880126953125, -3546.7685546875, -3400.656982421875, -3254.54541015625, -3108.43408203125, -2962.322509765625, -2816.2109375, -2670.099609375, -2523.988037109375, -2377.87646484375, -2231.764892578125, -2085.6533203125, -1939.5419921875, -1793.430419921875, -1647.31884765625, -1501.2073974609375, -1355.095947265625, -1208.984375, -1062.872802734375, -916.7613525390625, -770.6498413085938, -624.538330078125, -478.42681884765625, -332.3153076171875, -186.20379638671875, -40.091796875, 106.01971435546875, 252.1312255859375, 398.24273681640625, 544.354248046875, 690.4657592773438, 836.5772705078125, 982.6887817382812, 1128.80029296875, 1274.911865234375, 1421.0233154296875, 1567.134765625, 1713.246337890625, 1859.35791015625, 2005.4693603515625, 2151.580810546875, 2297.6923828125, 2443.803955078125, 2589.91552734375, 2736.02685546875, 2882.138427734375, 3028.25, 3174.361328125, 3320.472900390625, 3466.58447265625, 3612.696044921875, 3758.8076171875, 3904.9189453125, 4051.030517578125, 4197.14208984375, 4343.25341796875, 4489.365234375, 4635.4765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 7.0, 12.0, 26.0, 14.0, 30.0, 46.0, 59.0, 64.0, 81.0, 151.0, 204.0, 268.0, 395.0, 476.0, 745.0, 1093.0, 1601.0, 2294.0, 3450.0, 5307.0, 8338.0, 13599.0, 23310.0, 44932.0, 106009.0, 375449.0, 2779088.0, 575042.0, 140608.0, 52859.0, 25093.0, 13445.0, 7697.0, 4513.0, 2911.0, 1859.0, 1200.0, 707.0, 433.0, 314.0, 200.0, 135.0, 80.0, 55.0, 32.0, 17.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-42.71875, -41.5185546875, -40.318359375, -39.1181640625, -37.91796875, -36.7177734375, -35.517578125, -34.3173828125, -33.1171875, -31.9169921875, -30.716796875, -29.5166015625, -28.31640625, -27.1162109375, -25.916015625, -24.7158203125, -23.515625, -22.3154296875, -21.115234375, -19.9150390625, -18.71484375, -17.5146484375, -16.314453125, -15.1142578125, -13.9140625, -12.7138671875, -11.513671875, -10.3134765625, -9.11328125, -7.9130859375, -6.712890625, -5.5126953125, -4.3125, -3.1123046875, -1.912109375, -0.7119140625, 0.48828125, 1.6884765625, 2.888671875, 4.0888671875, 5.2890625, 6.4892578125, 7.689453125, 8.8896484375, 10.08984375, 11.2900390625, 12.490234375, 13.6904296875, 14.890625, 16.0908203125, 17.291015625, 18.4912109375, 19.69140625, 20.8916015625, 22.091796875, 23.2919921875, 24.4921875, 25.6923828125, 26.892578125, 28.0927734375, 29.29296875, 30.4931640625, 31.693359375, 32.8935546875, 34.09375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 2.0, 12.0, 3.0, 4.0, 13.0, 9.0, 14.0, 23.0, 24.0, 42.0, 41.0, 59.0, 93.0, 125.0, 134.0, 82.0, 78.0, 62.0, 40.0, 30.0, 19.0, 18.0, 12.0, 12.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.703125, -4.575531005859375, -4.44793701171875, -4.320343017578125, -4.1927490234375, -4.065155029296875, -3.93756103515625, -3.809967041015625, -3.682373046875, -3.554779052734375, -3.42718505859375, -3.299591064453125, -3.1719970703125, -3.044403076171875, -2.91680908203125, -2.789215087890625, -2.66162109375, -2.534027099609375, -2.40643310546875, -2.278839111328125, -2.1512451171875, -2.023651123046875, -1.89605712890625, -1.768463134765625, -1.640869140625, -1.513275146484375, -1.38568115234375, -1.258087158203125, -1.1304931640625, -1.002899169921875, -0.87530517578125, -0.747711181640625, -0.6201171875, -0.492523193359375, -0.36492919921875, -0.237335205078125, -0.1097412109375, 0.017852783203125, 0.14544677734375, 0.273040771484375, 0.400634765625, 0.528228759765625, 0.65582275390625, 0.783416748046875, 0.9110107421875, 1.038604736328125, 1.16619873046875, 1.293792724609375, 1.42138671875, 1.548980712890625, 1.67657470703125, 1.804168701171875, 1.9317626953125, 2.059356689453125, 2.18695068359375, 2.314544677734375, 2.442138671875, 2.569732666015625, 2.69732666015625, 2.824920654296875, 2.9525146484375, 3.080108642578125, 3.20770263671875, 3.335296630859375, 3.462890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 6.0, 8.0, 9.0, 37.0, 32.0, 44.0, 53.0, 112.0, 113.0, 187.0, 230.0, 375.0, 549.0, 887.0, 1491.0, 2552.0, 4864.0, 9771.0, 21848.0, 53910.0, 147571.0, 458985.0, 1856567.0, 1129297.0, 322730.0, 107213.0, 40508.0, 16963.0, 7803.0, 3891.0, 2129.0, 1177.0, 808.0, 467.0, 306.0, 217.0, 153.0, 126.0, 91.0, 57.0, 50.0, 27.0, 16.0, 14.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.84375, -36.53173828125, -35.2197265625, -33.90771484375, -32.595703125, -31.28369140625, -29.9716796875, -28.65966796875, -27.34765625, -26.03564453125, -24.7236328125, -23.41162109375, -22.099609375, -20.78759765625, -19.4755859375, -18.16357421875, -16.8515625, -15.53955078125, -14.2275390625, -12.91552734375, -11.603515625, -10.29150390625, -8.9794921875, -7.66748046875, -6.35546875, -5.04345703125, -3.7314453125, -2.41943359375, -1.107421875, 0.20458984375, 1.5166015625, 2.82861328125, 4.140625, 5.45263671875, 6.7646484375, 8.07666015625, 9.388671875, 10.70068359375, 12.0126953125, 13.32470703125, 14.63671875, 15.94873046875, 17.2607421875, 18.57275390625, 19.884765625, 21.19677734375, 22.5087890625, 23.82080078125, 25.1328125, 26.44482421875, 27.7568359375, 29.06884765625, 30.380859375, 31.69287109375, 33.0048828125, 34.31689453125, 35.62890625, 36.94091796875, 38.2529296875, 39.56494140625, 40.876953125, 42.18896484375, 43.5009765625, 44.81298828125, 46.125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 12.0, 17.0, 14.0, 18.0, 12.0, 30.0, 28.0, 32.0, 43.0, 67.0, 66.0, 90.0, 115.0, 145.0, 168.0, 237.0, 266.0, 407.0, 543.0, 343.0, 266.0, 229.0, 183.0, 145.0, 115.0, 87.0, 85.0, 64.0, 48.0, 55.0, 34.0, 27.0, 17.0, 12.0, 12.0, 9.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.59375, -14.2027587890625, -13.811767578125, -13.4207763671875, -13.02978515625, -12.6387939453125, -12.247802734375, -11.8568115234375, -11.4658203125, -11.0748291015625, -10.683837890625, -10.2928466796875, -9.90185546875, -9.5108642578125, -9.119873046875, -8.7288818359375, -8.337890625, -7.9468994140625, -7.555908203125, -7.1649169921875, -6.77392578125, -6.3829345703125, -5.991943359375, -5.6009521484375, -5.2099609375, -4.8189697265625, -4.427978515625, -4.0369873046875, -3.64599609375, -3.2550048828125, -2.864013671875, -2.4730224609375, -2.08203125, -1.6910400390625, -1.300048828125, -0.9090576171875, -0.51806640625, -0.1270751953125, 0.263916015625, 0.6549072265625, 1.0458984375, 1.4368896484375, 1.827880859375, 2.2188720703125, 2.60986328125, 3.0008544921875, 3.391845703125, 3.7828369140625, 4.173828125, 4.5648193359375, 4.955810546875, 5.3468017578125, 5.73779296875, 6.1287841796875, 6.519775390625, 6.9107666015625, 7.3017578125, 7.6927490234375, 8.083740234375, 8.4747314453125, 8.86572265625, 9.2567138671875, 9.647705078125, 10.0386962890625, 10.4296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 8.0, 12.0, 27.0, 61.0, 108.0, 163.0, 184.0, 184.0, 121.0, 54.0, 33.0, 16.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-214.38536071777344, -205.2847442626953, -196.18414306640625, -187.08352661132812, -177.98291015625, -168.88229370117188, -159.78167724609375, -150.6810760498047, -141.58045959472656, -132.47984313964844, -123.37923431396484, -114.27862548828125, -105.17800903320312, -96.077392578125, -86.9767837524414, -77.87617492675781, -68.77555847167969, -59.67494583129883, -50.57433319091797, -41.47372055053711, -32.37310791015625, -23.27249526977539, -14.171882629394531, -5.071269989013672, 4.0293426513671875, 13.129955291748047, 22.230567932128906, 31.331180572509766, 40.431793212890625, 49.532405853271484, 58.633018493652344, 67.73362731933594, 76.83425903320312, 85.93487548828125, 95.03548431396484, 104.13609313964844, 113.23670959472656, 122.33732604980469, 131.43792724609375, 140.53854370117188, 149.63916015625, 158.73977661132812, 167.84039306640625, 176.9409942626953, 186.04161071777344, 195.14222717285156, 204.24282836914062, 213.34344482421875, 222.44406127929688, 231.544677734375, 240.64529418945312, 249.7458953857422, 258.84649658203125, 267.9471130371094, 277.0477294921875, 286.1483459472656, 295.24896240234375, 304.3495788574219, 313.4501953125, 322.5508117675781, 331.65142822265625, 340.75201416015625, 349.8526306152344, 358.9532470703125, 368.0538635253906]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 13.0, 11.0, 17.0, 17.0, 28.0, 30.0, 51.0, 56.0, 63.0, 61.0, 58.0, 67.0, 78.0, 66.0, 58.0, 49.0, 43.0, 32.0, 47.0, 42.0, 23.0, 23.0, 19.0, 10.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-166.04632568359375, -161.99449157714844, -157.9426727294922, -153.89083862304688, -149.83900451660156, -145.7871856689453, -141.7353515625, -137.6835174560547, -133.63169860839844, -129.57986450195312, -125.52803802490234, -121.47621154785156, -117.42438507080078, -113.37255859375, -109.32072448730469, -105.2688980102539, -101.2170639038086, -97.16523742675781, -93.1134033203125, -89.06157684326172, -85.00975036621094, -80.95791625976562, -76.90608978271484, -72.85426330566406, -68.80242919921875, -64.75060272216797, -60.69877243041992, -56.646942138671875, -52.595115661621094, -48.54328536987305, -44.491455078125, -40.43962860107422, -36.38780975341797, -32.33597946166992, -28.28415298461914, -24.232322692871094, -20.18049430847168, -16.128665924072266, -12.076835632324219, -8.025007247924805, -3.9731788635253906, 0.07864999771118164, 4.130478858947754, 8.182308197021484, 12.234136581420898, 16.285964965820312, 20.33779525756836, 24.389623641967773, 28.441452026367188, 32.493282318115234, 36.545108795166016, 40.59693908691406, 44.648765563964844, 48.70059585571289, 52.75242614746094, 56.80425262451172, 60.856082916259766, 64.90791320800781, 68.9597396850586, 73.01156616210938, 77.06340026855469, 81.11522674560547, 85.16705322265625, 89.21888732910156, 93.27071380615234]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 9.0, 20.0, 26.0, 30.0, 52.0, 56.0, 97.0, 128.0, 187.0, 332.0, 521.0, 887.0, 1623.0, 3110.0, 6346.0, 14290.0, 37738.0, 128521.0, 508949.0, 244197.0, 61756.0, 21614.0, 8815.0, 4263.0, 2144.0, 1179.0, 602.0, 363.0, 227.0, 149.0, 94.0, 68.0, 39.0, 26.0, 27.0, 6.0, 7.0, 8.0, 14.0, 2.0, 6.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.171875, -29.156494140625, -28.14111328125, -27.125732421875, -26.1103515625, -25.094970703125, -24.07958984375, -23.064208984375, -22.048828125, -21.033447265625, -20.01806640625, -19.002685546875, -17.9873046875, -16.971923828125, -15.95654296875, -14.941162109375, -13.92578125, -12.910400390625, -11.89501953125, -10.879638671875, -9.8642578125, -8.848876953125, -7.83349609375, -6.818115234375, -5.802734375, -4.787353515625, -3.77197265625, -2.756591796875, -1.7412109375, -0.725830078125, 0.28955078125, 1.304931640625, 2.3203125, 3.335693359375, 4.35107421875, 5.366455078125, 6.3818359375, 7.397216796875, 8.41259765625, 9.427978515625, 10.443359375, 11.458740234375, 12.47412109375, 13.489501953125, 14.5048828125, 15.520263671875, 16.53564453125, 17.551025390625, 18.56640625, 19.581787109375, 20.59716796875, 21.612548828125, 22.6279296875, 23.643310546875, 24.65869140625, 25.674072265625, 26.689453125, 27.704833984375, 28.72021484375, 29.735595703125, 30.7509765625, 31.766357421875, 32.78173828125, 33.797119140625, 34.8125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 14.0, 20.0, 22.0, 14.0, 30.0, 56.0, 60.0, 69.0, 73.0, 81.0, 95.0, 70.0, 73.0, 60.0, 54.0, 39.0, 45.0, 22.0, 24.0, 15.0, 9.0, 7.0, 3.0, 2.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.521270751953125, -6.35504150390625, -6.188812255859375, -6.0225830078125, -5.856353759765625, -5.69012451171875, -5.523895263671875, -5.357666015625, -5.191436767578125, -5.02520751953125, -4.858978271484375, -4.6927490234375, -4.526519775390625, -4.36029052734375, -4.194061279296875, -4.02783203125, -3.861602783203125, -3.69537353515625, -3.529144287109375, -3.3629150390625, -3.196685791015625, -3.03045654296875, -2.864227294921875, -2.697998046875, -2.531768798828125, -2.36553955078125, -2.199310302734375, -2.0330810546875, -1.866851806640625, -1.70062255859375, -1.534393310546875, -1.3681640625, -1.201934814453125, -1.03570556640625, -0.869476318359375, -0.7032470703125, -0.537017822265625, -0.37078857421875, -0.204559326171875, -0.038330078125, 0.127899169921875, 0.29412841796875, 0.460357666015625, 0.6265869140625, 0.792816162109375, 0.95904541015625, 1.125274658203125, 1.29150390625, 1.457733154296875, 1.62396240234375, 1.790191650390625, 1.9564208984375, 2.122650146484375, 2.28887939453125, 2.455108642578125, 2.621337890625, 2.787567138671875, 2.95379638671875, 3.120025634765625, 3.2862548828125, 3.452484130859375, 3.61871337890625, 3.784942626953125, 3.951171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 13.0, 23.0, 16.0, 24.0, 28.0, 66.0, 74.0, 101.0, 167.0, 239.0, 320.0, 458.0, 668.0, 1048.0, 1637.0, 2550.0, 4313.0, 7460.0, 13358.0, 27019.0, 59782.0, 160152.0, 389516.0, 225741.0, 79581.0, 34456.0, 16812.0, 8995.0, 5077.0, 3102.0, 1940.0, 1238.0, 790.0, 513.0, 359.0, 263.0, 175.0, 142.0, 102.0, 61.0, 48.0, 35.0, 22.0, 24.0, 11.0, 6.0, 11.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.59375, -17.9873046875, -17.380859375, -16.7744140625, -16.16796875, -15.5615234375, -14.955078125, -14.3486328125, -13.7421875, -13.1357421875, -12.529296875, -11.9228515625, -11.31640625, -10.7099609375, -10.103515625, -9.4970703125, -8.890625, -8.2841796875, -7.677734375, -7.0712890625, -6.46484375, -5.8583984375, -5.251953125, -4.6455078125, -4.0390625, -3.4326171875, -2.826171875, -2.2197265625, -1.61328125, -1.0068359375, -0.400390625, 0.2060546875, 0.8125, 1.4189453125, 2.025390625, 2.6318359375, 3.23828125, 3.8447265625, 4.451171875, 5.0576171875, 5.6640625, 6.2705078125, 6.876953125, 7.4833984375, 8.08984375, 8.6962890625, 9.302734375, 9.9091796875, 10.515625, 11.1220703125, 11.728515625, 12.3349609375, 12.94140625, 13.5478515625, 14.154296875, 14.7607421875, 15.3671875, 15.9736328125, 16.580078125, 17.1865234375, 17.79296875, 18.3994140625, 19.005859375, 19.6123046875, 20.21875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 2.0, 8.0, 11.0, 17.0, 11.0, 8.0, 9.0, 15.0, 18.0, 18.0, 23.0, 29.0, 37.0, 43.0, 43.0, 41.0, 41.0, 40.0, 38.0, 38.0, 45.0, 38.0, 30.0, 35.0, 42.0, 33.0, 29.0, 33.0, 29.0, 22.0, 23.0, 16.0, 20.0, 13.0, 19.0, 11.0, 16.0, 9.0, 11.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.6494140625, -18.017578125, -17.3857421875, -16.75390625, -16.1220703125, -15.490234375, -14.8583984375, -14.2265625, -13.5947265625, -12.962890625, -12.3310546875, -11.69921875, -11.0673828125, -10.435546875, -9.8037109375, -9.171875, -8.5400390625, -7.908203125, -7.2763671875, -6.64453125, -6.0126953125, -5.380859375, -4.7490234375, -4.1171875, -3.4853515625, -2.853515625, -2.2216796875, -1.58984375, -0.9580078125, -0.326171875, 0.3056640625, 0.9375, 1.5693359375, 2.201171875, 2.8330078125, 3.46484375, 4.0966796875, 4.728515625, 5.3603515625, 5.9921875, 6.6240234375, 7.255859375, 7.8876953125, 8.51953125, 9.1513671875, 9.783203125, 10.4150390625, 11.046875, 11.6787109375, 12.310546875, 12.9423828125, 13.57421875, 14.2060546875, 14.837890625, 15.4697265625, 16.1015625, 16.7333984375, 17.365234375, 17.9970703125, 18.62890625, 19.2607421875, 19.892578125, 20.5244140625, 21.15625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 5.0, 3.0, 14.0, 10.0, 15.0, 39.0, 37.0, 48.0, 94.0, 161.0, 224.0, 406.0, 777.0, 1673.0, 3737.0, 9575.0, 30202.0, 135528.0, 534336.0, 256426.0, 50755.0, 14511.0, 5301.0, 2272.0, 1074.0, 554.0, 301.0, 185.0, 108.0, 71.0, 26.0, 24.0, 17.0, 10.0, 13.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.890625, -19.262939453125, -18.63525390625, -18.007568359375, -17.3798828125, -16.752197265625, -16.12451171875, -15.496826171875, -14.869140625, -14.241455078125, -13.61376953125, -12.986083984375, -12.3583984375, -11.730712890625, -11.10302734375, -10.475341796875, -9.84765625, -9.219970703125, -8.59228515625, -7.964599609375, -7.3369140625, -6.709228515625, -6.08154296875, -5.453857421875, -4.826171875, -4.198486328125, -3.57080078125, -2.943115234375, -2.3154296875, -1.687744140625, -1.06005859375, -0.432373046875, 0.1953125, 0.822998046875, 1.45068359375, 2.078369140625, 2.7060546875, 3.333740234375, 3.96142578125, 4.589111328125, 5.216796875, 5.844482421875, 6.47216796875, 7.099853515625, 7.7275390625, 8.355224609375, 8.98291015625, 9.610595703125, 10.23828125, 10.865966796875, 11.49365234375, 12.121337890625, 12.7490234375, 13.376708984375, 14.00439453125, 14.632080078125, 15.259765625, 15.887451171875, 16.51513671875, 17.142822265625, 17.7705078125, 18.398193359375, 19.02587890625, 19.653564453125, 20.28125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 10.0, 9.0, 13.0, 18.0, 24.0, 27.0, 32.0, 37.0, 47.0, 45.0, 56.0, 64.0, 58.0, 63.0, 69.0, 61.0, 59.0, 54.0, 40.0, 40.0, 26.0, 21.0, 23.0, 21.0, 17.0, 11.0, 2.0, 8.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0005445480346679688, -0.00052623450756073, -0.0005079209804534912, -0.0004896074533462524, -0.00047129392623901367, -0.0004529803991317749, -0.00043466687202453613, -0.00041635334491729736, -0.0003980398178100586, -0.0003797262907028198, -0.00036141276359558105, -0.0003430992364883423, -0.0003247857093811035, -0.00030647218227386475, -0.000288158655166626, -0.0002698451280593872, -0.00025153160095214844, -0.00023321807384490967, -0.0002149045467376709, -0.00019659101963043213, -0.00017827749252319336, -0.0001599639654159546, -0.00014165043830871582, -0.00012333691120147705, -0.00010502338409423828, -8.670985698699951e-05, -6.839632987976074e-05, -5.008280277252197e-05, -3.17692756652832e-05, -1.3455748558044434e-05, 4.857778549194336e-06, 2.3171305656433105e-05, 4.1484832763671875e-05, 5.9798359870910645e-05, 7.811188697814941e-05, 9.642541408538818e-05, 0.00011473894119262695, 0.00013305246829986572, 0.0001513659954071045, 0.00016967952251434326, 0.00018799304962158203, 0.0002063065767288208, 0.00022462010383605957, 0.00024293363094329834, 0.0002612471580505371, 0.0002795606851577759, 0.00029787421226501465, 0.0003161877393722534, 0.0003345012664794922, 0.00035281479358673096, 0.0003711283206939697, 0.0003894418478012085, 0.00040775537490844727, 0.00042606890201568604, 0.0004443824291229248, 0.0004626959562301636, 0.00048100948333740234, 0.0004993230104446411, 0.0005176365375518799, 0.0005359500646591187, 0.0005542635917663574, 0.0005725771188735962, 0.000590890645980835, 0.0006092041730880737, 0.0006275177001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 10.0, 13.0, 30.0, 36.0, 91.0, 177.0, 345.0, 803.0, 1680.0, 4594.0, 13809.0, 54738.0, 298340.0, 525958.0, 112286.0, 23695.0, 7155.0, 2590.0, 1089.0, 523.0, 270.0, 127.0, 84.0, 33.0, 21.0, 14.0, 10.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0], "bins": [-31.015625, -30.314208984375, -29.61279296875, -28.911376953125, -28.2099609375, -27.508544921875, -26.80712890625, -26.105712890625, -25.404296875, -24.702880859375, -24.00146484375, -23.300048828125, -22.5986328125, -21.897216796875, -21.19580078125, -20.494384765625, -19.79296875, -19.091552734375, -18.39013671875, -17.688720703125, -16.9873046875, -16.285888671875, -15.58447265625, -14.883056640625, -14.181640625, -13.480224609375, -12.77880859375, -12.077392578125, -11.3759765625, -10.674560546875, -9.97314453125, -9.271728515625, -8.5703125, -7.868896484375, -7.16748046875, -6.466064453125, -5.7646484375, -5.063232421875, -4.36181640625, -3.660400390625, -2.958984375, -2.257568359375, -1.55615234375, -0.854736328125, -0.1533203125, 0.548095703125, 1.24951171875, 1.950927734375, 2.65234375, 3.353759765625, 4.05517578125, 4.756591796875, 5.4580078125, 6.159423828125, 6.86083984375, 7.562255859375, 8.263671875, 8.965087890625, 9.66650390625, 10.367919921875, 11.0693359375, 11.770751953125, 12.47216796875, 13.173583984375, 13.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 6.0, 11.0, 15.0, 18.0, 25.0, 23.0, 24.0, 32.0, 36.0, 37.0, 45.0, 52.0, 52.0, 50.0, 72.0, 46.0, 62.0, 59.0, 42.0, 31.0, 44.0, 36.0, 22.0, 21.0, 22.0, 20.0, 14.0, 13.0, 9.0, 7.0, 9.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6484375, -8.39825439453125, -8.1480712890625, -7.89788818359375, -7.647705078125, -7.39752197265625, -7.1473388671875, -6.89715576171875, -6.64697265625, -6.39678955078125, -6.1466064453125, -5.89642333984375, -5.646240234375, -5.39605712890625, -5.1458740234375, -4.89569091796875, -4.6455078125, -4.39532470703125, -4.1451416015625, -3.89495849609375, -3.644775390625, -3.39459228515625, -3.1444091796875, -2.89422607421875, -2.64404296875, -2.39385986328125, -2.1436767578125, -1.89349365234375, -1.643310546875, -1.39312744140625, -1.1429443359375, -0.89276123046875, -0.642578125, -0.39239501953125, -0.1422119140625, 0.10797119140625, 0.358154296875, 0.60833740234375, 0.8585205078125, 1.10870361328125, 1.35888671875, 1.60906982421875, 1.8592529296875, 2.10943603515625, 2.359619140625, 2.60980224609375, 2.8599853515625, 3.11016845703125, 3.3603515625, 3.61053466796875, 3.8607177734375, 4.11090087890625, 4.361083984375, 4.61126708984375, 4.8614501953125, 5.11163330078125, 5.36181640625, 5.61199951171875, 5.8621826171875, 6.11236572265625, 6.362548828125, 6.61273193359375, 6.8629150390625, 7.11309814453125, 7.36328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 4.0, 5.0, 8.0, 11.0, 17.0, 26.0, 36.0, 94.0, 197.0, 215.0, 191.0, 85.0, 46.0, 24.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.68634033203125, -279.2657470703125, -269.84515380859375, -260.4245300292969, -251.00393676757812, -241.58334350585938, -232.16273498535156, -222.74212646484375, -213.321533203125, -203.90093994140625, -194.48033142089844, -185.05972290039062, -175.63912963867188, -166.21853637695312, -156.7979278564453, -147.3773193359375, -137.95672607421875, -128.5361328125, -119.11552429199219, -109.6949234008789, -100.27432250976562, -90.85372161865234, -81.43312072753906, -72.01251983642578, -62.5919189453125, -53.17131805419922, -43.75071716308594, -34.330116271972656, -24.909515380859375, -15.488914489746094, -6.0683135986328125, 3.3522872924804688, 12.772918701171875, 22.193519592285156, 31.614120483398438, 41.03472137451172, 50.455322265625, 59.87592315673828, 69.29652404785156, 78.71712493896484, 88.13772583007812, 97.5583267211914, 106.97892761230469, 116.39952850341797, 125.82012939453125, 135.24072265625, 144.6613311767578, 154.08193969726562, 163.50253295898438, 172.92312622070312, 182.34373474121094, 191.76434326171875, 201.1849365234375, 210.60552978515625, 220.02613830566406, 229.44674682617188, 238.86734008789062, 248.28793334960938, 257.70855712890625, 267.129150390625, 276.54974365234375, 285.9703369140625, 295.39093017578125, 304.8115539550781, 314.2321472167969]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 12.0, 12.0, 29.0, 61.0, 88.0, 131.0, 188.0, 139.0, 113.0, 64.0, 40.0, 22.0, 17.0, 6.0, 7.0, 7.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-279.038818359375, -266.829345703125, -254.61988830566406, -242.41043090820312, -230.20095825195312, -217.99148559570312, -205.7820281982422, -193.57257080078125, -181.36309814453125, -169.15362548828125, -156.9441680908203, -144.73471069335938, -132.52523803710938, -120.3157730102539, -108.10630798339844, -95.89684295654297, -83.6873779296875, -71.47791290283203, -59.26844787597656, -47.058982849121094, -34.849517822265625, -22.640052795410156, -10.430587768554688, 1.7788772583007812, 13.98834228515625, 26.19780731201172, 38.40727233886719, 50.616737365722656, 62.826202392578125, 75.0356674194336, 87.24513244628906, 99.45459747314453, 111.6640625, 123.87352752685547, 136.08299255371094, 148.29244995117188, 160.50192260742188, 172.71139526367188, 184.9208526611328, 197.13031005859375, 209.33978271484375, 221.54925537109375, 233.7587127685547, 245.96817016601562, 258.1776428222656, 270.3871154785156, 282.5965576171875, 294.8060302734375, 307.0155029296875, 319.2249755859375, 331.4344482421875, 343.6438903808594, 355.8533630371094, 368.0628356933594, 380.27227783203125, 392.48175048828125, 404.69122314453125, 416.90069580078125, 429.11016845703125, 441.3196105957031, 453.5290832519531, 465.7385559082031, 477.947998046875, 490.157470703125, 502.366943359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 15.0, 17.0, 21.0, 18.0, 55.0, 62.0, 110.0, 208.0, 378.0, 621.0, 1238.0, 2439.0, 5633.0, 14450.0, 48726.0, 295348.0, 3568143.0, 195194.0, 38937.0, 12427.0, 5016.0, 2356.0, 1126.0, 619.0, 405.0, 229.0, 152.0, 94.0, 62.0, 49.0, 28.0, 19.0, 24.0, 16.0, 14.0, 4.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-92.1875, -89.15625, -86.125, -83.09375, -80.0625, -77.03125, -74.0, -70.96875, -67.9375, -64.90625, -61.875, -58.84375, -55.8125, -52.78125, -49.75, -46.71875, -43.6875, -40.65625, -37.625, -34.59375, -31.5625, -28.53125, -25.5, -22.46875, -19.4375, -16.40625, -13.375, -10.34375, -7.3125, -4.28125, -1.25, 1.78125, 4.8125, 7.84375, 10.875, 13.90625, 16.9375, 19.96875, 23.0, 26.03125, 29.0625, 32.09375, 35.125, 38.15625, 41.1875, 44.21875, 47.25, 50.28125, 53.3125, 56.34375, 59.375, 62.40625, 65.4375, 68.46875, 71.5, 74.53125, 77.5625, 80.59375, 83.625, 86.65625, 89.6875, 92.71875, 95.75, 98.78125, 101.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 6.0, 15.0, 14.0, 19.0, 21.0, 30.0, 48.0, 71.0, 77.0, 86.0, 88.0, 71.0, 94.0, 77.0, 61.0, 50.0, 40.0, 34.0, 20.0, 19.0, 4.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.96875, -5.77081298828125, -5.5728759765625, -5.37493896484375, -5.177001953125, -4.97906494140625, -4.7811279296875, -4.58319091796875, -4.38525390625, -4.18731689453125, -3.9893798828125, -3.79144287109375, -3.593505859375, -3.39556884765625, -3.1976318359375, -2.99969482421875, -2.8017578125, -2.60382080078125, -2.4058837890625, -2.20794677734375, -2.010009765625, -1.81207275390625, -1.6141357421875, -1.41619873046875, -1.21826171875, -1.02032470703125, -0.8223876953125, -0.62445068359375, -0.426513671875, -0.22857666015625, -0.0306396484375, 0.16729736328125, 0.365234375, 0.56317138671875, 0.7611083984375, 0.95904541015625, 1.156982421875, 1.35491943359375, 1.5528564453125, 1.75079345703125, 1.94873046875, 2.14666748046875, 2.3446044921875, 2.54254150390625, 2.740478515625, 2.93841552734375, 3.1363525390625, 3.33428955078125, 3.5322265625, 3.73016357421875, 3.9281005859375, 4.12603759765625, 4.323974609375, 4.52191162109375, 4.7198486328125, 4.91778564453125, 5.11572265625, 5.31365966796875, 5.5115966796875, 5.70953369140625, 5.907470703125, 6.10540771484375, 6.3033447265625, 6.50128173828125, 6.69921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 8.0, 13.0, 15.0, 26.0, 41.0, 40.0, 58.0, 84.0, 123.0, 172.0, 260.0, 379.0, 613.0, 877.0, 1471.0, 2372.0, 4150.0, 7323.0, 13225.0, 26512.0, 55798.0, 131504.0, 384781.0, 2517491.0, 699401.0, 194664.0, 77385.0, 35555.0, 17452.0, 9329.0, 5139.0, 2973.0, 1786.0, 1107.0, 708.0, 427.0, 300.0, 214.0, 136.0, 115.0, 73.0, 50.0, 37.0, 26.0, 16.0, 11.0, 11.0, 8.0, 2.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0], "bins": [-52.1875, -50.591796875, -48.99609375, -47.400390625, -45.8046875, -44.208984375, -42.61328125, -41.017578125, -39.421875, -37.826171875, -36.23046875, -34.634765625, -33.0390625, -31.443359375, -29.84765625, -28.251953125, -26.65625, -25.060546875, -23.46484375, -21.869140625, -20.2734375, -18.677734375, -17.08203125, -15.486328125, -13.890625, -12.294921875, -10.69921875, -9.103515625, -7.5078125, -5.912109375, -4.31640625, -2.720703125, -1.125, 0.470703125, 2.06640625, 3.662109375, 5.2578125, 6.853515625, 8.44921875, 10.044921875, 11.640625, 13.236328125, 14.83203125, 16.427734375, 18.0234375, 19.619140625, 21.21484375, 22.810546875, 24.40625, 26.001953125, 27.59765625, 29.193359375, 30.7890625, 32.384765625, 33.98046875, 35.576171875, 37.171875, 38.767578125, 40.36328125, 41.958984375, 43.5546875, 45.150390625, 46.74609375, 48.341796875, 49.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 9.0, 22.0, 23.0, 24.0, 29.0, 49.0, 61.0, 84.0, 82.0, 133.0, 182.0, 289.0, 551.0, 1281.0, 407.0, 216.0, 161.0, 106.0, 70.0, 66.0, 40.0, 33.0, 25.0, 19.0, 10.0, 10.0, 13.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 6.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1490478515625, -8.813720703125, -8.4783935546875, -8.14306640625, -7.8077392578125, -7.472412109375, -7.1370849609375, -6.8017578125, -6.4664306640625, -6.131103515625, -5.7957763671875, -5.46044921875, -5.1251220703125, -4.789794921875, -4.4544677734375, -4.119140625, -3.7838134765625, -3.448486328125, -3.1131591796875, -2.77783203125, -2.4425048828125, -2.107177734375, -1.7718505859375, -1.4365234375, -1.1011962890625, -0.765869140625, -0.4305419921875, -0.09521484375, 0.2401123046875, 0.575439453125, 0.9107666015625, 1.24609375, 1.5814208984375, 1.916748046875, 2.2520751953125, 2.58740234375, 2.9227294921875, 3.258056640625, 3.5933837890625, 3.9287109375, 4.2640380859375, 4.599365234375, 4.9346923828125, 5.27001953125, 5.6053466796875, 5.940673828125, 6.2760009765625, 6.611328125, 6.9466552734375, 7.281982421875, 7.6173095703125, 7.95263671875, 8.2879638671875, 8.623291015625, 8.9586181640625, 9.2939453125, 9.6292724609375, 9.964599609375, 10.2999267578125, 10.63525390625, 10.9705810546875, 11.305908203125, 11.6412353515625, 11.9765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 16.0, 9.0, 21.0, 45.0, 70.0, 117.0, 183.0, 184.0, 135.0, 104.0, 52.0, 36.0, 17.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.76976013183594, -143.60548400878906, -139.44122314453125, -135.27694702148438, -131.11268615722656, -126.94841766357422, -122.78414916992188, -118.619873046875, -114.45561218261719, -110.29134368896484, -106.1270751953125, -101.96280670166016, -97.79853820800781, -93.63426971435547, -89.47000122070312, -85.30572509765625, -81.1414566040039, -76.97718811035156, -72.81291961669922, -68.64865112304688, -64.48438262939453, -60.32011413574219, -56.15584182739258, -51.991573333740234, -47.82730484008789, -43.66303634643555, -39.4987678527832, -35.334495544433594, -31.170228958129883, -27.00596046447754, -22.841690063476562, -18.67742156982422, -14.513153076171875, -10.348884582519531, -6.184615135192871, -2.020345687866211, 2.143922805786133, 6.308191299438477, 10.472461700439453, 14.636730194091797, 18.80099868774414, 22.965267181396484, 27.129535675048828, 31.293806076049805, 35.45807647705078, 39.622344970703125, 43.78661346435547, 47.95088195800781, 52.115150451660156, 56.2794189453125, 60.443687438964844, 64.60795593261719, 68.77222442626953, 72.93649291992188, 77.10076904296875, 81.26502990722656, 85.42930603027344, 89.59357452392578, 93.75784301757812, 97.92211151123047, 102.08638000488281, 106.25064849853516, 110.4149169921875, 114.57919311523438, 118.74345397949219]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 17.0, 16.0, 17.0, 26.0, 31.0, 34.0, 47.0, 49.0, 67.0, 54.0, 77.0, 74.0, 78.0, 78.0, 59.0, 45.0, 46.0, 41.0, 28.0, 28.0, 15.0, 17.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.56741333007812, -62.397796630859375, -60.228179931640625, -58.05856704711914, -55.88895034790039, -53.71933364868164, -51.549720764160156, -49.380104064941406, -47.210487365722656, -45.040870666503906, -42.871253967285156, -40.70164108276367, -38.53202438354492, -36.36240768432617, -34.19279479980469, -32.02317810058594, -29.853561401367188, -27.683944702148438, -25.51432991027832, -23.344715118408203, -21.175098419189453, -19.005481719970703, -16.835866928100586, -14.666251182556152, -12.496635437011719, -10.327019691467285, -8.157403945922852, -5.987788200378418, -3.8181724548339844, -1.6485567092895508, 0.5210590362548828, 2.6906747817993164, 4.86029052734375, 7.029906272888184, 9.199522018432617, 11.36913776397705, 13.538753509521484, 15.708369255065918, 17.87798500061035, 20.04759979248047, 22.21721649169922, 24.38683319091797, 26.556447982788086, 28.726062774658203, 30.895679473876953, 33.0652961730957, 35.23490905761719, 37.40452575683594, 39.57414245605469, 41.74375915527344, 43.91337585449219, 46.08298873901367, 48.25260543823242, 50.42222213745117, 52.591835021972656, 54.761451721191406, 56.931068420410156, 59.100685119628906, 61.270301818847656, 63.43991470336914, 65.60952758789062, 67.77914428710938, 69.94876098632812, 72.11837768554688, 74.28799438476562]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 11.0, 9.0, 13.0, 18.0, 26.0, 30.0, 38.0, 65.0, 112.0, 129.0, 210.0, 337.0, 510.0, 737.0, 1320.0, 2262.0, 4081.0, 7763.0, 15312.0, 34157.0, 88838.0, 294557.0, 389424.0, 123975.0, 44444.0, 19061.0, 9352.0, 4948.0, 2720.0, 1541.0, 882.0, 585.0, 337.0, 238.0, 160.0, 106.0, 78.0, 42.0, 31.0, 27.0, 16.0, 17.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-46.25, -44.93408203125, -43.6181640625, -42.30224609375, -40.986328125, -39.67041015625, -38.3544921875, -37.03857421875, -35.72265625, -34.40673828125, -33.0908203125, -31.77490234375, -30.458984375, -29.14306640625, -27.8271484375, -26.51123046875, -25.1953125, -23.87939453125, -22.5634765625, -21.24755859375, -19.931640625, -18.61572265625, -17.2998046875, -15.98388671875, -14.66796875, -13.35205078125, -12.0361328125, -10.72021484375, -9.404296875, -8.08837890625, -6.7724609375, -5.45654296875, -4.140625, -2.82470703125, -1.5087890625, -0.19287109375, 1.123046875, 2.43896484375, 3.7548828125, 5.07080078125, 6.38671875, 7.70263671875, 9.0185546875, 10.33447265625, 11.650390625, 12.96630859375, 14.2822265625, 15.59814453125, 16.9140625, 18.22998046875, 19.5458984375, 20.86181640625, 22.177734375, 23.49365234375, 24.8095703125, 26.12548828125, 27.44140625, 28.75732421875, 30.0732421875, 31.38916015625, 32.705078125, 34.02099609375, 35.3369140625, 36.65283203125, 37.96875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 16.0, 13.0, 21.0, 28.0, 32.0, 31.0, 34.0, 39.0, 58.0, 53.0, 53.0, 51.0, 62.0, 46.0, 53.0, 52.0, 48.0, 46.0, 43.0, 24.0, 26.0, 13.0, 15.0, 18.0, 22.0, 10.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.18487548828125, -3.0494384765625, -2.91400146484375, -2.778564453125, -2.64312744140625, -2.5076904296875, -2.37225341796875, -2.23681640625, -2.10137939453125, -1.9659423828125, -1.83050537109375, -1.695068359375, -1.55963134765625, -1.4241943359375, -1.28875732421875, -1.1533203125, -1.01788330078125, -0.8824462890625, -0.74700927734375, -0.611572265625, -0.47613525390625, -0.3406982421875, -0.20526123046875, -0.06982421875, 0.06561279296875, 0.2010498046875, 0.33648681640625, 0.471923828125, 0.60736083984375, 0.7427978515625, 0.87823486328125, 1.013671875, 1.14910888671875, 1.2845458984375, 1.41998291015625, 1.555419921875, 1.69085693359375, 1.8262939453125, 1.96173095703125, 2.09716796875, 2.23260498046875, 2.3680419921875, 2.50347900390625, 2.638916015625, 2.77435302734375, 2.9097900390625, 3.04522705078125, 3.1806640625, 3.31610107421875, 3.4515380859375, 3.58697509765625, 3.722412109375, 3.85784912109375, 3.9932861328125, 4.12872314453125, 4.26416015625, 4.39959716796875, 4.5350341796875, 4.67047119140625, 4.805908203125, 4.94134521484375, 5.0767822265625, 5.21221923828125, 5.34765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 11.0, 15.0, 13.0, 12.0, 34.0, 64.0, 95.0, 169.0, 252.0, 422.0, 702.0, 1296.0, 2318.0, 4736.0, 10787.0, 30130.0, 119837.0, 538181.0, 257745.0, 51965.0, 16193.0, 6687.0, 3114.0, 1611.0, 893.0, 447.0, 301.0, 191.0, 110.0, 75.0, 49.0, 36.0, 30.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.09375, -55.5390625, -53.984375, -52.4296875, -50.875, -49.3203125, -47.765625, -46.2109375, -44.65625, -43.1015625, -41.546875, -39.9921875, -38.4375, -36.8828125, -35.328125, -33.7734375, -32.21875, -30.6640625, -29.109375, -27.5546875, -26.0, -24.4453125, -22.890625, -21.3359375, -19.78125, -18.2265625, -16.671875, -15.1171875, -13.5625, -12.0078125, -10.453125, -8.8984375, -7.34375, -5.7890625, -4.234375, -2.6796875, -1.125, 0.4296875, 1.984375, 3.5390625, 5.09375, 6.6484375, 8.203125, 9.7578125, 11.3125, 12.8671875, 14.421875, 15.9765625, 17.53125, 19.0859375, 20.640625, 22.1953125, 23.75, 25.3046875, 26.859375, 28.4140625, 29.96875, 31.5234375, 33.078125, 34.6328125, 36.1875, 37.7421875, 39.296875, 40.8515625, 42.40625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 4.0, 13.0, 10.0, 25.0, 25.0, 28.0, 29.0, 38.0, 45.0, 45.0, 47.0, 55.0, 67.0, 67.0, 45.0, 52.0, 56.0, 49.0, 54.0, 37.0, 37.0, 24.0, 23.0, 24.0, 18.0, 9.0, 14.0, 5.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-27.546875, -26.780517578125, -26.01416015625, -25.247802734375, -24.4814453125, -23.715087890625, -22.94873046875, -22.182373046875, -21.416015625, -20.649658203125, -19.88330078125, -19.116943359375, -18.3505859375, -17.584228515625, -16.81787109375, -16.051513671875, -15.28515625, -14.518798828125, -13.75244140625, -12.986083984375, -12.2197265625, -11.453369140625, -10.68701171875, -9.920654296875, -9.154296875, -8.387939453125, -7.62158203125, -6.855224609375, -6.0888671875, -5.322509765625, -4.55615234375, -3.789794921875, -3.0234375, -2.257080078125, -1.49072265625, -0.724365234375, 0.0419921875, 0.808349609375, 1.57470703125, 2.341064453125, 3.107421875, 3.873779296875, 4.64013671875, 5.406494140625, 6.1728515625, 6.939208984375, 7.70556640625, 8.471923828125, 9.23828125, 10.004638671875, 10.77099609375, 11.537353515625, 12.3037109375, 13.070068359375, 13.83642578125, 14.602783203125, 15.369140625, 16.135498046875, 16.90185546875, 17.668212890625, 18.4345703125, 19.200927734375, 19.96728515625, 20.733642578125, 21.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 12.0, 16.0, 30.0, 39.0, 51.0, 86.0, 143.0, 234.0, 347.0, 689.0, 1214.0, 2421.0, 5014.0, 11318.0, 27354.0, 73868.0, 205429.0, 368866.0, 219371.0, 79557.0, 29517.0, 11961.0, 5357.0, 2623.0, 1280.0, 675.0, 403.0, 226.0, 136.0, 85.0, 86.0, 37.0, 26.0, 22.0, 15.0, 6.0, 9.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.71875, -27.88720703125, -27.0556640625, -26.22412109375, -25.392578125, -24.56103515625, -23.7294921875, -22.89794921875, -22.06640625, -21.23486328125, -20.4033203125, -19.57177734375, -18.740234375, -17.90869140625, -17.0771484375, -16.24560546875, -15.4140625, -14.58251953125, -13.7509765625, -12.91943359375, -12.087890625, -11.25634765625, -10.4248046875, -9.59326171875, -8.76171875, -7.93017578125, -7.0986328125, -6.26708984375, -5.435546875, -4.60400390625, -3.7724609375, -2.94091796875, -2.109375, -1.27783203125, -0.4462890625, 0.38525390625, 1.216796875, 2.04833984375, 2.8798828125, 3.71142578125, 4.54296875, 5.37451171875, 6.2060546875, 7.03759765625, 7.869140625, 8.70068359375, 9.5322265625, 10.36376953125, 11.1953125, 12.02685546875, 12.8583984375, 13.68994140625, 14.521484375, 15.35302734375, 16.1845703125, 17.01611328125, 17.84765625, 18.67919921875, 19.5107421875, 20.34228515625, 21.173828125, 22.00537109375, 22.8369140625, 23.66845703125, 24.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 0.0, 5.0, 4.0, 4.0, 5.0, 9.0, 18.0, 27.0, 62.0, 94.0, 139.0, 167.0, 197.0, 101.0, 75.0, 31.0, 11.0, 8.0, 6.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0028076171875, -0.0027156472206115723, -0.0026236772537231445, -0.002531707286834717, -0.002439737319946289, -0.0023477673530578613, -0.0022557973861694336, -0.002163827419281006, -0.002071857452392578, -0.0019798874855041504, -0.0018879175186157227, -0.001795947551727295, -0.0017039775848388672, -0.0016120076179504395, -0.0015200376510620117, -0.001428067684173584, -0.0013360977172851562, -0.0012441277503967285, -0.0011521577835083008, -0.001060187816619873, -0.0009682178497314453, -0.0008762478828430176, -0.0007842779159545898, -0.0006923079490661621, -0.0006003379821777344, -0.0005083680152893066, -0.0004163980484008789, -0.00032442808151245117, -0.00023245811462402344, -0.0001404881477355957, -4.851818084716797e-05, 4.3451786041259766e-05, 0.0001354217529296875, 0.00022739171981811523, 0.00031936168670654297, 0.0004113316535949707, 0.0005033016204833984, 0.0005952715873718262, 0.0006872415542602539, 0.0007792115211486816, 0.0008711814880371094, 0.0009631514549255371, 0.0010551214218139648, 0.0011470913887023926, 0.0012390613555908203, 0.001331031322479248, 0.0014230012893676758, 0.0015149712562561035, 0.0016069412231445312, 0.001698911190032959, 0.0017908811569213867, 0.0018828511238098145, 0.001974821090698242, 0.00206679105758667, 0.0021587610244750977, 0.0022507309913635254, 0.002342700958251953, 0.002434670925140381, 0.0025266408920288086, 0.0026186108589172363, 0.002710580825805664, 0.002802550792694092, 0.0028945207595825195, 0.0029864907264709473, 0.003078460693359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 6.0, 5.0, 11.0, 20.0, 29.0, 62.0, 132.0, 215.0, 475.0, 1170.0, 2880.0, 7611.0, 25205.0, 99677.0, 385549.0, 387426.0, 100677.0, 24881.0, 7545.0, 2783.0, 1108.0, 500.0, 276.0, 129.0, 78.0, 36.0, 19.0, 14.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-49.125, -47.865478515625, -46.60595703125, -45.346435546875, -44.0869140625, -42.827392578125, -41.56787109375, -40.308349609375, -39.048828125, -37.789306640625, -36.52978515625, -35.270263671875, -34.0107421875, -32.751220703125, -31.49169921875, -30.232177734375, -28.97265625, -27.713134765625, -26.45361328125, -25.194091796875, -23.9345703125, -22.675048828125, -21.41552734375, -20.156005859375, -18.896484375, -17.636962890625, -16.37744140625, -15.117919921875, -13.8583984375, -12.598876953125, -11.33935546875, -10.079833984375, -8.8203125, -7.560791015625, -6.30126953125, -5.041748046875, -3.7822265625, -2.522705078125, -1.26318359375, -0.003662109375, 1.255859375, 2.515380859375, 3.77490234375, 5.034423828125, 6.2939453125, 7.553466796875, 8.81298828125, 10.072509765625, 11.33203125, 12.591552734375, 13.85107421875, 15.110595703125, 16.3701171875, 17.629638671875, 18.88916015625, 20.148681640625, 21.408203125, 22.667724609375, 23.92724609375, 25.186767578125, 26.4462890625, 27.705810546875, 28.96533203125, 30.224853515625, 31.484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 7.0, 7.0, 17.0, 14.0, 17.0, 29.0, 25.0, 33.0, 48.0, 64.0, 63.0, 61.0, 63.0, 62.0, 84.0, 69.0, 59.0, 60.0, 35.0, 39.0, 25.0, 29.0, 21.0, 9.0, 4.0, 9.0, 13.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.177978515625, -10.69970703125, -10.221435546875, -9.7431640625, -9.264892578125, -8.78662109375, -8.308349609375, -7.830078125, -7.351806640625, -6.87353515625, -6.395263671875, -5.9169921875, -5.438720703125, -4.96044921875, -4.482177734375, -4.00390625, -3.525634765625, -3.04736328125, -2.569091796875, -2.0908203125, -1.612548828125, -1.13427734375, -0.656005859375, -0.177734375, 0.300537109375, 0.77880859375, 1.257080078125, 1.7353515625, 2.213623046875, 2.69189453125, 3.170166015625, 3.6484375, 4.126708984375, 4.60498046875, 5.083251953125, 5.5615234375, 6.039794921875, 6.51806640625, 6.996337890625, 7.474609375, 7.952880859375, 8.43115234375, 8.909423828125, 9.3876953125, 9.865966796875, 10.34423828125, 10.822509765625, 11.30078125, 11.779052734375, 12.25732421875, 12.735595703125, 13.2138671875, 13.692138671875, 14.17041015625, 14.648681640625, 15.126953125, 15.605224609375, 16.08349609375, 16.561767578125, 17.0400390625, 17.518310546875, 17.99658203125, 18.474853515625, 18.953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 11.0, 7.0, 12.0, 18.0, 31.0, 77.0, 118.0, 150.0, 165.0, 146.0, 103.0, 71.0, 50.0, 21.0, 9.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.26101684570312, -167.6498260498047, -158.03863525390625, -148.42745971679688, -138.81626892089844, -129.205078125, -119.59388732910156, -109.98270416259766, -100.37151336669922, -90.76032257080078, -81.14913940429688, -71.53794860839844, -61.926761627197266, -52.315574645996094, -42.704383850097656, -33.09320068359375, -23.482009887695312, -13.870821952819824, -4.259634017944336, 5.351554870605469, 14.96274185180664, 24.573928833007812, 34.18511962890625, 43.796302795410156, 53.407493591308594, 63.018680572509766, 72.62986755371094, 82.24105834960938, 91.85224914550781, 101.46343231201172, 111.07462310791016, 120.68580627441406, 130.2969970703125, 139.90818786621094, 149.51937866210938, 159.13055419921875, 168.7417449951172, 178.35293579101562, 187.96412658691406, 197.5753173828125, 207.18649291992188, 216.7976837158203, 226.40887451171875, 236.02005004882812, 245.63124084472656, 255.242431640625, 264.8536376953125, 274.4648132324219, 284.07598876953125, 293.6871643066406, 303.2983703613281, 312.9095458984375, 322.520751953125, 332.1319274902344, 341.74310302734375, 351.35430908203125, 360.96551513671875, 370.5766906738281, 380.1878967285156, 389.799072265625, 399.4102783203125, 409.0214538574219, 418.63262939453125, 428.24383544921875, 437.8550109863281]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 3.0, 9.0, 9.0, 12.0, 11.0, 17.0, 21.0, 29.0, 35.0, 35.0, 51.0, 53.0, 58.0, 70.0, 52.0, 60.0, 52.0, 64.0, 45.0, 46.0, 45.0, 38.0, 35.0, 33.0, 23.0, 19.0, 14.0, 9.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-159.87094116210938, -154.9088897705078, -149.94683837890625, -144.98477172851562, -140.02272033691406, -135.0606689453125, -130.09861755371094, -125.13656616210938, -120.17450714111328, -115.21245574951172, -110.25039672851562, -105.28834533691406, -100.3262939453125, -95.3642349243164, -90.40218353271484, -85.44012451171875, -80.47807312011719, -75.51602172851562, -70.55396270751953, -65.59191131591797, -60.62985610961914, -55.66780090332031, -50.70574951171875, -45.74369430541992, -40.781639099121094, -35.819583892822266, -30.85753059387207, -25.895477294921875, -20.933422088623047, -15.971366882324219, -11.009313583374023, -6.047260284423828, -1.085205078125, 3.8768491744995117, 8.838903427124023, 13.800957679748535, 18.763011932373047, 23.725067138671875, 28.68712043762207, 33.649173736572266, 38.611228942871094, 43.57328414916992, 48.53533935546875, 53.49739074707031, 58.45944595336914, 63.42150115966797, 68.38355255126953, 73.34561157226562, 78.30766296386719, 83.26971435546875, 88.23177337646484, 93.1938247680664, 98.1558837890625, 103.11793518066406, 108.07998657226562, 113.04203796386719, 118.00409698486328, 122.96614837646484, 127.92820739746094, 132.8902587890625, 137.85231018066406, 142.81436157226562, 147.77642822265625, 152.7384796142578, 157.70053100585938]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 10.0, 20.0, 36.0, 47.0, 77.0, 123.0, 199.0, 352.0, 581.0, 1109.0, 2012.0, 3887.0, 8059.0, 18143.0, 47206.0, 182247.0, 3342556.0, 456421.0, 79857.0, 27346.0, 11726.0, 5552.0, 2849.0, 1561.0, 855.0, 497.0, 329.0, 198.0, 102.0, 96.0, 65.0, 38.0, 33.0, 20.0, 13.0, 15.0, 5.0, 4.0, 6.0, 8.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-90.8125, -87.2822265625, -83.751953125, -80.2216796875, -76.69140625, -73.1611328125, -69.630859375, -66.1005859375, -62.5703125, -59.0400390625, -55.509765625, -51.9794921875, -48.44921875, -44.9189453125, -41.388671875, -37.8583984375, -34.328125, -30.7978515625, -27.267578125, -23.7373046875, -20.20703125, -16.6767578125, -13.146484375, -9.6162109375, -6.0859375, -2.5556640625, 0.974609375, 4.5048828125, 8.03515625, 11.5654296875, 15.095703125, 18.6259765625, 22.15625, 25.6865234375, 29.216796875, 32.7470703125, 36.27734375, 39.8076171875, 43.337890625, 46.8681640625, 50.3984375, 53.9287109375, 57.458984375, 60.9892578125, 64.51953125, 68.0498046875, 71.580078125, 75.1103515625, 78.640625, 82.1708984375, 85.701171875, 89.2314453125, 92.76171875, 96.2919921875, 99.822265625, 103.3525390625, 106.8828125, 110.4130859375, 113.943359375, 117.4736328125, 121.00390625, 124.5341796875, 128.064453125, 131.5947265625, 135.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 20.0, 25.0, 33.0, 50.0, 48.0, 53.0, 61.0, 66.0, 72.0, 61.0, 83.0, 57.0, 60.0, 64.0, 48.0, 25.0, 21.0, 30.0, 18.0, 14.0, 15.0, 7.0, 10.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.35711669921875, -4.1712646484375, -3.98541259765625, -3.799560546875, -3.61370849609375, -3.4278564453125, -3.24200439453125, -3.05615234375, -2.87030029296875, -2.6844482421875, -2.49859619140625, -2.312744140625, -2.12689208984375, -1.9410400390625, -1.75518798828125, -1.5693359375, -1.38348388671875, -1.1976318359375, -1.01177978515625, -0.825927734375, -0.64007568359375, -0.4542236328125, -0.26837158203125, -0.08251953125, 0.10333251953125, 0.2891845703125, 0.47503662109375, 0.660888671875, 0.84674072265625, 1.0325927734375, 1.21844482421875, 1.404296875, 1.59014892578125, 1.7760009765625, 1.96185302734375, 2.147705078125, 2.33355712890625, 2.5194091796875, 2.70526123046875, 2.89111328125, 3.07696533203125, 3.2628173828125, 3.44866943359375, 3.634521484375, 3.82037353515625, 4.0062255859375, 4.19207763671875, 4.3779296875, 4.56378173828125, 4.7496337890625, 4.93548583984375, 5.121337890625, 5.30718994140625, 5.4930419921875, 5.67889404296875, 5.86474609375, 6.05059814453125, 6.2364501953125, 6.42230224609375, 6.608154296875, 6.79400634765625, 6.9798583984375, 7.16571044921875, 7.3515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 9.0, 5.0, 14.0, 15.0, 21.0, 23.0, 29.0, 42.0, 62.0, 96.0, 194.0, 368.0, 907.0, 2926.0, 13667.0, 107921.0, 3468250.0, 550047.0, 40180.0, 6636.0, 1637.0, 536.0, 242.0, 117.0, 95.0, 61.0, 39.0, 21.0, 18.0, 16.0, 19.0, 5.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-210.625, -203.306640625, -195.98828125, -188.669921875, -181.3515625, -174.033203125, -166.71484375, -159.396484375, -152.078125, -144.759765625, -137.44140625, -130.123046875, -122.8046875, -115.486328125, -108.16796875, -100.849609375, -93.53125, -86.212890625, -78.89453125, -71.576171875, -64.2578125, -56.939453125, -49.62109375, -42.302734375, -34.984375, -27.666015625, -20.34765625, -13.029296875, -5.7109375, 1.607421875, 8.92578125, 16.244140625, 23.5625, 30.880859375, 38.19921875, 45.517578125, 52.8359375, 60.154296875, 67.47265625, 74.791015625, 82.109375, 89.427734375, 96.74609375, 104.064453125, 111.3828125, 118.701171875, 126.01953125, 133.337890625, 140.65625, 147.974609375, 155.29296875, 162.611328125, 169.9296875, 177.248046875, 184.56640625, 191.884765625, 199.203125, 206.521484375, 213.83984375, 221.158203125, 228.4765625, 235.794921875, 243.11328125, 250.431640625, 257.75]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 6.0, 7.0, 6.0, 15.0, 23.0, 23.0, 33.0, 50.0, 51.0, 78.0, 94.0, 143.0, 237.0, 398.0, 1306.0, 596.0, 296.0, 187.0, 116.0, 95.0, 65.0, 51.0, 38.0, 27.0, 20.0, 16.0, 10.0, 13.0, 8.0, 12.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.1153564453125, -16.636962890625, -16.1585693359375, -15.68017578125, -15.2017822265625, -14.723388671875, -14.2449951171875, -13.7666015625, -13.2882080078125, -12.809814453125, -12.3314208984375, -11.85302734375, -11.3746337890625, -10.896240234375, -10.4178466796875, -9.939453125, -9.4610595703125, -8.982666015625, -8.5042724609375, -8.02587890625, -7.5474853515625, -7.069091796875, -6.5906982421875, -6.1123046875, -5.6339111328125, -5.155517578125, -4.6771240234375, -4.19873046875, -3.7203369140625, -3.241943359375, -2.7635498046875, -2.28515625, -1.8067626953125, -1.328369140625, -0.8499755859375, -0.37158203125, 0.1068115234375, 0.585205078125, 1.0635986328125, 1.5419921875, 2.0203857421875, 2.498779296875, 2.9771728515625, 3.45556640625, 3.9339599609375, 4.412353515625, 4.8907470703125, 5.369140625, 5.8475341796875, 6.325927734375, 6.8043212890625, 7.28271484375, 7.7611083984375, 8.239501953125, 8.7178955078125, 9.1962890625, 9.6746826171875, 10.153076171875, 10.6314697265625, 11.10986328125, 11.5882568359375, 12.066650390625, 12.5450439453125, 13.0234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 5.0, 9.0, 10.0, 20.0, 38.0, 52.0, 76.0, 101.0, 115.0, 146.0, 102.0, 112.0, 61.0, 55.0, 38.0, 26.0, 14.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.0250701904297, -195.2325897216797, -190.4401092529297, -185.64764404296875, -180.85516357421875, -176.06268310546875, -171.27020263671875, -166.47772216796875, -161.6852569580078, -156.8927764892578, -152.1002960205078, -147.30783081054688, -142.51535034179688, -137.72286987304688, -132.93038940429688, -128.13790893554688, -123.3454360961914, -118.5529556274414, -113.76048278808594, -108.96800231933594, -104.17552947998047, -99.38304901123047, -94.590576171875, -89.798095703125, -85.005615234375, -80.213134765625, -75.42066192626953, -70.62818145751953, -65.83570861816406, -61.04322814941406, -56.25075149536133, -51.458274841308594, -46.665809631347656, -41.87333297729492, -37.08085632324219, -32.28837585449219, -27.495901107788086, -22.70342445373535, -17.910945892333984, -13.11846923828125, -8.325992584228516, -3.533515453338623, 1.2589616775512695, 6.05143928527832, 10.843915939331055, 15.636392593383789, 20.428871154785156, 25.22134780883789, 30.013824462890625, 34.80630111694336, 39.598777770996094, 44.391258239746094, 49.18373107910156, 53.97621154785156, 58.7686882019043, 63.56116485595703, 68.3536376953125, 73.1461181640625, 77.93859100341797, 82.73107147216797, 87.52354431152344, 92.31602478027344, 97.10850524902344, 101.9009780883789, 106.6934585571289]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 17.0, 15.0, 15.0, 12.0, 19.0, 35.0, 25.0, 36.0, 31.0, 34.0, 36.0, 43.0, 47.0, 52.0, 38.0, 37.0, 51.0, 42.0, 39.0, 50.0, 44.0, 35.0, 29.0, 30.0, 38.0, 22.0, 17.0, 8.0, 9.0, 11.0, 10.0, 9.0, 14.0, 7.0, 7.0, 3.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.94207000732422, -68.9043960571289, -66.8667221069336, -64.82904052734375, -62.79136657714844, -60.753692626953125, -58.71601867675781, -56.678340911865234, -54.640663146972656, -52.602989196777344, -50.565311431884766, -48.52763748168945, -46.489959716796875, -44.45228576660156, -42.41461181640625, -40.37693405151367, -38.33926010131836, -36.30158615112305, -34.26390838623047, -32.226234436035156, -30.188556671142578, -28.150882720947266, -26.11320686340332, -24.075531005859375, -22.03785514831543, -20.000179290771484, -17.96250343322754, -15.92482852935791, -13.887152671813965, -11.84947681427002, -9.81180191040039, -7.774126052856445, -5.7364501953125, -3.698774576187134, -1.6610989570617676, 0.37657642364501953, 2.414252281188965, 4.45192813873291, 6.489603042602539, 8.527278900146484, 10.56495475769043, 12.602630615234375, 14.64030647277832, 16.677982330322266, 18.715656280517578, 20.753334045410156, 22.79100799560547, 24.828683853149414, 26.86635971069336, 28.904035568237305, 30.94171142578125, 32.97938537597656, 35.01706314086914, 37.05473709106445, 39.09241485595703, 41.130088806152344, 43.167762756347656, 45.20543670654297, 47.24311447143555, 49.28078842163086, 51.31846618652344, 53.35614013671875, 55.39381408691406, 57.43149185180664, 59.46916961669922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 10.0, 8.0, 8.0, 7.0, 14.0, 21.0, 37.0, 60.0, 73.0, 121.0, 125.0, 242.0, 326.0, 507.0, 749.0, 1133.0, 1744.0, 2723.0, 4102.0, 6512.0, 10437.0, 16182.0, 26064.0, 41075.0, 64266.0, 97296.0, 137524.0, 165767.0, 151517.0, 111916.0, 75525.0, 48805.0, 30911.0, 19095.0, 12086.0, 7444.0, 4882.0, 3132.0, 1997.0, 1361.0, 873.0, 572.0, 446.0, 265.0, 178.0, 138.0, 89.0, 85.0, 36.0, 21.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-30.765625, -29.762939453125, -28.76025390625, -27.757568359375, -26.7548828125, -25.752197265625, -24.74951171875, -23.746826171875, -22.744140625, -21.741455078125, -20.73876953125, -19.736083984375, -18.7333984375, -17.730712890625, -16.72802734375, -15.725341796875, -14.72265625, -13.719970703125, -12.71728515625, -11.714599609375, -10.7119140625, -9.709228515625, -8.70654296875, -7.703857421875, -6.701171875, -5.698486328125, -4.69580078125, -3.693115234375, -2.6904296875, -1.687744140625, -0.68505859375, 0.317626953125, 1.3203125, 2.322998046875, 3.32568359375, 4.328369140625, 5.3310546875, 6.333740234375, 7.33642578125, 8.339111328125, 9.341796875, 10.344482421875, 11.34716796875, 12.349853515625, 13.3525390625, 14.355224609375, 15.35791015625, 16.360595703125, 17.36328125, 18.365966796875, 19.36865234375, 20.371337890625, 21.3740234375, 22.376708984375, 23.37939453125, 24.382080078125, 25.384765625, 26.387451171875, 27.39013671875, 28.392822265625, 29.3955078125, 30.398193359375, 31.40087890625, 32.403564453125, 33.40625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 6.0, 9.0, 14.0, 7.0, 17.0, 12.0, 15.0, 12.0, 24.0, 28.0, 37.0, 36.0, 37.0, 44.0, 47.0, 39.0, 48.0, 53.0, 47.0, 41.0, 43.0, 42.0, 41.0, 56.0, 41.0, 22.0, 21.0, 30.0, 23.0, 18.0, 19.0, 13.0, 10.0, 5.0, 5.0, 12.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.30078125, -4.15350341796875, -4.0062255859375, -3.85894775390625, -3.711669921875, -3.56439208984375, -3.4171142578125, -3.26983642578125, -3.12255859375, -2.97528076171875, -2.8280029296875, -2.68072509765625, -2.533447265625, -2.38616943359375, -2.2388916015625, -2.09161376953125, -1.9443359375, -1.79705810546875, -1.6497802734375, -1.50250244140625, -1.355224609375, -1.20794677734375, -1.0606689453125, -0.91339111328125, -0.76611328125, -0.61883544921875, -0.4715576171875, -0.32427978515625, -0.177001953125, -0.02972412109375, 0.1175537109375, 0.26483154296875, 0.412109375, 0.55938720703125, 0.7066650390625, 0.85394287109375, 1.001220703125, 1.14849853515625, 1.2957763671875, 1.44305419921875, 1.59033203125, 1.73760986328125, 1.8848876953125, 2.03216552734375, 2.179443359375, 2.32672119140625, 2.4739990234375, 2.62127685546875, 2.7685546875, 2.91583251953125, 3.0631103515625, 3.21038818359375, 3.357666015625, 3.50494384765625, 3.6522216796875, 3.79949951171875, 3.94677734375, 4.09405517578125, 4.2413330078125, 4.38861083984375, 4.535888671875, 4.68316650390625, 4.8304443359375, 4.97772216796875, 5.125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 16.0, 21.0, 33.0, 37.0, 46.0, 87.0, 116.0, 193.0, 273.0, 409.0, 685.0, 1219.0, 2376.0, 4774.0, 11107.0, 27280.0, 71923.0, 181802.0, 336640.0, 242497.0, 101013.0, 38078.0, 14857.0, 6323.0, 2931.0, 1506.0, 836.0, 498.0, 321.0, 217.0, 161.0, 83.0, 56.0, 48.0, 27.0, 21.0, 13.0, 9.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -76.279296875, -73.87109375, -71.462890625, -69.0546875, -66.646484375, -64.23828125, -61.830078125, -59.421875, -57.013671875, -54.60546875, -52.197265625, -49.7890625, -47.380859375, -44.97265625, -42.564453125, -40.15625, -37.748046875, -35.33984375, -32.931640625, -30.5234375, -28.115234375, -25.70703125, -23.298828125, -20.890625, -18.482421875, -16.07421875, -13.666015625, -11.2578125, -8.849609375, -6.44140625, -4.033203125, -1.625, 0.783203125, 3.19140625, 5.599609375, 8.0078125, 10.416015625, 12.82421875, 15.232421875, 17.640625, 20.048828125, 22.45703125, 24.865234375, 27.2734375, 29.681640625, 32.08984375, 34.498046875, 36.90625, 39.314453125, 41.72265625, 44.130859375, 46.5390625, 48.947265625, 51.35546875, 53.763671875, 56.171875, 58.580078125, 60.98828125, 63.396484375, 65.8046875, 68.212890625, 70.62109375, 73.029296875, 75.4375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 11.0, 10.0, 12.0, 25.0, 17.0, 22.0, 22.0, 31.0, 32.0, 35.0, 43.0, 49.0, 34.0, 30.0, 48.0, 53.0, 54.0, 48.0, 44.0, 40.0, 31.0, 38.0, 33.0, 33.0, 23.0, 26.0, 23.0, 18.0, 15.0, 12.0, 6.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.21875, -32.14990234375, -31.0810546875, -30.01220703125, -28.943359375, -27.87451171875, -26.8056640625, -25.73681640625, -24.66796875, -23.59912109375, -22.5302734375, -21.46142578125, -20.392578125, -19.32373046875, -18.2548828125, -17.18603515625, -16.1171875, -15.04833984375, -13.9794921875, -12.91064453125, -11.841796875, -10.77294921875, -9.7041015625, -8.63525390625, -7.56640625, -6.49755859375, -5.4287109375, -4.35986328125, -3.291015625, -2.22216796875, -1.1533203125, -0.08447265625, 0.984375, 2.05322265625, 3.1220703125, 4.19091796875, 5.259765625, 6.32861328125, 7.3974609375, 8.46630859375, 9.53515625, 10.60400390625, 11.6728515625, 12.74169921875, 13.810546875, 14.87939453125, 15.9482421875, 17.01708984375, 18.0859375, 19.15478515625, 20.2236328125, 21.29248046875, 22.361328125, 23.43017578125, 24.4990234375, 25.56787109375, 26.63671875, 27.70556640625, 28.7744140625, 29.84326171875, 30.912109375, 31.98095703125, 33.0498046875, 34.11865234375, 35.1875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 8.0, 9.0, 18.0, 23.0, 41.0, 64.0, 90.0, 162.0, 306.0, 598.0, 1132.0, 2551.0, 5989.0, 16365.0, 51166.0, 174203.0, 389398.0, 275591.0, 88247.0, 26425.0, 9109.0, 3530.0, 1636.0, 856.0, 429.0, 227.0, 135.0, 84.0, 59.0, 21.0, 24.0, 16.0, 11.0, 13.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -51.84912109375, -50.1044921875, -48.35986328125, -46.615234375, -44.87060546875, -43.1259765625, -41.38134765625, -39.63671875, -37.89208984375, -36.1474609375, -34.40283203125, -32.658203125, -30.91357421875, -29.1689453125, -27.42431640625, -25.6796875, -23.93505859375, -22.1904296875, -20.44580078125, -18.701171875, -16.95654296875, -15.2119140625, -13.46728515625, -11.72265625, -9.97802734375, -8.2333984375, -6.48876953125, -4.744140625, -2.99951171875, -1.2548828125, 0.48974609375, 2.234375, 3.97900390625, 5.7236328125, 7.46826171875, 9.212890625, 10.95751953125, 12.7021484375, 14.44677734375, 16.19140625, 17.93603515625, 19.6806640625, 21.42529296875, 23.169921875, 24.91455078125, 26.6591796875, 28.40380859375, 30.1484375, 31.89306640625, 33.6376953125, 35.38232421875, 37.126953125, 38.87158203125, 40.6162109375, 42.36083984375, 44.10546875, 45.85009765625, 47.5947265625, 49.33935546875, 51.083984375, 52.82861328125, 54.5732421875, 56.31787109375, 58.0625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 8.0, 13.0, 21.0, 16.0, 38.0, 30.0, 42.0, 55.0, 56.0, 73.0, 94.0, 88.0, 82.0, 72.0, 63.0, 35.0, 34.0, 39.0, 23.0, 18.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006748199462890625, -0.006529808044433594, -0.0063114166259765625, -0.006093025207519531, -0.0058746337890625, -0.005656242370605469, -0.0054378509521484375, -0.005219459533691406, -0.005001068115234375, -0.004782676696777344, -0.0045642852783203125, -0.004345893859863281, -0.00412750244140625, -0.003909111022949219, -0.0036907196044921875, -0.0034723281860351562, -0.003253936767578125, -0.0030355453491210938, -0.0028171539306640625, -0.0025987625122070312, -0.00238037109375, -0.0021619796752929688, -0.0019435882568359375, -0.0017251968383789062, -0.001506805419921875, -0.0012884140014648438, -0.0010700225830078125, -0.0008516311645507812, -0.00063323974609375, -0.00041484832763671875, -0.0001964569091796875, 2.193450927734375e-05, 0.000240325927734375, 0.00045871734619140625, 0.0006771087646484375, 0.0008955001831054688, 0.0011138916015625, 0.0013322830200195312, 0.0015506744384765625, 0.0017690658569335938, 0.001987457275390625, 0.0022058486938476562, 0.0024242401123046875, 0.0026426315307617188, 0.00286102294921875, 0.0030794143676757812, 0.0032978057861328125, 0.0035161972045898438, 0.003734588623046875, 0.003952980041503906, 0.0041713714599609375, 0.004389762878417969, 0.004608154296875, 0.004826545715332031, 0.0050449371337890625, 0.005263328552246094, 0.005481719970703125, 0.005700111389160156, 0.0059185028076171875, 0.006136894226074219, 0.00635528564453125, 0.006573677062988281, 0.0067920684814453125, 0.007010459899902344, 0.007228851318359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 12.0, 2.0, 20.0, 30.0, 38.0, 69.0, 159.0, 272.0, 550.0, 1392.0, 4003.0, 17021.0, 131228.0, 643140.0, 217183.0, 25020.0, 5258.0, 1725.0, 700.0, 338.0, 155.0, 85.0, 45.0, 31.0, 24.0, 14.0, 9.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.625, -90.56640625, -87.5078125, -84.44921875, -81.390625, -78.33203125, -75.2734375, -72.21484375, -69.15625, -66.09765625, -63.0390625, -59.98046875, -56.921875, -53.86328125, -50.8046875, -47.74609375, -44.6875, -41.62890625, -38.5703125, -35.51171875, -32.453125, -29.39453125, -26.3359375, -23.27734375, -20.21875, -17.16015625, -14.1015625, -11.04296875, -7.984375, -4.92578125, -1.8671875, 1.19140625, 4.25, 7.30859375, 10.3671875, 13.42578125, 16.484375, 19.54296875, 22.6015625, 25.66015625, 28.71875, 31.77734375, 34.8359375, 37.89453125, 40.953125, 44.01171875, 47.0703125, 50.12890625, 53.1875, 56.24609375, 59.3046875, 62.36328125, 65.421875, 68.48046875, 71.5390625, 74.59765625, 77.65625, 80.71484375, 83.7734375, 86.83203125, 89.890625, 92.94921875, 96.0078125, 99.06640625, 102.125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 19.0, 36.0, 46.0, 34.0, 68.0, 79.0, 98.0, 131.0, 97.0, 89.0, 76.0, 56.0, 58.0, 21.0, 26.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.141357421875, -23.92333984375, -22.705322265625, -21.4873046875, -20.269287109375, -19.05126953125, -17.833251953125, -16.615234375, -15.397216796875, -14.17919921875, -12.961181640625, -11.7431640625, -10.525146484375, -9.30712890625, -8.089111328125, -6.87109375, -5.653076171875, -4.43505859375, -3.217041015625, -1.9990234375, -0.781005859375, 0.43701171875, 1.655029296875, 2.873046875, 4.091064453125, 5.30908203125, 6.527099609375, 7.7451171875, 8.963134765625, 10.18115234375, 11.399169921875, 12.6171875, 13.835205078125, 15.05322265625, 16.271240234375, 17.4892578125, 18.707275390625, 19.92529296875, 21.143310546875, 22.361328125, 23.579345703125, 24.79736328125, 26.015380859375, 27.2333984375, 28.451416015625, 29.66943359375, 30.887451171875, 32.10546875, 33.323486328125, 34.54150390625, 35.759521484375, 36.9775390625, 38.195556640625, 39.41357421875, 40.631591796875, 41.849609375, 43.067626953125, 44.28564453125, 45.503662109375, 46.7216796875, 47.939697265625, 49.15771484375, 50.375732421875, 51.59375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 10.0, 17.0, 35.0, 104.0, 213.0, 250.0, 198.0, 100.0, 39.0, 21.0, 6.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-660.50146484375, -626.5277099609375, -592.553955078125, -558.5802001953125, -524.6065063476562, -490.63275146484375, -456.65899658203125, -422.68524169921875, -388.7115173339844, -354.7377624511719, -320.7640380859375, -286.790283203125, -252.81654357910156, -218.84280395507812, -184.86904907226562, -150.8953094482422, -116.92156982421875, -82.94783020019531, -48.974082946777344, -15.000335693359375, 18.973403930664062, 52.9471435546875, 86.9208984375, 120.89463806152344, 154.86837768554688, 188.8421173095703, 222.81585693359375, 256.78961181640625, 290.76336669921875, 324.7370910644531, 358.7108459472656, 392.6845703125, 426.6583251953125, 460.632080078125, 494.6058044433594, 528.57958984375, 562.5532836914062, 596.5270385742188, 630.5007934570312, 664.4745483398438, 698.4482421875, 732.4219970703125, 766.395751953125, 800.3695068359375, 834.3432006835938, 868.3169555664062, 902.2907104492188, 936.2644653320312, 970.2382202148438, 1004.2119750976562, 1038.1856689453125, 1072.159423828125, 1106.1331787109375, 1140.10693359375, 1174.0806884765625, 1208.054443359375, 1242.0281982421875, 1276.001953125, 1309.9757080078125, 1343.949462890625, 1377.9232177734375, 1411.89697265625, 1445.87060546875, 1479.8443603515625, 1513.818115234375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 13.0, 7.0, 12.0, 24.0, 15.0, 28.0, 36.0, 50.0, 51.0, 59.0, 70.0, 67.0, 65.0, 79.0, 76.0, 71.0, 44.0, 43.0, 40.0, 31.0, 22.0, 21.0, 23.0, 13.0, 5.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.781982421875, -314.1104431152344, -301.4389343261719, -288.76739501953125, -276.0958557128906, -263.42431640625, -250.7528076171875, -238.08126831054688, -225.4097442626953, -212.73822021484375, -200.06668090820312, -187.39515686035156, -174.7236328125, -162.05209350585938, -149.3805694580078, -136.70904541015625, -124.03750610351562, -111.36597442626953, -98.69444274902344, -86.02291870117188, -73.35138702392578, -60.67985534667969, -48.008331298828125, -35.33679962158203, -22.665267944335938, -9.993738174438477, 2.6777915954589844, 15.349319458007812, 28.020851135253906, 40.6923828125, 53.36390686035156, 66.03543853759766, 78.70697021484375, 91.37850189208984, 104.05003356933594, 116.7215576171875, 129.39309692382812, 142.0646209716797, 154.73614501953125, 167.40768432617188, 180.07920837402344, 192.750732421875, 205.42227172851562, 218.0937957763672, 230.76531982421875, 243.43685913085938, 256.1083984375, 268.7799072265625, 281.4514465332031, 294.12298583984375, 306.79449462890625, 319.4660339355469, 332.1375732421875, 344.80908203125, 357.4806213378906, 370.15216064453125, 382.82366943359375, 395.4952087402344, 408.1667175292969, 420.8382568359375, 433.5097961425781, 446.18133544921875, 458.85284423828125, 471.5243835449219, 484.1959228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 6.0, 3.0, 2.0, 11.0, 30.0, 31.0, 41.0, 71.0, 123.0, 334.0, 775.0, 2853.0, 15629.0, 195355.0, 3883129.0, 84709.0, 8657.0, 1557.0, 484.0, 188.0, 102.0, 69.0, 42.0, 25.0, 19.0, 10.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-403.0, -390.546875, -378.09375, -365.640625, -353.1875, -340.734375, -328.28125, -315.828125, -303.375, -290.921875, -278.46875, -266.015625, -253.5625, -241.109375, -228.65625, -216.203125, -203.75, -191.296875, -178.84375, -166.390625, -153.9375, -141.484375, -129.03125, -116.578125, -104.125, -91.671875, -79.21875, -66.765625, -54.3125, -41.859375, -29.40625, -16.953125, -4.5, 7.953125, 20.40625, 32.859375, 45.3125, 57.765625, 70.21875, 82.671875, 95.125, 107.578125, 120.03125, 132.484375, 144.9375, 157.390625, 169.84375, 182.296875, 194.75, 207.203125, 219.65625, 232.109375, 244.5625, 257.015625, 269.46875, 281.921875, 294.375, 306.828125, 319.28125, 331.734375, 344.1875, 356.640625, 369.09375, 381.546875, 394.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 2.0, 8.0, 13.0, 25.0, 26.0, 29.0, 26.0, 50.0, 40.0, 53.0, 65.0, 59.0, 77.0, 78.0, 72.0, 84.0, 59.0, 52.0, 26.0, 36.0, 34.0, 24.0, 14.0, 13.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.703125, -10.36767578125, -10.0322265625, -9.69677734375, -9.361328125, -9.02587890625, -8.6904296875, -8.35498046875, -8.01953125, -7.68408203125, -7.3486328125, -7.01318359375, -6.677734375, -6.34228515625, -6.0068359375, -5.67138671875, -5.3359375, -5.00048828125, -4.6650390625, -4.32958984375, -3.994140625, -3.65869140625, -3.3232421875, -2.98779296875, -2.65234375, -2.31689453125, -1.9814453125, -1.64599609375, -1.310546875, -0.97509765625, -0.6396484375, -0.30419921875, 0.03125, 0.36669921875, 0.7021484375, 1.03759765625, 1.373046875, 1.70849609375, 2.0439453125, 2.37939453125, 2.71484375, 3.05029296875, 3.3857421875, 3.72119140625, 4.056640625, 4.39208984375, 4.7275390625, 5.06298828125, 5.3984375, 5.73388671875, 6.0693359375, 6.40478515625, 6.740234375, 7.07568359375, 7.4111328125, 7.74658203125, 8.08203125, 8.41748046875, 8.7529296875, 9.08837890625, 9.423828125, 9.75927734375, 10.0947265625, 10.43017578125, 10.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 8.0, 6.0, 16.0, 18.0, 19.0, 29.0, 28.0, 71.0, 108.0, 241.0, 688.0, 2519.0, 11104.0, 66845.0, 844334.0, 3128244.0, 117032.0, 17486.0, 3794.0, 998.0, 334.0, 147.0, 77.0, 45.0, 28.0, 21.0, 16.0, 11.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.5, -256.38671875, -247.2734375, -238.16015625, -229.046875, -219.93359375, -210.8203125, -201.70703125, -192.59375, -183.48046875, -174.3671875, -165.25390625, -156.140625, -147.02734375, -137.9140625, -128.80078125, -119.6875, -110.57421875, -101.4609375, -92.34765625, -83.234375, -74.12109375, -65.0078125, -55.89453125, -46.78125, -37.66796875, -28.5546875, -19.44140625, -10.328125, -1.21484375, 7.8984375, 17.01171875, 26.125, 35.23828125, 44.3515625, 53.46484375, 62.578125, 71.69140625, 80.8046875, 89.91796875, 99.03125, 108.14453125, 117.2578125, 126.37109375, 135.484375, 144.59765625, 153.7109375, 162.82421875, 171.9375, 181.05078125, 190.1640625, 199.27734375, 208.390625, 217.50390625, 226.6171875, 235.73046875, 244.84375, 253.95703125, 263.0703125, 272.18359375, 281.296875, 290.41015625, 299.5234375, 308.63671875, 317.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 8.0, 14.0, 7.0, 13.0, 19.0, 31.0, 38.0, 46.0, 62.0, 65.0, 114.0, 161.0, 286.0, 615.0, 1377.0, 405.0, 238.0, 165.0, 95.0, 81.0, 49.0, 29.0, 31.0, 32.0, 18.0, 17.0, 17.0, 7.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-35.25, -34.30517578125, -33.3603515625, -32.41552734375, -31.470703125, -30.52587890625, -29.5810546875, -28.63623046875, -27.69140625, -26.74658203125, -25.8017578125, -24.85693359375, -23.912109375, -22.96728515625, -22.0224609375, -21.07763671875, -20.1328125, -19.18798828125, -18.2431640625, -17.29833984375, -16.353515625, -15.40869140625, -14.4638671875, -13.51904296875, -12.57421875, -11.62939453125, -10.6845703125, -9.73974609375, -8.794921875, -7.85009765625, -6.9052734375, -5.96044921875, -5.015625, -4.07080078125, -3.1259765625, -2.18115234375, -1.236328125, -0.29150390625, 0.6533203125, 1.59814453125, 2.54296875, 3.48779296875, 4.4326171875, 5.37744140625, 6.322265625, 7.26708984375, 8.2119140625, 9.15673828125, 10.1015625, 11.04638671875, 11.9912109375, 12.93603515625, 13.880859375, 14.82568359375, 15.7705078125, 16.71533203125, 17.66015625, 18.60498046875, 19.5498046875, 20.49462890625, 21.439453125, 22.38427734375, 23.3291015625, 24.27392578125, 25.21875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 12.0, 35.0, 32.0, 72.0, 127.0, 171.0, 172.0, 144.0, 106.0, 51.0, 31.0, 21.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.3853759765625, -251.46664428710938, -239.54791259765625, -227.62918090820312, -215.71044921875, -203.79171752929688, -191.87298583984375, -179.95425415039062, -168.0355224609375, -156.11679077148438, -144.19805908203125, -132.27932739257812, -120.360595703125, -108.44186401367188, -96.52313232421875, -84.60440063476562, -72.6856689453125, -60.766937255859375, -48.84820556640625, -36.929473876953125, -25.0107421875, -13.092010498046875, -1.17327880859375, 10.745452880859375, 22.6641845703125, 34.582916259765625, 46.50164794921875, 58.420379638671875, 70.339111328125, 82.25784301757812, 94.17657470703125, 106.09530639648438, 118.0140380859375, 129.93276977539062, 141.85150146484375, 153.77023315429688, 165.68896484375, 177.60769653320312, 189.52642822265625, 201.44515991210938, 213.3638916015625, 225.28262329101562, 237.20135498046875, 249.12008666992188, 261.038818359375, 272.9575500488281, 284.87628173828125, 296.7950134277344, 308.7137451171875, 320.6324768066406, 332.55120849609375, 344.4699401855469, 356.388671875, 368.3074035644531, 380.22613525390625, 392.1448669433594, 404.0635986328125, 415.9823303222656, 427.90106201171875, 439.8197937011719, 451.738525390625, 463.6572570800781, 475.57598876953125, 487.4947204589844, 499.4134521484375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 0.0, 5.0, 10.0, 5.0, 9.0, 4.0, 17.0, 14.0, 9.0, 12.0, 14.0, 22.0, 22.0, 27.0, 31.0, 23.0, 34.0, 36.0, 33.0, 42.0, 44.0, 40.0, 39.0, 46.0, 49.0, 40.0, 33.0, 48.0, 33.0, 26.0, 19.0, 22.0, 23.0, 26.0, 22.0, 17.0, 18.0, 9.0, 17.0, 9.0, 9.0, 8.0, 4.0, 9.0, 5.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-131.38462829589844, -127.5765609741211, -123.76848602294922, -119.96041870117188, -116.15234375, -112.34427642822266, -108.53620910644531, -104.72813415527344, -100.92005920410156, -97.11199188232422, -93.30391693115234, -89.495849609375, -85.68777465820312, -81.87970733642578, -78.07164001464844, -74.26356506347656, -70.45549774169922, -66.64743041992188, -62.83935546875, -59.031288146972656, -55.22321319580078, -51.41514587402344, -47.60707473754883, -43.79900360107422, -39.99093246459961, -36.182861328125, -32.37479019165039, -28.566720962524414, -24.758649826049805, -20.950578689575195, -17.14250946044922, -13.33443832397461, -9.5263671875, -5.718296527862549, -1.9102258682250977, 1.8978443145751953, 5.705915451049805, 9.513986587524414, 13.32205581665039, 17.130126953125, 20.93819808959961, 24.74626922607422, 28.554340362548828, 32.36241149902344, 36.17047882080078, 39.978553771972656, 43.78662109375, 47.59469223022461, 51.40276336669922, 55.21083450317383, 59.01890563964844, 62.82697296142578, 66.63504791259766, 70.443115234375, 74.25119018554688, 78.05925750732422, 81.86732482910156, 85.6753921508789, 89.48346710205078, 93.29153442382812, 97.099609375, 100.90767669677734, 104.71574401855469, 108.52381896972656, 112.33189392089844]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 12.0, 13.0, 16.0, 22.0, 38.0, 46.0, 72.0, 114.0, 183.0, 277.0, 435.0, 750.0, 1193.0, 2356.0, 5194.0, 12774.0, 34988.0, 95807.0, 235310.0, 348744.0, 190333.0, 73998.0, 26785.0, 10112.0, 4205.0, 1957.0, 1076.0, 611.0, 374.0, 236.0, 148.0, 123.0, 83.0, 49.0, 40.0, 20.0, 13.0, 13.0, 10.0, 4.0, 8.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-92.0, -89.2431640625, -86.486328125, -83.7294921875, -80.97265625, -78.2158203125, -75.458984375, -72.7021484375, -69.9453125, -67.1884765625, -64.431640625, -61.6748046875, -58.91796875, -56.1611328125, -53.404296875, -50.6474609375, -47.890625, -45.1337890625, -42.376953125, -39.6201171875, -36.86328125, -34.1064453125, -31.349609375, -28.5927734375, -25.8359375, -23.0791015625, -20.322265625, -17.5654296875, -14.80859375, -12.0517578125, -9.294921875, -6.5380859375, -3.78125, -1.0244140625, 1.732421875, 4.4892578125, 7.24609375, 10.0029296875, 12.759765625, 15.5166015625, 18.2734375, 21.0302734375, 23.787109375, 26.5439453125, 29.30078125, 32.0576171875, 34.814453125, 37.5712890625, 40.328125, 43.0849609375, 45.841796875, 48.5986328125, 51.35546875, 54.1123046875, 56.869140625, 59.6259765625, 62.3828125, 65.1396484375, 67.896484375, 70.6533203125, 73.41015625, 76.1669921875, 78.923828125, 81.6806640625, 84.4375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 6.0, 12.0, 20.0, 33.0, 35.0, 48.0, 60.0, 59.0, 72.0, 68.0, 69.0, 76.0, 66.0, 59.0, 64.0, 63.0, 50.0, 35.0, 21.0, 25.0, 10.0, 13.0, 13.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.3125, -12.897705078125, -12.48291015625, -12.068115234375, -11.6533203125, -11.238525390625, -10.82373046875, -10.408935546875, -9.994140625, -9.579345703125, -9.16455078125, -8.749755859375, -8.3349609375, -7.920166015625, -7.50537109375, -7.090576171875, -6.67578125, -6.260986328125, -5.84619140625, -5.431396484375, -5.0166015625, -4.601806640625, -4.18701171875, -3.772216796875, -3.357421875, -2.942626953125, -2.52783203125, -2.113037109375, -1.6982421875, -1.283447265625, -0.86865234375, -0.453857421875, -0.0390625, 0.375732421875, 0.79052734375, 1.205322265625, 1.6201171875, 2.034912109375, 2.44970703125, 2.864501953125, 3.279296875, 3.694091796875, 4.10888671875, 4.523681640625, 4.9384765625, 5.353271484375, 5.76806640625, 6.182861328125, 6.59765625, 7.012451171875, 7.42724609375, 7.842041015625, 8.2568359375, 8.671630859375, 9.08642578125, 9.501220703125, 9.916015625, 10.330810546875, 10.74560546875, 11.160400390625, 11.5751953125, 11.989990234375, 12.40478515625, 12.819580078125, 13.234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 10.0, 9.0, 14.0, 21.0, 28.0, 36.0, 59.0, 77.0, 131.0, 203.0, 284.0, 457.0, 796.0, 1291.0, 2594.0, 5555.0, 13778.0, 40010.0, 128445.0, 364726.0, 325798.0, 108152.0, 34084.0, 11928.0, 4642.0, 2244.0, 1215.0, 696.0, 455.0, 260.0, 160.0, 120.0, 84.0, 44.0, 38.0, 30.0, 25.0, 12.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.6875, -107.326171875, -103.96484375, -100.603515625, -97.2421875, -93.880859375, -90.51953125, -87.158203125, -83.796875, -80.435546875, -77.07421875, -73.712890625, -70.3515625, -66.990234375, -63.62890625, -60.267578125, -56.90625, -53.544921875, -50.18359375, -46.822265625, -43.4609375, -40.099609375, -36.73828125, -33.376953125, -30.015625, -26.654296875, -23.29296875, -19.931640625, -16.5703125, -13.208984375, -9.84765625, -6.486328125, -3.125, 0.236328125, 3.59765625, 6.958984375, 10.3203125, 13.681640625, 17.04296875, 20.404296875, 23.765625, 27.126953125, 30.48828125, 33.849609375, 37.2109375, 40.572265625, 43.93359375, 47.294921875, 50.65625, 54.017578125, 57.37890625, 60.740234375, 64.1015625, 67.462890625, 70.82421875, 74.185546875, 77.546875, 80.908203125, 84.26953125, 87.630859375, 90.9921875, 94.353515625, 97.71484375, 101.076171875, 104.4375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 9.0, 12.0, 15.0, 25.0, 31.0, 31.0, 42.0, 46.0, 56.0, 69.0, 60.0, 62.0, 56.0, 80.0, 76.0, 55.0, 40.0, 43.0, 43.0, 31.0, 23.0, 18.0, 12.0, 8.0, 13.0, 7.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.5625, -68.2412109375, -65.919921875, -63.5986328125, -61.27734375, -58.9560546875, -56.634765625, -54.3134765625, -51.9921875, -49.6708984375, -47.349609375, -45.0283203125, -42.70703125, -40.3857421875, -38.064453125, -35.7431640625, -33.421875, -31.1005859375, -28.779296875, -26.4580078125, -24.13671875, -21.8154296875, -19.494140625, -17.1728515625, -14.8515625, -12.5302734375, -10.208984375, -7.8876953125, -5.56640625, -3.2451171875, -0.923828125, 1.3974609375, 3.71875, 6.0400390625, 8.361328125, 10.6826171875, 13.00390625, 15.3251953125, 17.646484375, 19.9677734375, 22.2890625, 24.6103515625, 26.931640625, 29.2529296875, 31.57421875, 33.8955078125, 36.216796875, 38.5380859375, 40.859375, 43.1806640625, 45.501953125, 47.8232421875, 50.14453125, 52.4658203125, 54.787109375, 57.1083984375, 59.4296875, 61.7509765625, 64.072265625, 66.3935546875, 68.71484375, 71.0361328125, 73.357421875, 75.6787109375, 78.0]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 8.0, 14.0, 11.0, 22.0, 31.0, 38.0, 58.0, 99.0, 118.0, 235.0, 405.0, 817.0, 1786.0, 4739.0, 14709.0, 59008.0, 266596.0, 477273.0, 169412.0, 36898.0, 10028.0, 3339.0, 1326.0, 683.0, 369.0, 194.0, 127.0, 78.0, 42.0, 32.0, 20.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.375, -43.65234375, -41.9296875, -40.20703125, -38.484375, -36.76171875, -35.0390625, -33.31640625, -31.59375, -29.87109375, -28.1484375, -26.42578125, -24.703125, -22.98046875, -21.2578125, -19.53515625, -17.8125, -16.08984375, -14.3671875, -12.64453125, -10.921875, -9.19921875, -7.4765625, -5.75390625, -4.03125, -2.30859375, -0.5859375, 1.13671875, 2.859375, 4.58203125, 6.3046875, 8.02734375, 9.75, 11.47265625, 13.1953125, 14.91796875, 16.640625, 18.36328125, 20.0859375, 21.80859375, 23.53125, 25.25390625, 26.9765625, 28.69921875, 30.421875, 32.14453125, 33.8671875, 35.58984375, 37.3125, 39.03515625, 40.7578125, 42.48046875, 44.203125, 45.92578125, 47.6484375, 49.37109375, 51.09375, 52.81640625, 54.5390625, 56.26171875, 57.984375, 59.70703125, 61.4296875, 63.15234375, 64.875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 13.0, 15.0, 22.0, 23.0, 21.0, 38.0, 48.0, 74.0, 64.0, 105.0, 100.0, 90.0, 84.0, 64.0, 41.0, 32.0, 32.0, 25.0, 19.0, 16.0, 14.0, 11.0, 12.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00801849365234375, -0.007793307304382324, -0.0075681209564208984, -0.007342934608459473, -0.007117748260498047, -0.006892561912536621, -0.006667375564575195, -0.0064421892166137695, -0.006217002868652344, -0.005991816520690918, -0.005766630172729492, -0.005541443824768066, -0.005316257476806641, -0.005091071128845215, -0.004865884780883789, -0.004640698432922363, -0.0044155120849609375, -0.004190325736999512, -0.003965139389038086, -0.00373995304107666, -0.0035147666931152344, -0.0032895803451538086, -0.003064393997192383, -0.002839207649230957, -0.0026140213012695312, -0.0023888349533081055, -0.0021636486053466797, -0.001938462257385254, -0.0017132759094238281, -0.0014880895614624023, -0.0012629032135009766, -0.0010377168655395508, -0.000812530517578125, -0.0005873441696166992, -0.00036215782165527344, -0.00013697147369384766, 8.821487426757812e-05, 0.0003134012222290039, 0.0005385875701904297, 0.0007637739181518555, 0.0009889602661132812, 0.001214146614074707, 0.0014393329620361328, 0.0016645193099975586, 0.0018897056579589844, 0.00211489200592041, 0.002340078353881836, 0.0025652647018432617, 0.0027904510498046875, 0.0030156373977661133, 0.003240823745727539, 0.003466010093688965, 0.0036911964416503906, 0.003916382789611816, 0.004141569137573242, 0.004366755485534668, 0.004591941833496094, 0.0048171281814575195, 0.005042314529418945, 0.005267500877380371, 0.005492687225341797, 0.005717873573303223, 0.0059430599212646484, 0.006168246269226074, 0.0063934326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 16.0, 12.0, 16.0, 25.0, 37.0, 39.0, 91.0, 130.0, 189.0, 306.0, 521.0, 930.0, 1814.0, 3896.0, 9715.0, 28770.0, 106251.0, 359589.0, 373067.0, 114101.0, 30543.0, 10177.0, 3995.0, 1884.0, 965.0, 545.0, 336.0, 196.0, 123.0, 82.0, 52.0, 34.0, 29.0, 21.0, 7.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.90625, -52.3671875, -50.828125, -49.2890625, -47.75, -46.2109375, -44.671875, -43.1328125, -41.59375, -40.0546875, -38.515625, -36.9765625, -35.4375, -33.8984375, -32.359375, -30.8203125, -29.28125, -27.7421875, -26.203125, -24.6640625, -23.125, -21.5859375, -20.046875, -18.5078125, -16.96875, -15.4296875, -13.890625, -12.3515625, -10.8125, -9.2734375, -7.734375, -6.1953125, -4.65625, -3.1171875, -1.578125, -0.0390625, 1.5, 3.0390625, 4.578125, 6.1171875, 7.65625, 9.1953125, 10.734375, 12.2734375, 13.8125, 15.3515625, 16.890625, 18.4296875, 19.96875, 21.5078125, 23.046875, 24.5859375, 26.125, 27.6640625, 29.203125, 30.7421875, 32.28125, 33.8203125, 35.359375, 36.8984375, 38.4375, 39.9765625, 41.515625, 43.0546875, 44.59375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 7.0, 8.0, 6.0, 11.0, 5.0, 10.0, 19.0, 21.0, 31.0, 50.0, 44.0, 59.0, 66.0, 69.0, 70.0, 72.0, 76.0, 56.0, 54.0, 44.0, 53.0, 41.0, 19.0, 31.0, 25.0, 12.0, 10.0, 8.0, 8.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-30.5625, -29.804443359375, -29.04638671875, -28.288330078125, -27.5302734375, -26.772216796875, -26.01416015625, -25.256103515625, -24.498046875, -23.739990234375, -22.98193359375, -22.223876953125, -21.4658203125, -20.707763671875, -19.94970703125, -19.191650390625, -18.43359375, -17.675537109375, -16.91748046875, -16.159423828125, -15.4013671875, -14.643310546875, -13.88525390625, -13.127197265625, -12.369140625, -11.611083984375, -10.85302734375, -10.094970703125, -9.3369140625, -8.578857421875, -7.82080078125, -7.062744140625, -6.3046875, -5.546630859375, -4.78857421875, -4.030517578125, -3.2724609375, -2.514404296875, -1.75634765625, -0.998291015625, -0.240234375, 0.517822265625, 1.27587890625, 2.033935546875, 2.7919921875, 3.550048828125, 4.30810546875, 5.066162109375, 5.82421875, 6.582275390625, 7.34033203125, 8.098388671875, 8.8564453125, 9.614501953125, 10.37255859375, 11.130615234375, 11.888671875, 12.646728515625, 13.40478515625, 14.162841796875, 14.9208984375, 15.678955078125, 16.43701171875, 17.195068359375, 17.953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 14.0, 26.0, 51.0, 73.0, 96.0, 137.0, 141.0, 132.0, 109.0, 75.0, 44.0, 35.0, 21.0, 7.0, 9.0, 6.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.4290161132812, -618.9644165039062, -596.4998168945312, -574.0352783203125, -551.5706787109375, -529.1060791015625, -506.6414794921875, -484.1768798828125, -461.7123107910156, -439.2477111816406, -416.78314208984375, -394.31854248046875, -371.85394287109375, -349.3893737792969, -326.9247741699219, -304.460205078125, -281.99560546875, -259.531005859375, -237.06643676757812, -214.60183715820312, -192.1372528076172, -169.67266845703125, -147.20806884765625, -124.74348449707031, -102.27890014648438, -79.81431579589844, -57.34972381591797, -34.8851318359375, -12.420547485351562, 10.044036865234375, 32.508636474609375, 54.97322082519531, 77.4378662109375, 99.90245056152344, 122.3670425415039, 144.83163452148438, 167.2962188720703, 189.76080322265625, 212.22540283203125, 234.6899871826172, 257.1545715332031, 279.6191711425781, 302.083740234375, 324.54833984375, 347.012939453125, 369.4775085449219, 391.9421081542969, 414.40667724609375, 436.87127685546875, 459.33587646484375, 481.8004455566406, 504.2650451660156, 526.7296142578125, 549.1942138671875, 571.6588134765625, 594.1234130859375, 616.5880126953125, 639.0526123046875, 661.5172119140625, 683.9818115234375, 706.4463500976562, 728.9109497070312, 751.3755493164062, 773.8401489257812, 796.3046875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 10.0, 10.0, 8.0, 10.0, 22.0, 20.0, 19.0, 26.0, 19.0, 21.0, 30.0, 30.0, 48.0, 36.0, 39.0, 44.0, 56.0, 49.0, 51.0, 56.0, 49.0, 36.0, 37.0, 29.0, 30.0, 41.0, 27.0, 25.0, 17.0, 19.0, 15.0, 10.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-411.755126953125, -399.9296569824219, -388.1042175292969, -376.27874755859375, -364.4532775878906, -352.6278076171875, -340.8023681640625, -328.9768981933594, -317.15142822265625, -305.3259582519531, -293.5005187988281, -281.675048828125, -269.8495788574219, -258.02410888671875, -246.19866943359375, -234.37319946289062, -222.54774475097656, -210.7222900390625, -198.89682006835938, -187.0713653564453, -175.2458953857422, -163.42044067382812, -151.594970703125, -139.76951599121094, -127.94405364990234, -116.11859130859375, -104.29312896728516, -92.46766662597656, -80.6422119140625, -68.81674194335938, -56.99128723144531, -45.16582489013672, -33.340362548828125, -21.51490020751953, -9.68943977355957, 2.1360206604003906, 13.961483001708984, 25.786945343017578, 37.612403869628906, 49.4378662109375, 61.263328552246094, 73.08879089355469, 84.91425323486328, 96.73971557617188, 108.56517028808594, 120.39064025878906, 132.21609497070312, 144.04156494140625, 155.8670196533203, 167.69247436523438, 179.5179443359375, 191.34339904785156, 203.1688690185547, 214.99432373046875, 226.81979370117188, 238.64524841308594, 250.470703125, 262.2961730957031, 274.1216125488281, 285.94708251953125, 297.7725524902344, 309.5980224609375, 321.4234619140625, 333.2489318847656, 345.07440185546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 13.0, 28.0, 25.0, 64.0, 123.0, 283.0, 862.0, 3989.0, 32835.0, 3772369.0, 363993.0, 16077.0, 2495.0, 599.0, 216.0, 111.0, 63.0, 62.0, 27.0, 18.0, 10.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.75, -326.1328125, -313.515625, -300.8984375, -288.28125, -275.6640625, -263.046875, -250.4296875, -237.8125, -225.1953125, -212.578125, -199.9609375, -187.34375, -174.7265625, -162.109375, -149.4921875, -136.875, -124.2578125, -111.640625, -99.0234375, -86.40625, -73.7890625, -61.171875, -48.5546875, -35.9375, -23.3203125, -10.703125, 1.9140625, 14.53125, 27.1484375, 39.765625, 52.3828125, 65.0, 77.6171875, 90.234375, 102.8515625, 115.46875, 128.0859375, 140.703125, 153.3203125, 165.9375, 178.5546875, 191.171875, 203.7890625, 216.40625, 229.0234375, 241.640625, 254.2578125, 266.875, 279.4921875, 292.109375, 304.7265625, 317.34375, 329.9609375, 342.578125, 355.1953125, 367.8125, 380.4296875, 393.046875, 405.6640625, 418.28125, 430.8984375, 443.515625, 456.1328125, 468.75]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 21.0, 18.0, 33.0, 59.0, 63.0, 71.0, 67.0, 103.0, 92.0, 95.0, 91.0, 73.0, 46.0, 47.0, 36.0, 34.0, 17.0, 10.0, 11.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.188232421875, -16.56396484375, -15.939697265625, -15.3154296875, -14.691162109375, -14.06689453125, -13.442626953125, -12.818359375, -12.194091796875, -11.56982421875, -10.945556640625, -10.3212890625, -9.697021484375, -9.07275390625, -8.448486328125, -7.82421875, -7.199951171875, -6.57568359375, -5.951416015625, -5.3271484375, -4.702880859375, -4.07861328125, -3.454345703125, -2.830078125, -2.205810546875, -1.58154296875, -0.957275390625, -0.3330078125, 0.291259765625, 0.91552734375, 1.539794921875, 2.1640625, 2.788330078125, 3.41259765625, 4.036865234375, 4.6611328125, 5.285400390625, 5.90966796875, 6.533935546875, 7.158203125, 7.782470703125, 8.40673828125, 9.031005859375, 9.6552734375, 10.279541015625, 10.90380859375, 11.528076171875, 12.15234375, 12.776611328125, 13.40087890625, 14.025146484375, 14.6494140625, 15.273681640625, 15.89794921875, 16.522216796875, 17.146484375, 17.770751953125, 18.39501953125, 19.019287109375, 19.6435546875, 20.267822265625, 20.89208984375, 21.516357421875, 22.140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 12.0, 10.0, 33.0, 55.0, 84.0, 125.0, 184.0, 432.0, 759.0, 1523.0, 3455.0, 8292.0, 22839.0, 79408.0, 486297.0, 3275479.0, 237576.0, 50505.0, 15829.0, 6071.0, 2624.0, 1245.0, 607.0, 340.0, 199.0, 117.0, 68.0, 38.0, 13.0, 17.0, 13.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.125, -163.228515625, -158.33203125, -153.435546875, -148.5390625, -143.642578125, -138.74609375, -133.849609375, -128.953125, -124.056640625, -119.16015625, -114.263671875, -109.3671875, -104.470703125, -99.57421875, -94.677734375, -89.78125, -84.884765625, -79.98828125, -75.091796875, -70.1953125, -65.298828125, -60.40234375, -55.505859375, -50.609375, -45.712890625, -40.81640625, -35.919921875, -31.0234375, -26.126953125, -21.23046875, -16.333984375, -11.4375, -6.541015625, -1.64453125, 3.251953125, 8.1484375, 13.044921875, 17.94140625, 22.837890625, 27.734375, 32.630859375, 37.52734375, 42.423828125, 47.3203125, 52.216796875, 57.11328125, 62.009765625, 66.90625, 71.802734375, 76.69921875, 81.595703125, 86.4921875, 91.388671875, 96.28515625, 101.181640625, 106.078125, 110.974609375, 115.87109375, 120.767578125, 125.6640625, 130.560546875, 135.45703125, 140.353515625, 145.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 8.0, 5.0, 14.0, 10.0, 15.0, 15.0, 31.0, 38.0, 48.0, 93.0, 129.0, 238.0, 540.0, 1729.0, 533.0, 245.0, 111.0, 91.0, 60.0, 22.0, 30.0, 25.0, 10.0, 4.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -31.91943359375, -30.7138671875, -29.50830078125, -28.302734375, -27.09716796875, -25.8916015625, -24.68603515625, -23.48046875, -22.27490234375, -21.0693359375, -19.86376953125, -18.658203125, -17.45263671875, -16.2470703125, -15.04150390625, -13.8359375, -12.63037109375, -11.4248046875, -10.21923828125, -9.013671875, -7.80810546875, -6.6025390625, -5.39697265625, -4.19140625, -2.98583984375, -1.7802734375, -0.57470703125, 0.630859375, 1.83642578125, 3.0419921875, 4.24755859375, 5.453125, 6.65869140625, 7.8642578125, 9.06982421875, 10.275390625, 11.48095703125, 12.6865234375, 13.89208984375, 15.09765625, 16.30322265625, 17.5087890625, 18.71435546875, 19.919921875, 21.12548828125, 22.3310546875, 23.53662109375, 24.7421875, 25.94775390625, 27.1533203125, 28.35888671875, 29.564453125, 30.77001953125, 31.9755859375, 33.18115234375, 34.38671875, 35.59228515625, 36.7978515625, 38.00341796875, 39.208984375, 40.41455078125, 41.6201171875, 42.82568359375, 44.03125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 10.0, 8.0, 28.0, 51.0, 50.0, 72.0, 105.0, 127.0, 123.0, 114.0, 84.0, 81.0, 48.0, 31.0, 20.0, 16.0, 8.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.4905548095703, -242.75283813476562, -235.01512145996094, -227.2773895263672, -219.5396728515625, -211.8019561767578, -204.06423950195312, -196.32650756835938, -188.5887908935547, -180.85107421875, -173.1133575439453, -165.37562561035156, -157.63790893554688, -149.9001922607422, -142.1624755859375, -134.42474365234375, -126.6870346069336, -118.9493179321289, -111.21159362792969, -103.473876953125, -95.73615264892578, -87.9984359741211, -80.26071166992188, -72.52299499511719, -64.7852783203125, -57.04755783081055, -49.309837341308594, -41.572120666503906, -33.83439636230469, -26.0966796875, -18.358959197998047, -10.621238708496094, -2.883514404296875, 4.85420560836792, 12.591925621032715, 20.32964515686035, 28.067365646362305, 35.805084228515625, 43.54280471801758, 51.28052520751953, 59.018245697021484, 66.75596618652344, 74.49368286132812, 82.23140716552734, 89.96912384033203, 97.70684814453125, 105.44456481933594, 113.18228149414062, 120.92000579833984, 128.65773010253906, 136.39544677734375, 144.13316345214844, 151.87088012695312, 159.60861206054688, 167.34632873535156, 175.08404541015625, 182.82176208496094, 190.55947875976562, 198.2971954345703, 206.03492736816406, 213.77264404296875, 221.51036071777344, 229.24807739257812, 236.98580932617188, 244.72352600097656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 4.0, 12.0, 12.0, 19.0, 18.0, 27.0, 25.0, 23.0, 32.0, 33.0, 31.0, 40.0, 34.0, 36.0, 53.0, 35.0, 43.0, 49.0, 53.0, 51.0, 44.0, 45.0, 25.0, 26.0, 42.0, 30.0, 21.0, 15.0, 19.0, 18.0, 17.0, 7.0, 8.0, 6.0, 3.0, 5.0, 5.0, 1.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-117.79442596435547, -114.21016693115234, -110.62590789794922, -107.04164123535156, -103.45738220214844, -99.87312316894531, -96.28886413574219, -92.70460510253906, -89.12034606933594, -85.53608703613281, -81.95182800292969, -78.36756896972656, -74.7833023071289, -71.19904327392578, -67.61478424072266, -64.03052520751953, -60.446258544921875, -56.86199951171875, -53.27773666381836, -49.693477630615234, -46.109214782714844, -42.52495574951172, -38.940696716308594, -35.35643768310547, -31.772174835205078, -28.18791389465332, -24.603652954101562, -21.019393920898438, -17.43513298034668, -13.850872039794922, -10.266613006591797, -6.682352066040039, -3.09808349609375, 0.4861769676208496, 4.070437431335449, 7.654697418212891, 11.238958358764648, 14.823219299316406, 18.40747833251953, 21.99173927307129, 25.576000213623047, 29.160261154174805, 32.74452209472656, 36.32878112792969, 39.91304016113281, 43.4973030090332, 47.08156204223633, 50.66582489013672, 54.250083923339844, 57.83434295654297, 61.41860580444336, 65.00286865234375, 68.58712768554688, 72.17138671875, 75.75564575195312, 79.33990478515625, 82.92416381835938, 86.5084228515625, 90.09268188476562, 93.67694091796875, 97.2612075805664, 100.84546661376953, 104.42972564697266, 108.01398468017578, 111.59825134277344]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 14.0, 8.0, 31.0, 30.0, 33.0, 58.0, 90.0, 134.0, 161.0, 246.0, 376.0, 660.0, 1294.0, 2781.0, 6857.0, 18072.0, 52629.0, 152276.0, 348539.0, 289434.0, 112594.0, 38482.0, 13726.0, 5066.0, 2257.0, 1068.0, 582.0, 332.0, 218.0, 157.0, 94.0, 79.0, 56.0, 33.0, 28.0, 11.0, 8.0, 11.0, 9.0, 9.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-96.3125, -93.69921875, -91.0859375, -88.47265625, -85.859375, -83.24609375, -80.6328125, -78.01953125, -75.40625, -72.79296875, -70.1796875, -67.56640625, -64.953125, -62.33984375, -59.7265625, -57.11328125, -54.5, -51.88671875, -49.2734375, -46.66015625, -44.046875, -41.43359375, -38.8203125, -36.20703125, -33.59375, -30.98046875, -28.3671875, -25.75390625, -23.140625, -20.52734375, -17.9140625, -15.30078125, -12.6875, -10.07421875, -7.4609375, -4.84765625, -2.234375, 0.37890625, 2.9921875, 5.60546875, 8.21875, 10.83203125, 13.4453125, 16.05859375, 18.671875, 21.28515625, 23.8984375, 26.51171875, 29.125, 31.73828125, 34.3515625, 36.96484375, 39.578125, 42.19140625, 44.8046875, 47.41796875, 50.03125, 52.64453125, 55.2578125, 57.87109375, 60.484375, 63.09765625, 65.7109375, 68.32421875, 70.9375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 9.0, 20.0, 34.0, 37.0, 47.0, 62.0, 79.0, 83.0, 93.0, 102.0, 81.0, 88.0, 71.0, 52.0, 40.0, 39.0, 22.0, 17.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.106201171875, -17.46240234375, -16.818603515625, -16.1748046875, -15.531005859375, -14.88720703125, -14.243408203125, -13.599609375, -12.955810546875, -12.31201171875, -11.668212890625, -11.0244140625, -10.380615234375, -9.73681640625, -9.093017578125, -8.44921875, -7.805419921875, -7.16162109375, -6.517822265625, -5.8740234375, -5.230224609375, -4.58642578125, -3.942626953125, -3.298828125, -2.655029296875, -2.01123046875, -1.367431640625, -0.7236328125, -0.079833984375, 0.56396484375, 1.207763671875, 1.8515625, 2.495361328125, 3.13916015625, 3.782958984375, 4.4267578125, 5.070556640625, 5.71435546875, 6.358154296875, 7.001953125, 7.645751953125, 8.28955078125, 8.933349609375, 9.5771484375, 10.220947265625, 10.86474609375, 11.508544921875, 12.15234375, 12.796142578125, 13.43994140625, 14.083740234375, 14.7275390625, 15.371337890625, 16.01513671875, 16.658935546875, 17.302734375, 17.946533203125, 18.59033203125, 19.234130859375, 19.8779296875, 20.521728515625, 21.16552734375, 21.809326171875, 22.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 19.0, 16.0, 23.0, 43.0, 41.0, 72.0, 96.0, 124.0, 189.0, 272.0, 375.0, 563.0, 918.0, 1517.0, 2758.0, 5592.0, 11818.0, 26876.0, 64444.0, 144554.0, 267322.0, 264700.0, 142444.0, 62914.0, 26653.0, 11604.0, 5506.0, 2762.0, 1543.0, 902.0, 560.0, 363.0, 307.0, 195.0, 137.0, 83.0, 74.0, 46.0, 34.0, 29.0, 18.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.34375, -50.5380859375, -48.732421875, -46.9267578125, -45.12109375, -43.3154296875, -41.509765625, -39.7041015625, -37.8984375, -36.0927734375, -34.287109375, -32.4814453125, -30.67578125, -28.8701171875, -27.064453125, -25.2587890625, -23.453125, -21.6474609375, -19.841796875, -18.0361328125, -16.23046875, -14.4248046875, -12.619140625, -10.8134765625, -9.0078125, -7.2021484375, -5.396484375, -3.5908203125, -1.78515625, 0.0205078125, 1.826171875, 3.6318359375, 5.4375, 7.2431640625, 9.048828125, 10.8544921875, 12.66015625, 14.4658203125, 16.271484375, 18.0771484375, 19.8828125, 21.6884765625, 23.494140625, 25.2998046875, 27.10546875, 28.9111328125, 30.716796875, 32.5224609375, 34.328125, 36.1337890625, 37.939453125, 39.7451171875, 41.55078125, 43.3564453125, 45.162109375, 46.9677734375, 48.7734375, 50.5791015625, 52.384765625, 54.1904296875, 55.99609375, 57.8017578125, 59.607421875, 61.4130859375, 63.21875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 9.0, 8.0, 18.0, 7.0, 12.0, 15.0, 14.0, 23.0, 25.0, 35.0, 33.0, 45.0, 36.0, 52.0, 56.0, 46.0, 46.0, 36.0, 52.0, 50.0, 41.0, 53.0, 38.0, 40.0, 30.0, 34.0, 30.0, 22.0, 12.0, 13.0, 18.0, 12.0, 10.0, 6.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.75, -50.013671875, -48.27734375, -46.541015625, -44.8046875, -43.068359375, -41.33203125, -39.595703125, -37.859375, -36.123046875, -34.38671875, -32.650390625, -30.9140625, -29.177734375, -27.44140625, -25.705078125, -23.96875, -22.232421875, -20.49609375, -18.759765625, -17.0234375, -15.287109375, -13.55078125, -11.814453125, -10.078125, -8.341796875, -6.60546875, -4.869140625, -3.1328125, -1.396484375, 0.33984375, 2.076171875, 3.8125, 5.548828125, 7.28515625, 9.021484375, 10.7578125, 12.494140625, 14.23046875, 15.966796875, 17.703125, 19.439453125, 21.17578125, 22.912109375, 24.6484375, 26.384765625, 28.12109375, 29.857421875, 31.59375, 33.330078125, 35.06640625, 36.802734375, 38.5390625, 40.275390625, 42.01171875, 43.748046875, 45.484375, 47.220703125, 48.95703125, 50.693359375, 52.4296875, 54.166015625, 55.90234375, 57.638671875, 59.375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 16.0, 23.0, 27.0, 39.0, 41.0, 81.0, 123.0, 183.0, 306.0, 510.0, 1070.0, 2461.0, 6230.0, 20576.0, 85191.0, 336018.0, 423328.0, 128158.0, 29649.0, 8602.0, 2985.0, 1291.0, 664.0, 366.0, 187.0, 122.0, 73.0, 55.0, 40.0, 13.0, 19.0, 14.0, 16.0, 12.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.35986328125, -33.2197265625, -32.07958984375, -30.939453125, -29.79931640625, -28.6591796875, -27.51904296875, -26.37890625, -25.23876953125, -24.0986328125, -22.95849609375, -21.818359375, -20.67822265625, -19.5380859375, -18.39794921875, -17.2578125, -16.11767578125, -14.9775390625, -13.83740234375, -12.697265625, -11.55712890625, -10.4169921875, -9.27685546875, -8.13671875, -6.99658203125, -5.8564453125, -4.71630859375, -3.576171875, -2.43603515625, -1.2958984375, -0.15576171875, 0.984375, 2.12451171875, 3.2646484375, 4.40478515625, 5.544921875, 6.68505859375, 7.8251953125, 8.96533203125, 10.10546875, 11.24560546875, 12.3857421875, 13.52587890625, 14.666015625, 15.80615234375, 16.9462890625, 18.08642578125, 19.2265625, 20.36669921875, 21.5068359375, 22.64697265625, 23.787109375, 24.92724609375, 26.0673828125, 27.20751953125, 28.34765625, 29.48779296875, 30.6279296875, 31.76806640625, 32.908203125, 34.04833984375, 35.1884765625, 36.32861328125, 37.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 5.0, 9.0, 7.0, 5.0, 16.0, 18.0, 19.0, 32.0, 26.0, 26.0, 41.0, 47.0, 67.0, 100.0, 89.0, 92.0, 64.0, 50.0, 51.0, 45.0, 28.0, 35.0, 21.0, 21.0, 22.0, 9.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.004543304443359375, -0.004396557807922363, -0.0042498111724853516, -0.00410306453704834, -0.003956317901611328, -0.0038095712661743164, -0.0036628246307373047, -0.003516077995300293, -0.0033693313598632812, -0.0032225847244262695, -0.003075838088989258, -0.002929091453552246, -0.0027823448181152344, -0.0026355981826782227, -0.002488851547241211, -0.0023421049118041992, -0.0021953582763671875, -0.0020486116409301758, -0.001901865005493164, -0.0017551183700561523, -0.0016083717346191406, -0.001461625099182129, -0.0013148784637451172, -0.0011681318283081055, -0.0010213851928710938, -0.000874638557434082, -0.0007278919219970703, -0.0005811452865600586, -0.0004343986511230469, -0.00028765201568603516, -0.00014090538024902344, 5.841255187988281e-06, 0.000152587890625, 0.0002993345260620117, 0.00044608116149902344, 0.0005928277969360352, 0.0007395744323730469, 0.0008863210678100586, 0.0010330677032470703, 0.001179814338684082, 0.0013265609741210938, 0.0014733076095581055, 0.0016200542449951172, 0.001766800880432129, 0.0019135475158691406, 0.0020602941513061523, 0.002207040786743164, 0.0023537874221801758, 0.0025005340576171875, 0.0026472806930541992, 0.002794027328491211, 0.0029407739639282227, 0.0030875205993652344, 0.003234267234802246, 0.003381013870239258, 0.0035277605056762695, 0.0036745071411132812, 0.003821253776550293, 0.003968000411987305, 0.004114747047424316, 0.004261493682861328, 0.00440824031829834, 0.0045549869537353516, 0.004701733589172363, 0.004848480224609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 21.0, 23.0, 31.0, 54.0, 82.0, 123.0, 237.0, 382.0, 668.0, 1183.0, 2493.0, 5963.0, 17854.0, 75553.0, 349971.0, 442700.0, 112803.0, 24469.0, 7689.0, 2995.0, 1408.0, 737.0, 428.0, 247.0, 137.0, 96.0, 62.0, 36.0, 18.0, 14.0, 16.0, 7.0, 9.0, 6.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.59375, -39.3681640625, -38.142578125, -36.9169921875, -35.69140625, -34.4658203125, -33.240234375, -32.0146484375, -30.7890625, -29.5634765625, -28.337890625, -27.1123046875, -25.88671875, -24.6611328125, -23.435546875, -22.2099609375, -20.984375, -19.7587890625, -18.533203125, -17.3076171875, -16.08203125, -14.8564453125, -13.630859375, -12.4052734375, -11.1796875, -9.9541015625, -8.728515625, -7.5029296875, -6.27734375, -5.0517578125, -3.826171875, -2.6005859375, -1.375, -0.1494140625, 1.076171875, 2.3017578125, 3.52734375, 4.7529296875, 5.978515625, 7.2041015625, 8.4296875, 9.6552734375, 10.880859375, 12.1064453125, 13.33203125, 14.5576171875, 15.783203125, 17.0087890625, 18.234375, 19.4599609375, 20.685546875, 21.9111328125, 23.13671875, 24.3623046875, 25.587890625, 26.8134765625, 28.0390625, 29.2646484375, 30.490234375, 31.7158203125, 32.94140625, 34.1669921875, 35.392578125, 36.6181640625, 37.84375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 11.0, 14.0, 11.0, 17.0, 21.0, 23.0, 44.0, 48.0, 54.0, 58.0, 80.0, 92.0, 69.0, 78.0, 77.0, 52.0, 39.0, 48.0, 39.0, 27.0, 19.0, 16.0, 15.0, 8.0, 6.0, 10.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.453125, -21.758056640625, -21.06298828125, -20.367919921875, -19.6728515625, -18.977783203125, -18.28271484375, -17.587646484375, -16.892578125, -16.197509765625, -15.50244140625, -14.807373046875, -14.1123046875, -13.417236328125, -12.72216796875, -12.027099609375, -11.33203125, -10.636962890625, -9.94189453125, -9.246826171875, -8.5517578125, -7.856689453125, -7.16162109375, -6.466552734375, -5.771484375, -5.076416015625, -4.38134765625, -3.686279296875, -2.9912109375, -2.296142578125, -1.60107421875, -0.906005859375, -0.2109375, 0.484130859375, 1.17919921875, 1.874267578125, 2.5693359375, 3.264404296875, 3.95947265625, 4.654541015625, 5.349609375, 6.044677734375, 6.73974609375, 7.434814453125, 8.1298828125, 8.824951171875, 9.52001953125, 10.215087890625, 10.91015625, 11.605224609375, 12.30029296875, 12.995361328125, 13.6904296875, 14.385498046875, 15.08056640625, 15.775634765625, 16.470703125, 17.165771484375, 17.86083984375, 18.555908203125, 19.2509765625, 19.946044921875, 20.64111328125, 21.336181640625, 22.03125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 18.0, 14.0, 37.0, 61.0, 68.0, 82.0, 96.0, 129.0, 96.0, 92.0, 75.0, 54.0, 47.0, 37.0, 22.0, 13.0, 11.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-502.29571533203125, -489.33551025390625, -476.37530517578125, -463.4150695800781, -450.4548645019531, -437.4946594238281, -424.5344543457031, -411.57421875, -398.614013671875, -385.65380859375, -372.693603515625, -359.7333679199219, -346.7731628417969, -333.8129577636719, -320.8527526855469, -307.89251708984375, -294.93231201171875, -281.97210693359375, -269.01190185546875, -256.0516662597656, -243.09146118164062, -230.13125610351562, -217.17105102539062, -204.21083068847656, -191.25064086914062, -178.29043579101562, -165.33021545410156, -152.37001037597656, -139.4097900390625, -126.4495849609375, -113.48937225341797, -100.52915954589844, -87.56893920898438, -74.60872650146484, -61.64851379394531, -48.68830490112305, -35.728092193603516, -22.76788330078125, -9.807670593261719, 3.1525421142578125, 16.112754821777344, 29.072967529296875, 42.033180236816406, 54.99338912963867, 67.95359802246094, 80.91381072998047, 93.8740234375, 106.83423614501953, 119.79444885253906, 132.75465393066406, 145.71487426757812, 158.67507934570312, 171.6352996826172, 184.5955047607422, 197.55572509765625, 210.51593017578125, 223.47613525390625, 236.43634033203125, 249.3965606689453, 262.3567810058594, 275.3169860839844, 288.2771911621094, 301.2373962402344, 314.1976318359375, 327.1578369140625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 11.0, 4.0, 10.0, 17.0, 18.0, 15.0, 23.0, 28.0, 28.0, 46.0, 47.0, 34.0, 35.0, 58.0, 44.0, 49.0, 58.0, 57.0, 45.0, 39.0, 46.0, 43.0, 28.0, 44.0, 25.0, 36.0, 20.0, 14.0, 9.0, 18.0, 10.0, 5.0, 4.0, 11.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.86920166015625, -280.7148132324219, -270.5603942871094, -260.406005859375, -250.25161743164062, -240.0972137451172, -229.94281005859375, -219.78842163085938, -209.63401794433594, -199.4796142578125, -189.32522583007812, -179.1708221435547, -169.01641845703125, -158.86203002929688, -148.70762634277344, -138.55322265625, -128.39883422851562, -118.24443817138672, -108.09004211425781, -97.93563842773438, -87.78124237060547, -77.62684631347656, -67.47244262695312, -57.31804656982422, -47.16365051269531, -37.009254455566406, -26.854854583740234, -16.700456619262695, -6.546058654785156, 3.60833740234375, 13.762737274169922, 23.917137145996094, 34.071533203125, 44.225929260253906, 54.38032913208008, 64.53472900390625, 74.68912506103516, 84.84352111816406, 94.9979248046875, 105.1523208618164, 115.30671691894531, 125.46111297607422, 135.61550903320312, 145.76991271972656, 155.92431640625, 166.07870483398438, 176.2331085205078, 186.38751220703125, 196.54190063476562, 206.69630432128906, 216.85069274902344, 227.00509643554688, 237.15948486328125, 247.3138885498047, 257.4682922363281, 267.6226806640625, 277.777099609375, 287.9314880371094, 298.0859069824219, 308.24029541015625, 318.3946838378906, 328.549072265625, 338.7034912109375, 348.8578796386719, 359.01226806640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 8.0, 20.0, 33.0, 48.0, 73.0, 102.0, 181.0, 329.0, 610.0, 1199.0, 2964.0, 8620.0, 33589.0, 353145.0, 3695411.0, 74827.0, 14901.0, 4668.0, 1747.0, 799.0, 416.0, 225.0, 125.0, 69.0, 49.0, 27.0, 24.0, 15.0, 6.0, 11.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-145.0, -139.861328125, -134.72265625, -129.583984375, -124.4453125, -119.306640625, -114.16796875, -109.029296875, -103.890625, -98.751953125, -93.61328125, -88.474609375, -83.3359375, -78.197265625, -73.05859375, -67.919921875, -62.78125, -57.642578125, -52.50390625, -47.365234375, -42.2265625, -37.087890625, -31.94921875, -26.810546875, -21.671875, -16.533203125, -11.39453125, -6.255859375, -1.1171875, 4.021484375, 9.16015625, 14.298828125, 19.4375, 24.576171875, 29.71484375, 34.853515625, 39.9921875, 45.130859375, 50.26953125, 55.408203125, 60.546875, 65.685546875, 70.82421875, 75.962890625, 81.1015625, 86.240234375, 91.37890625, 96.517578125, 101.65625, 106.794921875, 111.93359375, 117.072265625, 122.2109375, 127.349609375, 132.48828125, 137.626953125, 142.765625, 147.904296875, 153.04296875, 158.181640625, 163.3203125, 168.458984375, 173.59765625, 178.736328125, 183.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 14.0, 21.0, 20.0, 19.0, 32.0, 46.0, 60.0, 65.0, 69.0, 82.0, 81.0, 82.0, 68.0, 76.0, 50.0, 54.0, 31.0, 41.0, 27.0, 16.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5390625, -14.9981689453125, -14.457275390625, -13.9163818359375, -13.37548828125, -12.8345947265625, -12.293701171875, -11.7528076171875, -11.2119140625, -10.6710205078125, -10.130126953125, -9.5892333984375, -9.04833984375, -8.5074462890625, -7.966552734375, -7.4256591796875, -6.884765625, -6.3438720703125, -5.802978515625, -5.2620849609375, -4.72119140625, -4.1802978515625, -3.639404296875, -3.0985107421875, -2.5576171875, -2.0167236328125, -1.475830078125, -0.9349365234375, -0.39404296875, 0.1468505859375, 0.687744140625, 1.2286376953125, 1.76953125, 2.3104248046875, 2.851318359375, 3.3922119140625, 3.93310546875, 4.4739990234375, 5.014892578125, 5.5557861328125, 6.0966796875, 6.6375732421875, 7.178466796875, 7.7193603515625, 8.26025390625, 8.8011474609375, 9.342041015625, 9.8829345703125, 10.423828125, 10.9647216796875, 11.505615234375, 12.0465087890625, 12.58740234375, 13.1282958984375, 13.669189453125, 14.2100830078125, 14.7509765625, 15.2918701171875, 15.832763671875, 16.3736572265625, 16.91455078125, 17.4554443359375, 17.996337890625, 18.5372314453125, 19.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 5.0, 7.0, 12.0, 12.0, 18.0, 28.0, 17.0, 27.0, 34.0, 36.0, 80.0, 101.0, 157.0, 327.0, 701.0, 1710.0, 4944.0, 16478.0, 69454.0, 576713.0, 3327656.0, 152370.0, 29879.0, 8311.0, 2920.0, 1191.0, 511.0, 217.0, 126.0, 61.0, 47.0, 33.0, 24.0, 16.0, 17.0, 8.0, 11.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.3125, -118.5166015625, -114.720703125, -110.9248046875, -107.12890625, -103.3330078125, -99.537109375, -95.7412109375, -91.9453125, -88.1494140625, -84.353515625, -80.5576171875, -76.76171875, -72.9658203125, -69.169921875, -65.3740234375, -61.578125, -57.7822265625, -53.986328125, -50.1904296875, -46.39453125, -42.5986328125, -38.802734375, -35.0068359375, -31.2109375, -27.4150390625, -23.619140625, -19.8232421875, -16.02734375, -12.2314453125, -8.435546875, -4.6396484375, -0.84375, 2.9521484375, 6.748046875, 10.5439453125, 14.33984375, 18.1357421875, 21.931640625, 25.7275390625, 29.5234375, 33.3193359375, 37.115234375, 40.9111328125, 44.70703125, 48.5029296875, 52.298828125, 56.0947265625, 59.890625, 63.6865234375, 67.482421875, 71.2783203125, 75.07421875, 78.8701171875, 82.666015625, 86.4619140625, 90.2578125, 94.0537109375, 97.849609375, 101.6455078125, 105.44140625, 109.2373046875, 113.033203125, 116.8291015625, 120.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 3.0, 6.0, 20.0, 29.0, 42.0, 63.0, 113.0, 214.0, 604.0, 2060.0, 440.0, 210.0, 108.0, 50.0, 39.0, 21.0, 20.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-54.9375, -53.75244140625, -52.5673828125, -51.38232421875, -50.197265625, -49.01220703125, -47.8271484375, -46.64208984375, -45.45703125, -44.27197265625, -43.0869140625, -41.90185546875, -40.716796875, -39.53173828125, -38.3466796875, -37.16162109375, -35.9765625, -34.79150390625, -33.6064453125, -32.42138671875, -31.236328125, -30.05126953125, -28.8662109375, -27.68115234375, -26.49609375, -25.31103515625, -24.1259765625, -22.94091796875, -21.755859375, -20.57080078125, -19.3857421875, -18.20068359375, -17.015625, -15.83056640625, -14.6455078125, -13.46044921875, -12.275390625, -11.09033203125, -9.9052734375, -8.72021484375, -7.53515625, -6.35009765625, -5.1650390625, -3.97998046875, -2.794921875, -1.60986328125, -0.4248046875, 0.76025390625, 1.9453125, 3.13037109375, 4.3154296875, 5.50048828125, 6.685546875, 7.87060546875, 9.0556640625, 10.24072265625, 11.42578125, 12.61083984375, 13.7958984375, 14.98095703125, 16.166015625, 17.35107421875, 18.5361328125, 19.72119140625, 20.90625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 4.0, 11.0, 19.0, 18.0, 34.0, 46.0, 75.0, 133.0, 120.0, 143.0, 123.0, 89.0, 73.0, 35.0, 28.0, 17.0, 7.0, 8.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.0135269165039, -115.53886413574219, -110.06420135498047, -104.58953857421875, -99.11488342285156, -93.64021301269531, -88.16555786132812, -82.6908950805664, -77.21623229980469, -71.74156951904297, -66.26690673828125, -60.7922477722168, -55.31758499145508, -49.84292221069336, -44.368263244628906, -38.89360046386719, -33.41893768310547, -27.94427490234375, -22.469614028930664, -16.994953155517578, -11.52029037475586, -6.045627593994141, -0.5709686279296875, 4.903694152832031, 10.37835693359375, 15.853018760681152, 21.327680587768555, 26.80234146118164, 32.27700424194336, 37.75166702270508, 43.22632598876953, 48.70098876953125, 54.17564392089844, 59.650306701660156, 65.12496948242188, 70.59962463378906, 76.07429504394531, 81.5489501953125, 87.02361297607422, 92.49827575683594, 97.97293853759766, 103.44760131835938, 108.9222640991211, 114.39692687988281, 119.87158203125, 125.34625244140625, 130.82090759277344, 136.29556274414062, 141.77023315429688, 147.24488830566406, 152.7195587158203, 158.1942138671875, 163.66888427734375, 169.14353942871094, 174.61819458007812, 180.09286499023438, 185.56753540039062, 191.0421905517578, 196.51686096191406, 201.99151611328125, 207.4661865234375, 212.9408416748047, 218.41549682617188, 223.89016723632812, 229.3648223876953]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 9.0, 13.0, 15.0, 19.0, 18.0, 24.0, 20.0, 31.0, 29.0, 34.0, 35.0, 29.0, 28.0, 51.0, 39.0, 38.0, 48.0, 47.0, 44.0, 42.0, 42.0, 37.0, 30.0, 29.0, 32.0, 27.0, 20.0, 15.0, 19.0, 13.0, 11.0, 13.0, 11.0, 9.0, 11.0, 11.0, 2.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-86.27619934082031, -83.82474517822266, -81.373291015625, -78.92182922363281, -76.47037506103516, -74.0189208984375, -71.56746673583984, -69.11601257324219, -66.66455078125, -64.21309661865234, -61.76163864135742, -59.310184478759766, -56.858726501464844, -54.40727233886719, -51.95581817626953, -49.50436019897461, -47.05290603637695, -44.6014518737793, -42.149993896484375, -39.69853973388672, -37.2470817565918, -34.79562759399414, -32.34416961669922, -29.892715454101562, -27.441259384155273, -24.989803314208984, -22.538347244262695, -20.086891174316406, -17.63543701171875, -15.183979988098145, -12.732524871826172, -10.281068801879883, -7.829612731933594, -5.378156661987305, -2.926701068878174, -0.47524547576904297, 1.976210594177246, 4.427666664123535, 6.879121780395508, 9.330577850341797, 11.782033920288086, 14.233489990234375, 16.684946060180664, 19.136402130126953, 21.58785629272461, 24.03931427001953, 26.490768432617188, 28.942224502563477, 31.393680572509766, 33.84513473510742, 36.296592712402344, 38.748046875, 41.19950485229492, 43.65095901489258, 46.1024169921875, 48.553871154785156, 51.00532531738281, 53.45677947998047, 55.90823745727539, 58.35969161987305, 60.81114959716797, 63.262603759765625, 65.71405792236328, 68.16551208496094, 70.61697387695312]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 24.0, 40.0, 42.0, 70.0, 80.0, 197.0, 271.0, 484.0, 1001.0, 2147.0, 5643.0, 18128.0, 66668.0, 255361.0, 471452.0, 164830.0, 42863.0, 11817.0, 3981.0, 1622.0, 755.0, 416.0, 231.0, 126.0, 86.0, 52.0, 48.0, 30.0, 17.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.875, -92.6064453125, -89.337890625, -86.0693359375, -82.80078125, -79.5322265625, -76.263671875, -72.9951171875, -69.7265625, -66.4580078125, -63.189453125, -59.9208984375, -56.65234375, -53.3837890625, -50.115234375, -46.8466796875, -43.578125, -40.3095703125, -37.041015625, -33.7724609375, -30.50390625, -27.2353515625, -23.966796875, -20.6982421875, -17.4296875, -14.1611328125, -10.892578125, -7.6240234375, -4.35546875, -1.0869140625, 2.181640625, 5.4501953125, 8.71875, 11.9873046875, 15.255859375, 18.5244140625, 21.79296875, 25.0615234375, 28.330078125, 31.5986328125, 34.8671875, 38.1357421875, 41.404296875, 44.6728515625, 47.94140625, 51.2099609375, 54.478515625, 57.7470703125, 61.015625, 64.2841796875, 67.552734375, 70.8212890625, 74.08984375, 77.3583984375, 80.626953125, 83.8955078125, 87.1640625, 90.4326171875, 93.701171875, 96.9697265625, 100.23828125, 103.5068359375, 106.775390625, 110.0439453125, 113.3125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 16.0, 12.0, 26.0, 22.0, 36.0, 46.0, 53.0, 72.0, 73.0, 101.0, 92.0, 75.0, 90.0, 67.0, 46.0, 46.0, 44.0, 25.0, 21.0, 11.0, 7.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.71875, -15.12451171875, -14.5302734375, -13.93603515625, -13.341796875, -12.74755859375, -12.1533203125, -11.55908203125, -10.96484375, -10.37060546875, -9.7763671875, -9.18212890625, -8.587890625, -7.99365234375, -7.3994140625, -6.80517578125, -6.2109375, -5.61669921875, -5.0224609375, -4.42822265625, -3.833984375, -3.23974609375, -2.6455078125, -2.05126953125, -1.45703125, -0.86279296875, -0.2685546875, 0.32568359375, 0.919921875, 1.51416015625, 2.1083984375, 2.70263671875, 3.296875, 3.89111328125, 4.4853515625, 5.07958984375, 5.673828125, 6.26806640625, 6.8623046875, 7.45654296875, 8.05078125, 8.64501953125, 9.2392578125, 9.83349609375, 10.427734375, 11.02197265625, 11.6162109375, 12.21044921875, 12.8046875, 13.39892578125, 13.9931640625, 14.58740234375, 15.181640625, 15.77587890625, 16.3701171875, 16.96435546875, 17.55859375, 18.15283203125, 18.7470703125, 19.34130859375, 19.935546875, 20.52978515625, 21.1240234375, 21.71826171875, 22.3125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 11.0, 14.0, 18.0, 28.0, 47.0, 61.0, 91.0, 97.0, 171.0, 214.0, 275.0, 466.0, 746.0, 1258.0, 2144.0, 4337.0, 9375.0, 21474.0, 54359.0, 133009.0, 275978.0, 293049.0, 145947.0, 60441.0, 24088.0, 10186.0, 4703.0, 2332.0, 1302.0, 776.0, 488.0, 328.0, 208.0, 140.0, 113.0, 71.0, 64.0, 44.0, 33.0, 14.0, 18.0, 10.0, 6.0, 3.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.375, -49.720703125, -48.06640625, -46.412109375, -44.7578125, -43.103515625, -41.44921875, -39.794921875, -38.140625, -36.486328125, -34.83203125, -33.177734375, -31.5234375, -29.869140625, -28.21484375, -26.560546875, -24.90625, -23.251953125, -21.59765625, -19.943359375, -18.2890625, -16.634765625, -14.98046875, -13.326171875, -11.671875, -10.017578125, -8.36328125, -6.708984375, -5.0546875, -3.400390625, -1.74609375, -0.091796875, 1.5625, 3.216796875, 4.87109375, 6.525390625, 8.1796875, 9.833984375, 11.48828125, 13.142578125, 14.796875, 16.451171875, 18.10546875, 19.759765625, 21.4140625, 23.068359375, 24.72265625, 26.376953125, 28.03125, 29.685546875, 31.33984375, 32.994140625, 34.6484375, 36.302734375, 37.95703125, 39.611328125, 41.265625, 42.919921875, 44.57421875, 46.228515625, 47.8828125, 49.537109375, 51.19140625, 52.845703125, 54.5]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 4.0, 13.0, 9.0, 14.0, 16.0, 14.0, 16.0, 24.0, 24.0, 27.0, 40.0, 32.0, 33.0, 43.0, 38.0, 50.0, 50.0, 60.0, 54.0, 45.0, 37.0, 50.0, 41.0, 44.0, 41.0, 30.0, 27.0, 15.0, 27.0, 17.0, 14.0, 9.0, 8.0, 11.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.76171875, -39.2109375, -37.66015625, -36.109375, -34.55859375, -33.0078125, -31.45703125, -29.90625, -28.35546875, -26.8046875, -25.25390625, -23.703125, -22.15234375, -20.6015625, -19.05078125, -17.5, -15.94921875, -14.3984375, -12.84765625, -11.296875, -9.74609375, -8.1953125, -6.64453125, -5.09375, -3.54296875, -1.9921875, -0.44140625, 1.109375, 2.66015625, 4.2109375, 5.76171875, 7.3125, 8.86328125, 10.4140625, 11.96484375, 13.515625, 15.06640625, 16.6171875, 18.16796875, 19.71875, 21.26953125, 22.8203125, 24.37109375, 25.921875, 27.47265625, 29.0234375, 30.57421875, 32.125, 33.67578125, 35.2265625, 36.77734375, 38.328125, 39.87890625, 41.4296875, 42.98046875, 44.53125, 46.08203125, 47.6328125, 49.18359375, 50.734375, 52.28515625, 53.8359375, 55.38671875, 56.9375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 17.0, 11.0, 29.0, 29.0, 48.0, 82.0, 128.0, 229.0, 472.0, 857.0, 1738.0, 3924.0, 11314.0, 45845.0, 279892.0, 552160.0, 117351.0, 22383.0, 6616.0, 2686.0, 1213.0, 655.0, 353.0, 202.0, 98.0, 68.0, 39.0, 27.0, 21.0, 9.0, 12.0, 7.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.65625, -41.2919921875, -39.927734375, -38.5634765625, -37.19921875, -35.8349609375, -34.470703125, -33.1064453125, -31.7421875, -30.3779296875, -29.013671875, -27.6494140625, -26.28515625, -24.9208984375, -23.556640625, -22.1923828125, -20.828125, -19.4638671875, -18.099609375, -16.7353515625, -15.37109375, -14.0068359375, -12.642578125, -11.2783203125, -9.9140625, -8.5498046875, -7.185546875, -5.8212890625, -4.45703125, -3.0927734375, -1.728515625, -0.3642578125, 1.0, 2.3642578125, 3.728515625, 5.0927734375, 6.45703125, 7.8212890625, 9.185546875, 10.5498046875, 11.9140625, 13.2783203125, 14.642578125, 16.0068359375, 17.37109375, 18.7353515625, 20.099609375, 21.4638671875, 22.828125, 24.1923828125, 25.556640625, 26.9208984375, 28.28515625, 29.6494140625, 31.013671875, 32.3779296875, 33.7421875, 35.1064453125, 36.470703125, 37.8349609375, 39.19921875, 40.5634765625, 41.927734375, 43.2919921875, 44.65625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 7.0, 10.0, 10.0, 13.0, 14.0, 22.0, 37.0, 41.0, 66.0, 82.0, 130.0, 145.0, 107.0, 81.0, 58.0, 38.0, 34.0, 29.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00690460205078125, -0.006703615188598633, -0.006502628326416016, -0.0063016414642333984, -0.006100654602050781, -0.005899667739868164, -0.005698680877685547, -0.00549769401550293, -0.0052967071533203125, -0.005095720291137695, -0.004894733428955078, -0.004693746566772461, -0.004492759704589844, -0.0042917728424072266, -0.004090785980224609, -0.003889799118041992, -0.003688812255859375, -0.003487825393676758, -0.0032868385314941406, -0.0030858516693115234, -0.0028848648071289062, -0.002683877944946289, -0.002482891082763672, -0.0022819042205810547, -0.0020809173583984375, -0.0018799304962158203, -0.0016789436340332031, -0.001477956771850586, -0.0012769699096679688, -0.0010759830474853516, -0.0008749961853027344, -0.0006740093231201172, -0.0004730224609375, -0.0002720355987548828, -7.104873657226562e-05, 0.00012993812561035156, 0.00033092498779296875, 0.0005319118499755859, 0.0007328987121582031, 0.0009338855743408203, 0.0011348724365234375, 0.0013358592987060547, 0.0015368461608886719, 0.001737833023071289, 0.0019388198852539062, 0.0021398067474365234, 0.0023407936096191406, 0.002541780471801758, 0.002742767333984375, 0.002943754196166992, 0.0031447410583496094, 0.0033457279205322266, 0.0035467147827148438, 0.003747701644897461, 0.003948688507080078, 0.004149675369262695, 0.0043506622314453125, 0.00455164909362793, 0.004752635955810547, 0.004953622817993164, 0.005154609680175781, 0.0053555965423583984, 0.005556583404541016, 0.005757570266723633, 0.00595855712890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 0.0, 3.0, 6.0, 2.0, 7.0, 6.0, 10.0, 24.0, 21.0, 28.0, 46.0, 77.0, 134.0, 200.0, 372.0, 728.0, 1535.0, 3540.0, 9782.0, 38165.0, 302387.0, 588049.0, 78453.0, 15701.0, 5084.0, 1994.0, 954.0, 486.0, 279.0, 173.0, 93.0, 62.0, 40.0, 36.0, 15.0, 15.0, 9.0, 6.0, 7.0, 9.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1875, -54.54443359375, -52.9013671875, -51.25830078125, -49.615234375, -47.97216796875, -46.3291015625, -44.68603515625, -43.04296875, -41.39990234375, -39.7568359375, -38.11376953125, -36.470703125, -34.82763671875, -33.1845703125, -31.54150390625, -29.8984375, -28.25537109375, -26.6123046875, -24.96923828125, -23.326171875, -21.68310546875, -20.0400390625, -18.39697265625, -16.75390625, -15.11083984375, -13.4677734375, -11.82470703125, -10.181640625, -8.53857421875, -6.8955078125, -5.25244140625, -3.609375, -1.96630859375, -0.3232421875, 1.31982421875, 2.962890625, 4.60595703125, 6.2490234375, 7.89208984375, 9.53515625, 11.17822265625, 12.8212890625, 14.46435546875, 16.107421875, 17.75048828125, 19.3935546875, 21.03662109375, 22.6796875, 24.32275390625, 25.9658203125, 27.60888671875, 29.251953125, 30.89501953125, 32.5380859375, 34.18115234375, 35.82421875, 37.46728515625, 39.1103515625, 40.75341796875, 42.396484375, 44.03955078125, 45.6826171875, 47.32568359375, 48.96875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 2.0, 6.0, 4.0, 7.0, 9.0, 8.0, 8.0, 21.0, 28.0, 26.0, 44.0, 61.0, 69.0, 80.0, 81.0, 104.0, 101.0, 85.0, 62.0, 46.0, 40.0, 32.0, 17.0, 16.0, 7.0, 9.0, 4.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.82421875, -30.9921875, -30.16015625, -29.328125, -28.49609375, -27.6640625, -26.83203125, -26.0, -25.16796875, -24.3359375, -23.50390625, -22.671875, -21.83984375, -21.0078125, -20.17578125, -19.34375, -18.51171875, -17.6796875, -16.84765625, -16.015625, -15.18359375, -14.3515625, -13.51953125, -12.6875, -11.85546875, -11.0234375, -10.19140625, -9.359375, -8.52734375, -7.6953125, -6.86328125, -6.03125, -5.19921875, -4.3671875, -3.53515625, -2.703125, -1.87109375, -1.0390625, -0.20703125, 0.625, 1.45703125, 2.2890625, 3.12109375, 3.953125, 4.78515625, 5.6171875, 6.44921875, 7.28125, 8.11328125, 8.9453125, 9.77734375, 10.609375, 11.44140625, 12.2734375, 13.10546875, 13.9375, 14.76953125, 15.6015625, 16.43359375, 17.265625, 18.09765625, 18.9296875, 19.76171875, 20.59375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 7.0, 9.0, 6.0, 19.0, 19.0, 29.0, 51.0, 59.0, 100.0, 92.0, 110.0, 121.0, 84.0, 90.0, 68.0, 39.0, 29.0, 21.0, 12.0, 10.0, 11.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-573.565673828125, -561.1333618164062, -548.7010498046875, -536.268798828125, -523.8364868164062, -511.4041748046875, -498.97186279296875, -486.53955078125, -474.10723876953125, -461.6749267578125, -449.2426452636719, -436.8103332519531, -424.3780212402344, -411.94573974609375, -399.513427734375, -387.08111572265625, -374.6488342285156, -362.2165222167969, -349.78424072265625, -337.3519287109375, -324.91961669921875, -312.4873046875, -300.0550231933594, -287.6227111816406, -275.1904296875, -262.75811767578125, -250.32582092285156, -237.89352416992188, -225.46121215820312, -213.02891540527344, -200.59661865234375, -188.164306640625, -175.73202514648438, -163.2997283935547, -150.86741638183594, -138.43511962890625, -126.00281524658203, -113.57051086425781, -101.13821411132812, -88.7059097290039, -76.27360534667969, -63.84130096435547, -51.409000396728516, -38.97669982910156, -26.544395446777344, -14.112091064453125, -1.6797943115234375, 10.752510070800781, 23.184814453125, 35.61711883544922, 48.04941940307617, 60.481719970703125, 72.91402435302734, 85.34632873535156, 97.77862548828125, 110.21092987060547, 122.64323425292969, 135.07553100585938, 147.50784301757812, 159.9401397705078, 172.3724365234375, 184.80474853515625, 197.23704528808594, 209.66934204101562, 222.10165405273438]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 6.0, 10.0, 11.0, 14.0, 11.0, 18.0, 29.0, 30.0, 35.0, 40.0, 49.0, 32.0, 40.0, 52.0, 42.0, 35.0, 46.0, 58.0, 51.0, 51.0, 49.0, 48.0, 29.0, 39.0, 35.0, 26.0, 23.0, 12.0, 19.0, 26.0, 2.0, 5.0, 4.0, 8.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-315.7646179199219, -306.2895202636719, -296.8144226074219, -287.3393249511719, -277.8642272949219, -268.3891296386719, -258.9140319824219, -249.4389190673828, -239.9638214111328, -230.4887237548828, -221.0136260986328, -211.5385284423828, -202.06341552734375, -192.58831787109375, -183.11322021484375, -173.63812255859375, -164.16302490234375, -154.68792724609375, -145.21282958984375, -135.73773193359375, -126.26262664794922, -116.78752899169922, -107.31242370605469, -97.83732604980469, -88.36222839355469, -78.88713073730469, -69.41203308105469, -59.936927795410156, -50.461830139160156, -40.986732482910156, -31.51163101196289, -22.036529541015625, -12.56146240234375, -3.086362838745117, 6.388736724853516, 15.863836288452148, 25.33893585205078, 34.81403350830078, 44.28913497924805, 53.76423645019531, 63.23933410644531, 72.71443176269531, 82.18952941894531, 91.66463470458984, 101.13973236083984, 110.61483001708984, 120.08993530273438, 129.56503295898438, 139.04013061523438, 148.51522827148438, 157.99032592773438, 167.46542358398438, 176.94052124023438, 186.41561889648438, 195.89073181152344, 205.36582946777344, 214.84092712402344, 224.31602478027344, 233.79112243652344, 243.26622009277344, 252.7413330078125, 262.2164306640625, 271.6915283203125, 281.1666259765625, 290.6417236328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 26.0, 38.0, 49.0, 64.0, 121.0, 238.0, 481.0, 916.0, 2287.0, 6420.0, 22276.0, 122367.0, 3535504.0, 438003.0, 47545.0, 11231.0, 3589.0, 1463.0, 688.0, 352.0, 192.0, 127.0, 62.0, 40.0, 38.0, 33.0, 21.0, 17.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-129.25, -124.591796875, -119.93359375, -115.275390625, -110.6171875, -105.958984375, -101.30078125, -96.642578125, -91.984375, -87.326171875, -82.66796875, -78.009765625, -73.3515625, -68.693359375, -64.03515625, -59.376953125, -54.71875, -50.060546875, -45.40234375, -40.744140625, -36.0859375, -31.427734375, -26.76953125, -22.111328125, -17.453125, -12.794921875, -8.13671875, -3.478515625, 1.1796875, 5.837890625, 10.49609375, 15.154296875, 19.8125, 24.470703125, 29.12890625, 33.787109375, 38.4453125, 43.103515625, 47.76171875, 52.419921875, 57.078125, 61.736328125, 66.39453125, 71.052734375, 75.7109375, 80.369140625, 85.02734375, 89.685546875, 94.34375, 99.001953125, 103.66015625, 108.318359375, 112.9765625, 117.634765625, 122.29296875, 126.951171875, 131.609375, 136.267578125, 140.92578125, 145.583984375, 150.2421875, 154.900390625, 159.55859375, 164.216796875, 168.875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 14.0, 20.0, 23.0, 31.0, 33.0, 58.0, 69.0, 96.0, 97.0, 84.0, 77.0, 74.0, 97.0, 60.0, 45.0, 40.0, 26.0, 17.0, 23.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.501220703125, -16.89306640625, -16.284912109375, -15.6767578125, -15.068603515625, -14.46044921875, -13.852294921875, -13.244140625, -12.635986328125, -12.02783203125, -11.419677734375, -10.8115234375, -10.203369140625, -9.59521484375, -8.987060546875, -8.37890625, -7.770751953125, -7.16259765625, -6.554443359375, -5.9462890625, -5.338134765625, -4.72998046875, -4.121826171875, -3.513671875, -2.905517578125, -2.29736328125, -1.689208984375, -1.0810546875, -0.472900390625, 0.13525390625, 0.743408203125, 1.3515625, 1.959716796875, 2.56787109375, 3.176025390625, 3.7841796875, 4.392333984375, 5.00048828125, 5.608642578125, 6.216796875, 6.824951171875, 7.43310546875, 8.041259765625, 8.6494140625, 9.257568359375, 9.86572265625, 10.473876953125, 11.08203125, 11.690185546875, 12.29833984375, 12.906494140625, 13.5146484375, 14.122802734375, 14.73095703125, 15.339111328125, 15.947265625, 16.555419921875, 17.16357421875, 17.771728515625, 18.3798828125, 18.988037109375, 19.59619140625, 20.204345703125, 20.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 10.0, 13.0, 15.0, 28.0, 27.0, 60.0, 51.0, 69.0, 89.0, 119.0, 185.0, 234.0, 328.0, 493.0, 893.0, 1551.0, 3168.0, 8295.0, 27271.0, 135507.0, 2376303.0, 1485477.0, 115666.0, 24127.0, 7263.0, 2980.0, 1485.0, 856.0, 549.0, 361.0, 214.0, 149.0, 102.0, 81.0, 80.0, 42.0, 31.0, 26.0, 24.0, 14.0, 7.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-109.0, -105.58984375, -102.1796875, -98.76953125, -95.359375, -91.94921875, -88.5390625, -85.12890625, -81.71875, -78.30859375, -74.8984375, -71.48828125, -68.078125, -64.66796875, -61.2578125, -57.84765625, -54.4375, -51.02734375, -47.6171875, -44.20703125, -40.796875, -37.38671875, -33.9765625, -30.56640625, -27.15625, -23.74609375, -20.3359375, -16.92578125, -13.515625, -10.10546875, -6.6953125, -3.28515625, 0.125, 3.53515625, 6.9453125, 10.35546875, 13.765625, 17.17578125, 20.5859375, 23.99609375, 27.40625, 30.81640625, 34.2265625, 37.63671875, 41.046875, 44.45703125, 47.8671875, 51.27734375, 54.6875, 58.09765625, 61.5078125, 64.91796875, 68.328125, 71.73828125, 75.1484375, 78.55859375, 81.96875, 85.37890625, 88.7890625, 92.19921875, 95.609375, 99.01953125, 102.4296875, 105.83984375, 109.25]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 5.0, 15.0, 25.0, 42.0, 63.0, 92.0, 167.0, 308.0, 709.0, 1652.0, 464.0, 236.0, 109.0, 69.0, 38.0, 27.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.875, -54.376953125, -52.87890625, -51.380859375, -49.8828125, -48.384765625, -46.88671875, -45.388671875, -43.890625, -42.392578125, -40.89453125, -39.396484375, -37.8984375, -36.400390625, -34.90234375, -33.404296875, -31.90625, -30.408203125, -28.91015625, -27.412109375, -25.9140625, -24.416015625, -22.91796875, -21.419921875, -19.921875, -18.423828125, -16.92578125, -15.427734375, -13.9296875, -12.431640625, -10.93359375, -9.435546875, -7.9375, -6.439453125, -4.94140625, -3.443359375, -1.9453125, -0.447265625, 1.05078125, 2.548828125, 4.046875, 5.544921875, 7.04296875, 8.541015625, 10.0390625, 11.537109375, 13.03515625, 14.533203125, 16.03125, 17.529296875, 19.02734375, 20.525390625, 22.0234375, 23.521484375, 25.01953125, 26.517578125, 28.015625, 29.513671875, 31.01171875, 32.509765625, 34.0078125, 35.505859375, 37.00390625, 38.501953125, 40.0]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 20.0, 25.0, 53.0, 66.0, 103.0, 117.0, 133.0, 116.0, 105.0, 70.0, 57.0, 45.0, 28.0, 12.0, 15.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.1314392089844, -355.24560546875, -346.35980224609375, -337.4739990234375, -328.5881652832031, -319.70233154296875, -310.8165283203125, -301.93072509765625, -293.0448913574219, -284.1590576171875, -275.27325439453125, -266.387451171875, -257.5016174316406, -248.6157989501953, -239.72998046875, -230.8441619873047, -221.95834350585938, -213.07252502441406, -204.18670654296875, -195.30088806152344, -186.41506958007812, -177.5292510986328, -168.6434326171875, -159.7576141357422, -150.87179565429688, -141.98597717285156, -133.10015869140625, -124.21434020996094, -115.32852172851562, -106.44270324707031, -97.556884765625, -88.67106628417969, -79.78526306152344, -70.89944458007812, -62.01362609863281, -53.1278076171875, -44.24198913574219, -35.356170654296875, -26.470352172851562, -17.58453369140625, -8.698715209960938, 0.187103271484375, 9.072921752929688, 17.958740234375, 26.844558715820312, 35.730377197265625, 44.61619567871094, 53.50201416015625, 62.38783264160156, 71.27365112304688, 80.15946960449219, 89.0452880859375, 97.93110656738281, 106.81692504882812, 115.70274353027344, 124.58856201171875, 133.47438049316406, 142.36019897460938, 151.2460174560547, 160.1318359375, 169.0176544189453, 177.90347290039062, 186.78929138183594, 195.67510986328125, 204.56092834472656]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 10.0, 8.0, 12.0, 23.0, 24.0, 27.0, 30.0, 35.0, 36.0, 40.0, 42.0, 41.0, 41.0, 40.0, 57.0, 60.0, 60.0, 37.0, 45.0, 36.0, 32.0, 33.0, 29.0, 39.0, 33.0, 21.0, 11.0, 18.0, 10.0, 15.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.99546813964844, -129.6334686279297, -125.27147674560547, -120.90947723388672, -116.5474853515625, -112.18548583984375, -107.823486328125, -103.46148681640625, -99.09949493408203, -94.73749542236328, -90.37550354003906, -86.01350402832031, -81.65150451660156, -77.28951263427734, -72.9275131225586, -68.56552124023438, -64.20352172851562, -59.84152603149414, -55.479530334472656, -51.117530822753906, -46.75553512573242, -42.39353942871094, -38.03153991699219, -33.6695442199707, -29.30754852294922, -24.945552825927734, -20.583555221557617, -16.2215576171875, -11.859561920166016, -7.497566223144531, -3.135568618774414, 1.2264289855957031, 5.588409423828125, 9.950406074523926, 14.312402725219727, 18.674400329589844, 23.036396026611328, 27.398391723632812, 31.76038932800293, 36.12238693237305, 40.48438262939453, 44.846378326416016, 49.2083740234375, 53.57037353515625, 57.932369232177734, 62.29436492919922, 66.65636444091797, 71.01835632324219, 75.38035583496094, 79.74235534667969, 84.1043472290039, 88.46634674072266, 92.82833862304688, 97.19033813476562, 101.55233764648438, 105.91433715820312, 110.27632904052734, 114.6383285522461, 119.00032043457031, 123.36231994628906, 127.72431945800781, 132.0863037109375, 136.44830322265625, 140.810302734375, 145.17230224609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 16.0, 27.0, 41.0, 62.0, 97.0, 153.0, 273.0, 511.0, 1087.0, 3045.0, 14729.0, 116540.0, 698525.0, 184847.0, 21902.0, 3983.0, 1342.0, 625.0, 278.0, 177.0, 116.0, 69.0, 31.0, 25.0, 15.0, 15.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.75, -174.84375, -168.9375, -163.03125, -157.125, -151.21875, -145.3125, -139.40625, -133.5, -127.59375, -121.6875, -115.78125, -109.875, -103.96875, -98.0625, -92.15625, -86.25, -80.34375, -74.4375, -68.53125, -62.625, -56.71875, -50.8125, -44.90625, -39.0, -33.09375, -27.1875, -21.28125, -15.375, -9.46875, -3.5625, 2.34375, 8.25, 14.15625, 20.0625, 25.96875, 31.875, 37.78125, 43.6875, 49.59375, 55.5, 61.40625, 67.3125, 73.21875, 79.125, 85.03125, 90.9375, 96.84375, 102.75, 108.65625, 114.5625, 120.46875, 126.375, 132.28125, 138.1875, 144.09375, 150.0, 155.90625, 161.8125, 167.71875, 173.625, 179.53125, 185.4375, 191.34375, 197.25]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 20.0, 31.0, 37.0, 54.0, 63.0, 74.0, 103.0, 83.0, 100.0, 87.0, 84.0, 75.0, 42.0, 30.0, 40.0, 23.0, 14.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.605712890625, -19.96142578125, -19.317138671875, -18.6728515625, -18.028564453125, -17.38427734375, -16.739990234375, -16.095703125, -15.451416015625, -14.80712890625, -14.162841796875, -13.5185546875, -12.874267578125, -12.22998046875, -11.585693359375, -10.94140625, -10.297119140625, -9.65283203125, -9.008544921875, -8.3642578125, -7.719970703125, -7.07568359375, -6.431396484375, -5.787109375, -5.142822265625, -4.49853515625, -3.854248046875, -3.2099609375, -2.565673828125, -1.92138671875, -1.277099609375, -0.6328125, 0.011474609375, 0.65576171875, 1.300048828125, 1.9443359375, 2.588623046875, 3.23291015625, 3.877197265625, 4.521484375, 5.165771484375, 5.81005859375, 6.454345703125, 7.0986328125, 7.742919921875, 8.38720703125, 9.031494140625, 9.67578125, 10.320068359375, 10.96435546875, 11.608642578125, 12.2529296875, 12.897216796875, 13.54150390625, 14.185791015625, 14.830078125, 15.474365234375, 16.11865234375, 16.762939453125, 17.4072265625, 18.051513671875, 18.69580078125, 19.340087890625, 19.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 10.0, 11.0, 11.0, 28.0, 37.0, 50.0, 75.0, 111.0, 155.0, 232.0, 366.0, 613.0, 1001.0, 1790.0, 3260.0, 6647.0, 13941.0, 30622.0, 67388.0, 147768.0, 296934.0, 255283.0, 119736.0, 54674.0, 24461.0, 11394.0, 5398.0, 2745.0, 1552.0, 816.0, 504.0, 303.0, 241.0, 112.0, 91.0, 61.0, 37.0, 25.0, 25.0, 15.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.65625, -46.2490234375, -44.841796875, -43.4345703125, -42.02734375, -40.6201171875, -39.212890625, -37.8056640625, -36.3984375, -34.9912109375, -33.583984375, -32.1767578125, -30.76953125, -29.3623046875, -27.955078125, -26.5478515625, -25.140625, -23.7333984375, -22.326171875, -20.9189453125, -19.51171875, -18.1044921875, -16.697265625, -15.2900390625, -13.8828125, -12.4755859375, -11.068359375, -9.6611328125, -8.25390625, -6.8466796875, -5.439453125, -4.0322265625, -2.625, -1.2177734375, 0.189453125, 1.5966796875, 3.00390625, 4.4111328125, 5.818359375, 7.2255859375, 8.6328125, 10.0400390625, 11.447265625, 12.8544921875, 14.26171875, 15.6689453125, 17.076171875, 18.4833984375, 19.890625, 21.2978515625, 22.705078125, 24.1123046875, 25.51953125, 26.9267578125, 28.333984375, 29.7412109375, 31.1484375, 32.5556640625, 33.962890625, 35.3701171875, 36.77734375, 38.1845703125, 39.591796875, 40.9990234375, 42.40625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 10.0, 5.0, 9.0, 15.0, 14.0, 12.0, 15.0, 18.0, 33.0, 23.0, 32.0, 31.0, 36.0, 41.0, 45.0, 42.0, 46.0, 31.0, 50.0, 45.0, 49.0, 43.0, 27.0, 39.0, 32.0, 40.0, 33.0, 21.0, 17.0, 16.0, 24.0, 20.0, 20.0, 13.0, 12.0, 6.0, 10.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.03125, -38.72265625, -37.4140625, -36.10546875, -34.796875, -33.48828125, -32.1796875, -30.87109375, -29.5625, -28.25390625, -26.9453125, -25.63671875, -24.328125, -23.01953125, -21.7109375, -20.40234375, -19.09375, -17.78515625, -16.4765625, -15.16796875, -13.859375, -12.55078125, -11.2421875, -9.93359375, -8.625, -7.31640625, -6.0078125, -4.69921875, -3.390625, -2.08203125, -0.7734375, 0.53515625, 1.84375, 3.15234375, 4.4609375, 5.76953125, 7.078125, 8.38671875, 9.6953125, 11.00390625, 12.3125, 13.62109375, 14.9296875, 16.23828125, 17.546875, 18.85546875, 20.1640625, 21.47265625, 22.78125, 24.08984375, 25.3984375, 26.70703125, 28.015625, 29.32421875, 30.6328125, 31.94140625, 33.25, 34.55859375, 35.8671875, 37.17578125, 38.484375, 39.79296875, 41.1015625, 42.41015625, 43.71875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 16.0, 24.0, 44.0, 72.0, 144.0, 319.0, 842.0, 2813.0, 13599.0, 111197.0, 660574.0, 228443.0, 24136.0, 4351.0, 1151.0, 428.0, 177.0, 91.0, 59.0, 22.0, 15.0, 11.0, 9.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.5595703125, -40.900390625, -39.2412109375, -37.58203125, -35.9228515625, -34.263671875, -32.6044921875, -30.9453125, -29.2861328125, -27.626953125, -25.9677734375, -24.30859375, -22.6494140625, -20.990234375, -19.3310546875, -17.671875, -16.0126953125, -14.353515625, -12.6943359375, -11.03515625, -9.3759765625, -7.716796875, -6.0576171875, -4.3984375, -2.7392578125, -1.080078125, 0.5791015625, 2.23828125, 3.8974609375, 5.556640625, 7.2158203125, 8.875, 10.5341796875, 12.193359375, 13.8525390625, 15.51171875, 17.1708984375, 18.830078125, 20.4892578125, 22.1484375, 23.8076171875, 25.466796875, 27.1259765625, 28.78515625, 30.4443359375, 32.103515625, 33.7626953125, 35.421875, 37.0810546875, 38.740234375, 40.3994140625, 42.05859375, 43.7177734375, 45.376953125, 47.0361328125, 48.6953125, 50.3544921875, 52.013671875, 53.6728515625, 55.33203125, 56.9912109375, 58.650390625, 60.3095703125, 61.96875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 8.0, 14.0, 17.0, 20.0, 27.0, 35.0, 38.0, 56.0, 54.0, 124.0, 133.0, 130.0, 77.0, 53.0, 48.0, 32.0, 33.0, 18.0, 19.0, 13.0, 9.0, 6.0, 1.0, 10.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00592803955078125, -0.005778014659881592, -0.005627989768981934, -0.005477964878082275, -0.005327939987182617, -0.005177915096282959, -0.005027890205383301, -0.004877865314483643, -0.004727840423583984, -0.004577815532684326, -0.004427790641784668, -0.00427776575088501, -0.0041277408599853516, -0.003977715969085693, -0.003827691078186035, -0.003677666187286377, -0.0035276412963867188, -0.0033776164054870605, -0.0032275915145874023, -0.003077566623687744, -0.002927541732788086, -0.0027775168418884277, -0.0026274919509887695, -0.0024774670600891113, -0.002327442169189453, -0.002177417278289795, -0.0020273923873901367, -0.0018773674964904785, -0.0017273426055908203, -0.0015773177146911621, -0.001427292823791504, -0.0012772679328918457, -0.0011272430419921875, -0.0009772181510925293, -0.0008271932601928711, -0.0006771683692932129, -0.0005271434783935547, -0.0003771185874938965, -0.00022709369659423828, -7.706880569458008e-05, 7.295608520507812e-05, 0.00022298097610473633, 0.00037300586700439453, 0.0005230307579040527, 0.0006730556488037109, 0.0008230805397033691, 0.0009731054306030273, 0.0011231303215026855, 0.0012731552124023438, 0.001423180103302002, 0.0015732049942016602, 0.0017232298851013184, 0.0018732547760009766, 0.0020232796669006348, 0.002173304557800293, 0.002323329448699951, 0.0024733543395996094, 0.0026233792304992676, 0.0027734041213989258, 0.002923429012298584, 0.003073453903198242, 0.0032234787940979004, 0.0033735036849975586, 0.003523528575897217, 0.003673553466796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 23.0, 19.0, 38.0, 54.0, 102.0, 130.0, 229.0, 359.0, 595.0, 1108.0, 2135.0, 4265.0, 10270.0, 28062.0, 94719.0, 309473.0, 390105.0, 140609.0, 40766.0, 13994.0, 5667.0, 2640.0, 1301.0, 708.0, 431.0, 248.0, 158.0, 102.0, 68.0, 44.0, 18.0, 23.0, 18.0, 16.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-27.078125, -26.236083984375, -25.39404296875, -24.552001953125, -23.7099609375, -22.867919921875, -22.02587890625, -21.183837890625, -20.341796875, -19.499755859375, -18.65771484375, -17.815673828125, -16.9736328125, -16.131591796875, -15.28955078125, -14.447509765625, -13.60546875, -12.763427734375, -11.92138671875, -11.079345703125, -10.2373046875, -9.395263671875, -8.55322265625, -7.711181640625, -6.869140625, -6.027099609375, -5.18505859375, -4.343017578125, -3.5009765625, -2.658935546875, -1.81689453125, -0.974853515625, -0.1328125, 0.709228515625, 1.55126953125, 2.393310546875, 3.2353515625, 4.077392578125, 4.91943359375, 5.761474609375, 6.603515625, 7.445556640625, 8.28759765625, 9.129638671875, 9.9716796875, 10.813720703125, 11.65576171875, 12.497802734375, 13.33984375, 14.181884765625, 15.02392578125, 15.865966796875, 16.7080078125, 17.550048828125, 18.39208984375, 19.234130859375, 20.076171875, 20.918212890625, 21.76025390625, 22.602294921875, 23.4443359375, 24.286376953125, 25.12841796875, 25.970458984375, 26.8125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 2.0, 8.0, 8.0, 22.0, 18.0, 26.0, 30.0, 45.0, 46.0, 66.0, 80.0, 107.0, 97.0, 83.0, 83.0, 69.0, 41.0, 46.0, 24.0, 20.0, 23.0, 16.0, 11.0, 3.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.564697265625, -20.83251953125, -20.100341796875, -19.3681640625, -18.635986328125, -17.90380859375, -17.171630859375, -16.439453125, -15.707275390625, -14.97509765625, -14.242919921875, -13.5107421875, -12.778564453125, -12.04638671875, -11.314208984375, -10.58203125, -9.849853515625, -9.11767578125, -8.385498046875, -7.6533203125, -6.921142578125, -6.18896484375, -5.456787109375, -4.724609375, -3.992431640625, -3.26025390625, -2.528076171875, -1.7958984375, -1.063720703125, -0.33154296875, 0.400634765625, 1.1328125, 1.864990234375, 2.59716796875, 3.329345703125, 4.0615234375, 4.793701171875, 5.52587890625, 6.258056640625, 6.990234375, 7.722412109375, 8.45458984375, 9.186767578125, 9.9189453125, 10.651123046875, 11.38330078125, 12.115478515625, 12.84765625, 13.579833984375, 14.31201171875, 15.044189453125, 15.7763671875, 16.508544921875, 17.24072265625, 17.972900390625, 18.705078125, 19.437255859375, 20.16943359375, 20.901611328125, 21.6337890625, 22.365966796875, 23.09814453125, 23.830322265625, 24.5625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 15.0, 32.0, 33.0, 35.0, 49.0, 50.0, 68.0, 65.0, 84.0, 110.0, 67.0, 69.0, 65.0, 56.0, 41.0, 35.0, 25.0, 22.0, 16.0, 11.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-231.17059326171875, -222.47744750976562, -213.7843017578125, -205.09115600585938, -196.39801025390625, -187.70486450195312, -179.01171875, -170.31857299804688, -161.62542724609375, -152.93228149414062, -144.2391357421875, -135.54598999023438, -126.85284423828125, -118.15969848632812, -109.46656036376953, -100.7734146118164, -92.08027648925781, -83.38713073730469, -74.69398498535156, -66.00083923339844, -57.30769729614258, -48.61455154418945, -39.921409606933594, -31.22826385498047, -22.535118103027344, -13.841973304748535, -5.148828506469727, 3.5443153381347656, 12.23746109008789, 20.930606842041016, 29.623748779296875, 38.31689453125, 47.010040283203125, 55.70318603515625, 64.39633178710938, 73.0894775390625, 81.78262329101562, 90.47576904296875, 99.16890716552734, 107.86205291748047, 116.5551986694336, 125.24834442138672, 133.9414825439453, 142.63462829589844, 151.32777404785156, 160.0209197998047, 168.7140655517578, 177.40721130371094, 186.10035705566406, 194.7935028076172, 203.4866485595703, 212.17979431152344, 220.87294006347656, 229.5660858154297, 238.25921630859375, 246.95236206054688, 255.6455078125, 264.3386535644531, 273.03179931640625, 281.7249450683594, 290.4180908203125, 299.1112365722656, 307.80438232421875, 316.4975280761719, 325.190673828125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 12.0, 10.0, 14.0, 14.0, 17.0, 19.0, 24.0, 21.0, 28.0, 27.0, 29.0, 44.0, 39.0, 50.0, 47.0, 49.0, 43.0, 42.0, 52.0, 39.0, 43.0, 44.0, 38.0, 25.0, 33.0, 23.0, 32.0, 15.0, 16.0, 18.0, 16.0, 11.0, 12.0, 11.0, 5.0, 6.0, 1.0, 4.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.33224487304688, -239.5975799560547, -231.8629150390625, -224.1282501220703, -216.39358520507812, -208.65892028808594, -200.92425537109375, -193.18960571289062, -185.45492553710938, -177.7202606201172, -169.985595703125, -162.2509307861328, -154.51626586914062, -146.78160095214844, -139.04693603515625, -131.31228637695312, -123.57762145996094, -115.84295654296875, -108.10829162597656, -100.37362670898438, -92.63896179199219, -84.904296875, -77.16963958740234, -69.43497467041016, -61.70030975341797, -53.96564483642578, -46.230979919433594, -38.49631881713867, -30.761653900146484, -23.026988983154297, -15.292327880859375, -7.5576629638671875, 0.1770172119140625, 7.911681175231934, 15.646345138549805, 23.38100814819336, 31.115673065185547, 38.850337982177734, 46.584999084472656, 54.319664001464844, 62.05432891845703, 69.78899383544922, 77.5236587524414, 85.25831604003906, 92.99298095703125, 100.72764587402344, 108.46231079101562, 116.19697570800781, 123.931640625, 131.6663055419922, 139.40097045898438, 147.13563537597656, 154.87030029296875, 162.60496520996094, 170.33963012695312, 178.07427978515625, 185.8089599609375, 193.5436248779297, 201.27828979492188, 209.01295471191406, 216.74761962890625, 224.48228454589844, 232.21694946289062, 239.95159912109375, 247.68626403808594]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 13.0, 14.0, 27.0, 38.0, 61.0, 95.0, 156.0, 275.0, 603.0, 1429.0, 4248.0, 21747.0, 704500.0, 3425192.0, 27719.0, 5160.0, 1566.0, 645.0, 277.0, 181.0, 81.0, 71.0, 46.0, 41.0, 21.0, 12.0, 15.0, 4.0, 6.0, 11.0, 2.0, 5.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.625, -202.154296875, -194.68359375, -187.212890625, -179.7421875, -172.271484375, -164.80078125, -157.330078125, -149.859375, -142.388671875, -134.91796875, -127.447265625, -119.9765625, -112.505859375, -105.03515625, -97.564453125, -90.09375, -82.623046875, -75.15234375, -67.681640625, -60.2109375, -52.740234375, -45.26953125, -37.798828125, -30.328125, -22.857421875, -15.38671875, -7.916015625, -0.4453125, 7.025390625, 14.49609375, 21.966796875, 29.4375, 36.908203125, 44.37890625, 51.849609375, 59.3203125, 66.791015625, 74.26171875, 81.732421875, 89.203125, 96.673828125, 104.14453125, 111.615234375, 119.0859375, 126.556640625, 134.02734375, 141.498046875, 148.96875, 156.439453125, 163.91015625, 171.380859375, 178.8515625, 186.322265625, 193.79296875, 201.263671875, 208.734375, 216.205078125, 223.67578125, 231.146484375, 238.6171875, 246.087890625, 253.55859375, 261.029296875, 268.5]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 14.0, 13.0, 32.0, 33.0, 43.0, 51.0, 69.0, 100.0, 81.0, 108.0, 94.0, 69.0, 67.0, 60.0, 43.0, 40.0, 25.0, 18.0, 12.0, 13.0, 1.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.5, -20.8583984375, -20.216796875, -19.5751953125, -18.93359375, -18.2919921875, -17.650390625, -17.0087890625, -16.3671875, -15.7255859375, -15.083984375, -14.4423828125, -13.80078125, -13.1591796875, -12.517578125, -11.8759765625, -11.234375, -10.5927734375, -9.951171875, -9.3095703125, -8.66796875, -8.0263671875, -7.384765625, -6.7431640625, -6.1015625, -5.4599609375, -4.818359375, -4.1767578125, -3.53515625, -2.8935546875, -2.251953125, -1.6103515625, -0.96875, -0.3271484375, 0.314453125, 0.9560546875, 1.59765625, 2.2392578125, 2.880859375, 3.5224609375, 4.1640625, 4.8056640625, 5.447265625, 6.0888671875, 6.73046875, 7.3720703125, 8.013671875, 8.6552734375, 9.296875, 9.9384765625, 10.580078125, 11.2216796875, 11.86328125, 12.5048828125, 13.146484375, 13.7880859375, 14.4296875, 15.0712890625, 15.712890625, 16.3544921875, 16.99609375, 17.6376953125, 18.279296875, 18.9208984375, 19.5625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 2.0, 9.0, 6.0, 9.0, 19.0, 11.0, 13.0, 20.0, 30.0, 44.0, 76.0, 137.0, 245.0, 429.0, 869.0, 1857.0, 4501.0, 11988.0, 38718.0, 180997.0, 3156470.0, 673631.0, 87048.0, 22948.0, 8061.0, 3177.0, 1372.0, 712.0, 327.0, 200.0, 108.0, 75.0, 52.0, 38.0, 14.0, 12.0, 12.0, 6.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-89.25, -86.52734375, -83.8046875, -81.08203125, -78.359375, -75.63671875, -72.9140625, -70.19140625, -67.46875, -64.74609375, -62.0234375, -59.30078125, -56.578125, -53.85546875, -51.1328125, -48.41015625, -45.6875, -42.96484375, -40.2421875, -37.51953125, -34.796875, -32.07421875, -29.3515625, -26.62890625, -23.90625, -21.18359375, -18.4609375, -15.73828125, -13.015625, -10.29296875, -7.5703125, -4.84765625, -2.125, 0.59765625, 3.3203125, 6.04296875, 8.765625, 11.48828125, 14.2109375, 16.93359375, 19.65625, 22.37890625, 25.1015625, 27.82421875, 30.546875, 33.26953125, 35.9921875, 38.71484375, 41.4375, 44.16015625, 46.8828125, 49.60546875, 52.328125, 55.05078125, 57.7734375, 60.49609375, 63.21875, 65.94140625, 68.6640625, 71.38671875, 74.109375, 76.83203125, 79.5546875, 82.27734375, 85.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 35.0, 35.0, 60.0, 91.0, 131.0, 183.0, 346.0, 1027.0, 1036.0, 350.0, 206.0, 128.0, 90.0, 63.0, 41.0, 26.0, 27.0, 26.0, 19.0, 17.0, 9.0, 4.0, 7.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.21875, -18.507080078125, -17.79541015625, -17.083740234375, -16.3720703125, -15.660400390625, -14.94873046875, -14.237060546875, -13.525390625, -12.813720703125, -12.10205078125, -11.390380859375, -10.6787109375, -9.967041015625, -9.25537109375, -8.543701171875, -7.83203125, -7.120361328125, -6.40869140625, -5.697021484375, -4.9853515625, -4.273681640625, -3.56201171875, -2.850341796875, -2.138671875, -1.427001953125, -0.71533203125, -0.003662109375, 0.7080078125, 1.419677734375, 2.13134765625, 2.843017578125, 3.5546875, 4.266357421875, 4.97802734375, 5.689697265625, 6.4013671875, 7.113037109375, 7.82470703125, 8.536376953125, 9.248046875, 9.959716796875, 10.67138671875, 11.383056640625, 12.0947265625, 12.806396484375, 13.51806640625, 14.229736328125, 14.94140625, 15.653076171875, 16.36474609375, 17.076416015625, 17.7880859375, 18.499755859375, 19.21142578125, 19.923095703125, 20.634765625, 21.346435546875, 22.05810546875, 22.769775390625, 23.4814453125, 24.193115234375, 24.90478515625, 25.616455078125, 26.328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 25.0, 45.0, 50.0, 79.0, 121.0, 123.0, 127.0, 92.0, 94.0, 65.0, 52.0, 30.0, 29.0, 10.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.47479248046875, -167.94744873046875, -161.42010498046875, -154.8927459716797, -148.3654022216797, -141.8380584716797, -135.3107147216797, -128.78335571289062, -122.25601196289062, -115.72866821289062, -109.2013168334961, -102.6739730834961, -96.14662170410156, -89.61927795410156, -83.09193420410156, -76.56458282470703, -70.03723907470703, -63.509891510009766, -56.9825439453125, -50.4552001953125, -43.92784881591797, -37.40050506591797, -30.873157501220703, -24.345809936523438, -17.818462371826172, -11.291114807128906, -4.763768196105957, 1.7635784149169922, 8.290925979614258, 14.81827163696289, 21.345619201660156, 27.872966766357422, 34.40031433105469, 40.92766189575195, 47.45500946044922, 53.98235321044922, 60.50970458984375, 67.03704833984375, 73.56439208984375, 80.09174346923828, 86.61909484863281, 93.14643859863281, 99.67378997802734, 106.20113372802734, 112.72848510742188, 119.25582885742188, 125.78317260742188, 132.31051635742188, 138.83786010742188, 145.36520385742188, 151.89254760742188, 158.41990661621094, 164.94725036621094, 171.47459411621094, 178.00193786621094, 184.529296875, 191.056640625, 197.583984375, 204.111328125, 210.63868713378906, 217.16603088378906, 223.69337463378906, 230.22071838378906, 236.74807739257812, 243.27542114257812]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 5.0, 9.0, 6.0, 9.0, 10.0, 19.0, 19.0, 24.0, 28.0, 28.0, 44.0, 31.0, 41.0, 46.0, 56.0, 61.0, 52.0, 43.0, 49.0, 45.0, 51.0, 33.0, 37.0, 36.0, 29.0, 29.0, 33.0, 25.0, 19.0, 17.0, 12.0, 15.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-113.060546875, -109.63899230957031, -106.21743774414062, -102.79588317871094, -99.37432861328125, -95.95277404785156, -92.5312271118164, -89.10967254638672, -85.68811798095703, -82.26656341552734, -78.84500885009766, -75.42345428466797, -72.00190734863281, -68.58035278320312, -65.15879821777344, -61.73724365234375, -58.31568908691406, -54.894134521484375, -51.47257995605469, -48.051029205322266, -44.62947463989258, -41.20792007446289, -37.78636932373047, -34.36481475830078, -30.943260192871094, -27.521705627441406, -24.10015296936035, -20.678600311279297, -17.25704574584961, -13.835491180419922, -10.413938522338867, -6.9923858642578125, -3.570831298828125, -0.1492776870727539, 3.272275924682617, 6.693829536437988, 10.11538314819336, 13.536937713623047, 16.9584903717041, 20.380043029785156, 23.801597595214844, 27.22315216064453, 30.644704818725586, 34.06625747680664, 37.48781204223633, 40.909366607666016, 44.33091735839844, 47.752471923828125, 51.17402648925781, 54.5955810546875, 58.01713562011719, 61.43868637084961, 64.86024475097656, 68.28179931640625, 71.7033462524414, 75.1249008178711, 78.54645538330078, 81.96800994873047, 85.38956451416016, 88.81111907958984, 92.232666015625, 95.65422058105469, 99.07577514648438, 102.49732971191406, 105.91888427734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 12.0, 19.0, 13.0, 29.0, 33.0, 42.0, 49.0, 74.0, 109.0, 193.0, 281.0, 503.0, 973.0, 1964.0, 4976.0, 15934.0, 65921.0, 330861.0, 486440.0, 104416.0, 23462.0, 6903.0, 2573.0, 1154.0, 609.0, 331.0, 228.0, 130.0, 100.0, 51.0, 44.0, 33.0, 27.0, 15.0, 11.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-134.75, -130.6845703125, -126.619140625, -122.5537109375, -118.48828125, -114.4228515625, -110.357421875, -106.2919921875, -102.2265625, -98.1611328125, -94.095703125, -90.0302734375, -85.96484375, -81.8994140625, -77.833984375, -73.7685546875, -69.703125, -65.6376953125, -61.572265625, -57.5068359375, -53.44140625, -49.3759765625, -45.310546875, -41.2451171875, -37.1796875, -33.1142578125, -29.048828125, -24.9833984375, -20.91796875, -16.8525390625, -12.787109375, -8.7216796875, -4.65625, -0.5908203125, 3.474609375, 7.5400390625, 11.60546875, 15.6708984375, 19.736328125, 23.8017578125, 27.8671875, 31.9326171875, 35.998046875, 40.0634765625, 44.12890625, 48.1943359375, 52.259765625, 56.3251953125, 60.390625, 64.4560546875, 68.521484375, 72.5869140625, 76.65234375, 80.7177734375, 84.783203125, 88.8486328125, 92.9140625, 96.9794921875, 101.044921875, 105.1103515625, 109.17578125, 113.2412109375, 117.306640625, 121.3720703125, 125.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 13.0, 14.0, 17.0, 25.0, 30.0, 31.0, 53.0, 72.0, 88.0, 80.0, 89.0, 86.0, 102.0, 76.0, 61.0, 41.0, 36.0, 21.0, 29.0, 14.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.796875, -21.151123046875, -20.50537109375, -19.859619140625, -19.2138671875, -18.568115234375, -17.92236328125, -17.276611328125, -16.630859375, -15.985107421875, -15.33935546875, -14.693603515625, -14.0478515625, -13.402099609375, -12.75634765625, -12.110595703125, -11.46484375, -10.819091796875, -10.17333984375, -9.527587890625, -8.8818359375, -8.236083984375, -7.59033203125, -6.944580078125, -6.298828125, -5.653076171875, -5.00732421875, -4.361572265625, -3.7158203125, -3.070068359375, -2.42431640625, -1.778564453125, -1.1328125, -0.487060546875, 0.15869140625, 0.804443359375, 1.4501953125, 2.095947265625, 2.74169921875, 3.387451171875, 4.033203125, 4.678955078125, 5.32470703125, 5.970458984375, 6.6162109375, 7.261962890625, 7.90771484375, 8.553466796875, 9.19921875, 9.844970703125, 10.49072265625, 11.136474609375, 11.7822265625, 12.427978515625, 13.07373046875, 13.719482421875, 14.365234375, 15.010986328125, 15.65673828125, 16.302490234375, 16.9482421875, 17.593994140625, 18.23974609375, 18.885498046875, 19.53125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 15.0, 14.0, 17.0, 23.0, 32.0, 47.0, 53.0, 50.0, 91.0, 119.0, 157.0, 198.0, 300.0, 488.0, 679.0, 1117.0, 1952.0, 3620.0, 7470.0, 15955.0, 35230.0, 81191.0, 184184.0, 327392.0, 214350.0, 95256.0, 41452.0, 18349.0, 8520.0, 4206.0, 2262.0, 1226.0, 802.0, 471.0, 352.0, 232.0, 163.0, 129.0, 108.0, 59.0, 53.0, 43.0, 23.0, 22.0, 18.0, 20.0, 14.0, 5.0, 7.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-43.96875, -42.5771484375, -41.185546875, -39.7939453125, -38.40234375, -37.0107421875, -35.619140625, -34.2275390625, -32.8359375, -31.4443359375, -30.052734375, -28.6611328125, -27.26953125, -25.8779296875, -24.486328125, -23.0947265625, -21.703125, -20.3115234375, -18.919921875, -17.5283203125, -16.13671875, -14.7451171875, -13.353515625, -11.9619140625, -10.5703125, -9.1787109375, -7.787109375, -6.3955078125, -5.00390625, -3.6123046875, -2.220703125, -0.8291015625, 0.5625, 1.9541015625, 3.345703125, 4.7373046875, 6.12890625, 7.5205078125, 8.912109375, 10.3037109375, 11.6953125, 13.0869140625, 14.478515625, 15.8701171875, 17.26171875, 18.6533203125, 20.044921875, 21.4365234375, 22.828125, 24.2197265625, 25.611328125, 27.0029296875, 28.39453125, 29.7861328125, 31.177734375, 32.5693359375, 33.9609375, 35.3525390625, 36.744140625, 38.1357421875, 39.52734375, 40.9189453125, 42.310546875, 43.7021484375, 45.09375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 6.0, 9.0, 12.0, 12.0, 20.0, 22.0, 22.0, 20.0, 24.0, 19.0, 35.0, 38.0, 37.0, 39.0, 44.0, 35.0, 62.0, 44.0, 37.0, 37.0, 35.0, 40.0, 27.0, 31.0, 36.0, 27.0, 27.0, 25.0, 29.0, 21.0, 14.0, 12.0, 15.0, 9.0, 9.0, 10.0, 10.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-43.6875, -42.39794921875, -41.1083984375, -39.81884765625, -38.529296875, -37.23974609375, -35.9501953125, -34.66064453125, -33.37109375, -32.08154296875, -30.7919921875, -29.50244140625, -28.212890625, -26.92333984375, -25.6337890625, -24.34423828125, -23.0546875, -21.76513671875, -20.4755859375, -19.18603515625, -17.896484375, -16.60693359375, -15.3173828125, -14.02783203125, -12.73828125, -11.44873046875, -10.1591796875, -8.86962890625, -7.580078125, -6.29052734375, -5.0009765625, -3.71142578125, -2.421875, -1.13232421875, 0.1572265625, 1.44677734375, 2.736328125, 4.02587890625, 5.3154296875, 6.60498046875, 7.89453125, 9.18408203125, 10.4736328125, 11.76318359375, 13.052734375, 14.34228515625, 15.6318359375, 16.92138671875, 18.2109375, 19.50048828125, 20.7900390625, 22.07958984375, 23.369140625, 24.65869140625, 25.9482421875, 27.23779296875, 28.52734375, 29.81689453125, 31.1064453125, 32.39599609375, 33.685546875, 34.97509765625, 36.2646484375, 37.55419921875, 38.84375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 26.0, 28.0, 44.0, 69.0, 154.0, 262.0, 551.0, 1308.0, 3106.0, 8829.0, 29028.0, 115661.0, 416514.0, 348925.0, 88900.0, 23030.0, 7278.0, 2641.0, 1171.0, 477.0, 280.0, 117.0, 59.0, 34.0, 15.0, 14.0, 14.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.34375, -25.36474609375, -24.3857421875, -23.40673828125, -22.427734375, -21.44873046875, -20.4697265625, -19.49072265625, -18.51171875, -17.53271484375, -16.5537109375, -15.57470703125, -14.595703125, -13.61669921875, -12.6376953125, -11.65869140625, -10.6796875, -9.70068359375, -8.7216796875, -7.74267578125, -6.763671875, -5.78466796875, -4.8056640625, -3.82666015625, -2.84765625, -1.86865234375, -0.8896484375, 0.08935546875, 1.068359375, 2.04736328125, 3.0263671875, 4.00537109375, 4.984375, 5.96337890625, 6.9423828125, 7.92138671875, 8.900390625, 9.87939453125, 10.8583984375, 11.83740234375, 12.81640625, 13.79541015625, 14.7744140625, 15.75341796875, 16.732421875, 17.71142578125, 18.6904296875, 19.66943359375, 20.6484375, 21.62744140625, 22.6064453125, 23.58544921875, 24.564453125, 25.54345703125, 26.5224609375, 27.50146484375, 28.48046875, 29.45947265625, 30.4384765625, 31.41748046875, 32.396484375, 33.37548828125, 34.3544921875, 35.33349609375, 36.3125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 20.0, 15.0, 29.0, 31.0, 30.0, 64.0, 72.0, 141.0, 141.0, 119.0, 76.0, 53.0, 36.0, 29.0, 30.0, 15.0, 20.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.004067182540893555, -0.003907680511474609, -0.003748178482055664, -0.0035886764526367188, -0.0034291744232177734, -0.003269672393798828, -0.003110170364379883, -0.0029506683349609375, -0.002791166305541992, -0.002631664276123047, -0.0024721622467041016, -0.0023126602172851562, -0.002153158187866211, -0.0019936561584472656, -0.0018341541290283203, -0.001674652099609375, -0.0015151500701904297, -0.0013556480407714844, -0.001196146011352539, -0.0010366439819335938, -0.0008771419525146484, -0.0007176399230957031, -0.0005581378936767578, -0.0003986358642578125, -0.0002391338348388672, -7.963180541992188e-05, 7.987022399902344e-05, 0.00023937225341796875, 0.00039887428283691406, 0.0005583763122558594, 0.0007178783416748047, 0.00087738037109375, 0.0010368824005126953, 0.0011963844299316406, 0.001355886459350586, 0.0015153884887695312, 0.0016748905181884766, 0.0018343925476074219, 0.001993894577026367, 0.0021533966064453125, 0.002312898635864258, 0.002472400665283203, 0.0026319026947021484, 0.0027914047241210938, 0.002950906753540039, 0.0031104087829589844, 0.0032699108123779297, 0.003429412841796875, 0.0035889148712158203, 0.0037484169006347656, 0.003907918930053711, 0.004067420959472656, 0.0042269229888916016, 0.004386425018310547, 0.004545927047729492, 0.0047054290771484375, 0.004864931106567383, 0.005024433135986328, 0.0051839351654052734, 0.005343437194824219, 0.005502939224243164, 0.005662441253662109, 0.005821943283081055, 0.0059814453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 9.0, 14.0, 15.0, 33.0, 33.0, 71.0, 117.0, 208.0, 333.0, 684.0, 1467.0, 3719.0, 10385.0, 37095.0, 161655.0, 497249.0, 254508.0, 57148.0, 15175.0, 4819.0, 1873.0, 876.0, 461.0, 238.0, 128.0, 83.0, 56.0, 31.0, 30.0, 8.0, 14.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.3125, -35.32177734375, -34.3310546875, -33.34033203125, -32.349609375, -31.35888671875, -30.3681640625, -29.37744140625, -28.38671875, -27.39599609375, -26.4052734375, -25.41455078125, -24.423828125, -23.43310546875, -22.4423828125, -21.45166015625, -20.4609375, -19.47021484375, -18.4794921875, -17.48876953125, -16.498046875, -15.50732421875, -14.5166015625, -13.52587890625, -12.53515625, -11.54443359375, -10.5537109375, -9.56298828125, -8.572265625, -7.58154296875, -6.5908203125, -5.60009765625, -4.609375, -3.61865234375, -2.6279296875, -1.63720703125, -0.646484375, 0.34423828125, 1.3349609375, 2.32568359375, 3.31640625, 4.30712890625, 5.2978515625, 6.28857421875, 7.279296875, 8.27001953125, 9.2607421875, 10.25146484375, 11.2421875, 12.23291015625, 13.2236328125, 14.21435546875, 15.205078125, 16.19580078125, 17.1865234375, 18.17724609375, 19.16796875, 20.15869140625, 21.1494140625, 22.14013671875, 23.130859375, 24.12158203125, 25.1123046875, 26.10302734375, 27.09375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 8.0, 15.0, 14.0, 23.0, 32.0, 34.0, 46.0, 44.0, 56.0, 55.0, 69.0, 67.0, 67.0, 59.0, 57.0, 57.0, 53.0, 49.0, 32.0, 26.0, 21.0, 14.0, 12.0, 11.0, 9.0, 5.0, 7.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.471435546875, -17.91162109375, -17.351806640625, -16.7919921875, -16.232177734375, -15.67236328125, -15.112548828125, -14.552734375, -13.992919921875, -13.43310546875, -12.873291015625, -12.3134765625, -11.753662109375, -11.19384765625, -10.634033203125, -10.07421875, -9.514404296875, -8.95458984375, -8.394775390625, -7.8349609375, -7.275146484375, -6.71533203125, -6.155517578125, -5.595703125, -5.035888671875, -4.47607421875, -3.916259765625, -3.3564453125, -2.796630859375, -2.23681640625, -1.677001953125, -1.1171875, -0.557373046875, 0.00244140625, 0.562255859375, 1.1220703125, 1.681884765625, 2.24169921875, 2.801513671875, 3.361328125, 3.921142578125, 4.48095703125, 5.040771484375, 5.6005859375, 6.160400390625, 6.72021484375, 7.280029296875, 7.83984375, 8.399658203125, 8.95947265625, 9.519287109375, 10.0791015625, 10.638916015625, 11.19873046875, 11.758544921875, 12.318359375, 12.878173828125, 13.43798828125, 13.997802734375, 14.5576171875, 15.117431640625, 15.67724609375, 16.237060546875, 16.796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 15.0, 32.0, 34.0, 53.0, 65.0, 92.0, 112.0, 103.0, 95.0, 112.0, 82.0, 62.0, 48.0, 24.0, 24.0, 18.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.0211181640625, -492.9909362792969, -480.96075439453125, -468.9305419921875, -456.9003601074219, -444.87017822265625, -432.8399963378906, -420.809814453125, -408.77960205078125, -396.7494201660156, -384.71923828125, -372.68902587890625, -360.6588439941406, -348.628662109375, -336.5984802246094, -324.56829833984375, -312.5380859375, -300.5079040527344, -288.47772216796875, -276.447509765625, -264.4173278808594, -252.38714599609375, -240.35696411132812, -228.32676696777344, -216.29660034179688, -204.26641845703125, -192.23622131347656, -180.20603942871094, -168.17584228515625, -156.14566040039062, -144.115478515625, -132.0852813720703, -120.05508422851562, -108.02489471435547, -95.99470520019531, -83.96452331542969, -71.934326171875, -59.90414047241211, -47.87395477294922, -35.84376525878906, -23.813575744628906, -11.783387184143066, 0.24680137634277344, 12.276988983154297, 24.307178497314453, 36.33736801147461, 48.3675537109375, 60.397743225097656, 72.42793273925781, 84.45812225341797, 96.48831176757812, 108.51849365234375, 120.54869079589844, 132.57887268066406, 144.60906982421875, 156.63925170898438, 168.66943359375, 180.69961547851562, 192.7298126220703, 204.75999450683594, 216.79019165039062, 228.82037353515625, 240.85055541992188, 252.88075256347656, 264.91094970703125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 7.0, 2.0, 2.0, 8.0, 8.0, 6.0, 7.0, 13.0, 15.0, 16.0, 22.0, 23.0, 24.0, 28.0, 28.0, 49.0, 43.0, 40.0, 30.0, 46.0, 56.0, 36.0, 47.0, 52.0, 44.0, 48.0, 32.0, 34.0, 38.0, 37.0, 31.0, 25.0, 28.0, 20.0, 10.0, 14.0, 13.0, 12.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.45175170898438, -184.69760131835938, -176.9434356689453, -169.1892852783203, -161.4351348876953, -153.68096923828125, -145.92681884765625, -138.17266845703125, -130.4185028076172, -122.66434478759766, -114.91019439697266, -107.15603637695312, -99.4018783569336, -91.64772033691406, -83.89356994628906, -76.13941192626953, -68.38526153564453, -60.631107330322266, -52.876949310302734, -45.12279510498047, -37.36863708496094, -29.614482879638672, -21.860328674316406, -14.106170654296875, -6.352016448974609, 1.4021391868591309, 9.156294822692871, 16.910449981689453, 24.66460609436035, 32.41876220703125, 40.172916412353516, 47.92707443237305, 55.68122863769531, 63.43538284301758, 71.18953704833984, 78.94369506835938, 86.6978530883789, 94.45201110839844, 102.20616149902344, 109.96031951904297, 117.7144775390625, 125.46863555908203, 133.22279357910156, 140.97694396972656, 148.73109436035156, 156.48526000976562, 164.23941040039062, 171.99356079101562, 179.74771118164062, 187.50186157226562, 195.2560272216797, 203.0101776123047, 210.7643280029297, 218.51849365234375, 226.27264404296875, 234.02679443359375, 241.7809600830078, 249.5351104736328, 257.2892761230469, 265.0434265136719, 272.7975769042969, 280.5517272949219, 288.305908203125, 296.06005859375, 303.814208984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 12.0, 7.0, 16.0, 25.0, 33.0, 51.0, 74.0, 103.0, 194.0, 408.0, 809.0, 2000.0, 6021.0, 27694.0, 427985.0, 3652438.0, 61417.0, 9781.0, 2902.0, 1113.0, 507.0, 229.0, 167.0, 102.0, 54.0, 29.0, 21.0, 22.0, 10.0, 11.0, 7.0, 8.0, 7.0, 10.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-169.125, -162.904296875, -156.68359375, -150.462890625, -144.2421875, -138.021484375, -131.80078125, -125.580078125, -119.359375, -113.138671875, -106.91796875, -100.697265625, -94.4765625, -88.255859375, -82.03515625, -75.814453125, -69.59375, -63.373046875, -57.15234375, -50.931640625, -44.7109375, -38.490234375, -32.26953125, -26.048828125, -19.828125, -13.607421875, -7.38671875, -1.166015625, 5.0546875, 11.275390625, 17.49609375, 23.716796875, 29.9375, 36.158203125, 42.37890625, 48.599609375, 54.8203125, 61.041015625, 67.26171875, 73.482421875, 79.703125, 85.923828125, 92.14453125, 98.365234375, 104.5859375, 110.806640625, 117.02734375, 123.248046875, 129.46875, 135.689453125, 141.91015625, 148.130859375, 154.3515625, 160.572265625, 166.79296875, 173.013671875, 179.234375, 185.455078125, 191.67578125, 197.896484375, 204.1171875, 210.337890625, 216.55859375, 222.779296875, 229.0]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 7.0, 13.0, 19.0, 23.0, 27.0, 33.0, 53.0, 76.0, 78.0, 81.0, 93.0, 91.0, 70.0, 64.0, 73.0, 48.0, 42.0, 26.0, 32.0, 13.0, 16.0, 8.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.671875, -20.0439453125, -19.416015625, -18.7880859375, -18.16015625, -17.5322265625, -16.904296875, -16.2763671875, -15.6484375, -15.0205078125, -14.392578125, -13.7646484375, -13.13671875, -12.5087890625, -11.880859375, -11.2529296875, -10.625, -9.9970703125, -9.369140625, -8.7412109375, -8.11328125, -7.4853515625, -6.857421875, -6.2294921875, -5.6015625, -4.9736328125, -4.345703125, -3.7177734375, -3.08984375, -2.4619140625, -1.833984375, -1.2060546875, -0.578125, 0.0498046875, 0.677734375, 1.3056640625, 1.93359375, 2.5615234375, 3.189453125, 3.8173828125, 4.4453125, 5.0732421875, 5.701171875, 6.3291015625, 6.95703125, 7.5849609375, 8.212890625, 8.8408203125, 9.46875, 10.0966796875, 10.724609375, 11.3525390625, 11.98046875, 12.6083984375, 13.236328125, 13.8642578125, 14.4921875, 15.1201171875, 15.748046875, 16.3759765625, 17.00390625, 17.6318359375, 18.259765625, 18.8876953125, 19.515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 9.0, 13.0, 11.0, 29.0, 27.0, 31.0, 52.0, 51.0, 88.0, 99.0, 172.0, 236.0, 404.0, 816.0, 1963.0, 6139.0, 27001.0, 221411.0, 3587066.0, 304115.0, 33067.0, 7202.0, 2117.0, 856.0, 411.0, 251.0, 158.0, 111.0, 93.0, 61.0, 56.0, 37.0, 31.0, 15.0, 15.0, 14.0, 15.0, 15.0, 1.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.625, -126.732421875, -122.83984375, -118.947265625, -115.0546875, -111.162109375, -107.26953125, -103.376953125, -99.484375, -95.591796875, -91.69921875, -87.806640625, -83.9140625, -80.021484375, -76.12890625, -72.236328125, -68.34375, -64.451171875, -60.55859375, -56.666015625, -52.7734375, -48.880859375, -44.98828125, -41.095703125, -37.203125, -33.310546875, -29.41796875, -25.525390625, -21.6328125, -17.740234375, -13.84765625, -9.955078125, -6.0625, -2.169921875, 1.72265625, 5.615234375, 9.5078125, 13.400390625, 17.29296875, 21.185546875, 25.078125, 28.970703125, 32.86328125, 36.755859375, 40.6484375, 44.541015625, 48.43359375, 52.326171875, 56.21875, 60.111328125, 64.00390625, 67.896484375, 71.7890625, 75.681640625, 79.57421875, 83.466796875, 87.359375, 91.251953125, 95.14453125, 99.037109375, 102.9296875, 106.822265625, 110.71484375, 114.607421875, 118.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 9.0, 1.0, 22.0, 24.0, 50.0, 76.0, 234.0, 792.0, 2004.0, 494.0, 177.0, 83.0, 53.0, 26.0, 15.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.8125, -56.7373046875, -54.662109375, -52.5869140625, -50.51171875, -48.4365234375, -46.361328125, -44.2861328125, -42.2109375, -40.1357421875, -38.060546875, -35.9853515625, -33.91015625, -31.8349609375, -29.759765625, -27.6845703125, -25.609375, -23.5341796875, -21.458984375, -19.3837890625, -17.30859375, -15.2333984375, -13.158203125, -11.0830078125, -9.0078125, -6.9326171875, -4.857421875, -2.7822265625, -0.70703125, 1.3681640625, 3.443359375, 5.5185546875, 7.59375, 9.6689453125, 11.744140625, 13.8193359375, 15.89453125, 17.9697265625, 20.044921875, 22.1201171875, 24.1953125, 26.2705078125, 28.345703125, 30.4208984375, 32.49609375, 34.5712890625, 36.646484375, 38.7216796875, 40.796875, 42.8720703125, 44.947265625, 47.0224609375, 49.09765625, 51.1728515625, 53.248046875, 55.3232421875, 57.3984375, 59.4736328125, 61.548828125, 63.6240234375, 65.69921875, 67.7744140625, 69.849609375, 71.9248046875, 74.0]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 12.0, 22.0, 24.0, 42.0, 64.0, 89.0, 116.0, 114.0, 122.0, 106.0, 92.0, 67.0, 49.0, 34.0, 18.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-282.52789306640625, -274.9053039550781, -267.28271484375, -259.6601257324219, -252.0375518798828, -244.4149627685547, -236.79237365722656, -229.16978454589844, -221.54721069335938, -213.92462158203125, -206.30203247070312, -198.679443359375, -191.05686950683594, -183.4342803955078, -175.8116912841797, -168.18910217285156, -160.56651306152344, -152.9439239501953, -145.3213348388672, -137.69876098632812, -130.076171875, -122.45358276367188, -114.83099365234375, -107.20840454101562, -99.58582305908203, -91.9632339477539, -84.34065246582031, -76.71806335449219, -69.09547424316406, -61.47289276123047, -53.850303649902344, -46.227718353271484, -38.60511779785156, -30.982532501220703, -23.35994529724121, -15.737358093261719, -8.11477279663086, -0.4921875, 7.130401611328125, 14.752986907958984, 22.375572204589844, 29.998157501220703, 37.62074279785156, 45.24333190917969, 52.86591720581055, 60.488502502441406, 68.11109161376953, 75.73367309570312, 83.35626220703125, 90.97885131835938, 98.60143280029297, 106.2240219116211, 113.84660339355469, 121.46919250488281, 129.09178161621094, 136.71437072753906, 144.33694458007812, 151.95953369140625, 159.58212280273438, 167.2047119140625, 174.82728576660156, 182.4498748779297, 190.0724639892578, 197.69505310058594, 205.31764221191406]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 12.0, 14.0, 12.0, 20.0, 28.0, 30.0, 33.0, 39.0, 44.0, 52.0, 68.0, 54.0, 42.0, 60.0, 68.0, 54.0, 62.0, 50.0, 43.0, 45.0, 29.0, 25.0, 31.0, 19.0, 13.0, 16.0, 7.0, 9.0, 4.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.14976501464844, -134.23031616210938, -129.3108673095703, -124.39141845703125, -119.47196960449219, -114.55252075195312, -109.63307189941406, -104.713623046875, -99.79417419433594, -94.87472534179688, -89.95527648925781, -85.03582763671875, -80.11637878417969, -75.19692993164062, -70.27748107910156, -65.3580322265625, -60.43858337402344, -55.519134521484375, -50.59968566894531, -45.68023681640625, -40.76078796386719, -35.841339111328125, -30.921890258789062, -26.00244140625, -21.082992553710938, -16.163543701171875, -11.244094848632812, -6.32464599609375, -1.4051971435546875, 3.514251708984375, 8.433700561523438, 13.3531494140625, 18.2725830078125, 23.192031860351562, 28.111480712890625, 33.03092956542969, 37.95037841796875, 42.86982727050781, 47.789276123046875, 52.70872497558594, 57.628173828125, 62.54762268066406, 67.46707153320312, 72.38652038574219, 77.30596923828125, 82.22541809082031, 87.14486694335938, 92.06431579589844, 96.9837646484375, 101.90321350097656, 106.82266235351562, 111.74211120605469, 116.66156005859375, 121.58100891113281, 126.50045776367188, 131.41990661621094, 136.33935546875, 141.25880432128906, 146.17825317382812, 151.0977020263672, 156.01715087890625, 160.9365997314453, 165.85604858398438, 170.77549743652344, 175.6949462890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 2.0, 1.0, 7.0, 11.0, 7.0, 27.0, 35.0, 45.0, 61.0, 95.0, 156.0, 294.0, 534.0, 1260.0, 3314.0, 12827.0, 74864.0, 702069.0, 215996.0, 27249.0, 6035.0, 1869.0, 827.0, 397.0, 208.0, 135.0, 94.0, 33.0, 29.0, 24.0, 8.0, 6.0, 11.0, 6.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.875, -140.615234375, -135.35546875, -130.095703125, -124.8359375, -119.576171875, -114.31640625, -109.056640625, -103.796875, -98.537109375, -93.27734375, -88.017578125, -82.7578125, -77.498046875, -72.23828125, -66.978515625, -61.71875, -56.458984375, -51.19921875, -45.939453125, -40.6796875, -35.419921875, -30.16015625, -24.900390625, -19.640625, -14.380859375, -9.12109375, -3.861328125, 1.3984375, 6.658203125, 11.91796875, 17.177734375, 22.4375, 27.697265625, 32.95703125, 38.216796875, 43.4765625, 48.736328125, 53.99609375, 59.255859375, 64.515625, 69.775390625, 75.03515625, 80.294921875, 85.5546875, 90.814453125, 96.07421875, 101.333984375, 106.59375, 111.853515625, 117.11328125, 122.373046875, 127.6328125, 132.892578125, 138.15234375, 143.412109375, 148.671875, 153.931640625, 159.19140625, 164.451171875, 169.7109375, 174.970703125, 180.23046875, 185.490234375, 190.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 10.0, 6.0, 23.0, 25.0, 25.0, 56.0, 66.0, 91.0, 73.0, 84.0, 100.0, 91.0, 63.0, 72.0, 52.0, 53.0, 34.0, 24.0, 16.0, 14.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.140625, -21.455078125, -20.76953125, -20.083984375, -19.3984375, -18.712890625, -18.02734375, -17.341796875, -16.65625, -15.970703125, -15.28515625, -14.599609375, -13.9140625, -13.228515625, -12.54296875, -11.857421875, -11.171875, -10.486328125, -9.80078125, -9.115234375, -8.4296875, -7.744140625, -7.05859375, -6.373046875, -5.6875, -5.001953125, -4.31640625, -3.630859375, -2.9453125, -2.259765625, -1.57421875, -0.888671875, -0.203125, 0.482421875, 1.16796875, 1.853515625, 2.5390625, 3.224609375, 3.91015625, 4.595703125, 5.28125, 5.966796875, 6.65234375, 7.337890625, 8.0234375, 8.708984375, 9.39453125, 10.080078125, 10.765625, 11.451171875, 12.13671875, 12.822265625, 13.5078125, 14.193359375, 14.87890625, 15.564453125, 16.25, 16.935546875, 17.62109375, 18.306640625, 18.9921875, 19.677734375, 20.36328125, 21.048828125, 21.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 5.0, 9.0, 14.0, 12.0, 26.0, 29.0, 39.0, 52.0, 68.0, 130.0, 151.0, 201.0, 296.0, 488.0, 762.0, 1426.0, 3002.0, 7243.0, 19648.0, 56119.0, 176815.0, 492100.0, 193624.0, 60424.0, 20890.0, 7869.0, 3161.0, 1535.0, 895.0, 482.0, 303.0, 221.0, 137.0, 101.0, 68.0, 55.0, 44.0, 27.0, 19.0, 21.0, 17.0, 9.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-60.8125, -58.943359375, -57.07421875, -55.205078125, -53.3359375, -51.466796875, -49.59765625, -47.728515625, -45.859375, -43.990234375, -42.12109375, -40.251953125, -38.3828125, -36.513671875, -34.64453125, -32.775390625, -30.90625, -29.037109375, -27.16796875, -25.298828125, -23.4296875, -21.560546875, -19.69140625, -17.822265625, -15.953125, -14.083984375, -12.21484375, -10.345703125, -8.4765625, -6.607421875, -4.73828125, -2.869140625, -1.0, 0.869140625, 2.73828125, 4.607421875, 6.4765625, 8.345703125, 10.21484375, 12.083984375, 13.953125, 15.822265625, 17.69140625, 19.560546875, 21.4296875, 23.298828125, 25.16796875, 27.037109375, 28.90625, 30.775390625, 32.64453125, 34.513671875, 36.3828125, 38.251953125, 40.12109375, 41.990234375, 43.859375, 45.728515625, 47.59765625, 49.466796875, 51.3359375, 53.205078125, 55.07421875, 56.943359375, 58.8125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 10.0, 8.0, 13.0, 15.0, 11.0, 16.0, 26.0, 22.0, 19.0, 32.0, 32.0, 40.0, 49.0, 37.0, 53.0, 43.0, 45.0, 51.0, 45.0, 58.0, 43.0, 40.0, 34.0, 33.0, 28.0, 30.0, 25.0, 26.0, 25.0, 22.0, 20.0, 11.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.56982421875, -41.0146484375, -39.45947265625, -37.904296875, -36.34912109375, -34.7939453125, -33.23876953125, -31.68359375, -30.12841796875, -28.5732421875, -27.01806640625, -25.462890625, -23.90771484375, -22.3525390625, -20.79736328125, -19.2421875, -17.68701171875, -16.1318359375, -14.57666015625, -13.021484375, -11.46630859375, -9.9111328125, -8.35595703125, -6.80078125, -5.24560546875, -3.6904296875, -2.13525390625, -0.580078125, 0.97509765625, 2.5302734375, 4.08544921875, 5.640625, 7.19580078125, 8.7509765625, 10.30615234375, 11.861328125, 13.41650390625, 14.9716796875, 16.52685546875, 18.08203125, 19.63720703125, 21.1923828125, 22.74755859375, 24.302734375, 25.85791015625, 27.4130859375, 28.96826171875, 30.5234375, 32.07861328125, 33.6337890625, 35.18896484375, 36.744140625, 38.29931640625, 39.8544921875, 41.40966796875, 42.96484375, 44.52001953125, 46.0751953125, 47.63037109375, 49.185546875, 50.74072265625, 52.2958984375, 53.85107421875, 55.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 8.0, 5.0, 12.0, 18.0, 32.0, 53.0, 79.0, 88.0, 188.0, 363.0, 808.0, 2150.0, 7335.0, 30634.0, 184535.0, 620785.0, 163534.0, 27562.0, 6629.0, 2052.0, 855.0, 368.0, 184.0, 98.0, 75.0, 32.0, 18.0, 14.0, 10.0, 9.0, 4.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.968017578125, -29.95166015625, -28.935302734375, -27.9189453125, -26.902587890625, -25.88623046875, -24.869873046875, -23.853515625, -22.837158203125, -21.82080078125, -20.804443359375, -19.7880859375, -18.771728515625, -17.75537109375, -16.739013671875, -15.72265625, -14.706298828125, -13.68994140625, -12.673583984375, -11.6572265625, -10.640869140625, -9.62451171875, -8.608154296875, -7.591796875, -6.575439453125, -5.55908203125, -4.542724609375, -3.5263671875, -2.510009765625, -1.49365234375, -0.477294921875, 0.5390625, 1.555419921875, 2.57177734375, 3.588134765625, 4.6044921875, 5.620849609375, 6.63720703125, 7.653564453125, 8.669921875, 9.686279296875, 10.70263671875, 11.718994140625, 12.7353515625, 13.751708984375, 14.76806640625, 15.784423828125, 16.80078125, 17.817138671875, 18.83349609375, 19.849853515625, 20.8662109375, 21.882568359375, 22.89892578125, 23.915283203125, 24.931640625, 25.947998046875, 26.96435546875, 27.980712890625, 28.9970703125, 30.013427734375, 31.02978515625, 32.046142578125, 33.0625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 14.0, 6.0, 15.0, 18.0, 35.0, 31.0, 52.0, 114.0, 190.0, 201.0, 103.0, 62.0, 30.0, 30.0, 18.0, 13.0, 19.0, 5.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0072479248046875, -0.007052063941955566, -0.006856203079223633, -0.006660342216491699, -0.006464481353759766, -0.006268620491027832, -0.0060727596282958984, -0.005876898765563965, -0.005681037902832031, -0.005485177040100098, -0.005289316177368164, -0.0050934553146362305, -0.004897594451904297, -0.004701733589172363, -0.00450587272644043, -0.004310011863708496, -0.0041141510009765625, -0.003918290138244629, -0.0037224292755126953, -0.0035265684127807617, -0.003330707550048828, -0.0031348466873168945, -0.002938985824584961, -0.0027431249618530273, -0.0025472640991210938, -0.00235140323638916, -0.0021555423736572266, -0.001959681510925293, -0.0017638206481933594, -0.0015679597854614258, -0.0013720989227294922, -0.0011762380599975586, -0.000980377197265625, -0.0007845163345336914, -0.0005886554718017578, -0.0003927946090698242, -0.00019693374633789062, -1.0728836059570312e-06, 0.00019478797912597656, 0.00039064884185791016, 0.0005865097045898438, 0.0007823705673217773, 0.000978231430053711, 0.0011740922927856445, 0.0013699531555175781, 0.0015658140182495117, 0.0017616748809814453, 0.001957535743713379, 0.0021533966064453125, 0.002349257469177246, 0.0025451183319091797, 0.0027409791946411133, 0.002936840057373047, 0.0031327009201049805, 0.003328561782836914, 0.0035244226455688477, 0.0037202835083007812, 0.003916144371032715, 0.0041120052337646484, 0.004307866096496582, 0.004503726959228516, 0.004699587821960449, 0.004895448684692383, 0.005091309547424316, 0.00528717041015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 10.0, 14.0, 16.0, 34.0, 49.0, 70.0, 117.0, 216.0, 344.0, 659.0, 1608.0, 4758.0, 17521.0, 81292.0, 549930.0, 326745.0, 47988.0, 11262.0, 3221.0, 1338.0, 557.0, 318.0, 167.0, 105.0, 81.0, 36.0, 21.0, 13.0, 14.0, 7.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.115234375, -32.13671875, -31.158203125, -30.1796875, -29.201171875, -28.22265625, -27.244140625, -26.265625, -25.287109375, -24.30859375, -23.330078125, -22.3515625, -21.373046875, -20.39453125, -19.416015625, -18.4375, -17.458984375, -16.48046875, -15.501953125, -14.5234375, -13.544921875, -12.56640625, -11.587890625, -10.609375, -9.630859375, -8.65234375, -7.673828125, -6.6953125, -5.716796875, -4.73828125, -3.759765625, -2.78125, -1.802734375, -0.82421875, 0.154296875, 1.1328125, 2.111328125, 3.08984375, 4.068359375, 5.046875, 6.025390625, 7.00390625, 7.982421875, 8.9609375, 9.939453125, 10.91796875, 11.896484375, 12.875, 13.853515625, 14.83203125, 15.810546875, 16.7890625, 17.767578125, 18.74609375, 19.724609375, 20.703125, 21.681640625, 22.66015625, 23.638671875, 24.6171875, 25.595703125, 26.57421875, 27.552734375, 28.53125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 7.0, 11.0, 5.0, 12.0, 12.0, 9.0, 19.0, 25.0, 42.0, 45.0, 73.0, 88.0, 144.0, 115.0, 107.0, 89.0, 45.0, 28.0, 35.0, 28.0, 12.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.760009765625, -18.11376953125, -17.467529296875, -16.8212890625, -16.175048828125, -15.52880859375, -14.882568359375, -14.236328125, -13.590087890625, -12.94384765625, -12.297607421875, -11.6513671875, -11.005126953125, -10.35888671875, -9.712646484375, -9.06640625, -8.420166015625, -7.77392578125, -7.127685546875, -6.4814453125, -5.835205078125, -5.18896484375, -4.542724609375, -3.896484375, -3.250244140625, -2.60400390625, -1.957763671875, -1.3115234375, -0.665283203125, -0.01904296875, 0.627197265625, 1.2734375, 1.919677734375, 2.56591796875, 3.212158203125, 3.8583984375, 4.504638671875, 5.15087890625, 5.797119140625, 6.443359375, 7.089599609375, 7.73583984375, 8.382080078125, 9.0283203125, 9.674560546875, 10.32080078125, 10.967041015625, 11.61328125, 12.259521484375, 12.90576171875, 13.552001953125, 14.1982421875, 14.844482421875, 15.49072265625, 16.136962890625, 16.783203125, 17.429443359375, 18.07568359375, 18.721923828125, 19.3681640625, 20.014404296875, 20.66064453125, 21.306884765625, 21.953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 7.0, 15.0, 36.0, 60.0, 105.0, 137.0, 187.0, 167.0, 100.0, 76.0, 56.0, 24.0, 17.0, 8.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-635.1976928710938, -617.8590698242188, -600.5204467773438, -583.1817626953125, -565.8431396484375, -548.5045166015625, -531.1658935546875, -513.8272705078125, -496.4886169433594, -479.1499938964844, -461.81134033203125, -444.47271728515625, -427.13409423828125, -409.7954406738281, -392.4568176269531, -375.1181640625, -357.779541015625, -340.44091796875, -323.1022644042969, -305.7636413574219, -288.42498779296875, -271.08636474609375, -253.74774169921875, -236.4091033935547, -219.07046508789062, -201.73182678222656, -184.3931884765625, -167.0545654296875, -149.71592712402344, -132.37728881835938, -115.03865814208984, -97.70002746582031, -80.36138916015625, -63.02275466918945, -45.684120178222656, -28.34548568725586, -11.006851196289062, 6.331787109375, 23.67041778564453, 41.00904846191406, 58.347686767578125, 75.68632507324219, 93.02495574951172, 110.36358642578125, 127.70222473144531, 145.04086303710938, 162.37948608398438, 179.71812438964844, 197.0567626953125, 214.39540100097656, 231.73403930664062, 249.07266235351562, 266.41131591796875, 283.74993896484375, 301.08856201171875, 318.42718505859375, 335.7658386230469, 353.1044616699219, 370.443115234375, 387.78173828125, 405.120361328125, 422.4590148925781, 439.7976379394531, 457.13629150390625, 474.47491455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 10.0, 11.0, 12.0, 13.0, 15.0, 22.0, 20.0, 23.0, 36.0, 24.0, 31.0, 23.0, 38.0, 35.0, 45.0, 47.0, 54.0, 32.0, 47.0, 37.0, 39.0, 47.0, 27.0, 38.0, 31.0, 28.0, 43.0, 18.0, 25.0, 13.0, 15.0, 15.0, 10.0, 14.0, 8.0, 10.0, 12.0, 4.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.2005615234375, -192.03567504882812, -184.8707733154297, -177.7058868408203, -170.54100036621094, -163.3760986328125, -156.21121215820312, -149.04632568359375, -141.88143920898438, -134.716552734375, -127.5516586303711, -120.38676452636719, -113.22187805175781, -106.0569839477539, -98.89208984375, -91.72720336914062, -84.56230163574219, -77.39740753173828, -70.2325210571289, -63.067626953125, -55.90273666381836, -48.73784637451172, -41.57295227050781, -34.40806198120117, -27.24317169189453, -20.07828140258789, -12.913389205932617, -5.748497009277344, 1.4163932800292969, 8.581283569335938, 15.746177673339844, 22.911067962646484, 30.075958251953125, 37.240848541259766, 44.405738830566406, 51.57063293457031, 58.73552322387695, 65.9004135131836, 73.0653076171875, 80.23019409179688, 87.39508819580078, 94.55998229980469, 101.72486877441406, 108.88976287841797, 116.05465698242188, 123.21954345703125, 130.38442993164062, 137.54933166503906, 144.71421813964844, 151.8791046142578, 159.04400634765625, 166.20889282226562, 173.373779296875, 180.53866577148438, 187.7035675048828, 194.8684539794922, 202.03335571289062, 209.1982421875, 216.36314392089844, 223.5280303955078, 230.6929168701172, 237.85781860351562, 245.022705078125, 252.18759155273438, 259.35247802734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 8.0, 11.0, 15.0, 35.0, 33.0, 54.0, 68.0, 88.0, 124.0, 219.0, 334.0, 627.0, 1204.0, 2703.0, 6777.0, 23233.0, 149712.0, 3793906.0, 176830.0, 25322.0, 7334.0, 2770.0, 1312.0, 619.0, 335.0, 181.0, 116.0, 73.0, 50.0, 37.0, 17.0, 21.0, 10.0, 18.0, 13.0, 12.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-143.375, -138.349609375, -133.32421875, -128.298828125, -123.2734375, -118.248046875, -113.22265625, -108.197265625, -103.171875, -98.146484375, -93.12109375, -88.095703125, -83.0703125, -78.044921875, -73.01953125, -67.994140625, -62.96875, -57.943359375, -52.91796875, -47.892578125, -42.8671875, -37.841796875, -32.81640625, -27.791015625, -22.765625, -17.740234375, -12.71484375, -7.689453125, -2.6640625, 2.361328125, 7.38671875, 12.412109375, 17.4375, 22.462890625, 27.48828125, 32.513671875, 37.5390625, 42.564453125, 47.58984375, 52.615234375, 57.640625, 62.666015625, 67.69140625, 72.716796875, 77.7421875, 82.767578125, 87.79296875, 92.818359375, 97.84375, 102.869140625, 107.89453125, 112.919921875, 117.9453125, 122.970703125, 127.99609375, 133.021484375, 138.046875, 143.072265625, 148.09765625, 153.123046875, 158.1484375, 163.173828125, 168.19921875, 173.224609375, 178.25]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 3.0, 6.0, 15.0, 16.0, 18.0, 29.0, 44.0, 45.0, 87.0, 83.0, 65.0, 78.0, 73.0, 75.0, 79.0, 60.0, 59.0, 53.0, 36.0, 21.0, 18.0, 12.0, 14.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.265625, -20.600830078125, -19.93603515625, -19.271240234375, -18.6064453125, -17.941650390625, -17.27685546875, -16.612060546875, -15.947265625, -15.282470703125, -14.61767578125, -13.952880859375, -13.2880859375, -12.623291015625, -11.95849609375, -11.293701171875, -10.62890625, -9.964111328125, -9.29931640625, -8.634521484375, -7.9697265625, -7.304931640625, -6.64013671875, -5.975341796875, -5.310546875, -4.645751953125, -3.98095703125, -3.316162109375, -2.6513671875, -1.986572265625, -1.32177734375, -0.656982421875, 0.0078125, 0.672607421875, 1.33740234375, 2.002197265625, 2.6669921875, 3.331787109375, 3.99658203125, 4.661376953125, 5.326171875, 5.990966796875, 6.65576171875, 7.320556640625, 7.9853515625, 8.650146484375, 9.31494140625, 9.979736328125, 10.64453125, 11.309326171875, 11.97412109375, 12.638916015625, 13.3037109375, 13.968505859375, 14.63330078125, 15.298095703125, 15.962890625, 16.627685546875, 17.29248046875, 17.957275390625, 18.6220703125, 19.286865234375, 19.95166015625, 20.616455078125, 21.28125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 13.0, 19.0, 31.0, 43.0, 51.0, 72.0, 85.0, 136.0, 221.0, 393.0, 801.0, 1890.0, 5603.0, 19964.0, 111748.0, 3106144.0, 859358.0, 66486.0, 14073.0, 4086.0, 1467.0, 636.0, 349.0, 190.0, 113.0, 76.0, 49.0, 47.0, 27.0, 20.0, 10.0, 11.0, 11.0, 9.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-114.125, -110.65234375, -107.1796875, -103.70703125, -100.234375, -96.76171875, -93.2890625, -89.81640625, -86.34375, -82.87109375, -79.3984375, -75.92578125, -72.453125, -68.98046875, -65.5078125, -62.03515625, -58.5625, -55.08984375, -51.6171875, -48.14453125, -44.671875, -41.19921875, -37.7265625, -34.25390625, -30.78125, -27.30859375, -23.8359375, -20.36328125, -16.890625, -13.41796875, -9.9453125, -6.47265625, -3.0, 0.47265625, 3.9453125, 7.41796875, 10.890625, 14.36328125, 17.8359375, 21.30859375, 24.78125, 28.25390625, 31.7265625, 35.19921875, 38.671875, 42.14453125, 45.6171875, 49.08984375, 52.5625, 56.03515625, 59.5078125, 62.98046875, 66.453125, 69.92578125, 73.3984375, 76.87109375, 80.34375, 83.81640625, 87.2890625, 90.76171875, 94.234375, 97.70703125, 101.1796875, 104.65234375, 108.125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 21.0, 30.0, 57.0, 95.0, 251.0, 569.0, 1898.0, 640.0, 223.0, 113.0, 55.0, 43.0, 21.0, 19.0, 7.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.8125, -62.3779296875, -60.943359375, -59.5087890625, -58.07421875, -56.6396484375, -55.205078125, -53.7705078125, -52.3359375, -50.9013671875, -49.466796875, -48.0322265625, -46.59765625, -45.1630859375, -43.728515625, -42.2939453125, -40.859375, -39.4248046875, -37.990234375, -36.5556640625, -35.12109375, -33.6865234375, -32.251953125, -30.8173828125, -29.3828125, -27.9482421875, -26.513671875, -25.0791015625, -23.64453125, -22.2099609375, -20.775390625, -19.3408203125, -17.90625, -16.4716796875, -15.037109375, -13.6025390625, -12.16796875, -10.7333984375, -9.298828125, -7.8642578125, -6.4296875, -4.9951171875, -3.560546875, -2.1259765625, -0.69140625, 0.7431640625, 2.177734375, 3.6123046875, 5.046875, 6.4814453125, 7.916015625, 9.3505859375, 10.78515625, 12.2197265625, 13.654296875, 15.0888671875, 16.5234375, 17.9580078125, 19.392578125, 20.8271484375, 22.26171875, 23.6962890625, 25.130859375, 26.5654296875, 28.0]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 13.0, 24.0, 64.0, 97.0, 123.0, 143.0, 159.0, 120.0, 116.0, 55.0, 37.0, 13.0, 10.0, 5.0, 4.0, 0.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-215.8210906982422, -207.04991149902344, -198.2787322998047, -189.50753784179688, -180.73635864257812, -171.96517944335938, -163.19400024414062, -154.42282104492188, -145.65164184570312, -136.88046264648438, -128.10928344726562, -119.33809661865234, -110.56690979003906, -101.79573059082031, -93.02455139160156, -84.25337219238281, -75.482177734375, -66.71099853515625, -57.93981170654297, -49.16863250732422, -40.3974494934082, -31.626266479492188, -22.855087280273438, -14.083904266357422, -5.312721252441406, 3.458460807800293, 12.229642868041992, 21.000823974609375, 29.77200698852539, 38.543190002441406, 47.314369201660156, 56.08555221557617, 64.85671997070312, 73.62789916992188, 82.39908599853516, 91.1702651977539, 99.94145202636719, 108.71263122558594, 117.48381042480469, 126.25498962402344, 135.02618408203125, 143.79736328125, 152.56854248046875, 161.3397216796875, 170.1109161376953, 178.88209533691406, 187.6532745361328, 196.42445373535156, 205.1956329345703, 213.96681213378906, 222.7379913330078, 231.50918579101562, 240.28036499023438, 249.05154418945312, 257.8227233886719, 266.5939025878906, 275.3650817871094, 284.1362609863281, 292.9074401855469, 301.6786193847656, 310.4497985839844, 319.22100830078125, 327.9921875, 336.76336669921875, 345.5345458984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 15.0, 7.0, 10.0, 9.0, 24.0, 22.0, 21.0, 33.0, 46.0, 44.0, 41.0, 33.0, 52.0, 76.0, 60.0, 64.0, 52.0, 44.0, 45.0, 44.0, 50.0, 33.0, 21.0, 30.0, 22.0, 14.0, 19.0, 19.0, 10.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.55390167236328, -98.66016387939453, -94.76643371582031, -90.87269592285156, -86.97895812988281, -83.08522033691406, -79.19148254394531, -75.2977523803711, -71.40401458740234, -67.5102767944336, -63.61654281616211, -59.722808837890625, -55.829071044921875, -51.935333251953125, -48.04159927368164, -44.147865295410156, -40.254127502441406, -36.360389709472656, -32.46665573120117, -28.572919845581055, -24.679183959960938, -20.78544807434082, -16.891712188720703, -12.997976303100586, -9.104240417480469, -5.210504531860352, -1.3167686462402344, 2.576967239379883, 6.470703125, 10.364439010620117, 14.258174896240234, 18.15191078186035, 22.045639038085938, 25.939374923706055, 29.833110809326172, 33.726844787597656, 37.620582580566406, 41.514320373535156, 45.40805435180664, 49.301788330078125, 53.195526123046875, 57.089263916015625, 60.98299789428711, 64.8767318725586, 68.77046966552734, 72.6642074584961, 76.55793762207031, 80.45167541503906, 84.34541320800781, 88.23915100097656, 92.13288879394531, 96.02661895751953, 99.92035675048828, 103.81409454345703, 107.70782470703125, 111.6015625, 115.49530029296875, 119.3890380859375, 123.28277587890625, 127.17650604248047, 131.07025146484375, 134.96397399902344, 138.8577117919922, 142.75144958496094, 146.6451873779297]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 9.0, 15.0, 21.0, 27.0, 54.0, 74.0, 110.0, 190.0, 297.0, 537.0, 1198.0, 3490.0, 14604.0, 84429.0, 753049.0, 159015.0, 23053.0, 5140.0, 1603.0, 721.0, 345.0, 229.0, 107.0, 72.0, 41.0, 38.0, 18.0, 22.0, 12.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-165.25, -160.1875, -155.125, -150.0625, -145.0, -139.9375, -134.875, -129.8125, -124.75, -119.6875, -114.625, -109.5625, -104.5, -99.4375, -94.375, -89.3125, -84.25, -79.1875, -74.125, -69.0625, -64.0, -58.9375, -53.875, -48.8125, -43.75, -38.6875, -33.625, -28.5625, -23.5, -18.4375, -13.375, -8.3125, -3.25, 1.8125, 6.875, 11.9375, 17.0, 22.0625, 27.125, 32.1875, 37.25, 42.3125, 47.375, 52.4375, 57.5, 62.5625, 67.625, 72.6875, 77.75, 82.8125, 87.875, 92.9375, 98.0, 103.0625, 108.125, 113.1875, 118.25, 123.3125, 128.375, 133.4375, 138.5, 143.5625, 148.625, 153.6875, 158.75]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 9.0, 13.0, 15.0, 18.0, 35.0, 33.0, 49.0, 57.0, 85.0, 60.0, 80.0, 80.0, 85.0, 85.0, 61.0, 60.0, 40.0, 40.0, 32.0, 17.0, 12.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.6875, -21.015625, -20.34375, -19.671875, -19.0, -18.328125, -17.65625, -16.984375, -16.3125, -15.640625, -14.96875, -14.296875, -13.625, -12.953125, -12.28125, -11.609375, -10.9375, -10.265625, -9.59375, -8.921875, -8.25, -7.578125, -6.90625, -6.234375, -5.5625, -4.890625, -4.21875, -3.546875, -2.875, -2.203125, -1.53125, -0.859375, -0.1875, 0.484375, 1.15625, 1.828125, 2.5, 3.171875, 3.84375, 4.515625, 5.1875, 5.859375, 6.53125, 7.203125, 7.875, 8.546875, 9.21875, 9.890625, 10.5625, 11.234375, 11.90625, 12.578125, 13.25, 13.921875, 14.59375, 15.265625, 15.9375, 16.609375, 17.28125, 17.953125, 18.625, 19.296875, 19.96875, 20.640625, 21.3125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 9.0, 20.0, 29.0, 37.0, 36.0, 65.0, 112.0, 151.0, 238.0, 378.0, 711.0, 1383.0, 2453.0, 5165.0, 10667.0, 22252.0, 48791.0, 136323.0, 452824.0, 237394.0, 70368.0, 30780.0, 14046.0, 6909.0, 3387.0, 1748.0, 903.0, 513.0, 301.0, 160.0, 101.0, 77.0, 53.0, 41.0, 29.0, 26.0, 12.0, 11.0, 9.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.5, -48.03125, -46.5625, -45.09375, -43.625, -42.15625, -40.6875, -39.21875, -37.75, -36.28125, -34.8125, -33.34375, -31.875, -30.40625, -28.9375, -27.46875, -26.0, -24.53125, -23.0625, -21.59375, -20.125, -18.65625, -17.1875, -15.71875, -14.25, -12.78125, -11.3125, -9.84375, -8.375, -6.90625, -5.4375, -3.96875, -2.5, -1.03125, 0.4375, 1.90625, 3.375, 4.84375, 6.3125, 7.78125, 9.25, 10.71875, 12.1875, 13.65625, 15.125, 16.59375, 18.0625, 19.53125, 21.0, 22.46875, 23.9375, 25.40625, 26.875, 28.34375, 29.8125, 31.28125, 32.75, 34.21875, 35.6875, 37.15625, 38.625, 40.09375, 41.5625, 43.03125, 44.5]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 1.0, 8.0, 8.0, 11.0, 14.0, 23.0, 13.0, 20.0, 33.0, 36.0, 35.0, 30.0, 38.0, 35.0, 40.0, 37.0, 41.0, 39.0, 47.0, 63.0, 41.0, 48.0, 44.0, 36.0, 44.0, 36.0, 31.0, 18.0, 25.0, 16.0, 13.0, 13.0, 13.0, 8.0, 6.0, 7.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.478515625, -43.95703125, -42.435546875, -40.9140625, -39.392578125, -37.87109375, -36.349609375, -34.828125, -33.306640625, -31.78515625, -30.263671875, -28.7421875, -27.220703125, -25.69921875, -24.177734375, -22.65625, -21.134765625, -19.61328125, -18.091796875, -16.5703125, -15.048828125, -13.52734375, -12.005859375, -10.484375, -8.962890625, -7.44140625, -5.919921875, -4.3984375, -2.876953125, -1.35546875, 0.166015625, 1.6875, 3.208984375, 4.73046875, 6.251953125, 7.7734375, 9.294921875, 10.81640625, 12.337890625, 13.859375, 15.380859375, 16.90234375, 18.423828125, 19.9453125, 21.466796875, 22.98828125, 24.509765625, 26.03125, 27.552734375, 29.07421875, 30.595703125, 32.1171875, 33.638671875, 35.16015625, 36.681640625, 38.203125, 39.724609375, 41.24609375, 42.767578125, 44.2890625, 45.810546875, 47.33203125, 48.853515625, 50.375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 22.0, 28.0, 39.0, 40.0, 100.0, 140.0, 293.0, 505.0, 986.0, 2528.0, 9193.0, 69883.0, 852383.0, 96106.0, 11124.0, 2806.0, 1097.0, 541.0, 286.0, 153.0, 76.0, 68.0, 34.0, 30.0, 16.0, 15.0, 8.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.65625, -45.79150390625, -43.9267578125, -42.06201171875, -40.197265625, -38.33251953125, -36.4677734375, -34.60302734375, -32.73828125, -30.87353515625, -29.0087890625, -27.14404296875, -25.279296875, -23.41455078125, -21.5498046875, -19.68505859375, -17.8203125, -15.95556640625, -14.0908203125, -12.22607421875, -10.361328125, -8.49658203125, -6.6318359375, -4.76708984375, -2.90234375, -1.03759765625, 0.8271484375, 2.69189453125, 4.556640625, 6.42138671875, 8.2861328125, 10.15087890625, 12.015625, 13.88037109375, 15.7451171875, 17.60986328125, 19.474609375, 21.33935546875, 23.2041015625, 25.06884765625, 26.93359375, 28.79833984375, 30.6630859375, 32.52783203125, 34.392578125, 36.25732421875, 38.1220703125, 39.98681640625, 41.8515625, 43.71630859375, 45.5810546875, 47.44580078125, 49.310546875, 51.17529296875, 53.0400390625, 54.90478515625, 56.76953125, 58.63427734375, 60.4990234375, 62.36376953125, 64.228515625, 66.09326171875, 67.9580078125, 69.82275390625, 71.6875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 3.0, 3.0, 6.0, 13.0, 11.0, 26.0, 20.0, 43.0, 130.0, 320.0, 214.0, 73.0, 34.0, 25.0, 22.0, 12.0, 6.0, 6.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0111541748046875, -0.010910391807556152, -0.010666608810424805, -0.010422825813293457, -0.01017904281616211, -0.009935259819030762, -0.009691476821899414, -0.009447693824768066, -0.009203910827636719, -0.008960127830505371, -0.008716344833374023, -0.008472561836242676, -0.008228778839111328, -0.00798499584197998, -0.007741212844848633, -0.007497429847717285, -0.0072536468505859375, -0.00700986385345459, -0.006766080856323242, -0.0065222978591918945, -0.006278514862060547, -0.006034731864929199, -0.0057909488677978516, -0.005547165870666504, -0.005303382873535156, -0.005059599876403809, -0.004815816879272461, -0.004572033882141113, -0.004328250885009766, -0.004084467887878418, -0.0038406848907470703, -0.0035969018936157227, -0.003353118896484375, -0.0031093358993530273, -0.0028655529022216797, -0.002621769905090332, -0.0023779869079589844, -0.0021342039108276367, -0.001890420913696289, -0.0016466379165649414, -0.0014028549194335938, -0.001159071922302246, -0.0009152889251708984, -0.0006715059280395508, -0.0004277229309082031, -0.00018393993377685547, 5.984306335449219e-05, 0.00030362606048583984, 0.0005474090576171875, 0.0007911920547485352, 0.0010349750518798828, 0.0012787580490112305, 0.0015225410461425781, 0.0017663240432739258, 0.0020101070404052734, 0.002253890037536621, 0.0024976730346679688, 0.0027414560317993164, 0.002985239028930664, 0.0032290220260620117, 0.0034728050231933594, 0.003716588020324707, 0.003960371017456055, 0.004204154014587402, 0.00444793701171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 8.0, 19.0, 35.0, 38.0, 49.0, 105.0, 173.0, 391.0, 1013.0, 3470.0, 19026.0, 316753.0, 671832.0, 28719.0, 4662.0, 1244.0, 503.0, 195.0, 100.0, 66.0, 36.0, 22.0, 16.0, 14.0, 7.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.375, -57.40234375, -55.4296875, -53.45703125, -51.484375, -49.51171875, -47.5390625, -45.56640625, -43.59375, -41.62109375, -39.6484375, -37.67578125, -35.703125, -33.73046875, -31.7578125, -29.78515625, -27.8125, -25.83984375, -23.8671875, -21.89453125, -19.921875, -17.94921875, -15.9765625, -14.00390625, -12.03125, -10.05859375, -8.0859375, -6.11328125, -4.140625, -2.16796875, -0.1953125, 1.77734375, 3.75, 5.72265625, 7.6953125, 9.66796875, 11.640625, 13.61328125, 15.5859375, 17.55859375, 19.53125, 21.50390625, 23.4765625, 25.44921875, 27.421875, 29.39453125, 31.3671875, 33.33984375, 35.3125, 37.28515625, 39.2578125, 41.23046875, 43.203125, 45.17578125, 47.1484375, 49.12109375, 51.09375, 53.06640625, 55.0390625, 57.01171875, 58.984375, 60.95703125, 62.9296875, 64.90234375, 66.875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 14.0, 19.0, 31.0, 42.0, 79.0, 180.0, 229.0, 157.0, 85.0, 38.0, 24.0, 15.0, 11.0, 11.0, 8.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.5615234375, -33.560546875, -32.5595703125, -31.55859375, -30.5576171875, -29.556640625, -28.5556640625, -27.5546875, -26.5537109375, -25.552734375, -24.5517578125, -23.55078125, -22.5498046875, -21.548828125, -20.5478515625, -19.546875, -18.5458984375, -17.544921875, -16.5439453125, -15.54296875, -14.5419921875, -13.541015625, -12.5400390625, -11.5390625, -10.5380859375, -9.537109375, -8.5361328125, -7.53515625, -6.5341796875, -5.533203125, -4.5322265625, -3.53125, -2.5302734375, -1.529296875, -0.5283203125, 0.47265625, 1.4736328125, 2.474609375, 3.4755859375, 4.4765625, 5.4775390625, 6.478515625, 7.4794921875, 8.48046875, 9.4814453125, 10.482421875, 11.4833984375, 12.484375, 13.4853515625, 14.486328125, 15.4873046875, 16.48828125, 17.4892578125, 18.490234375, 19.4912109375, 20.4921875, 21.4931640625, 22.494140625, 23.4951171875, 24.49609375, 25.4970703125, 26.498046875, 27.4990234375, 28.5]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 15.0, 38.0, 41.0, 83.0, 140.0, 158.0, 162.0, 150.0, 97.0, 57.0, 42.0, 11.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.3349151611328, -172.87261962890625, -155.4103240966797, -137.94802856445312, -120.4857406616211, -103.02344512939453, -85.5611572265625, -68.09886169433594, -50.636566162109375, -33.17427062988281, -15.711978912353516, 1.7503128051757812, 19.212608337402344, 36.674903869628906, 54.13719177246094, 71.5994873046875, 89.06178283691406, 106.52407836914062, 123.98637390136719, 141.44866943359375, 158.91094970703125, 176.37326049804688, 193.83554077148438, 211.29783630371094, 228.7601318359375, 246.22242736816406, 263.6847229003906, 281.1470031738281, 298.60931396484375, 316.07159423828125, 333.53387451171875, 350.9961853027344, 368.45843505859375, 385.92071533203125, 403.3830261230469, 420.8453063964844, 438.3076171875, 455.7698974609375, 473.232177734375, 490.6944885253906, 508.15679931640625, 525.6190795898438, 543.0813598632812, 560.543701171875, 578.0059814453125, 595.46826171875, 612.9305419921875, 630.392822265625, 647.8551025390625, 665.3173828125, 682.7796630859375, 700.2420043945312, 717.7042846679688, 735.1665649414062, 752.6288452148438, 770.0911865234375, 787.553466796875, 805.0157470703125, 822.47802734375, 839.9403686523438, 857.4026489257812, 874.8649291992188, 892.3272094726562, 909.78955078125, 927.2518310546875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 5.0, 10.0, 13.0, 15.0, 9.0, 25.0, 28.0, 16.0, 26.0, 37.0, 28.0, 32.0, 35.0, 37.0, 48.0, 57.0, 53.0, 48.0, 37.0, 42.0, 42.0, 40.0, 35.0, 34.0, 33.0, 31.0, 22.0, 22.0, 25.0, 23.0, 21.0, 12.0, 8.0, 12.0, 6.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.6279296875, -184.66299438476562, -177.6980438232422, -170.7331085205078, -163.76815795898438, -156.80322265625, -149.83828735351562, -142.8733367919922, -135.9084014892578, -128.94346618652344, -121.978515625, -115.01358032226562, -108.04863739013672, -101.08369445800781, -94.1187515258789, -87.15380859375, -80.1888656616211, -73.22392272949219, -66.25897979736328, -59.29404067993164, -52.3291015625, -45.364158630371094, -38.39921569824219, -31.434276580810547, -24.46933364868164, -17.504392623901367, -10.539450645446777, -3.5745086669921875, 3.390432357788086, 10.35537338256836, 17.320316314697266, 24.285255432128906, 31.250198364257812, 38.21514129638672, 45.18008041381836, 52.145023345947266, 59.109962463378906, 66.07490539550781, 73.03984832763672, 80.00479125976562, 86.9697265625, 93.9346694946289, 100.89961242675781, 107.86454772949219, 114.8294906616211, 121.79443359375, 128.75936889648438, 135.7243194580078, 142.68927001953125, 149.65420532226562, 156.61915588378906, 163.58409118652344, 170.54904174804688, 177.51397705078125, 184.47891235351562, 191.44386291503906, 198.40879821777344, 205.3737335205078, 212.33868408203125, 219.30361938476562, 226.26856994628906, 233.23350524902344, 240.19845581054688, 247.16339111328125, 254.12832641601562]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 16.0, 14.0, 23.0, 32.0, 37.0, 38.0, 57.0, 86.0, 135.0, 203.0, 301.0, 476.0, 851.0, 1540.0, 3284.0, 7747.0, 23431.0, 98074.0, 3262223.0, 699083.0, 66695.0, 17776.0, 6375.0, 2600.0, 1225.0, 662.0, 387.0, 255.0, 168.0, 110.0, 97.0, 58.0, 47.0, 32.0, 38.0, 18.0, 16.0, 12.0, 16.0, 6.0, 3.0, 5.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-145.125, -140.42578125, -135.7265625, -131.02734375, -126.328125, -121.62890625, -116.9296875, -112.23046875, -107.53125, -102.83203125, -98.1328125, -93.43359375, -88.734375, -84.03515625, -79.3359375, -74.63671875, -69.9375, -65.23828125, -60.5390625, -55.83984375, -51.140625, -46.44140625, -41.7421875, -37.04296875, -32.34375, -27.64453125, -22.9453125, -18.24609375, -13.546875, -8.84765625, -4.1484375, 0.55078125, 5.25, 9.94921875, 14.6484375, 19.34765625, 24.046875, 28.74609375, 33.4453125, 38.14453125, 42.84375, 47.54296875, 52.2421875, 56.94140625, 61.640625, 66.33984375, 71.0390625, 75.73828125, 80.4375, 85.13671875, 89.8359375, 94.53515625, 99.234375, 103.93359375, 108.6328125, 113.33203125, 118.03125, 122.73046875, 127.4296875, 132.12890625, 136.828125, 141.52734375, 146.2265625, 150.92578125, 155.625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 7.0, 6.0, 12.0, 7.0, 20.0, 22.0, 28.0, 54.0, 40.0, 64.0, 72.0, 77.0, 66.0, 102.0, 70.0, 70.0, 65.0, 67.0, 32.0, 34.0, 37.0, 13.0, 16.0, 6.0, 7.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.609375, -20.93505859375, -20.2607421875, -19.58642578125, -18.912109375, -18.23779296875, -17.5634765625, -16.88916015625, -16.21484375, -15.54052734375, -14.8662109375, -14.19189453125, -13.517578125, -12.84326171875, -12.1689453125, -11.49462890625, -10.8203125, -10.14599609375, -9.4716796875, -8.79736328125, -8.123046875, -7.44873046875, -6.7744140625, -6.10009765625, -5.42578125, -4.75146484375, -4.0771484375, -3.40283203125, -2.728515625, -2.05419921875, -1.3798828125, -0.70556640625, -0.03125, 0.64306640625, 1.3173828125, 1.99169921875, 2.666015625, 3.34033203125, 4.0146484375, 4.68896484375, 5.36328125, 6.03759765625, 6.7119140625, 7.38623046875, 8.060546875, 8.73486328125, 9.4091796875, 10.08349609375, 10.7578125, 11.43212890625, 12.1064453125, 12.78076171875, 13.455078125, 14.12939453125, 14.8037109375, 15.47802734375, 16.15234375, 16.82666015625, 17.5009765625, 18.17529296875, 18.849609375, 19.52392578125, 20.1982421875, 20.87255859375, 21.546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 9.0, 10.0, 14.0, 14.0, 18.0, 36.0, 41.0, 50.0, 63.0, 115.0, 157.0, 237.0, 415.0, 722.0, 1315.0, 2732.0, 6101.0, 14616.0, 39276.0, 129394.0, 922889.0, 2808316.0, 184037.0, 51014.0, 18247.0, 7418.0, 3343.0, 1592.0, 807.0, 477.0, 273.0, 177.0, 106.0, 72.0, 50.0, 32.0, 23.0, 15.0, 15.0, 12.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-86.4375, -83.904296875, -81.37109375, -78.837890625, -76.3046875, -73.771484375, -71.23828125, -68.705078125, -66.171875, -63.638671875, -61.10546875, -58.572265625, -56.0390625, -53.505859375, -50.97265625, -48.439453125, -45.90625, -43.373046875, -40.83984375, -38.306640625, -35.7734375, -33.240234375, -30.70703125, -28.173828125, -25.640625, -23.107421875, -20.57421875, -18.041015625, -15.5078125, -12.974609375, -10.44140625, -7.908203125, -5.375, -2.841796875, -0.30859375, 2.224609375, 4.7578125, 7.291015625, 9.82421875, 12.357421875, 14.890625, 17.423828125, 19.95703125, 22.490234375, 25.0234375, 27.556640625, 30.08984375, 32.623046875, 35.15625, 37.689453125, 40.22265625, 42.755859375, 45.2890625, 47.822265625, 50.35546875, 52.888671875, 55.421875, 57.955078125, 60.48828125, 63.021484375, 65.5546875, 68.087890625, 70.62109375, 73.154296875, 75.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 11.0, 22.0, 29.0, 33.0, 66.0, 71.0, 139.0, 279.0, 772.0, 1772.0, 373.0, 202.0, 102.0, 62.0, 43.0, 25.0, 9.0, 10.0, 15.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-54.46875, -53.208740234375, -51.94873046875, -50.688720703125, -49.4287109375, -48.168701171875, -46.90869140625, -45.648681640625, -44.388671875, -43.128662109375, -41.86865234375, -40.608642578125, -39.3486328125, -38.088623046875, -36.82861328125, -35.568603515625, -34.30859375, -33.048583984375, -31.78857421875, -30.528564453125, -29.2685546875, -28.008544921875, -26.74853515625, -25.488525390625, -24.228515625, -22.968505859375, -21.70849609375, -20.448486328125, -19.1884765625, -17.928466796875, -16.66845703125, -15.408447265625, -14.1484375, -12.888427734375, -11.62841796875, -10.368408203125, -9.1083984375, -7.848388671875, -6.58837890625, -5.328369140625, -4.068359375, -2.808349609375, -1.54833984375, -0.288330078125, 0.9716796875, 2.231689453125, 3.49169921875, 4.751708984375, 6.01171875, 7.271728515625, 8.53173828125, 9.791748046875, 11.0517578125, 12.311767578125, 13.57177734375, 14.831787109375, 16.091796875, 17.351806640625, 18.61181640625, 19.871826171875, 21.1318359375, 22.391845703125, 23.65185546875, 24.911865234375, 26.171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 22.0, 37.0, 61.0, 107.0, 161.0, 194.0, 174.0, 126.0, 62.0, 29.0, 20.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-550.94921875, -540.5137329101562, -530.0782470703125, -519.6427612304688, -509.207275390625, -498.7717590332031, -488.3362731933594, -477.9007873535156, -467.4653015136719, -457.0298156738281, -446.5943298339844, -436.1588439941406, -425.72332763671875, -415.287841796875, -404.85235595703125, -394.4168701171875, -383.98138427734375, -373.5458984375, -363.11041259765625, -352.6749267578125, -342.23944091796875, -331.8039245605469, -321.3684387207031, -310.9329528808594, -300.4974670410156, -290.0619812011719, -279.6264953613281, -269.1910095214844, -258.7554931640625, -248.3200225830078, -237.884521484375, -227.44903564453125, -217.01353454589844, -206.5780487060547, -196.14254760742188, -185.70706176757812, -175.27157592773438, -164.83609008789062, -154.40060424804688, -143.96510314941406, -133.5296173095703, -123.09413146972656, -112.65863800048828, -102.22314453125, -91.78765869140625, -81.3521728515625, -70.91667938232422, -60.48118591308594, -50.04570007324219, -39.61021041870117, -29.174720764160156, -18.73923110961914, -8.303741455078125, 2.1317481994628906, 12.567237854003906, 23.002731323242188, 33.43821716308594, 43.87370681762695, 54.30919647216797, 64.74468994140625, 75.18017578125, 85.61566162109375, 96.05115509033203, 106.48664855957031, 116.92213439941406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 0.0, 6.0, 4.0, 6.0, 6.0, 7.0, 7.0, 10.0, 15.0, 15.0, 14.0, 13.0, 25.0, 22.0, 28.0, 24.0, 20.0, 32.0, 37.0, 35.0, 37.0, 40.0, 38.0, 45.0, 39.0, 31.0, 40.0, 38.0, 35.0, 30.0, 24.0, 33.0, 22.0, 22.0, 24.0, 28.0, 22.0, 20.0, 21.0, 14.0, 14.0, 8.0, 11.0, 14.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-89.22309875488281, -86.47863006591797, -83.73416137695312, -80.98970031738281, -78.24523162841797, -75.50076293945312, -72.75629425048828, -70.01182556152344, -67.26736450195312, -64.52289581298828, -61.7784309387207, -59.03396224975586, -56.28949737548828, -53.54502868652344, -50.800559997558594, -48.05609130859375, -45.311622619628906, -42.56715393066406, -39.822689056396484, -37.07822036743164, -34.33375549316406, -31.58928680419922, -28.844818115234375, -26.100351333618164, -23.355884552001953, -20.611417770385742, -17.86695098876953, -15.122482299804688, -12.378015518188477, -9.633548736572266, -6.889080047607422, -4.144613265991211, -1.400146484375, 1.3443207740783691, 4.088788032531738, 6.833255767822266, 9.577722549438477, 12.322189331054688, 15.066658020019531, 17.811124801635742, 20.555591583251953, 23.300058364868164, 26.044525146484375, 28.78899383544922, 31.53346061706543, 34.27792739868164, 37.022396087646484, 39.76686096191406, 42.511329650878906, 45.25579833984375, 48.00026321411133, 50.74473190307617, 53.48919677734375, 56.233665466308594, 58.97813415527344, 61.72260284423828, 64.46707153320312, 67.21154022216797, 69.95600891113281, 72.70046997070312, 75.44493865966797, 78.18940734863281, 80.93387603759766, 83.6783447265625, 86.42280578613281]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 19.0, 31.0, 55.0, 71.0, 105.0, 195.0, 303.0, 551.0, 1176.0, 3177.0, 11266.0, 54645.0, 317257.0, 541564.0, 92486.0, 17933.0, 4441.0, 1615.0, 671.0, 390.0, 235.0, 144.0, 78.0, 52.0, 40.0, 11.0, 19.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.0625, -115.1142578125, -111.166015625, -107.2177734375, -103.26953125, -99.3212890625, -95.373046875, -91.4248046875, -87.4765625, -83.5283203125, -79.580078125, -75.6318359375, -71.68359375, -67.7353515625, -63.787109375, -59.8388671875, -55.890625, -51.9423828125, -47.994140625, -44.0458984375, -40.09765625, -36.1494140625, -32.201171875, -28.2529296875, -24.3046875, -20.3564453125, -16.408203125, -12.4599609375, -8.51171875, -4.5634765625, -0.615234375, 3.3330078125, 7.28125, 11.2294921875, 15.177734375, 19.1259765625, 23.07421875, 27.0224609375, 30.970703125, 34.9189453125, 38.8671875, 42.8154296875, 46.763671875, 50.7119140625, 54.66015625, 58.6083984375, 62.556640625, 66.5048828125, 70.453125, 74.4013671875, 78.349609375, 82.2978515625, 86.24609375, 90.1943359375, 94.142578125, 98.0908203125, 102.0390625, 105.9873046875, 109.935546875, 113.8837890625, 117.83203125, 121.7802734375, 125.728515625, 129.6767578125, 133.625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 9.0, 9.0, 21.0, 12.0, 21.0, 32.0, 46.0, 58.0, 49.0, 86.0, 77.0, 77.0, 89.0, 63.0, 63.0, 65.0, 59.0, 54.0, 28.0, 28.0, 16.0, 7.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.125, -21.4287109375, -20.732421875, -20.0361328125, -19.33984375, -18.6435546875, -17.947265625, -17.2509765625, -16.5546875, -15.8583984375, -15.162109375, -14.4658203125, -13.76953125, -13.0732421875, -12.376953125, -11.6806640625, -10.984375, -10.2880859375, -9.591796875, -8.8955078125, -8.19921875, -7.5029296875, -6.806640625, -6.1103515625, -5.4140625, -4.7177734375, -4.021484375, -3.3251953125, -2.62890625, -1.9326171875, -1.236328125, -0.5400390625, 0.15625, 0.8525390625, 1.548828125, 2.2451171875, 2.94140625, 3.6376953125, 4.333984375, 5.0302734375, 5.7265625, 6.4228515625, 7.119140625, 7.8154296875, 8.51171875, 9.2080078125, 9.904296875, 10.6005859375, 11.296875, 11.9931640625, 12.689453125, 13.3857421875, 14.08203125, 14.7783203125, 15.474609375, 16.1708984375, 16.8671875, 17.5634765625, 18.259765625, 18.9560546875, 19.65234375, 20.3486328125, 21.044921875, 21.7412109375, 22.4375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 13.0, 9.0, 22.0, 35.0, 40.0, 54.0, 89.0, 123.0, 147.0, 214.0, 327.0, 486.0, 970.0, 2074.0, 5295.0, 16433.0, 55532.0, 208369.0, 521224.0, 168286.0, 46473.0, 13825.0, 4417.0, 1765.0, 851.0, 501.0, 285.0, 199.0, 161.0, 90.0, 58.0, 53.0, 36.0, 24.0, 16.0, 18.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.8125, -67.841796875, -65.87109375, -63.900390625, -61.9296875, -59.958984375, -57.98828125, -56.017578125, -54.046875, -52.076171875, -50.10546875, -48.134765625, -46.1640625, -44.193359375, -42.22265625, -40.251953125, -38.28125, -36.310546875, -34.33984375, -32.369140625, -30.3984375, -28.427734375, -26.45703125, -24.486328125, -22.515625, -20.544921875, -18.57421875, -16.603515625, -14.6328125, -12.662109375, -10.69140625, -8.720703125, -6.75, -4.779296875, -2.80859375, -0.837890625, 1.1328125, 3.103515625, 5.07421875, 7.044921875, 9.015625, 10.986328125, 12.95703125, 14.927734375, 16.8984375, 18.869140625, 20.83984375, 22.810546875, 24.78125, 26.751953125, 28.72265625, 30.693359375, 32.6640625, 34.634765625, 36.60546875, 38.576171875, 40.546875, 42.517578125, 44.48828125, 46.458984375, 48.4296875, 50.400390625, 52.37109375, 54.341796875, 56.3125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 5.0, 8.0, 5.0, 13.0, 8.0, 8.0, 11.0, 14.0, 16.0, 15.0, 17.0, 22.0, 23.0, 35.0, 30.0, 33.0, 28.0, 38.0, 41.0, 29.0, 33.0, 48.0, 38.0, 39.0, 40.0, 41.0, 38.0, 38.0, 41.0, 33.0, 37.0, 15.0, 20.0, 19.0, 21.0, 13.0, 18.0, 10.0, 14.0, 8.0, 6.0, 10.0, 9.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.5625, -37.10888671875, -35.6552734375, -34.20166015625, -32.748046875, -31.29443359375, -29.8408203125, -28.38720703125, -26.93359375, -25.47998046875, -24.0263671875, -22.57275390625, -21.119140625, -19.66552734375, -18.2119140625, -16.75830078125, -15.3046875, -13.85107421875, -12.3974609375, -10.94384765625, -9.490234375, -8.03662109375, -6.5830078125, -5.12939453125, -3.67578125, -2.22216796875, -0.7685546875, 0.68505859375, 2.138671875, 3.59228515625, 5.0458984375, 6.49951171875, 7.953125, 9.40673828125, 10.8603515625, 12.31396484375, 13.767578125, 15.22119140625, 16.6748046875, 18.12841796875, 19.58203125, 21.03564453125, 22.4892578125, 23.94287109375, 25.396484375, 26.85009765625, 28.3037109375, 29.75732421875, 31.2109375, 32.66455078125, 34.1181640625, 35.57177734375, 37.025390625, 38.47900390625, 39.9326171875, 41.38623046875, 42.83984375, 44.29345703125, 45.7470703125, 47.20068359375, 48.654296875, 50.10791015625, 51.5615234375, 53.01513671875, 54.46875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 12.0, 14.0, 13.0, 36.0, 54.0, 71.0, 167.0, 279.0, 553.0, 1431.0, 3544.0, 10005.0, 31385.0, 103788.0, 414413.0, 352116.0, 89093.0, 27367.0, 8739.0, 3161.0, 1164.0, 552.0, 290.0, 129.0, 76.0, 30.0, 29.0, 15.0, 12.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -21.887939453125, -21.01025390625, -20.132568359375, -19.2548828125, -18.377197265625, -17.49951171875, -16.621826171875, -15.744140625, -14.866455078125, -13.98876953125, -13.111083984375, -12.2333984375, -11.355712890625, -10.47802734375, -9.600341796875, -8.72265625, -7.844970703125, -6.96728515625, -6.089599609375, -5.2119140625, -4.334228515625, -3.45654296875, -2.578857421875, -1.701171875, -0.823486328125, 0.05419921875, 0.931884765625, 1.8095703125, 2.687255859375, 3.56494140625, 4.442626953125, 5.3203125, 6.197998046875, 7.07568359375, 7.953369140625, 8.8310546875, 9.708740234375, 10.58642578125, 11.464111328125, 12.341796875, 13.219482421875, 14.09716796875, 14.974853515625, 15.8525390625, 16.730224609375, 17.60791015625, 18.485595703125, 19.36328125, 20.240966796875, 21.11865234375, 21.996337890625, 22.8740234375, 23.751708984375, 24.62939453125, 25.507080078125, 26.384765625, 27.262451171875, 28.14013671875, 29.017822265625, 29.8955078125, 30.773193359375, 31.65087890625, 32.528564453125, 33.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 13.0, 21.0, 23.0, 21.0, 34.0, 42.0, 62.0, 104.0, 183.0, 136.0, 86.0, 69.0, 31.0, 42.0, 30.0, 22.0, 14.0, 14.0, 6.0, 8.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00711822509765625, -0.006952166557312012, -0.0067861080169677734, -0.006620049476623535, -0.006453990936279297, -0.006287932395935059, -0.00612187385559082, -0.005955815315246582, -0.005789756774902344, -0.0056236982345581055, -0.005457639694213867, -0.005291581153869629, -0.005125522613525391, -0.004959464073181152, -0.004793405532836914, -0.004627346992492676, -0.0044612884521484375, -0.004295229911804199, -0.004129171371459961, -0.003963112831115723, -0.0037970542907714844, -0.003630995750427246, -0.003464937210083008, -0.0032988786697387695, -0.0031328201293945312, -0.002966761589050293, -0.0028007030487060547, -0.0026346445083618164, -0.002468585968017578, -0.00230252742767334, -0.0021364688873291016, -0.0019704103469848633, -0.001804351806640625, -0.0016382932662963867, -0.0014722347259521484, -0.0013061761856079102, -0.0011401176452636719, -0.0009740591049194336, -0.0008080005645751953, -0.000641942024230957, -0.00047588348388671875, -0.00030982494354248047, -0.0001437664031982422, 2.2292137145996094e-05, 0.00018835067749023438, 0.00035440921783447266, 0.0005204677581787109, 0.0006865262985229492, 0.0008525848388671875, 0.0010186433792114258, 0.001184701919555664, 0.0013507604598999023, 0.0015168190002441406, 0.001682877540588379, 0.0018489360809326172, 0.0020149946212768555, 0.0021810531616210938, 0.002347111701965332, 0.0025131702423095703, 0.0026792287826538086, 0.002845287322998047, 0.003011345863342285, 0.0031774044036865234, 0.0033434629440307617, 0.003509521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 18.0, 19.0, 26.0, 32.0, 48.0, 81.0, 112.0, 145.0, 264.0, 425.0, 806.0, 1679.0, 4152.0, 11972.0, 44153.0, 195948.0, 538912.0, 188145.0, 42307.0, 11777.0, 4041.0, 1641.0, 766.0, 400.0, 228.0, 139.0, 77.0, 67.0, 57.0, 26.0, 27.0, 17.0, 12.0, 6.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.2568359375, -31.232421875, -30.2080078125, -29.18359375, -28.1591796875, -27.134765625, -26.1103515625, -25.0859375, -24.0615234375, -23.037109375, -22.0126953125, -20.98828125, -19.9638671875, -18.939453125, -17.9150390625, -16.890625, -15.8662109375, -14.841796875, -13.8173828125, -12.79296875, -11.7685546875, -10.744140625, -9.7197265625, -8.6953125, -7.6708984375, -6.646484375, -5.6220703125, -4.59765625, -3.5732421875, -2.548828125, -1.5244140625, -0.5, 0.5244140625, 1.548828125, 2.5732421875, 3.59765625, 4.6220703125, 5.646484375, 6.6708984375, 7.6953125, 8.7197265625, 9.744140625, 10.7685546875, 11.79296875, 12.8173828125, 13.841796875, 14.8662109375, 15.890625, 16.9150390625, 17.939453125, 18.9638671875, 19.98828125, 21.0126953125, 22.037109375, 23.0615234375, 24.0859375, 25.1103515625, 26.134765625, 27.1591796875, 28.18359375, 29.2080078125, 30.232421875, 31.2568359375, 32.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 2.0, 11.0, 4.0, 5.0, 10.0, 10.0, 6.0, 19.0, 7.0, 16.0, 22.0, 37.0, 31.0, 38.0, 40.0, 61.0, 69.0, 69.0, 64.0, 63.0, 50.0, 57.0, 47.0, 51.0, 42.0, 37.0, 24.0, 20.0, 19.0, 14.0, 10.0, 8.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.390625, -19.777099609375, -19.16357421875, -18.550048828125, -17.9365234375, -17.322998046875, -16.70947265625, -16.095947265625, -15.482421875, -14.868896484375, -14.25537109375, -13.641845703125, -13.0283203125, -12.414794921875, -11.80126953125, -11.187744140625, -10.57421875, -9.960693359375, -9.34716796875, -8.733642578125, -8.1201171875, -7.506591796875, -6.89306640625, -6.279541015625, -5.666015625, -5.052490234375, -4.43896484375, -3.825439453125, -3.2119140625, -2.598388671875, -1.98486328125, -1.371337890625, -0.7578125, -0.144287109375, 0.46923828125, 1.082763671875, 1.6962890625, 2.309814453125, 2.92333984375, 3.536865234375, 4.150390625, 4.763916015625, 5.37744140625, 5.990966796875, 6.6044921875, 7.218017578125, 7.83154296875, 8.445068359375, 9.05859375, 9.672119140625, 10.28564453125, 10.899169921875, 11.5126953125, 12.126220703125, 12.73974609375, 13.353271484375, 13.966796875, 14.580322265625, 15.19384765625, 15.807373046875, 16.4208984375, 17.034423828125, 17.64794921875, 18.261474609375, 18.875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 7.0, 34.0, 149.0, 324.0, 317.0, 139.0, 31.0, 10.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.1203308105469, -269.69305419921875, -225.26580810546875, -180.8385467529297, -136.41128540039062, -91.98402404785156, -47.5567626953125, -3.129486083984375, 41.297760009765625, 85.72502136230469, 130.15228271484375, 174.5795440673828, 219.00680541992188, 263.43408203125, 307.861328125, 352.2886047363281, 396.7158508300781, 441.14312744140625, 485.57037353515625, 529.9976196289062, 574.4249267578125, 618.8521728515625, 663.2794189453125, 707.7066650390625, 752.1339111328125, 796.5611572265625, 840.9884033203125, 885.4157104492188, 929.8429565429688, 974.2702026367188, 1018.697509765625, 1063.124755859375, 1107.552001953125, 1151.979248046875, 1196.406494140625, 1240.833740234375, 1285.260986328125, 1329.6883544921875, 1374.1156005859375, 1418.5428466796875, 1462.9700927734375, 1507.3973388671875, 1551.8245849609375, 1596.2518310546875, 1640.67919921875, 1685.1064453125, 1729.53369140625, 1773.9609375, 1818.38818359375, 1862.8154296875, 1907.24267578125, 1951.669921875, 1996.09716796875, 2040.5245361328125, 2084.95166015625, 2129.37890625, 2173.80615234375, 2218.2333984375, 2262.66064453125, 2307.087890625, 2351.51513671875, 2395.9423828125, 2440.36962890625, 2484.796875, 2529.224365234375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 12.0, 10.0, 9.0, 10.0, 14.0, 11.0, 22.0, 14.0, 22.0, 29.0, 32.0, 22.0, 39.0, 40.0, 39.0, 34.0, 34.0, 43.0, 44.0, 40.0, 40.0, 35.0, 41.0, 28.0, 35.0, 40.0, 24.0, 37.0, 17.0, 26.0, 17.0, 24.0, 12.0, 17.0, 11.0, 10.0, 9.0, 6.0, 8.0, 7.0, 9.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-268.91546630859375, -261.24969482421875, -253.58389282226562, -245.91812133789062, -238.25233459472656, -230.5865478515625, -222.9207763671875, -215.25498962402344, -207.58920288085938, -199.9234161376953, -192.25762939453125, -184.59185791015625, -176.9260711669922, -169.26028442382812, -161.59451293945312, -153.92872619628906, -146.262939453125, -138.59715270996094, -130.93136596679688, -123.26559448242188, -115.59980773925781, -107.93402099609375, -100.26824188232422, -92.60246276855469, -84.93667602539062, -77.27088928222656, -69.60511016845703, -61.939327239990234, -54.27354431152344, -46.60776138305664, -38.941978454589844, -31.276195526123047, -23.610397338867188, -15.94461441040039, -8.278831481933594, -0.6130485534667969, 7.052734375, 14.718517303466797, 22.384300231933594, 30.05008316040039, 37.71586608886719, 45.381649017333984, 53.04743194580078, 60.71321487426758, 68.37899780273438, 76.04478454589844, 83.71056365966797, 91.3763427734375, 99.04212951660156, 106.70791625976562, 114.37369537353516, 122.03947448730469, 129.70526123046875, 137.3710479736328, 145.03683471679688, 152.70260620117188, 160.36839294433594, 168.0341796875, 175.699951171875, 183.36573791503906, 191.03152465820312, 198.6973114013672, 206.36309814453125, 214.02886962890625, 221.6946563720703]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 6.0, 23.0, 42.0, 44.0, 57.0, 108.0, 172.0, 286.0, 498.0, 885.0, 1770.0, 4170.0, 12197.0, 50039.0, 403614.0, 3489321.0, 186247.0, 30339.0, 8207.0, 3036.0, 1296.0, 721.0, 402.0, 265.0, 155.0, 92.0, 70.0, 59.0, 38.0, 31.0, 16.0, 6.0, 12.0, 10.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.875, -137.19921875, -132.5234375, -127.84765625, -123.171875, -118.49609375, -113.8203125, -109.14453125, -104.46875, -99.79296875, -95.1171875, -90.44140625, -85.765625, -81.08984375, -76.4140625, -71.73828125, -67.0625, -62.38671875, -57.7109375, -53.03515625, -48.359375, -43.68359375, -39.0078125, -34.33203125, -29.65625, -24.98046875, -20.3046875, -15.62890625, -10.953125, -6.27734375, -1.6015625, 3.07421875, 7.75, 12.42578125, 17.1015625, 21.77734375, 26.453125, 31.12890625, 35.8046875, 40.48046875, 45.15625, 49.83203125, 54.5078125, 59.18359375, 63.859375, 68.53515625, 73.2109375, 77.88671875, 82.5625, 87.23828125, 91.9140625, 96.58984375, 101.265625, 105.94140625, 110.6171875, 115.29296875, 119.96875, 124.64453125, 129.3203125, 133.99609375, 138.671875, 143.34765625, 148.0234375, 152.69921875, 157.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 16.0, 20.0, 20.0, 26.0, 43.0, 42.0, 56.0, 88.0, 55.0, 80.0, 82.0, 71.0, 74.0, 70.0, 60.0, 51.0, 39.0, 33.0, 16.0, 18.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.640625, -20.948974609375, -20.25732421875, -19.565673828125, -18.8740234375, -18.182373046875, -17.49072265625, -16.799072265625, -16.107421875, -15.415771484375, -14.72412109375, -14.032470703125, -13.3408203125, -12.649169921875, -11.95751953125, -11.265869140625, -10.57421875, -9.882568359375, -9.19091796875, -8.499267578125, -7.8076171875, -7.115966796875, -6.42431640625, -5.732666015625, -5.041015625, -4.349365234375, -3.65771484375, -2.966064453125, -2.2744140625, -1.582763671875, -0.89111328125, -0.199462890625, 0.4921875, 1.183837890625, 1.87548828125, 2.567138671875, 3.2587890625, 3.950439453125, 4.64208984375, 5.333740234375, 6.025390625, 6.717041015625, 7.40869140625, 8.100341796875, 8.7919921875, 9.483642578125, 10.17529296875, 10.866943359375, 11.55859375, 12.250244140625, 12.94189453125, 13.633544921875, 14.3251953125, 15.016845703125, 15.70849609375, 16.400146484375, 17.091796875, 17.783447265625, 18.47509765625, 19.166748046875, 19.8583984375, 20.550048828125, 21.24169921875, 21.933349609375, 22.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 12.0, 12.0, 30.0, 29.0, 35.0, 51.0, 75.0, 98.0, 154.0, 210.0, 353.0, 583.0, 1387.0, 4442.0, 21850.0, 157064.0, 3244146.0, 686403.0, 62185.0, 10351.0, 2526.0, 946.0, 485.0, 268.0, 161.0, 124.0, 76.0, 69.0, 35.0, 29.0, 16.0, 15.0, 18.0, 9.0, 9.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-139.625, -135.6103515625, -131.595703125, -127.5810546875, -123.56640625, -119.5517578125, -115.537109375, -111.5224609375, -107.5078125, -103.4931640625, -99.478515625, -95.4638671875, -91.44921875, -87.4345703125, -83.419921875, -79.4052734375, -75.390625, -71.3759765625, -67.361328125, -63.3466796875, -59.33203125, -55.3173828125, -51.302734375, -47.2880859375, -43.2734375, -39.2587890625, -35.244140625, -31.2294921875, -27.21484375, -23.2001953125, -19.185546875, -15.1708984375, -11.15625, -7.1416015625, -3.126953125, 0.8876953125, 4.90234375, 8.9169921875, 12.931640625, 16.9462890625, 20.9609375, 24.9755859375, 28.990234375, 33.0048828125, 37.01953125, 41.0341796875, 45.048828125, 49.0634765625, 53.078125, 57.0927734375, 61.107421875, 65.1220703125, 69.13671875, 73.1513671875, 77.166015625, 81.1806640625, 85.1953125, 89.2099609375, 93.224609375, 97.2392578125, 101.25390625, 105.2685546875, 109.283203125, 113.2978515625, 117.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 17.0, 30.0, 59.0, 142.0, 333.0, 1158.0, 1628.0, 394.0, 158.0, 69.0, 44.0, 27.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.7470703125, -65.244140625, -62.7412109375, -60.23828125, -57.7353515625, -55.232421875, -52.7294921875, -50.2265625, -47.7236328125, -45.220703125, -42.7177734375, -40.21484375, -37.7119140625, -35.208984375, -32.7060546875, -30.203125, -27.7001953125, -25.197265625, -22.6943359375, -20.19140625, -17.6884765625, -15.185546875, -12.6826171875, -10.1796875, -7.6767578125, -5.173828125, -2.6708984375, -0.16796875, 2.3349609375, 4.837890625, 7.3408203125, 9.84375, 12.3466796875, 14.849609375, 17.3525390625, 19.85546875, 22.3583984375, 24.861328125, 27.3642578125, 29.8671875, 32.3701171875, 34.873046875, 37.3759765625, 39.87890625, 42.3818359375, 44.884765625, 47.3876953125, 49.890625, 52.3935546875, 54.896484375, 57.3994140625, 59.90234375, 62.4052734375, 64.908203125, 67.4111328125, 69.9140625, 72.4169921875, 74.919921875, 77.4228515625, 79.92578125, 82.4287109375, 84.931640625, 87.4345703125, 89.9375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 7.0, 8.0, 20.0, 24.0, 34.0, 41.0, 53.0, 70.0, 79.0, 87.0, 107.0, 82.0, 71.0, 79.0, 55.0, 56.0, 36.0, 22.0, 13.0, 15.0, 9.0, 4.0, 9.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-211.2149200439453, -203.9550018310547, -196.69508361816406, -189.43516540527344, -182.1752471923828, -174.9153289794922, -167.65541076660156, -160.39549255371094, -153.1355743408203, -145.8756561279297, -138.61573791503906, -131.35581970214844, -124.09590148925781, -116.83598327636719, -109.57606506347656, -102.31614685058594, -95.05622863769531, -87.79631042480469, -80.53639221191406, -73.27647399902344, -66.01655578613281, -58.75663757324219, -51.49671936035156, -44.23680114746094, -36.97688293457031, -29.716964721679688, -22.457046508789062, -15.197128295898438, -7.9372100830078125, -0.6772918701171875, 6.5826263427734375, 13.842544555664062, 21.10247802734375, 28.362396240234375, 35.622314453125, 42.882232666015625, 50.14215087890625, 57.402069091796875, 64.6619873046875, 71.92190551757812, 79.18182373046875, 86.44174194335938, 93.70166015625, 100.96157836914062, 108.22149658203125, 115.48141479492188, 122.7413330078125, 130.00125122070312, 137.26116943359375, 144.52108764648438, 151.781005859375, 159.04092407226562, 166.30084228515625, 173.56076049804688, 180.8206787109375, 188.08059692382812, 195.34051513671875, 202.60043334960938, 209.8603515625, 217.12026977539062, 224.38018798828125, 231.64010620117188, 238.9000244140625, 246.15994262695312, 253.41986083984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 9.0, 10.0, 11.0, 21.0, 19.0, 21.0, 27.0, 28.0, 28.0, 32.0, 47.0, 37.0, 52.0, 60.0, 38.0, 38.0, 59.0, 43.0, 36.0, 49.0, 46.0, 42.0, 45.0, 26.0, 32.0, 16.0, 28.0, 25.0, 22.0, 13.0, 8.0, 13.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-126.20563507080078, -121.4463882446289, -116.68714141845703, -111.92789459228516, -107.16864776611328, -102.4094009399414, -97.65015411376953, -92.89090728759766, -88.13166046142578, -83.3724136352539, -78.61316680908203, -73.85391998291016, -69.09467315673828, -64.3354263305664, -59.57617950439453, -54.816932678222656, -50.05768585205078, -45.298439025878906, -40.53919219970703, -35.779945373535156, -31.02069854736328, -26.261451721191406, -21.50220489501953, -16.742958068847656, -11.983711242675781, -7.224464416503906, -2.4652175903320312, 2.2940292358398438, 7.053276062011719, 11.812522888183594, 16.57176971435547, 21.331016540527344, 26.090255737304688, 30.849502563476562, 35.60874938964844, 40.36799621582031, 45.12724304199219, 49.88648986816406, 54.64573669433594, 59.40498352050781, 64.16423034667969, 68.92347717285156, 73.68272399902344, 78.44197082519531, 83.20121765136719, 87.96046447753906, 92.71971130371094, 97.47895812988281, 102.23820495605469, 106.99745178222656, 111.75669860839844, 116.51594543457031, 121.27519226074219, 126.03443908691406, 130.79368591308594, 135.5529327392578, 140.3121795654297, 145.07142639160156, 149.83067321777344, 154.5899200439453, 159.3491668701172, 164.10841369628906, 168.86766052246094, 173.6269073486328, 178.3861541748047]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 9.0, 9.0, 10.0, 26.0, 18.0, 31.0, 66.0, 98.0, 177.0, 341.0, 613.0, 1445.0, 3971.0, 16158.0, 98447.0, 581589.0, 293256.0, 39792.0, 8039.0, 2416.0, 979.0, 489.0, 250.0, 139.0, 58.0, 31.0, 35.0, 21.0, 13.0, 14.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-113.125, -109.05078125, -104.9765625, -100.90234375, -96.828125, -92.75390625, -88.6796875, -84.60546875, -80.53125, -76.45703125, -72.3828125, -68.30859375, -64.234375, -60.16015625, -56.0859375, -52.01171875, -47.9375, -43.86328125, -39.7890625, -35.71484375, -31.640625, -27.56640625, -23.4921875, -19.41796875, -15.34375, -11.26953125, -7.1953125, -3.12109375, 0.953125, 5.02734375, 9.1015625, 13.17578125, 17.25, 21.32421875, 25.3984375, 29.47265625, 33.546875, 37.62109375, 41.6953125, 45.76953125, 49.84375, 53.91796875, 57.9921875, 62.06640625, 66.140625, 70.21484375, 74.2890625, 78.36328125, 82.4375, 86.51171875, 90.5859375, 94.66015625, 98.734375, 102.80859375, 106.8828125, 110.95703125, 115.03125, 119.10546875, 123.1796875, 127.25390625, 131.328125, 135.40234375, 139.4765625, 143.55078125, 147.625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 24.0, 10.0, 28.0, 39.0, 51.0, 58.0, 76.0, 67.0, 77.0, 73.0, 75.0, 89.0, 70.0, 56.0, 44.0, 40.0, 40.0, 23.0, 7.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.65625, -20.92138671875, -20.1865234375, -19.45166015625, -18.716796875, -17.98193359375, -17.2470703125, -16.51220703125, -15.77734375, -15.04248046875, -14.3076171875, -13.57275390625, -12.837890625, -12.10302734375, -11.3681640625, -10.63330078125, -9.8984375, -9.16357421875, -8.4287109375, -7.69384765625, -6.958984375, -6.22412109375, -5.4892578125, -4.75439453125, -4.01953125, -3.28466796875, -2.5498046875, -1.81494140625, -1.080078125, -0.34521484375, 0.3896484375, 1.12451171875, 1.859375, 2.59423828125, 3.3291015625, 4.06396484375, 4.798828125, 5.53369140625, 6.2685546875, 7.00341796875, 7.73828125, 8.47314453125, 9.2080078125, 9.94287109375, 10.677734375, 11.41259765625, 12.1474609375, 12.88232421875, 13.6171875, 14.35205078125, 15.0869140625, 15.82177734375, 16.556640625, 17.29150390625, 18.0263671875, 18.76123046875, 19.49609375, 20.23095703125, 20.9658203125, 21.70068359375, 22.435546875, 23.17041015625, 23.9052734375, 24.64013671875, 25.375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 8.0, 8.0, 15.0, 20.0, 36.0, 44.0, 63.0, 92.0, 112.0, 179.0, 235.0, 319.0, 521.0, 898.0, 1672.0, 3566.0, 8933.0, 25334.0, 83466.0, 328810.0, 426043.0, 114575.0, 33360.0, 11262.0, 4282.0, 1934.0, 992.0, 545.0, 374.0, 222.0, 179.0, 122.0, 88.0, 58.0, 64.0, 35.0, 26.0, 13.0, 11.0, 4.0, 8.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.0625, -60.001953125, -57.94140625, -55.880859375, -53.8203125, -51.759765625, -49.69921875, -47.638671875, -45.578125, -43.517578125, -41.45703125, -39.396484375, -37.3359375, -35.275390625, -33.21484375, -31.154296875, -29.09375, -27.033203125, -24.97265625, -22.912109375, -20.8515625, -18.791015625, -16.73046875, -14.669921875, -12.609375, -10.548828125, -8.48828125, -6.427734375, -4.3671875, -2.306640625, -0.24609375, 1.814453125, 3.875, 5.935546875, 7.99609375, 10.056640625, 12.1171875, 14.177734375, 16.23828125, 18.298828125, 20.359375, 22.419921875, 24.48046875, 26.541015625, 28.6015625, 30.662109375, 32.72265625, 34.783203125, 36.84375, 38.904296875, 40.96484375, 43.025390625, 45.0859375, 47.146484375, 49.20703125, 51.267578125, 53.328125, 55.388671875, 57.44921875, 59.509765625, 61.5703125, 63.630859375, 65.69140625, 67.751953125, 69.8125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 6.0, 8.0, 11.0, 13.0, 18.0, 22.0, 19.0, 33.0, 21.0, 35.0, 40.0, 37.0, 36.0, 49.0, 52.0, 50.0, 59.0, 60.0, 59.0, 44.0, 42.0, 40.0, 41.0, 35.0, 28.0, 24.0, 11.0, 25.0, 22.0, 11.0, 7.0, 8.0, 9.0, 5.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.8125, -66.6806640625, -64.548828125, -62.4169921875, -60.28515625, -58.1533203125, -56.021484375, -53.8896484375, -51.7578125, -49.6259765625, -47.494140625, -45.3623046875, -43.23046875, -41.0986328125, -38.966796875, -36.8349609375, -34.703125, -32.5712890625, -30.439453125, -28.3076171875, -26.17578125, -24.0439453125, -21.912109375, -19.7802734375, -17.6484375, -15.5166015625, -13.384765625, -11.2529296875, -9.12109375, -6.9892578125, -4.857421875, -2.7255859375, -0.59375, 1.5380859375, 3.669921875, 5.8017578125, 7.93359375, 10.0654296875, 12.197265625, 14.3291015625, 16.4609375, 18.5927734375, 20.724609375, 22.8564453125, 24.98828125, 27.1201171875, 29.251953125, 31.3837890625, 33.515625, 35.6474609375, 37.779296875, 39.9111328125, 42.04296875, 44.1748046875, 46.306640625, 48.4384765625, 50.5703125, 52.7021484375, 54.833984375, 56.9658203125, 59.09765625, 61.2294921875, 63.361328125, 65.4931640625, 67.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 17.0, 25.0, 34.0, 50.0, 104.0, 174.0, 349.0, 742.0, 2026.0, 8144.0, 43827.0, 261641.0, 546005.0, 152831.0, 24955.0, 4902.0, 1434.0, 561.0, 294.0, 169.0, 98.0, 51.0, 37.0, 18.0, 13.0, 13.0, 9.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.609375, -30.600830078125, -29.59228515625, -28.583740234375, -27.5751953125, -26.566650390625, -25.55810546875, -24.549560546875, -23.541015625, -22.532470703125, -21.52392578125, -20.515380859375, -19.5068359375, -18.498291015625, -17.48974609375, -16.481201171875, -15.47265625, -14.464111328125, -13.45556640625, -12.447021484375, -11.4384765625, -10.429931640625, -9.42138671875, -8.412841796875, -7.404296875, -6.395751953125, -5.38720703125, -4.378662109375, -3.3701171875, -2.361572265625, -1.35302734375, -0.344482421875, 0.6640625, 1.672607421875, 2.68115234375, 3.689697265625, 4.6982421875, 5.706787109375, 6.71533203125, 7.723876953125, 8.732421875, 9.740966796875, 10.74951171875, 11.758056640625, 12.7666015625, 13.775146484375, 14.78369140625, 15.792236328125, 16.80078125, 17.809326171875, 18.81787109375, 19.826416015625, 20.8349609375, 21.843505859375, 22.85205078125, 23.860595703125, 24.869140625, 25.877685546875, 26.88623046875, 27.894775390625, 28.9033203125, 29.911865234375, 30.92041015625, 31.928955078125, 32.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 17.0, 11.0, 19.0, 23.0, 35.0, 41.0, 65.0, 87.0, 97.0, 93.0, 111.0, 88.0, 52.0, 54.0, 45.0, 36.0, 28.0, 21.0, 19.0, 6.0, 10.0, 12.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.0048789381980896, -0.004733920097351074, -0.004588901996612549, -0.0044438838958740234, -0.004298865795135498, -0.004153847694396973, -0.004008829593658447, -0.003863811492919922, -0.0037187933921813965, -0.003573775291442871, -0.0034287571907043457, -0.0032837390899658203, -0.003138720989227295, -0.0029937028884887695, -0.002848684787750244, -0.0027036666870117188, -0.0025586485862731934, -0.002413630485534668, -0.0022686123847961426, -0.002123594284057617, -0.001978576183319092, -0.0018335580825805664, -0.001688539981842041, -0.0015435218811035156, -0.0013985037803649902, -0.0012534856796264648, -0.0011084675788879395, -0.0009634494781494141, -0.0008184313774108887, -0.0006734132766723633, -0.0005283951759338379, -0.0003833770751953125, -0.0002383589744567871, -9.334087371826172e-05, 5.167722702026367e-05, 0.00019669532775878906, 0.00034171342849731445, 0.00048673152923583984, 0.0006317496299743652, 0.0007767677307128906, 0.000921785831451416, 0.0010668039321899414, 0.0012118220329284668, 0.0013568401336669922, 0.0015018582344055176, 0.001646876335144043, 0.0017918944358825684, 0.0019369125366210938, 0.002081930637359619, 0.0022269487380981445, 0.00237196683883667, 0.0025169849395751953, 0.0026620030403137207, 0.002807021141052246, 0.0029520392417907715, 0.003097057342529297, 0.0032420754432678223, 0.0033870935440063477, 0.003532111644744873, 0.0036771297454833984, 0.003822147846221924, 0.003967165946960449, 0.004112184047698975, 0.0042572021484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 14.0, 16.0, 33.0, 54.0, 92.0, 173.0, 249.0, 501.0, 982.0, 2387.0, 7658.0, 36065.0, 194647.0, 529780.0, 221065.0, 41417.0, 8537.0, 2658.0, 1001.0, 493.0, 287.0, 147.0, 104.0, 54.0, 32.0, 31.0, 18.0, 11.0, 12.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -33.168212890625, -32.14892578125, -31.129638671875, -30.1103515625, -29.091064453125, -28.07177734375, -27.052490234375, -26.033203125, -25.013916015625, -23.99462890625, -22.975341796875, -21.9560546875, -20.936767578125, -19.91748046875, -18.898193359375, -17.87890625, -16.859619140625, -15.84033203125, -14.821044921875, -13.8017578125, -12.782470703125, -11.76318359375, -10.743896484375, -9.724609375, -8.705322265625, -7.68603515625, -6.666748046875, -5.6474609375, -4.628173828125, -3.60888671875, -2.589599609375, -1.5703125, -0.551025390625, 0.46826171875, 1.487548828125, 2.5068359375, 3.526123046875, 4.54541015625, 5.564697265625, 6.583984375, 7.603271484375, 8.62255859375, 9.641845703125, 10.6611328125, 11.680419921875, 12.69970703125, 13.718994140625, 14.73828125, 15.757568359375, 16.77685546875, 17.796142578125, 18.8154296875, 19.834716796875, 20.85400390625, 21.873291015625, 22.892578125, 23.911865234375, 24.93115234375, 25.950439453125, 26.9697265625, 27.989013671875, 29.00830078125, 30.027587890625, 31.046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 10.0, 10.0, 9.0, 11.0, 25.0, 28.0, 38.0, 35.0, 62.0, 70.0, 79.0, 91.0, 95.0, 82.0, 64.0, 73.0, 51.0, 40.0, 26.0, 28.0, 18.0, 17.0, 13.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.71875, -26.935791015625, -26.15283203125, -25.369873046875, -24.5869140625, -23.803955078125, -23.02099609375, -22.238037109375, -21.455078125, -20.672119140625, -19.88916015625, -19.106201171875, -18.3232421875, -17.540283203125, -16.75732421875, -15.974365234375, -15.19140625, -14.408447265625, -13.62548828125, -12.842529296875, -12.0595703125, -11.276611328125, -10.49365234375, -9.710693359375, -8.927734375, -8.144775390625, -7.36181640625, -6.578857421875, -5.7958984375, -5.012939453125, -4.22998046875, -3.447021484375, -2.6640625, -1.881103515625, -1.09814453125, -0.315185546875, 0.4677734375, 1.250732421875, 2.03369140625, 2.816650390625, 3.599609375, 4.382568359375, 5.16552734375, 5.948486328125, 6.7314453125, 7.514404296875, 8.29736328125, 9.080322265625, 9.86328125, 10.646240234375, 11.42919921875, 12.212158203125, 12.9951171875, 13.778076171875, 14.56103515625, 15.343994140625, 16.126953125, 16.909912109375, 17.69287109375, 18.475830078125, 19.2587890625, 20.041748046875, 20.82470703125, 21.607666015625, 22.390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 13.0, 6.0, 21.0, 45.0, 78.0, 89.0, 132.0, 145.0, 124.0, 121.0, 70.0, 62.0, 42.0, 23.0, 10.0, 8.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-862.804931640625, -845.1047973632812, -827.4046630859375, -809.7045288085938, -792.00439453125, -774.3042602539062, -756.6041259765625, -738.904052734375, -721.203857421875, -703.5037231445312, -685.8035888671875, -668.1034545898438, -650.4033203125, -632.7031860351562, -615.0030517578125, -597.302978515625, -579.6028442382812, -561.9027099609375, -544.2025756835938, -526.50244140625, -508.80230712890625, -491.1021728515625, -473.4020690917969, -455.7019348144531, -438.0018005371094, -420.3016662597656, -402.6015319824219, -384.9013977050781, -367.2012939453125, -349.50115966796875, -331.801025390625, -314.10089111328125, -296.40069580078125, -278.7005615234375, -261.00042724609375, -243.30030822753906, -225.6001739501953, -207.90003967285156, -190.19992065429688, -172.49978637695312, -154.79965209960938, -137.09951782226562, -119.3993911743164, -101.69926452636719, -83.99913024902344, -66.29899597167969, -48.59886932373047, -30.89874267578125, -13.1986083984375, 4.501522064208984, 22.20165252685547, 39.90178298950195, 57.60191345214844, 75.30204772949219, 93.0021743774414, 110.70230102539062, 128.40243530273438, 146.10256958007812, 163.80270385742188, 181.50282287597656, 199.2029571533203, 216.90309143066406, 234.60321044921875, 252.3033447265625, 270.00347900390625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 12.0, 19.0, 17.0, 20.0, 27.0, 31.0, 37.0, 44.0, 36.0, 56.0, 55.0, 55.0, 67.0, 52.0, 52.0, 50.0, 56.0, 56.0, 53.0, 37.0, 34.0, 26.0, 22.0, 15.0, 17.0, 9.0, 6.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.99365234375, -448.9089660644531, -436.82427978515625, -424.7395935058594, -412.6549072265625, -400.5702209472656, -388.48553466796875, -376.40081787109375, -364.316162109375, -352.2314758300781, -340.14678955078125, -328.0621032714844, -315.9774169921875, -303.8927307128906, -291.80804443359375, -279.72332763671875, -267.6386413574219, -255.553955078125, -243.46926879882812, -231.38458251953125, -219.29989624023438, -207.2152099609375, -195.13050842285156, -183.0458221435547, -170.9611358642578, -158.87644958496094, -146.79176330566406, -134.70706176757812, -122.62238311767578, -110.5376968383789, -98.4530029296875, -86.36831665039062, -74.28363037109375, -62.198944091796875, -50.114253997802734, -38.029563903808594, -25.94487762451172, -13.860191345214844, -1.7754974365234375, 10.309188842773438, 22.393875122070312, 34.47856140136719, 46.56325149536133, 58.64794158935547, 70.73262786865234, 82.81731414794922, 94.90200805664062, 106.9866943359375, 119.07138061523438, 131.15606689453125, 143.24075317382812, 155.325439453125, 167.41012573242188, 179.49481201171875, 191.5795135498047, 203.66419982910156, 215.74888610839844, 227.8335723876953, 239.9182586669922, 252.00296020507812, 264.087646484375, 276.1723327636719, 288.25701904296875, 300.3417053222656, 312.4263916015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 9.0, 19.0, 20.0, 35.0, 42.0, 94.0, 152.0, 220.0, 453.0, 952.0, 2554.0, 8702.0, 58596.0, 4066785.0, 44032.0, 7387.0, 2336.0, 917.0, 407.0, 189.0, 135.0, 87.0, 43.0, 21.0, 24.0, 14.0, 15.0, 5.0, 5.0, 3.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.75, -213.5, -206.25, -199.0, -191.75, -184.5, -177.25, -170.0, -162.75, -155.5, -148.25, -141.0, -133.75, -126.5, -119.25, -112.0, -104.75, -97.5, -90.25, -83.0, -75.75, -68.5, -61.25, -54.0, -46.75, -39.5, -32.25, -25.0, -17.75, -10.5, -3.25, 4.0, 11.25, 18.5, 25.75, 33.0, 40.25, 47.5, 54.75, 62.0, 69.25, 76.5, 83.75, 91.0, 98.25, 105.5, 112.75, 120.0, 127.25, 134.5, 141.75, 149.0, 156.25, 163.5, 170.75, 178.0, 185.25, 192.5, 199.75, 207.0, 214.25, 221.5, 228.75, 236.0, 243.25]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 10.0, 6.0, 7.0, 10.0, 31.0, 20.0, 29.0, 42.0, 36.0, 54.0, 69.0, 63.0, 72.0, 60.0, 61.0, 77.0, 54.0, 58.0, 40.0, 42.0, 32.0, 31.0, 16.0, 17.0, 20.0, 8.0, 12.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.359375, -19.64990234375, -18.9404296875, -18.23095703125, -17.521484375, -16.81201171875, -16.1025390625, -15.39306640625, -14.68359375, -13.97412109375, -13.2646484375, -12.55517578125, -11.845703125, -11.13623046875, -10.4267578125, -9.71728515625, -9.0078125, -8.29833984375, -7.5888671875, -6.87939453125, -6.169921875, -5.46044921875, -4.7509765625, -4.04150390625, -3.33203125, -2.62255859375, -1.9130859375, -1.20361328125, -0.494140625, 0.21533203125, 0.9248046875, 1.63427734375, 2.34375, 3.05322265625, 3.7626953125, 4.47216796875, 5.181640625, 5.89111328125, 6.6005859375, 7.31005859375, 8.01953125, 8.72900390625, 9.4384765625, 10.14794921875, 10.857421875, 11.56689453125, 12.2763671875, 12.98583984375, 13.6953125, 14.40478515625, 15.1142578125, 15.82373046875, 16.533203125, 17.24267578125, 17.9521484375, 18.66162109375, 19.37109375, 20.08056640625, 20.7900390625, 21.49951171875, 22.208984375, 22.91845703125, 23.6279296875, 24.33740234375, 25.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 8.0, 18.0, 27.0, 50.0, 103.0, 215.0, 519.0, 1113.0, 2900.0, 8706.0, 43873.0, 3901007.0, 207708.0, 19636.0, 5155.0, 1818.0, 781.0, 321.0, 145.0, 75.0, 38.0, 20.0, 15.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.375, -158.0771484375, -153.779296875, -149.4814453125, -145.18359375, -140.8857421875, -136.587890625, -132.2900390625, -127.9921875, -123.6943359375, -119.396484375, -115.0986328125, -110.80078125, -106.5029296875, -102.205078125, -97.9072265625, -93.609375, -89.3115234375, -85.013671875, -80.7158203125, -76.41796875, -72.1201171875, -67.822265625, -63.5244140625, -59.2265625, -54.9287109375, -50.630859375, -46.3330078125, -42.03515625, -37.7373046875, -33.439453125, -29.1416015625, -24.84375, -20.5458984375, -16.248046875, -11.9501953125, -7.65234375, -3.3544921875, 0.943359375, 5.2412109375, 9.5390625, 13.8369140625, 18.134765625, 22.4326171875, 26.73046875, 31.0283203125, 35.326171875, 39.6240234375, 43.921875, 48.2197265625, 52.517578125, 56.8154296875, 61.11328125, 65.4111328125, 69.708984375, 74.0068359375, 78.3046875, 82.6025390625, 86.900390625, 91.1982421875, 95.49609375, 99.7939453125, 104.091796875, 108.3896484375, 112.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 7.0, 20.0, 20.0, 26.0, 43.0, 100.0, 177.0, 2657.0, 599.0, 150.0, 88.0, 53.0, 27.0, 27.0, 12.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.359375, -16.9130859375, -16.466796875, -16.0205078125, -15.57421875, -15.1279296875, -14.681640625, -14.2353515625, -13.7890625, -13.3427734375, -12.896484375, -12.4501953125, -12.00390625, -11.5576171875, -11.111328125, -10.6650390625, -10.21875, -9.7724609375, -9.326171875, -8.8798828125, -8.43359375, -7.9873046875, -7.541015625, -7.0947265625, -6.6484375, -6.2021484375, -5.755859375, -5.3095703125, -4.86328125, -4.4169921875, -3.970703125, -3.5244140625, -3.078125, -2.6318359375, -2.185546875, -1.7392578125, -1.29296875, -0.8466796875, -0.400390625, 0.0458984375, 0.4921875, 0.9384765625, 1.384765625, 1.8310546875, 2.27734375, 2.7236328125, 3.169921875, 3.6162109375, 4.0625, 4.5087890625, 4.955078125, 5.4013671875, 5.84765625, 6.2939453125, 6.740234375, 7.1865234375, 7.6328125, 8.0791015625, 8.525390625, 8.9716796875, 9.41796875, 9.8642578125, 10.310546875, 10.7568359375, 11.203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 12.0, 4.0, 9.0, 19.0, 13.0, 42.0, 51.0, 57.0, 70.0, 82.0, 88.0, 86.0, 91.0, 88.0, 73.0, 70.0, 39.0, 36.0, 23.0, 10.0, 9.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-87.95367431640625, -85.9128646850586, -83.87205505371094, -81.83124542236328, -79.79043579101562, -77.74961853027344, -75.70880889892578, -73.66799926757812, -71.62718963623047, -69.58638000488281, -67.54557037353516, -65.5047607421875, -63.46394729614258, -61.42313766479492, -59.38232421875, -57.341514587402344, -55.30070495605469, -53.25989532470703, -51.219085693359375, -49.17827224731445, -47.1374626159668, -45.09665298461914, -43.05583953857422, -41.01502990722656, -38.974220275878906, -36.93341064453125, -34.892601013183594, -32.85178756713867, -30.810977935791016, -28.77016830444336, -26.72935676574707, -24.68854522705078, -22.647735595703125, -20.60692596435547, -18.56611442565918, -16.52530288696289, -14.484493255615234, -12.443682670593262, -10.402872085571289, -8.362061500549316, -6.321250915527344, -4.280440330505371, -2.2396297454833984, -0.19881916046142578, 1.8419914245605469, 3.8828020095825195, 5.923612594604492, 7.964423179626465, 10.005233764648438, 12.04604434967041, 14.086854934692383, 16.127666473388672, 18.168476104736328, 20.209285736083984, 22.250097274780273, 24.290908813476562, 26.33171844482422, 28.372528076171875, 30.413339614868164, 32.45415115356445, 34.49496078491211, 36.535770416259766, 38.57658386230469, 40.617393493652344, 42.658203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 13.0, 16.0, 23.0, 22.0, 26.0, 31.0, 26.0, 39.0, 37.0, 45.0, 40.0, 44.0, 43.0, 33.0, 33.0, 47.0, 38.0, 36.0, 34.0, 43.0, 40.0, 25.0, 29.0, 25.0, 27.0, 22.0, 17.0, 13.0, 10.0, 14.0, 14.0, 7.0, 7.0, 7.0, 11.0, 3.0, 3.0, 1.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-34.16252899169922, -33.09475326538086, -32.0269775390625, -30.95920181274414, -29.89142608642578, -28.823650360107422, -27.75587272644043, -26.68809700012207, -25.62032127380371, -24.55254554748535, -23.484769821166992, -22.416994094848633, -21.34921646118164, -20.28144073486328, -19.213665008544922, -18.145889282226562, -17.078113555908203, -16.010337829589844, -14.942562103271484, -13.874785423278809, -12.80700969696045, -11.73923397064209, -10.671457290649414, -9.603681564331055, -8.535905838012695, -7.468130111694336, -6.400353908538818, -5.332577705383301, -4.264801979064941, -3.197026252746582, -2.1292500495910645, -1.0614738464355469, 0.0063018798828125, 1.074077844619751, 2.1418538093566895, 3.209629774093628, 4.277405738830566, 5.345181465148926, 6.412957668304443, 7.480733871459961, 8.54850959777832, 9.61628532409668, 10.684061050415039, 11.751837730407715, 12.819613456726074, 13.887389183044434, 14.95516586303711, 16.02294158935547, 17.090717315673828, 18.158493041992188, 19.226268768310547, 20.294044494628906, 21.361820220947266, 22.429595947265625, 23.497373580932617, 24.565149307250977, 25.632925033569336, 26.700700759887695, 27.768476486206055, 28.836252212524414, 29.904029846191406, 30.971805572509766, 32.039581298828125, 33.107357025146484, 34.175132751464844]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 10.0, 24.0, 34.0, 39.0, 44.0, 58.0, 118.0, 176.0, 265.0, 430.0, 680.0, 1137.0, 2198.0, 4648.0, 10888.0, 27319.0, 72210.0, 197389.0, 367353.0, 225728.0, 83004.0, 31511.0, 12307.0, 5325.0, 2413.0, 1270.0, 665.0, 429.0, 270.0, 183.0, 125.0, 78.0, 57.0, 46.0, 30.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-60.09375, -58.3037109375, -56.513671875, -54.7236328125, -52.93359375, -51.1435546875, -49.353515625, -47.5634765625, -45.7734375, -43.9833984375, -42.193359375, -40.4033203125, -38.61328125, -36.8232421875, -35.033203125, -33.2431640625, -31.453125, -29.6630859375, -27.873046875, -26.0830078125, -24.29296875, -22.5029296875, -20.712890625, -18.9228515625, -17.1328125, -15.3427734375, -13.552734375, -11.7626953125, -9.97265625, -8.1826171875, -6.392578125, -4.6025390625, -2.8125, -1.0224609375, 0.767578125, 2.5576171875, 4.34765625, 6.1376953125, 7.927734375, 9.7177734375, 11.5078125, 13.2978515625, 15.087890625, 16.8779296875, 18.66796875, 20.4580078125, 22.248046875, 24.0380859375, 25.828125, 27.6181640625, 29.408203125, 31.1982421875, 32.98828125, 34.7783203125, 36.568359375, 38.3583984375, 40.1484375, 41.9384765625, 43.728515625, 45.5185546875, 47.30859375, 49.0986328125, 50.888671875, 52.6787109375, 54.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 7.0, 11.0, 14.0, 11.0, 22.0, 30.0, 40.0, 40.0, 47.0, 46.0, 49.0, 62.0, 81.0, 52.0, 64.0, 76.0, 52.0, 50.0, 39.0, 42.0, 24.0, 35.0, 26.0, 18.0, 16.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.9375, -20.229248046875, -19.52099609375, -18.812744140625, -18.1044921875, -17.396240234375, -16.68798828125, -15.979736328125, -15.271484375, -14.563232421875, -13.85498046875, -13.146728515625, -12.4384765625, -11.730224609375, -11.02197265625, -10.313720703125, -9.60546875, -8.897216796875, -8.18896484375, -7.480712890625, -6.7724609375, -6.064208984375, -5.35595703125, -4.647705078125, -3.939453125, -3.231201171875, -2.52294921875, -1.814697265625, -1.1064453125, -0.398193359375, 0.31005859375, 1.018310546875, 1.7265625, 2.434814453125, 3.14306640625, 3.851318359375, 4.5595703125, 5.267822265625, 5.97607421875, 6.684326171875, 7.392578125, 8.100830078125, 8.80908203125, 9.517333984375, 10.2255859375, 10.933837890625, 11.64208984375, 12.350341796875, 13.05859375, 13.766845703125, 14.47509765625, 15.183349609375, 15.8916015625, 16.599853515625, 17.30810546875, 18.016357421875, 18.724609375, 19.432861328125, 20.14111328125, 20.849365234375, 21.5576171875, 22.265869140625, 22.97412109375, 23.682373046875, 24.390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 12.0, 26.0, 35.0, 65.0, 80.0, 168.0, 246.0, 403.0, 723.0, 1325.0, 3873.0, 21812.0, 213083.0, 697701.0, 92719.0, 11213.0, 2508.0, 1048.0, 567.0, 350.0, 195.0, 126.0, 87.0, 62.0, 40.0, 16.0, 16.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.3125, -110.01171875, -106.7109375, -103.41015625, -100.109375, -96.80859375, -93.5078125, -90.20703125, -86.90625, -83.60546875, -80.3046875, -77.00390625, -73.703125, -70.40234375, -67.1015625, -63.80078125, -60.5, -57.19921875, -53.8984375, -50.59765625, -47.296875, -43.99609375, -40.6953125, -37.39453125, -34.09375, -30.79296875, -27.4921875, -24.19140625, -20.890625, -17.58984375, -14.2890625, -10.98828125, -7.6875, -4.38671875, -1.0859375, 2.21484375, 5.515625, 8.81640625, 12.1171875, 15.41796875, 18.71875, 22.01953125, 25.3203125, 28.62109375, 31.921875, 35.22265625, 38.5234375, 41.82421875, 45.125, 48.42578125, 51.7265625, 55.02734375, 58.328125, 61.62890625, 64.9296875, 68.23046875, 71.53125, 74.83203125, 78.1328125, 81.43359375, 84.734375, 88.03515625, 91.3359375, 94.63671875, 97.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 12.0, 5.0, 16.0, 10.0, 13.0, 19.0, 23.0, 33.0, 22.0, 32.0, 33.0, 34.0, 32.0, 41.0, 37.0, 42.0, 40.0, 46.0, 47.0, 42.0, 46.0, 53.0, 31.0, 48.0, 29.0, 22.0, 28.0, 22.0, 18.0, 25.0, 16.0, 11.0, 7.0, 13.0, 10.0, 7.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.23046875, -60.0234375, -57.81640625, -55.609375, -53.40234375, -51.1953125, -48.98828125, -46.78125, -44.57421875, -42.3671875, -40.16015625, -37.953125, -35.74609375, -33.5390625, -31.33203125, -29.125, -26.91796875, -24.7109375, -22.50390625, -20.296875, -18.08984375, -15.8828125, -13.67578125, -11.46875, -9.26171875, -7.0546875, -4.84765625, -2.640625, -0.43359375, 1.7734375, 3.98046875, 6.1875, 8.39453125, 10.6015625, 12.80859375, 15.015625, 17.22265625, 19.4296875, 21.63671875, 23.84375, 26.05078125, 28.2578125, 30.46484375, 32.671875, 34.87890625, 37.0859375, 39.29296875, 41.5, 43.70703125, 45.9140625, 48.12109375, 50.328125, 52.53515625, 54.7421875, 56.94921875, 59.15625, 61.36328125, 63.5703125, 65.77734375, 67.984375, 70.19140625, 72.3984375, 74.60546875, 76.8125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 6.0, 7.0, 14.0, 13.0, 17.0, 27.0, 43.0, 58.0, 64.0, 102.0, 171.0, 256.0, 483.0, 852.0, 1675.0, 3644.0, 8717.0, 22809.0, 74167.0, 291430.0, 454634.0, 130355.0, 36271.0, 12627.0, 5143.0, 2313.0, 1130.0, 570.0, 325.0, 214.0, 130.0, 85.0, 55.0, 47.0, 21.0, 17.0, 14.0, 14.0, 10.0, 11.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.8125, -21.065673828125, -20.31884765625, -19.572021484375, -18.8251953125, -18.078369140625, -17.33154296875, -16.584716796875, -15.837890625, -15.091064453125, -14.34423828125, -13.597412109375, -12.8505859375, -12.103759765625, -11.35693359375, -10.610107421875, -9.86328125, -9.116455078125, -8.36962890625, -7.622802734375, -6.8759765625, -6.129150390625, -5.38232421875, -4.635498046875, -3.888671875, -3.141845703125, -2.39501953125, -1.648193359375, -0.9013671875, -0.154541015625, 0.59228515625, 1.339111328125, 2.0859375, 2.832763671875, 3.57958984375, 4.326416015625, 5.0732421875, 5.820068359375, 6.56689453125, 7.313720703125, 8.060546875, 8.807373046875, 9.55419921875, 10.301025390625, 11.0478515625, 11.794677734375, 12.54150390625, 13.288330078125, 14.03515625, 14.781982421875, 15.52880859375, 16.275634765625, 17.0224609375, 17.769287109375, 18.51611328125, 19.262939453125, 20.009765625, 20.756591796875, 21.50341796875, 22.250244140625, 22.9970703125, 23.743896484375, 24.49072265625, 25.237548828125, 25.984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 12.0, 14.0, 22.0, 19.0, 30.0, 34.0, 50.0, 48.0, 74.0, 73.0, 82.0, 80.0, 73.0, 76.0, 62.0, 37.0, 36.0, 27.0, 34.0, 14.0, 20.0, 8.0, 8.0, 10.0, 8.0, 5.0, 2.0, 1.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0038967132568359375, -0.0037879645824432373, -0.003679215908050537, -0.003570467233657837, -0.0034617185592651367, -0.0033529698848724365, -0.0032442212104797363, -0.003135472536087036, -0.003026723861694336, -0.0029179751873016357, -0.0028092265129089355, -0.0027004778385162354, -0.002591729164123535, -0.002482980489730835, -0.0023742318153381348, -0.0022654831409454346, -0.0021567344665527344, -0.002047985792160034, -0.001939237117767334, -0.0018304884433746338, -0.0017217397689819336, -0.0016129910945892334, -0.0015042424201965332, -0.001395493745803833, -0.0012867450714111328, -0.0011779963970184326, -0.0010692477226257324, -0.0009604990482330322, -0.000851750373840332, -0.0007430016994476318, -0.0006342530250549316, -0.0005255043506622314, -0.00041675567626953125, -0.00030800700187683105, -0.00019925832748413086, -9.050965309143066e-05, 1.823902130126953e-05, 0.00012698769569396973, 0.00023573637008666992, 0.0003444850444793701, 0.0004532337188720703, 0.0005619823932647705, 0.0006707310676574707, 0.0007794797420501709, 0.0008882284164428711, 0.0009969770908355713, 0.0011057257652282715, 0.0012144744396209717, 0.0013232231140136719, 0.001431971788406372, 0.0015407204627990723, 0.0016494691371917725, 0.0017582178115844727, 0.0018669664859771729, 0.001975715160369873, 0.0020844638347625732, 0.0021932125091552734, 0.0023019611835479736, 0.002410709857940674, 0.002519458532333374, 0.0026282072067260742, 0.0027369558811187744, 0.0028457045555114746, 0.002954453229904175, 0.003063201904296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 22.0, 34.0, 41.0, 60.0, 119.0, 200.0, 422.0, 1075.0, 4072.0, 25106.0, 385583.0, 587790.0, 36429.0, 5204.0, 1378.0, 511.0, 207.0, 114.0, 59.0, 31.0, 30.0, 18.0, 10.0, 13.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0625, -57.37890625, -55.6953125, -54.01171875, -52.328125, -50.64453125, -48.9609375, -47.27734375, -45.59375, -43.91015625, -42.2265625, -40.54296875, -38.859375, -37.17578125, -35.4921875, -33.80859375, -32.125, -30.44140625, -28.7578125, -27.07421875, -25.390625, -23.70703125, -22.0234375, -20.33984375, -18.65625, -16.97265625, -15.2890625, -13.60546875, -11.921875, -10.23828125, -8.5546875, -6.87109375, -5.1875, -3.50390625, -1.8203125, -0.13671875, 1.546875, 3.23046875, 4.9140625, 6.59765625, 8.28125, 9.96484375, 11.6484375, 13.33203125, 15.015625, 16.69921875, 18.3828125, 20.06640625, 21.75, 23.43359375, 25.1171875, 26.80078125, 28.484375, 30.16796875, 31.8515625, 33.53515625, 35.21875, 36.90234375, 38.5859375, 40.26953125, 41.953125, 43.63671875, 45.3203125, 47.00390625, 48.6875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 20.0, 35.0, 48.0, 61.0, 80.0, 130.0, 132.0, 146.0, 101.0, 90.0, 38.0, 39.0, 21.0, 7.0, 14.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.21875, -50.93603515625, -49.6533203125, -48.37060546875, -47.087890625, -45.80517578125, -44.5224609375, -43.23974609375, -41.95703125, -40.67431640625, -39.3916015625, -38.10888671875, -36.826171875, -35.54345703125, -34.2607421875, -32.97802734375, -31.6953125, -30.41259765625, -29.1298828125, -27.84716796875, -26.564453125, -25.28173828125, -23.9990234375, -22.71630859375, -21.43359375, -20.15087890625, -18.8681640625, -17.58544921875, -16.302734375, -15.02001953125, -13.7373046875, -12.45458984375, -11.171875, -9.88916015625, -8.6064453125, -7.32373046875, -6.041015625, -4.75830078125, -3.4755859375, -2.19287109375, -0.91015625, 0.37255859375, 1.6552734375, 2.93798828125, 4.220703125, 5.50341796875, 6.7861328125, 8.06884765625, 9.3515625, 10.63427734375, 11.9169921875, 13.19970703125, 14.482421875, 15.76513671875, 17.0478515625, 18.33056640625, 19.61328125, 20.89599609375, 22.1787109375, 23.46142578125, 24.744140625, 26.02685546875, 27.3095703125, 28.59228515625, 29.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 27.0, 47.0, 68.0, 110.0, 169.0, 162.0, 133.0, 100.0, 77.0, 48.0, 23.0, 14.0, 4.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-349.2296142578125, -328.0545654296875, -306.8795166015625, -285.7044982910156, -264.5294494628906, -243.35440063476562, -222.1793670654297, -201.00433349609375, -179.82928466796875, -158.65423583984375, -137.4792022705078, -116.30416107177734, -95.12911987304688, -73.9540786743164, -52.77903747558594, -31.60400390625, -10.428955078125, 10.746086120605469, 31.921127319335938, 53.096168518066406, 74.27120971679688, 95.44625091552734, 116.62129211425781, 137.79632568359375, 158.97137451171875, 180.14642333984375, 201.3214569091797, 222.49649047851562, 243.67153930664062, 264.8465881347656, 286.0216064453125, 307.1966552734375, 328.3717041015625, 349.5467529296875, 370.7218017578125, 391.8968200683594, 413.0718688964844, 434.2469177246094, 455.42193603515625, 476.59698486328125, 497.77203369140625, 518.9470825195312, 540.1221313476562, 561.2971801757812, 582.47216796875, 603.647216796875, 624.822265625, 645.997314453125, 667.17236328125, 688.347412109375, 709.5224609375, 730.697509765625, 751.87255859375, 773.0475463867188, 794.2225952148438, 815.3976440429688, 836.5726928710938, 857.7477416992188, 878.9227905273438, 900.0978393554688, 921.2728271484375, 942.4478759765625, 963.6229248046875, 984.7979736328125, 1005.9730224609375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 8.0, 10.0, 9.0, 24.0, 12.0, 33.0, 22.0, 26.0, 32.0, 32.0, 21.0, 35.0, 42.0, 47.0, 42.0, 50.0, 43.0, 43.0, 38.0, 39.0, 26.0, 42.0, 42.0, 43.0, 34.0, 32.0, 19.0, 24.0, 23.0, 16.0, 10.0, 9.0, 9.0, 7.0, 6.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.5670166015625, -322.6954345703125, -311.8238525390625, -300.9522705078125, -290.0806884765625, -279.2091064453125, -268.3375244140625, -257.4659423828125, -246.5943603515625, -235.7227783203125, -224.8511962890625, -213.9796142578125, -203.1080322265625, -192.2364501953125, -181.3648681640625, -170.4932861328125, -159.6217041015625, -148.7501220703125, -137.8785400390625, -127.0069580078125, -116.1353759765625, -105.2637939453125, -94.3922119140625, -83.5206298828125, -72.6490478515625, -61.7774658203125, -50.9058837890625, -40.0343017578125, -29.1627197265625, -18.2911376953125, -7.4195556640625, 3.4520263671875, 14.3236083984375, 25.1951904296875, 36.0667724609375, 46.9383544921875, 57.8099365234375, 68.6815185546875, 79.5531005859375, 90.4246826171875, 101.2962646484375, 112.1678466796875, 123.0394287109375, 133.9110107421875, 144.7825927734375, 155.6541748046875, 166.5257568359375, 177.3973388671875, 188.2689208984375, 199.1405029296875, 210.0120849609375, 220.8836669921875, 231.7552490234375, 242.6268310546875, 253.4984130859375, 264.3699951171875, 275.2415771484375, 286.1131591796875, 296.9847412109375, 307.8563232421875, 318.7279052734375, 329.5994873046875, 340.4710693359375, 351.3426513671875, 362.2142333984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 14.0, 23.0, 24.0, 47.0, 85.0, 123.0, 200.0, 359.0, 725.0, 1604.0, 4013.0, 13559.0, 87485.0, 3984518.0, 81205.0, 13106.0, 3961.0, 1565.0, 696.0, 363.0, 229.0, 132.0, 68.0, 51.0, 32.0, 12.0, 21.0, 14.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.0, -132.015625, -127.03125, -122.046875, -117.0625, -112.078125, -107.09375, -102.109375, -97.125, -92.140625, -87.15625, -82.171875, -77.1875, -72.203125, -67.21875, -62.234375, -57.25, -52.265625, -47.28125, -42.296875, -37.3125, -32.328125, -27.34375, -22.359375, -17.375, -12.390625, -7.40625, -2.421875, 2.5625, 7.546875, 12.53125, 17.515625, 22.5, 27.484375, 32.46875, 37.453125, 42.4375, 47.421875, 52.40625, 57.390625, 62.375, 67.359375, 72.34375, 77.328125, 82.3125, 87.296875, 92.28125, 97.265625, 102.25, 107.234375, 112.21875, 117.203125, 122.1875, 127.171875, 132.15625, 137.140625, 142.125, 147.109375, 152.09375, 157.078125, 162.0625, 167.046875, 172.03125, 177.015625, 182.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 11.0, 20.0, 19.0, 26.0, 37.0, 23.0, 39.0, 55.0, 44.0, 53.0, 66.0, 70.0, 65.0, 75.0, 59.0, 59.0, 53.0, 31.0, 33.0, 38.0, 34.0, 13.0, 18.0, 7.0, 5.0, 9.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.3125, -20.600341796875, -19.88818359375, -19.176025390625, -18.4638671875, -17.751708984375, -17.03955078125, -16.327392578125, -15.615234375, -14.903076171875, -14.19091796875, -13.478759765625, -12.7666015625, -12.054443359375, -11.34228515625, -10.630126953125, -9.91796875, -9.205810546875, -8.49365234375, -7.781494140625, -7.0693359375, -6.357177734375, -5.64501953125, -4.932861328125, -4.220703125, -3.508544921875, -2.79638671875, -2.084228515625, -1.3720703125, -0.659912109375, 0.05224609375, 0.764404296875, 1.4765625, 2.188720703125, 2.90087890625, 3.613037109375, 4.3251953125, 5.037353515625, 5.74951171875, 6.461669921875, 7.173828125, 7.885986328125, 8.59814453125, 9.310302734375, 10.0224609375, 10.734619140625, 11.44677734375, 12.158935546875, 12.87109375, 13.583251953125, 14.29541015625, 15.007568359375, 15.7197265625, 16.431884765625, 17.14404296875, 17.856201171875, 18.568359375, 19.280517578125, 19.99267578125, 20.704833984375, 21.4169921875, 22.129150390625, 22.84130859375, 23.553466796875, 24.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 11.0, 12.0, 11.0, 20.0, 20.0, 48.0, 70.0, 99.0, 142.0, 228.0, 394.0, 651.0, 1264.0, 2619.0, 5856.0, 16034.0, 55093.0, 508501.0, 3491311.0, 77198.0, 20740.0, 7470.0, 3093.0, 1449.0, 818.0, 401.0, 263.0, 159.0, 102.0, 56.0, 34.0, 29.0, 19.0, 20.0, 5.0, 8.0, 7.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.4033203125, -67.806640625, -65.2099609375, -62.61328125, -60.0166015625, -57.419921875, -54.8232421875, -52.2265625, -49.6298828125, -47.033203125, -44.4365234375, -41.83984375, -39.2431640625, -36.646484375, -34.0498046875, -31.453125, -28.8564453125, -26.259765625, -23.6630859375, -21.06640625, -18.4697265625, -15.873046875, -13.2763671875, -10.6796875, -8.0830078125, -5.486328125, -2.8896484375, -0.29296875, 2.3037109375, 4.900390625, 7.4970703125, 10.09375, 12.6904296875, 15.287109375, 17.8837890625, 20.48046875, 23.0771484375, 25.673828125, 28.2705078125, 30.8671875, 33.4638671875, 36.060546875, 38.6572265625, 41.25390625, 43.8505859375, 46.447265625, 49.0439453125, 51.640625, 54.2373046875, 56.833984375, 59.4306640625, 62.02734375, 64.6240234375, 67.220703125, 69.8173828125, 72.4140625, 75.0107421875, 77.607421875, 80.2041015625, 82.80078125, 85.3974609375, 87.994140625, 90.5908203125, 93.1875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 14.0, 14.0, 32.0, 41.0, 76.0, 97.0, 230.0, 2551.0, 556.0, 166.0, 89.0, 42.0, 36.0, 28.0, 25.0, 13.0, 16.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.4805908203125, -10.953369140625, -10.4261474609375, -9.89892578125, -9.3717041015625, -8.844482421875, -8.3172607421875, -7.7900390625, -7.2628173828125, -6.735595703125, -6.2083740234375, -5.68115234375, -5.1539306640625, -4.626708984375, -4.0994873046875, -3.572265625, -3.0450439453125, -2.517822265625, -1.9906005859375, -1.46337890625, -0.9361572265625, -0.408935546875, 0.1182861328125, 0.6455078125, 1.1727294921875, 1.699951171875, 2.2271728515625, 2.75439453125, 3.2816162109375, 3.808837890625, 4.3360595703125, 4.86328125, 5.3905029296875, 5.917724609375, 6.4449462890625, 6.97216796875, 7.4993896484375, 8.026611328125, 8.5538330078125, 9.0810546875, 9.6082763671875, 10.135498046875, 10.6627197265625, 11.18994140625, 11.7171630859375, 12.244384765625, 12.7716064453125, 13.298828125, 13.8260498046875, 14.353271484375, 14.8804931640625, 15.40771484375, 15.9349365234375, 16.462158203125, 16.9893798828125, 17.5166015625, 18.0438232421875, 18.571044921875, 19.0982666015625, 19.62548828125, 20.1527099609375, 20.679931640625, 21.2071533203125, 21.734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 15.0, 33.0, 33.0, 81.0, 99.0, 131.0, 158.0, 122.0, 109.0, 84.0, 46.0, 34.0, 19.0, 9.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.72802734375, -83.01950073242188, -79.31096649169922, -75.6024398803711, -71.89390563964844, -68.18537902832031, -64.47685241699219, -60.7683219909668, -57.059791564941406, -53.351261138916016, -49.642730712890625, -45.9342041015625, -42.22567367553711, -38.51714324951172, -34.808616638183594, -31.100086212158203, -27.391555786132812, -23.683025360107422, -19.974496841430664, -16.265968322753906, -12.557437896728516, -8.848907470703125, -5.140378952026367, -1.4318504333496094, 2.2766799926757812, 5.9852094650268555, 9.69373893737793, 13.402268409729004, 17.110797882080078, 20.81932830810547, 24.527856826782227, 28.236385345458984, 31.944915771484375, 35.653446197509766, 39.361976623535156, 43.07050323486328, 46.77903366088867, 50.48756408691406, 54.19609069824219, 57.90462112426758, 61.61315155029297, 65.3216781616211, 69.03021240234375, 72.73873901367188, 76.447265625, 80.15579986572266, 83.86432647705078, 87.57286071777344, 91.28138732910156, 94.98991394042969, 98.69844818115234, 102.40697479248047, 106.11550903320312, 109.82403564453125, 113.53256225585938, 117.2410888671875, 120.94962310791016, 124.65814971923828, 128.36668395996094, 132.07521057128906, 135.7837371826172, 139.49227905273438, 143.2008056640625, 146.90933227539062, 150.61785888671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 6.0, 7.0, 11.0, 22.0, 18.0, 23.0, 26.0, 24.0, 29.0, 26.0, 41.0, 27.0, 25.0, 35.0, 47.0, 45.0, 33.0, 38.0, 60.0, 44.0, 34.0, 33.0, 34.0, 29.0, 32.0, 24.0, 27.0, 21.0, 17.0, 15.0, 21.0, 23.0, 16.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-44.682899475097656, -43.43684768676758, -42.190792083740234, -40.944740295410156, -39.69868850708008, -38.45263671875, -37.206581115722656, -35.96052932739258, -34.7144775390625, -33.46842575073242, -32.22237014770508, -30.976318359375, -29.730266571044922, -28.48421287536621, -27.2381591796875, -25.992107391357422, -24.74605369567871, -23.5, -22.253948211669922, -21.00789451599121, -19.761842727661133, -18.515789031982422, -17.269737243652344, -16.023683547973633, -14.777630805969238, -13.531578063964844, -12.28552532196045, -11.039472579956055, -9.793418884277344, -8.547367095947266, -7.301313400268555, -6.05526065826416, -4.809207916259766, -3.563155174255371, -2.3171021938323975, -1.0710492134094238, 0.1750035285949707, 1.4210562705993652, 2.667109489440918, 3.9131622314453125, 5.159214973449707, 6.405267715454102, 7.651320457458496, 8.89737319946289, 10.143426895141602, 11.38947868347168, 12.63553237915039, 13.881585121154785, 15.12763786315918, 16.37369155883789, 17.61974334716797, 18.86579704284668, 20.111848831176758, 21.35790252685547, 22.603954315185547, 23.850008010864258, 25.09606170654297, 26.34211540222168, 27.588167190551758, 28.83422088623047, 30.080272674560547, 31.326326370239258, 32.57238006591797, 33.81843185424805, 35.064483642578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 24.0, 19.0, 18.0, 54.0, 81.0, 111.0, 192.0, 298.0, 601.0, 1187.0, 2622.0, 5884.0, 16027.0, 47227.0, 148620.0, 367751.0, 299356.0, 104417.0, 33644.0, 11794.0, 4521.0, 1835.0, 986.0, 481.0, 271.0, 186.0, 107.0, 73.0, 39.0, 36.0, 20.0, 17.0, 12.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4375, -49.822265625, -48.20703125, -46.591796875, -44.9765625, -43.361328125, -41.74609375, -40.130859375, -38.515625, -36.900390625, -35.28515625, -33.669921875, -32.0546875, -30.439453125, -28.82421875, -27.208984375, -25.59375, -23.978515625, -22.36328125, -20.748046875, -19.1328125, -17.517578125, -15.90234375, -14.287109375, -12.671875, -11.056640625, -9.44140625, -7.826171875, -6.2109375, -4.595703125, -2.98046875, -1.365234375, 0.25, 1.865234375, 3.48046875, 5.095703125, 6.7109375, 8.326171875, 9.94140625, 11.556640625, 13.171875, 14.787109375, 16.40234375, 18.017578125, 19.6328125, 21.248046875, 22.86328125, 24.478515625, 26.09375, 27.708984375, 29.32421875, 30.939453125, 32.5546875, 34.169921875, 35.78515625, 37.400390625, 39.015625, 40.630859375, 42.24609375, 43.861328125, 45.4765625, 47.091796875, 48.70703125, 50.322265625, 51.9375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 6.0, 14.0, 21.0, 29.0, 24.0, 21.0, 24.0, 35.0, 48.0, 50.0, 47.0, 58.0, 67.0, 41.0, 67.0, 57.0, 57.0, 61.0, 49.0, 36.0, 41.0, 34.0, 26.0, 20.0, 11.0, 11.0, 9.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.421875, -21.691650390625, -20.96142578125, -20.231201171875, -19.5009765625, -18.770751953125, -18.04052734375, -17.310302734375, -16.580078125, -15.849853515625, -15.11962890625, -14.389404296875, -13.6591796875, -12.928955078125, -12.19873046875, -11.468505859375, -10.73828125, -10.008056640625, -9.27783203125, -8.547607421875, -7.8173828125, -7.087158203125, -6.35693359375, -5.626708984375, -4.896484375, -4.166259765625, -3.43603515625, -2.705810546875, -1.9755859375, -1.245361328125, -0.51513671875, 0.215087890625, 0.9453125, 1.675537109375, 2.40576171875, 3.135986328125, 3.8662109375, 4.596435546875, 5.32666015625, 6.056884765625, 6.787109375, 7.517333984375, 8.24755859375, 8.977783203125, 9.7080078125, 10.438232421875, 11.16845703125, 11.898681640625, 12.62890625, 13.359130859375, 14.08935546875, 14.819580078125, 15.5498046875, 16.280029296875, 17.01025390625, 17.740478515625, 18.470703125, 19.200927734375, 19.93115234375, 20.661376953125, 21.3916015625, 22.121826171875, 22.85205078125, 23.582275390625, 24.3125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 10.0, 14.0, 33.0, 52.0, 102.0, 205.0, 445.0, 873.0, 2228.0, 15214.0, 672271.0, 344929.0, 8897.0, 1811.0, 760.0, 350.0, 206.0, 84.0, 34.0, 20.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.0, -142.083984375, -137.16796875, -132.251953125, -127.3359375, -122.419921875, -117.50390625, -112.587890625, -107.671875, -102.755859375, -97.83984375, -92.923828125, -88.0078125, -83.091796875, -78.17578125, -73.259765625, -68.34375, -63.427734375, -58.51171875, -53.595703125, -48.6796875, -43.763671875, -38.84765625, -33.931640625, -29.015625, -24.099609375, -19.18359375, -14.267578125, -9.3515625, -4.435546875, 0.48046875, 5.396484375, 10.3125, 15.228515625, 20.14453125, 25.060546875, 29.9765625, 34.892578125, 39.80859375, 44.724609375, 49.640625, 54.556640625, 59.47265625, 64.388671875, 69.3046875, 74.220703125, 79.13671875, 84.052734375, 88.96875, 93.884765625, 98.80078125, 103.716796875, 108.6328125, 113.548828125, 118.46484375, 123.380859375, 128.296875, 133.212890625, 138.12890625, 143.044921875, 147.9609375, 152.876953125, 157.79296875, 162.708984375, 167.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 0.0, 11.0, 10.0, 12.0, 9.0, 22.0, 16.0, 14.0, 34.0, 25.0, 32.0, 31.0, 40.0, 38.0, 44.0, 48.0, 40.0, 39.0, 62.0, 51.0, 37.0, 61.0, 38.0, 38.0, 34.0, 29.0, 37.0, 33.0, 18.0, 19.0, 9.0, 5.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.0, -77.3701171875, -74.740234375, -72.1103515625, -69.48046875, -66.8505859375, -64.220703125, -61.5908203125, -58.9609375, -56.3310546875, -53.701171875, -51.0712890625, -48.44140625, -45.8115234375, -43.181640625, -40.5517578125, -37.921875, -35.2919921875, -32.662109375, -30.0322265625, -27.40234375, -24.7724609375, -22.142578125, -19.5126953125, -16.8828125, -14.2529296875, -11.623046875, -8.9931640625, -6.36328125, -3.7333984375, -1.103515625, 1.5263671875, 4.15625, 6.7861328125, 9.416015625, 12.0458984375, 14.67578125, 17.3056640625, 19.935546875, 22.5654296875, 25.1953125, 27.8251953125, 30.455078125, 33.0849609375, 35.71484375, 38.3447265625, 40.974609375, 43.6044921875, 46.234375, 48.8642578125, 51.494140625, 54.1240234375, 56.75390625, 59.3837890625, 62.013671875, 64.6435546875, 67.2734375, 69.9033203125, 72.533203125, 75.1630859375, 77.79296875, 80.4228515625, 83.052734375, 85.6826171875, 88.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 16.0, 24.0, 44.0, 59.0, 113.0, 265.0, 767.0, 3195.0, 44200.0, 955077.0, 40290.0, 3187.0, 778.0, 272.0, 118.0, 68.0, 29.0, 17.0, 11.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.2490234375, -73.748046875, -71.2470703125, -68.74609375, -66.2451171875, -63.744140625, -61.2431640625, -58.7421875, -56.2412109375, -53.740234375, -51.2392578125, -48.73828125, -46.2373046875, -43.736328125, -41.2353515625, -38.734375, -36.2333984375, -33.732421875, -31.2314453125, -28.73046875, -26.2294921875, -23.728515625, -21.2275390625, -18.7265625, -16.2255859375, -13.724609375, -11.2236328125, -8.72265625, -6.2216796875, -3.720703125, -1.2197265625, 1.28125, 3.7822265625, 6.283203125, 8.7841796875, 11.28515625, 13.7861328125, 16.287109375, 18.7880859375, 21.2890625, 23.7900390625, 26.291015625, 28.7919921875, 31.29296875, 33.7939453125, 36.294921875, 38.7958984375, 41.296875, 43.7978515625, 46.298828125, 48.7998046875, 51.30078125, 53.8017578125, 56.302734375, 58.8037109375, 61.3046875, 63.8056640625, 66.306640625, 68.8076171875, 71.30859375, 73.8095703125, 76.310546875, 78.8115234375, 81.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 3.0, 9.0, 12.0, 15.0, 19.0, 30.0, 38.0, 48.0, 55.0, 63.0, 103.0, 108.0, 95.0, 93.0, 71.0, 52.0, 40.0, 32.0, 23.0, 15.0, 6.0, 11.0, 6.0, 9.0, 6.0, 5.0, 1.0, 6.0, 2.0, 4.0, 2.0], "bins": [-0.00531005859375, -0.005191385746002197, -0.0050727128982543945, -0.004954040050506592, -0.004835367202758789, -0.004716694355010986, -0.004598021507263184, -0.004479348659515381, -0.004360675811767578, -0.004242002964019775, -0.004123330116271973, -0.00400465726852417, -0.003885984420776367, -0.0037673115730285645, -0.0036486387252807617, -0.003529965877532959, -0.0034112930297851562, -0.0032926201820373535, -0.0031739473342895508, -0.003055274486541748, -0.0029366016387939453, -0.0028179287910461426, -0.00269925594329834, -0.002580583095550537, -0.0024619102478027344, -0.0023432374000549316, -0.002224564552307129, -0.002105891704559326, -0.0019872188568115234, -0.0018685460090637207, -0.001749873161315918, -0.0016312003135681152, -0.0015125274658203125, -0.0013938546180725098, -0.001275181770324707, -0.0011565089225769043, -0.0010378360748291016, -0.0009191632270812988, -0.0008004903793334961, -0.0006818175315856934, -0.0005631446838378906, -0.0004444718360900879, -0.00032579898834228516, -0.00020712614059448242, -8.845329284667969e-05, 3.0219554901123047e-05, 0.00014889240264892578, 0.0002675652503967285, 0.00038623809814453125, 0.000504910945892334, 0.0006235837936401367, 0.0007422566413879395, 0.0008609294891357422, 0.000979602336883545, 0.0010982751846313477, 0.0012169480323791504, 0.0013356208801269531, 0.0014542937278747559, 0.0015729665756225586, 0.0016916394233703613, 0.001810312271118164, 0.0019289851188659668, 0.0020476579666137695, 0.0021663308143615723, 0.002285003662109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 4.0, 13.0, 21.0, 22.0, 41.0, 75.0, 117.0, 192.0, 400.0, 1115.0, 3756.0, 25911.0, 784818.0, 217924.0, 10466.0, 2254.0, 739.0, 284.0, 151.0, 77.0, 64.0, 42.0, 21.0, 15.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8125, -59.8056640625, -57.798828125, -55.7919921875, -53.78515625, -51.7783203125, -49.771484375, -47.7646484375, -45.7578125, -43.7509765625, -41.744140625, -39.7373046875, -37.73046875, -35.7236328125, -33.716796875, -31.7099609375, -29.703125, -27.6962890625, -25.689453125, -23.6826171875, -21.67578125, -19.6689453125, -17.662109375, -15.6552734375, -13.6484375, -11.6416015625, -9.634765625, -7.6279296875, -5.62109375, -3.6142578125, -1.607421875, 0.3994140625, 2.40625, 4.4130859375, 6.419921875, 8.4267578125, 10.43359375, 12.4404296875, 14.447265625, 16.4541015625, 18.4609375, 20.4677734375, 22.474609375, 24.4814453125, 26.48828125, 28.4951171875, 30.501953125, 32.5087890625, 34.515625, 36.5224609375, 38.529296875, 40.5361328125, 42.54296875, 44.5498046875, 46.556640625, 48.5634765625, 50.5703125, 52.5771484375, 54.583984375, 56.5908203125, 58.59765625, 60.6044921875, 62.611328125, 64.6181640625, 66.625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 5.0, 22.0, 46.0, 107.0, 217.0, 205.0, 193.0, 107.0, 35.0, 23.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.859375, -28.842041015625, -26.82470703125, -24.807373046875, -22.7900390625, -20.772705078125, -18.75537109375, -16.738037109375, -14.720703125, -12.703369140625, -10.68603515625, -8.668701171875, -6.6513671875, -4.634033203125, -2.61669921875, -0.599365234375, 1.41796875, 3.435302734375, 5.45263671875, 7.469970703125, 9.4873046875, 11.504638671875, 13.52197265625, 15.539306640625, 17.556640625, 19.573974609375, 21.59130859375, 23.608642578125, 25.6259765625, 27.643310546875, 29.66064453125, 31.677978515625, 33.6953125, 35.712646484375, 37.72998046875, 39.747314453125, 41.7646484375, 43.781982421875, 45.79931640625, 47.816650390625, 49.833984375, 51.851318359375, 53.86865234375, 55.885986328125, 57.9033203125, 59.920654296875, 61.93798828125, 63.955322265625, 65.97265625, 67.989990234375, 70.00732421875, 72.024658203125, 74.0419921875, 76.059326171875, 78.07666015625, 80.093994140625, 82.111328125, 84.128662109375, 86.14599609375, 88.163330078125, 90.1806640625, 92.197998046875, 94.21533203125, 96.232666015625, 98.25]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 8.0, 16.0, 85.0, 198.0, 320.0, 240.0, 97.0, 26.0, 13.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.1193542480469, -271.5897216796875, -231.06005859375, -190.53042602539062, -150.0007781982422, -109.47113037109375, -68.94149780273438, -28.411834716796875, 12.1177978515625, 52.64744186401367, 93.17708587646484, 133.70672607421875, 174.2363739013672, 214.76602172851562, 255.295654296875, 295.8253173828125, 336.3549499511719, 376.88458251953125, 417.41424560546875, 457.9438781738281, 498.4735107421875, 539.003173828125, 579.5328369140625, 620.0625, 660.5921020507812, 701.1217651367188, 741.6513671875, 782.1810302734375, 822.710693359375, 863.2403564453125, 903.7699584960938, 944.2996215820312, 984.8292236328125, 1025.35888671875, 1065.8885498046875, 1106.418212890625, 1146.94775390625, 1187.4774169921875, 1228.007080078125, 1268.5367431640625, 1309.06640625, 1349.5960693359375, 1390.125732421875, 1430.6552734375, 1471.1849365234375, 1511.714599609375, 1552.2442626953125, 1592.77392578125, 1633.303466796875, 1673.8331298828125, 1714.36279296875, 1754.892333984375, 1795.4219970703125, 1835.95166015625, 1876.4813232421875, 1917.010986328125, 1957.5406494140625, 1998.0703125, 2038.5999755859375, 2079.129638671875, 2119.6591796875, 2160.18896484375, 2200.718505859375, 2241.248046875, 2281.77783203125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 7.0, 7.0, 19.0, 9.0, 6.0, 12.0, 12.0, 19.0, 25.0, 20.0, 37.0, 40.0, 31.0, 57.0, 39.0, 52.0, 47.0, 37.0, 56.0, 59.0, 50.0, 43.0, 50.0, 43.0, 32.0, 25.0, 27.0, 21.0, 21.0, 13.0, 14.0, 14.0, 10.0, 9.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-373.48114013671875, -361.5601806640625, -349.6391906738281, -337.7182312011719, -325.7972412109375, -313.87628173828125, -301.955322265625, -290.0343322753906, -278.1133728027344, -266.1924133300781, -254.27142333984375, -242.3504638671875, -230.4294891357422, -218.50851440429688, -206.58753967285156, -194.66656494140625, -182.74559020996094, -170.82461547851562, -158.9036407470703, -146.982666015625, -135.06170654296875, -123.14073181152344, -111.21975708007812, -99.29878997802734, -87.37781524658203, -75.45684051513672, -63.53587341308594, -51.614898681640625, -39.69392776489258, -27.77295684814453, -15.851982116699219, -3.9310150146484375, 7.989959716796875, 19.910930633544922, 31.8319034576416, 43.75287628173828, 55.67384719848633, 67.59481811523438, 79.51579284667969, 91.43675994873047, 103.35773468017578, 115.2787094116211, 127.19967651367188, 139.1206512451172, 151.0416259765625, 162.96258544921875, 174.88357543945312, 186.80453491210938, 198.7255096435547, 210.646484375, 222.5674591064453, 234.48843383789062, 246.40939331054688, 258.33038330078125, 270.2513427734375, 282.17230224609375, 294.0932922363281, 306.0142517089844, 317.93524169921875, 329.856201171875, 341.7771911621094, 353.6981506347656, 365.619140625, 377.54010009765625, 389.4610595703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 12.0, 22.0, 26.0, 36.0, 66.0, 76.0, 130.0, 195.0, 325.0, 607.0, 994.0, 2014.0, 4417.0, 10664.0, 44278.0, 4059196.0, 50600.0, 11242.0, 4514.0, 2124.0, 1149.0, 575.0, 364.0, 211.0, 154.0, 89.0, 58.0, 43.0, 18.0, 20.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-119.6875, -115.8916015625, -112.095703125, -108.2998046875, -104.50390625, -100.7080078125, -96.912109375, -93.1162109375, -89.3203125, -85.5244140625, -81.728515625, -77.9326171875, -74.13671875, -70.3408203125, -66.544921875, -62.7490234375, -58.953125, -55.1572265625, -51.361328125, -47.5654296875, -43.76953125, -39.9736328125, -36.177734375, -32.3818359375, -28.5859375, -24.7900390625, -20.994140625, -17.1982421875, -13.40234375, -9.6064453125, -5.810546875, -2.0146484375, 1.78125, 5.5771484375, 9.373046875, 13.1689453125, 16.96484375, 20.7607421875, 24.556640625, 28.3525390625, 32.1484375, 35.9443359375, 39.740234375, 43.5361328125, 47.33203125, 51.1279296875, 54.923828125, 58.7197265625, 62.515625, 66.3115234375, 70.107421875, 73.9033203125, 77.69921875, 81.4951171875, 85.291015625, 89.0869140625, 92.8828125, 96.6787109375, 100.474609375, 104.2705078125, 108.06640625, 111.8623046875, 115.658203125, 119.4541015625, 123.25]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 11.0, 2.0, 11.0, 14.0, 27.0, 33.0, 39.0, 40.0, 47.0, 51.0, 64.0, 75.0, 63.0, 80.0, 62.0, 73.0, 56.0, 51.0, 43.0, 26.0, 27.0, 22.0, 17.0, 16.0, 13.0, 8.0, 10.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.875, -28.02734375, -27.1796875, -26.33203125, -25.484375, -24.63671875, -23.7890625, -22.94140625, -22.09375, -21.24609375, -20.3984375, -19.55078125, -18.703125, -17.85546875, -17.0078125, -16.16015625, -15.3125, -14.46484375, -13.6171875, -12.76953125, -11.921875, -11.07421875, -10.2265625, -9.37890625, -8.53125, -7.68359375, -6.8359375, -5.98828125, -5.140625, -4.29296875, -3.4453125, -2.59765625, -1.75, -0.90234375, -0.0546875, 0.79296875, 1.640625, 2.48828125, 3.3359375, 4.18359375, 5.03125, 5.87890625, 6.7265625, 7.57421875, 8.421875, 9.26953125, 10.1171875, 10.96484375, 11.8125, 12.66015625, 13.5078125, 14.35546875, 15.203125, 16.05078125, 16.8984375, 17.74609375, 18.59375, 19.44140625, 20.2890625, 21.13671875, 21.984375, 22.83203125, 23.6796875, 24.52734375, 25.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 6.0, 7.0, 15.0, 27.0, 28.0, 30.0, 74.0, 84.0, 137.0, 169.0, 269.0, 476.0, 734.0, 1479.0, 2870.0, 6762.0, 19320.0, 187115.0, 3928118.0, 30077.0, 8869.0, 3675.0, 1661.0, 855.0, 467.0, 292.0, 208.0, 132.0, 92.0, 67.0, 39.0, 32.0, 32.0, 24.0, 15.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.3125, -75.0693359375, -71.826171875, -68.5830078125, -65.33984375, -62.0966796875, -58.853515625, -55.6103515625, -52.3671875, -49.1240234375, -45.880859375, -42.6376953125, -39.39453125, -36.1513671875, -32.908203125, -29.6650390625, -26.421875, -23.1787109375, -19.935546875, -16.6923828125, -13.44921875, -10.2060546875, -6.962890625, -3.7197265625, -0.4765625, 2.7666015625, 6.009765625, 9.2529296875, 12.49609375, 15.7392578125, 18.982421875, 22.2255859375, 25.46875, 28.7119140625, 31.955078125, 35.1982421875, 38.44140625, 41.6845703125, 44.927734375, 48.1708984375, 51.4140625, 54.6572265625, 57.900390625, 61.1435546875, 64.38671875, 67.6298828125, 70.873046875, 74.1162109375, 77.359375, 80.6025390625, 83.845703125, 87.0888671875, 90.33203125, 93.5751953125, 96.818359375, 100.0615234375, 103.3046875, 106.5478515625, 109.791015625, 113.0341796875, 116.27734375, 119.5205078125, 122.763671875, 126.0068359375, 129.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 8.0, 6.0, 8.0, 12.0, 40.0, 83.0, 3285.0, 439.0, 93.0, 31.0, 20.0, 13.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.69482421875, -22.9521484375, -22.20947265625, -21.466796875, -20.72412109375, -19.9814453125, -19.23876953125, -18.49609375, -17.75341796875, -17.0107421875, -16.26806640625, -15.525390625, -14.78271484375, -14.0400390625, -13.29736328125, -12.5546875, -11.81201171875, -11.0693359375, -10.32666015625, -9.583984375, -8.84130859375, -8.0986328125, -7.35595703125, -6.61328125, -5.87060546875, -5.1279296875, -4.38525390625, -3.642578125, -2.89990234375, -2.1572265625, -1.41455078125, -0.671875, 0.07080078125, 0.8134765625, 1.55615234375, 2.298828125, 3.04150390625, 3.7841796875, 4.52685546875, 5.26953125, 6.01220703125, 6.7548828125, 7.49755859375, 8.240234375, 8.98291015625, 9.7255859375, 10.46826171875, 11.2109375, 11.95361328125, 12.6962890625, 13.43896484375, 14.181640625, 14.92431640625, 15.6669921875, 16.40966796875, 17.15234375, 17.89501953125, 18.6376953125, 19.38037109375, 20.123046875, 20.86572265625, 21.6083984375, 22.35107421875, 23.09375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 10.0, 5.0, 9.0, 11.0, 26.0, 28.0, 40.0, 58.0, 73.0, 95.0, 104.0, 90.0, 102.0, 101.0, 78.0, 48.0, 42.0, 24.0, 20.0, 13.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.728843688964844, -48.334014892578125, -45.939186096191406, -43.54435729980469, -41.14952850341797, -38.75469970703125, -36.35987091064453, -33.96504211425781, -31.570215225219727, -29.175386428833008, -26.78055763244629, -24.385730743408203, -21.990901947021484, -19.596073150634766, -17.201244354248047, -14.806415557861328, -12.41158676147461, -10.01675796508789, -7.62192964553833, -5.2271013259887695, -2.832272529602051, -0.43744373321533203, 1.9573841094970703, 4.352212905883789, 6.747041702270508, 9.141870498657227, 11.536699295043945, 13.931527137756348, 16.32635498046875, 18.72118377685547, 21.116012573242188, 23.510841369628906, 25.905670166015625, 28.300498962402344, 30.695327758789062, 33.09015655517578, 35.4849853515625, 37.87981414794922, 40.27464294433594, 42.669471740722656, 45.064300537109375, 47.459129333496094, 49.85395812988281, 52.24878692626953, 54.64361572265625, 57.03844451904297, 59.43327331542969, 61.828102111816406, 64.22293090820312, 66.61775970458984, 69.01258850097656, 71.40741729736328, 73.80224609375, 76.19707489013672, 78.59190368652344, 80.98673248291016, 83.38155364990234, 85.77638244628906, 88.17121124267578, 90.5660400390625, 92.96086883544922, 95.35569763183594, 97.75052642822266, 100.14535522460938, 102.5401840209961]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 7.0, 9.0, 5.0, 12.0, 9.0, 21.0, 19.0, 21.0, 27.0, 32.0, 25.0, 23.0, 31.0, 42.0, 30.0, 43.0, 28.0, 41.0, 42.0, 43.0, 40.0, 45.0, 36.0, 32.0, 47.0, 37.0, 29.0, 18.0, 32.0, 25.0, 19.0, 11.0, 12.0, 10.0, 6.0, 16.0, 7.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-33.992958068847656, -32.957664489746094, -31.9223690032959, -30.887075424194336, -29.851781845092773, -28.816486358642578, -27.781192779541016, -26.745899200439453, -25.71060562133789, -24.675312042236328, -23.640016555786133, -22.60472297668457, -21.569429397583008, -20.534133911132812, -19.49884033203125, -18.463546752929688, -17.428251266479492, -16.39295768737793, -15.35766315460205, -14.322368621826172, -13.28707504272461, -12.25178050994873, -11.216485977172852, -10.181192398071289, -9.14589786529541, -8.110603332519531, -7.075309753417969, -6.04001522064209, -5.004721164703369, -3.9694271087646484, -2.9341325759887695, -1.8988385200500488, -0.8635444641113281, 0.17174971103668213, 1.2070438861846924, 2.242338180541992, 3.277632236480713, 4.312926292419434, 5.3482208251953125, 6.383514881134033, 7.418808937072754, 8.454103469848633, 9.489397048950195, 10.524691581726074, 11.559986114501953, 12.595279693603516, 13.630574226379395, 14.665868759155273, 15.701162338256836, 16.7364559173584, 17.771751403808594, 18.807044982910156, 19.84233856201172, 20.87763214111328, 21.912927627563477, 22.94822120666504, 23.983516693115234, 25.018810272216797, 26.054105758666992, 27.089399337768555, 28.124692916870117, 29.159988403320312, 30.195281982421875, 31.230575561523438, 32.265869140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 16.0, 33.0, 31.0, 86.0, 149.0, 265.0, 518.0, 1157.0, 2775.0, 8022.0, 27098.0, 105403.0, 383085.0, 377551.0, 103199.0, 26142.0, 7956.0, 2824.0, 1135.0, 497.0, 259.0, 141.0, 75.0, 36.0, 31.0, 22.0, 10.0, 12.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.84375, -57.00439453125, -55.1650390625, -53.32568359375, -51.486328125, -49.64697265625, -47.8076171875, -45.96826171875, -44.12890625, -42.28955078125, -40.4501953125, -38.61083984375, -36.771484375, -34.93212890625, -33.0927734375, -31.25341796875, -29.4140625, -27.57470703125, -25.7353515625, -23.89599609375, -22.056640625, -20.21728515625, -18.3779296875, -16.53857421875, -14.69921875, -12.85986328125, -11.0205078125, -9.18115234375, -7.341796875, -5.50244140625, -3.6630859375, -1.82373046875, 0.015625, 1.85498046875, 3.6943359375, 5.53369140625, 7.373046875, 9.21240234375, 11.0517578125, 12.89111328125, 14.73046875, 16.56982421875, 18.4091796875, 20.24853515625, 22.087890625, 23.92724609375, 25.7666015625, 27.60595703125, 29.4453125, 31.28466796875, 33.1240234375, 34.96337890625, 36.802734375, 38.64208984375, 40.4814453125, 42.32080078125, 44.16015625, 45.99951171875, 47.8388671875, 49.67822265625, 51.517578125, 53.35693359375, 55.1962890625, 57.03564453125, 58.875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 5.0, 5.0, 11.0, 8.0, 13.0, 13.0, 27.0, 24.0, 31.0, 41.0, 42.0, 58.0, 46.0, 57.0, 65.0, 69.0, 45.0, 73.0, 64.0, 64.0, 45.0, 39.0, 26.0, 27.0, 17.0, 17.0, 20.0, 7.0, 11.0, 9.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.96875, -27.1396484375, -26.310546875, -25.4814453125, -24.65234375, -23.8232421875, -22.994140625, -22.1650390625, -21.3359375, -20.5068359375, -19.677734375, -18.8486328125, -18.01953125, -17.1904296875, -16.361328125, -15.5322265625, -14.703125, -13.8740234375, -13.044921875, -12.2158203125, -11.38671875, -10.5576171875, -9.728515625, -8.8994140625, -8.0703125, -7.2412109375, -6.412109375, -5.5830078125, -4.75390625, -3.9248046875, -3.095703125, -2.2666015625, -1.4375, -0.6083984375, 0.220703125, 1.0498046875, 1.87890625, 2.7080078125, 3.537109375, 4.3662109375, 5.1953125, 6.0244140625, 6.853515625, 7.6826171875, 8.51171875, 9.3408203125, 10.169921875, 10.9990234375, 11.828125, 12.6572265625, 13.486328125, 14.3154296875, 15.14453125, 15.9736328125, 16.802734375, 17.6318359375, 18.4609375, 19.2900390625, 20.119140625, 20.9482421875, 21.77734375, 22.6064453125, 23.435546875, 24.2646484375, 25.09375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 18.0, 24.0, 36.0, 43.0, 93.0, 126.0, 194.0, 314.0, 477.0, 875.0, 1686.0, 5586.0, 46802.0, 706049.0, 263027.0, 16880.0, 3305.0, 1240.0, 647.0, 438.0, 232.0, 163.0, 104.0, 68.0, 39.0, 25.0, 20.0, 15.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -65.71484375, -62.5546875, -59.39453125, -56.234375, -53.07421875, -49.9140625, -46.75390625, -43.59375, -40.43359375, -37.2734375, -34.11328125, -30.953125, -27.79296875, -24.6328125, -21.47265625, -18.3125, -15.15234375, -11.9921875, -8.83203125, -5.671875, -2.51171875, 0.6484375, 3.80859375, 6.96875, 10.12890625, 13.2890625, 16.44921875, 19.609375, 22.76953125, 25.9296875, 29.08984375, 32.25, 35.41015625, 38.5703125, 41.73046875, 44.890625, 48.05078125, 51.2109375, 54.37109375, 57.53125, 60.69140625, 63.8515625, 67.01171875, 70.171875, 73.33203125, 76.4921875, 79.65234375, 82.8125, 85.97265625, 89.1328125, 92.29296875, 95.453125, 98.61328125, 101.7734375, 104.93359375, 108.09375, 111.25390625, 114.4140625, 117.57421875, 120.734375, 123.89453125, 127.0546875, 130.21484375, 133.375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 10.0, 8.0, 17.0, 21.0, 18.0, 29.0, 39.0, 42.0, 57.0, 59.0, 63.0, 76.0, 78.0, 66.0, 72.0, 68.0, 58.0, 51.0, 39.0, 37.0, 29.0, 19.0, 12.0, 13.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-185.25, -180.783203125, -176.31640625, -171.849609375, -167.3828125, -162.916015625, -158.44921875, -153.982421875, -149.515625, -145.048828125, -140.58203125, -136.115234375, -131.6484375, -127.181640625, -122.71484375, -118.248046875, -113.78125, -109.314453125, -104.84765625, -100.380859375, -95.9140625, -91.447265625, -86.98046875, -82.513671875, -78.046875, -73.580078125, -69.11328125, -64.646484375, -60.1796875, -55.712890625, -51.24609375, -46.779296875, -42.3125, -37.845703125, -33.37890625, -28.912109375, -24.4453125, -19.978515625, -15.51171875, -11.044921875, -6.578125, -2.111328125, 2.35546875, 6.822265625, 11.2890625, 15.755859375, 20.22265625, 24.689453125, 29.15625, 33.623046875, 38.08984375, 42.556640625, 47.0234375, 51.490234375, 55.95703125, 60.423828125, 64.890625, 69.357421875, 73.82421875, 78.291015625, 82.7578125, 87.224609375, 91.69140625, 96.158203125, 100.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 9.0, 11.0, 14.0, 28.0, 27.0, 38.0, 64.0, 87.0, 130.0, 242.0, 481.0, 1224.0, 4872.0, 40474.0, 774147.0, 208867.0, 13804.0, 2385.0, 802.0, 320.0, 201.0, 87.0, 62.0, 43.0, 29.0, 25.0, 11.0, 11.0, 11.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.76708984375, -40.3154296875, -38.86376953125, -37.412109375, -35.96044921875, -34.5087890625, -33.05712890625, -31.60546875, -30.15380859375, -28.7021484375, -27.25048828125, -25.798828125, -24.34716796875, -22.8955078125, -21.44384765625, -19.9921875, -18.54052734375, -17.0888671875, -15.63720703125, -14.185546875, -12.73388671875, -11.2822265625, -9.83056640625, -8.37890625, -6.92724609375, -5.4755859375, -4.02392578125, -2.572265625, -1.12060546875, 0.3310546875, 1.78271484375, 3.234375, 4.68603515625, 6.1376953125, 7.58935546875, 9.041015625, 10.49267578125, 11.9443359375, 13.39599609375, 14.84765625, 16.29931640625, 17.7509765625, 19.20263671875, 20.654296875, 22.10595703125, 23.5576171875, 25.00927734375, 26.4609375, 27.91259765625, 29.3642578125, 30.81591796875, 32.267578125, 33.71923828125, 35.1708984375, 36.62255859375, 38.07421875, 39.52587890625, 40.9775390625, 42.42919921875, 43.880859375, 45.33251953125, 46.7841796875, 48.23583984375, 49.6875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 6.0, 8.0, 8.0, 20.0, 14.0, 24.0, 36.0, 40.0, 56.0, 93.0, 113.0, 129.0, 112.0, 92.0, 66.0, 36.0, 31.0, 17.0, 17.0, 16.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003875732421875, -0.0037534236907958984, -0.003631114959716797, -0.0035088062286376953, -0.0033864974975585938, -0.003264188766479492, -0.0031418800354003906, -0.003019571304321289, -0.0028972625732421875, -0.002774953842163086, -0.0026526451110839844, -0.002530336380004883, -0.0024080276489257812, -0.0022857189178466797, -0.002163410186767578, -0.0020411014556884766, -0.001918792724609375, -0.0017964839935302734, -0.0016741752624511719, -0.0015518665313720703, -0.0014295578002929688, -0.0013072490692138672, -0.0011849403381347656, -0.001062631607055664, -0.0009403228759765625, -0.0008180141448974609, -0.0006957054138183594, -0.0005733966827392578, -0.00045108795166015625, -0.0003287792205810547, -0.00020647048950195312, -8.416175842285156e-05, 3.814697265625e-05, 0.00016045570373535156, 0.0002827644348144531, 0.0004050731658935547, 0.0005273818969726562, 0.0006496906280517578, 0.0007719993591308594, 0.0008943080902099609, 0.0010166168212890625, 0.001138925552368164, 0.0012612342834472656, 0.0013835430145263672, 0.0015058517456054688, 0.0016281604766845703, 0.0017504692077636719, 0.0018727779388427734, 0.001995086669921875, 0.0021173954010009766, 0.002239704132080078, 0.0023620128631591797, 0.0024843215942382812, 0.002606630325317383, 0.0027289390563964844, 0.002851247787475586, 0.0029735565185546875, 0.003095865249633789, 0.0032181739807128906, 0.003340482711791992, 0.0034627914428710938, 0.0035851001739501953, 0.003707408905029297, 0.0038297176361083984, 0.0039520263671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 13.0, 29.0, 64.0, 102.0, 196.0, 421.0, 1246.0, 7709.0, 188352.0, 823240.0, 23409.0, 2547.0, 691.0, 268.0, 119.0, 69.0, 37.0, 18.0, 8.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.49609375, -62.4296875, -60.36328125, -58.296875, -56.23046875, -54.1640625, -52.09765625, -50.03125, -47.96484375, -45.8984375, -43.83203125, -41.765625, -39.69921875, -37.6328125, -35.56640625, -33.5, -31.43359375, -29.3671875, -27.30078125, -25.234375, -23.16796875, -21.1015625, -19.03515625, -16.96875, -14.90234375, -12.8359375, -10.76953125, -8.703125, -6.63671875, -4.5703125, -2.50390625, -0.4375, 1.62890625, 3.6953125, 5.76171875, 7.828125, 9.89453125, 11.9609375, 14.02734375, 16.09375, 18.16015625, 20.2265625, 22.29296875, 24.359375, 26.42578125, 28.4921875, 30.55859375, 32.625, 34.69140625, 36.7578125, 38.82421875, 40.890625, 42.95703125, 45.0234375, 47.08984375, 49.15625, 51.22265625, 53.2890625, 55.35546875, 57.421875, 59.48828125, 61.5546875, 63.62109375, 65.6875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 1.0, 7.0, 8.0, 9.0, 13.0, 22.0, 18.0, 32.0, 58.0, 56.0, 83.0, 126.0, 118.0, 113.0, 87.0, 70.0, 59.0, 35.0, 22.0, 12.0, 9.0, 7.0, 6.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9375, -29.84814453125, -28.7587890625, -27.66943359375, -26.580078125, -25.49072265625, -24.4013671875, -23.31201171875, -22.22265625, -21.13330078125, -20.0439453125, -18.95458984375, -17.865234375, -16.77587890625, -15.6865234375, -14.59716796875, -13.5078125, -12.41845703125, -11.3291015625, -10.23974609375, -9.150390625, -8.06103515625, -6.9716796875, -5.88232421875, -4.79296875, -3.70361328125, -2.6142578125, -1.52490234375, -0.435546875, 0.65380859375, 1.7431640625, 2.83251953125, 3.921875, 5.01123046875, 6.1005859375, 7.18994140625, 8.279296875, 9.36865234375, 10.4580078125, 11.54736328125, 12.63671875, 13.72607421875, 14.8154296875, 15.90478515625, 16.994140625, 18.08349609375, 19.1728515625, 20.26220703125, 21.3515625, 22.44091796875, 23.5302734375, 24.61962890625, 25.708984375, 26.79833984375, 27.8876953125, 28.97705078125, 30.06640625, 31.15576171875, 32.2451171875, 33.33447265625, 34.423828125, 35.51318359375, 36.6025390625, 37.69189453125, 38.78125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 20.0, 70.0, 176.0, 306.0, 261.0, 111.0, 27.0, 17.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-839.79931640625, -805.8283081054688, -771.8572387695312, -737.88623046875, -703.9151611328125, -669.9441528320312, -635.97314453125, -602.0020751953125, -568.031005859375, -534.0599975585938, -500.08892822265625, -466.117919921875, -432.1468505859375, -398.17584228515625, -364.2048034667969, -330.2337646484375, -296.26275634765625, -262.2917175292969, -228.3206787109375, -194.3496551513672, -160.3786163330078, -126.40757751464844, -92.43655395507812, -58.46551513671875, -24.494476318359375, 9.476558685302734, 43.447593688964844, 77.41862487792969, 111.38966369628906, 145.36070251464844, 179.33172607421875, 213.30276489257812, 247.2738037109375, 281.2448425292969, 315.21588134765625, 349.1868896484375, 383.157958984375, 417.12896728515625, 451.1000061035156, 485.071044921875, 519.0421142578125, 553.0131225585938, 586.9841918945312, 620.9552001953125, 654.92626953125, 688.8972778320312, 722.8682861328125, 756.83935546875, 790.8103637695312, 824.7813720703125, 858.75244140625, 892.7234497070312, 926.6945190429688, 960.66552734375, 994.6365966796875, 1028.607666015625, 1062.57861328125, 1096.5496826171875, 1130.5206298828125, 1164.49169921875, 1198.4627685546875, 1232.433837890625, 1266.40478515625, 1300.3758544921875, 1334.346923828125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 4.0, 7.0, 16.0, 7.0, 15.0, 18.0, 20.0, 27.0, 10.0, 26.0, 32.0, 34.0, 38.0, 31.0, 34.0, 38.0, 49.0, 32.0, 43.0, 44.0, 49.0, 45.0, 39.0, 41.0, 37.0, 35.0, 34.0, 30.0, 32.0, 18.0, 24.0, 16.0, 13.0, 8.0, 8.0, 7.0, 10.0, 3.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-383.5564270019531, -372.88934326171875, -362.22222900390625, -351.5551452636719, -340.8880615234375, -330.220947265625, -319.5538635253906, -308.88677978515625, -298.21966552734375, -287.5525817871094, -276.8854675292969, -266.2183837890625, -255.55128479003906, -244.88418579101562, -234.21710205078125, -223.5500030517578, -212.88290405273438, -202.21580505371094, -191.5487060546875, -180.88162231445312, -170.2145233154297, -159.54742431640625, -148.88034057617188, -138.21324157714844, -127.546142578125, -116.87904357910156, -106.21195220947266, -95.54486083984375, -84.87776184082031, -74.21066284179688, -63.54357147216797, -52.87648010253906, -42.2093505859375, -31.542255401611328, -20.875160217285156, -10.208065032958984, 0.4590301513671875, 11.12612533569336, 21.79322052001953, 32.46031188964844, 43.127410888671875, 53.79450607299805, 64.46160125732422, 75.12869262695312, 85.79579162597656, 96.462890625, 107.1299819946289, 117.79707336425781, 128.46417236328125, 139.1312713623047, 149.79837036132812, 160.4654541015625, 171.13255310058594, 181.79965209960938, 192.46673583984375, 203.1338348388672, 213.80093383789062, 224.46803283691406, 235.1351318359375, 245.80221557617188, 256.46929931640625, 267.13641357421875, 277.8034973144531, 288.4705810546875, 299.1376953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 8.0, 4.0, 13.0, 16.0, 35.0, 41.0, 61.0, 102.0, 170.0, 321.0, 633.0, 1458.0, 3431.0, 9323.0, 38308.0, 3936131.0, 174795.0, 19267.0, 5754.0, 2209.0, 1034.0, 493.0, 266.0, 144.0, 81.0, 66.0, 32.0, 23.0, 17.0, 11.0, 10.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.3125, -97.79296875, -94.2734375, -90.75390625, -87.234375, -83.71484375, -80.1953125, -76.67578125, -73.15625, -69.63671875, -66.1171875, -62.59765625, -59.078125, -55.55859375, -52.0390625, -48.51953125, -45.0, -41.48046875, -37.9609375, -34.44140625, -30.921875, -27.40234375, -23.8828125, -20.36328125, -16.84375, -13.32421875, -9.8046875, -6.28515625, -2.765625, 0.75390625, 4.2734375, 7.79296875, 11.3125, 14.83203125, 18.3515625, 21.87109375, 25.390625, 28.91015625, 32.4296875, 35.94921875, 39.46875, 42.98828125, 46.5078125, 50.02734375, 53.546875, 57.06640625, 60.5859375, 64.10546875, 67.625, 71.14453125, 74.6640625, 78.18359375, 81.703125, 85.22265625, 88.7421875, 92.26171875, 95.78125, 99.30078125, 102.8203125, 106.33984375, 109.859375, 113.37890625, 116.8984375, 120.41796875, 123.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 11.0, 16.0, 33.0, 24.0, 39.0, 47.0, 62.0, 78.0, 77.0, 76.0, 93.0, 78.0, 81.0, 54.0, 47.0, 45.0, 32.0, 22.0, 26.0, 15.0, 6.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-41.6875, -40.64501953125, -39.6025390625, -38.56005859375, -37.517578125, -36.47509765625, -35.4326171875, -34.39013671875, -33.34765625, -32.30517578125, -31.2626953125, -30.22021484375, -29.177734375, -28.13525390625, -27.0927734375, -26.05029296875, -25.0078125, -23.96533203125, -22.9228515625, -21.88037109375, -20.837890625, -19.79541015625, -18.7529296875, -17.71044921875, -16.66796875, -15.62548828125, -14.5830078125, -13.54052734375, -12.498046875, -11.45556640625, -10.4130859375, -9.37060546875, -8.328125, -7.28564453125, -6.2431640625, -5.20068359375, -4.158203125, -3.11572265625, -2.0732421875, -1.03076171875, 0.01171875, 1.05419921875, 2.0966796875, 3.13916015625, 4.181640625, 5.22412109375, 6.2666015625, 7.30908203125, 8.3515625, 9.39404296875, 10.4365234375, 11.47900390625, 12.521484375, 13.56396484375, 14.6064453125, 15.64892578125, 16.69140625, 17.73388671875, 18.7763671875, 19.81884765625, 20.861328125, 21.90380859375, 22.9462890625, 23.98876953125, 25.03125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 5.0, 6.0, 6.0, 15.0, 19.0, 34.0, 40.0, 56.0, 66.0, 113.0, 201.0, 293.0, 412.0, 630.0, 1142.0, 2163.0, 4407.0, 10245.0, 30675.0, 194341.0, 3821474.0, 92151.0, 20431.0, 7490.0, 3495.0, 1753.0, 936.0, 603.0, 328.0, 242.0, 163.0, 116.0, 61.0, 39.0, 45.0, 17.0, 18.0, 21.0, 8.0, 9.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.34375, -57.4501953125, -55.556640625, -53.6630859375, -51.76953125, -49.8759765625, -47.982421875, -46.0888671875, -44.1953125, -42.3017578125, -40.408203125, -38.5146484375, -36.62109375, -34.7275390625, -32.833984375, -30.9404296875, -29.046875, -27.1533203125, -25.259765625, -23.3662109375, -21.47265625, -19.5791015625, -17.685546875, -15.7919921875, -13.8984375, -12.0048828125, -10.111328125, -8.2177734375, -6.32421875, -4.4306640625, -2.537109375, -0.6435546875, 1.25, 3.1435546875, 5.037109375, 6.9306640625, 8.82421875, 10.7177734375, 12.611328125, 14.5048828125, 16.3984375, 18.2919921875, 20.185546875, 22.0791015625, 23.97265625, 25.8662109375, 27.759765625, 29.6533203125, 31.546875, 33.4404296875, 35.333984375, 37.2275390625, 39.12109375, 41.0146484375, 42.908203125, 44.8017578125, 46.6953125, 48.5888671875, 50.482421875, 52.3759765625, 54.26953125, 56.1630859375, 58.056640625, 59.9501953125, 61.84375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 8.0, 6.0, 6.0, 17.0, 30.0, 37.0, 50.0, 62.0, 124.0, 378.0, 2708.0, 300.0, 116.0, 66.0, 41.0, 30.0, 22.0, 11.0, 6.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.78125, -19.15185546875, -18.5224609375, -17.89306640625, -17.263671875, -16.63427734375, -16.0048828125, -15.37548828125, -14.74609375, -14.11669921875, -13.4873046875, -12.85791015625, -12.228515625, -11.59912109375, -10.9697265625, -10.34033203125, -9.7109375, -9.08154296875, -8.4521484375, -7.82275390625, -7.193359375, -6.56396484375, -5.9345703125, -5.30517578125, -4.67578125, -4.04638671875, -3.4169921875, -2.78759765625, -2.158203125, -1.52880859375, -0.8994140625, -0.27001953125, 0.359375, 0.98876953125, 1.6181640625, 2.24755859375, 2.876953125, 3.50634765625, 4.1357421875, 4.76513671875, 5.39453125, 6.02392578125, 6.6533203125, 7.28271484375, 7.912109375, 8.54150390625, 9.1708984375, 9.80029296875, 10.4296875, 11.05908203125, 11.6884765625, 12.31787109375, 12.947265625, 13.57666015625, 14.2060546875, 14.83544921875, 15.46484375, 16.09423828125, 16.7236328125, 17.35302734375, 17.982421875, 18.61181640625, 19.2412109375, 19.87060546875, 20.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 17.0, 20.0, 20.0, 25.0, 42.0, 40.0, 68.0, 70.0, 98.0, 114.0, 96.0, 93.0, 74.0, 59.0, 53.0, 30.0, 27.0, 14.0, 13.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.06675720214844, -99.00914001464844, -95.95153045654297, -92.8939208984375, -89.8363037109375, -86.7786865234375, -83.72107696533203, -80.66346740722656, -77.60585021972656, -74.54823303222656, -71.4906234741211, -68.43301391601562, -65.37539672851562, -62.31778335571289, -59.260169982910156, -56.20255661010742, -53.14494323730469, -50.08732986450195, -47.02971649169922, -43.972103118896484, -40.91448974609375, -37.856876373291016, -34.79926300048828, -31.741649627685547, -28.684036254882812, -25.626422882080078, -22.568809509277344, -19.51119613647461, -16.453582763671875, -13.39596939086914, -10.338356018066406, -7.280742645263672, -4.2231292724609375, -1.1655158996582031, 1.8920974731445312, 4.949710845947266, 8.00732421875, 11.064937591552734, 14.122550964355469, 17.180164337158203, 20.237777709960938, 23.295391082763672, 26.353004455566406, 29.41061782836914, 32.468231201171875, 35.52584457397461, 38.583457946777344, 41.64107131958008, 44.69868469238281, 47.75629806518555, 50.81391143798828, 53.871524810791016, 56.92913818359375, 59.986751556396484, 63.04436492919922, 66.10197448730469, 69.15959167480469, 72.21720886230469, 75.27481842041016, 78.33242797851562, 81.39004516601562, 84.44766235351562, 87.5052719116211, 90.56288146972656, 93.62049865722656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 11.0, 9.0, 9.0, 6.0, 20.0, 15.0, 20.0, 17.0, 14.0, 22.0, 26.0, 33.0, 33.0, 46.0, 40.0, 43.0, 44.0, 50.0, 46.0, 48.0, 48.0, 46.0, 53.0, 47.0, 34.0, 35.0, 36.0, 26.0, 16.0, 29.0, 16.0, 16.0, 12.0, 10.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.46294403076172, -61.66453170776367, -59.866119384765625, -58.06770706176758, -56.26929473876953, -54.470882415771484, -52.67247009277344, -50.87405776977539, -49.075645446777344, -47.2772331237793, -45.47882080078125, -43.6804084777832, -41.881996154785156, -40.08358383178711, -38.28517150878906, -36.486759185791016, -34.68834686279297, -32.88993453979492, -31.091522216796875, -29.293109893798828, -27.49469757080078, -25.696285247802734, -23.897872924804688, -22.09946060180664, -20.301044464111328, -18.50263214111328, -16.704219818115234, -14.905807495117188, -13.10739517211914, -11.308981895446777, -9.51056957244873, -7.712157249450684, -5.913745880126953, -4.115333557128906, -2.3169209957122803, -0.5185084342956543, 1.2799038887023926, 3.0783166885375977, 4.8767290115356445, 6.675141334533691, 8.473553657531738, 10.271965980529785, 12.070378303527832, 13.868791580200195, 15.667203903198242, 17.46561622619629, 19.264028549194336, 21.062440872192383, 22.86085319519043, 24.659265518188477, 26.457677841186523, 28.25609016418457, 30.054502487182617, 31.852916717529297, 33.651329040527344, 35.44974136352539, 37.24815368652344, 39.046566009521484, 40.84497833251953, 42.64339065551758, 44.441802978515625, 46.24021530151367, 48.03862762451172, 49.837039947509766, 51.63545227050781]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 8.0, 7.0, 16.0, 17.0, 29.0, 43.0, 63.0, 111.0, 156.0, 227.0, 372.0, 652.0, 1175.0, 2221.0, 4894.0, 11477.0, 29517.0, 81389.0, 224506.0, 399909.0, 182838.0, 66699.0, 24105.0, 9448.0, 4109.0, 1983.0, 1047.0, 572.0, 348.0, 194.0, 135.0, 91.0, 43.0, 45.0, 28.0, 14.0, 11.0, 12.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.21875, -60.29833984375, -58.3779296875, -56.45751953125, -54.537109375, -52.61669921875, -50.6962890625, -48.77587890625, -46.85546875, -44.93505859375, -43.0146484375, -41.09423828125, -39.173828125, -37.25341796875, -35.3330078125, -33.41259765625, -31.4921875, -29.57177734375, -27.6513671875, -25.73095703125, -23.810546875, -21.89013671875, -19.9697265625, -18.04931640625, -16.12890625, -14.20849609375, -12.2880859375, -10.36767578125, -8.447265625, -6.52685546875, -4.6064453125, -2.68603515625, -0.765625, 1.15478515625, 3.0751953125, 4.99560546875, 6.916015625, 8.83642578125, 10.7568359375, 12.67724609375, 14.59765625, 16.51806640625, 18.4384765625, 20.35888671875, 22.279296875, 24.19970703125, 26.1201171875, 28.04052734375, 29.9609375, 31.88134765625, 33.8017578125, 35.72216796875, 37.642578125, 39.56298828125, 41.4833984375, 43.40380859375, 45.32421875, 47.24462890625, 49.1650390625, 51.08544921875, 53.005859375, 54.92626953125, 56.8466796875, 58.76708984375, 60.6875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 7.0, 11.0, 12.0, 15.0, 17.0, 23.0, 35.0, 44.0, 41.0, 62.0, 56.0, 65.0, 69.0, 82.0, 68.0, 73.0, 54.0, 58.0, 38.0, 36.0, 29.0, 28.0, 25.0, 12.0, 10.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.625, -32.701416015625, -31.77783203125, -30.854248046875, -29.9306640625, -29.007080078125, -28.08349609375, -27.159912109375, -26.236328125, -25.312744140625, -24.38916015625, -23.465576171875, -22.5419921875, -21.618408203125, -20.69482421875, -19.771240234375, -18.84765625, -17.924072265625, -17.00048828125, -16.076904296875, -15.1533203125, -14.229736328125, -13.30615234375, -12.382568359375, -11.458984375, -10.535400390625, -9.61181640625, -8.688232421875, -7.7646484375, -6.841064453125, -5.91748046875, -4.993896484375, -4.0703125, -3.146728515625, -2.22314453125, -1.299560546875, -0.3759765625, 0.547607421875, 1.47119140625, 2.394775390625, 3.318359375, 4.241943359375, 5.16552734375, 6.089111328125, 7.0126953125, 7.936279296875, 8.85986328125, 9.783447265625, 10.70703125, 11.630615234375, 12.55419921875, 13.477783203125, 14.4013671875, 15.324951171875, 16.24853515625, 17.172119140625, 18.095703125, 19.019287109375, 19.94287109375, 20.866455078125, 21.7900390625, 22.713623046875, 23.63720703125, 24.560791015625, 25.484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 13.0, 21.0, 16.0, 23.0, 30.0, 36.0, 58.0, 87.0, 104.0, 183.0, 277.0, 418.0, 777.0, 1479.0, 4427.0, 18393.0, 135911.0, 712175.0, 146622.0, 19379.0, 4485.0, 1551.0, 753.0, 412.0, 278.0, 169.0, 120.0, 92.0, 62.0, 51.0, 24.0, 30.0, 21.0, 16.0, 4.0, 6.0, 8.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -77.9453125, -74.890625, -71.8359375, -68.78125, -65.7265625, -62.671875, -59.6171875, -56.5625, -53.5078125, -50.453125, -47.3984375, -44.34375, -41.2890625, -38.234375, -35.1796875, -32.125, -29.0703125, -26.015625, -22.9609375, -19.90625, -16.8515625, -13.796875, -10.7421875, -7.6875, -4.6328125, -1.578125, 1.4765625, 4.53125, 7.5859375, 10.640625, 13.6953125, 16.75, 19.8046875, 22.859375, 25.9140625, 28.96875, 32.0234375, 35.078125, 38.1328125, 41.1875, 44.2421875, 47.296875, 50.3515625, 53.40625, 56.4609375, 59.515625, 62.5703125, 65.625, 68.6796875, 71.734375, 74.7890625, 77.84375, 80.8984375, 83.953125, 87.0078125, 90.0625, 93.1171875, 96.171875, 99.2265625, 102.28125, 105.3359375, 108.390625, 111.4453125, 114.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 9.0, 14.0, 11.0, 10.0, 19.0, 22.0, 22.0, 21.0, 26.0, 42.0, 39.0, 45.0, 48.0, 50.0, 53.0, 60.0, 43.0, 48.0, 50.0, 53.0, 45.0, 29.0, 34.0, 32.0, 31.0, 20.0, 29.0, 17.0, 20.0, 12.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-96.0, -93.3427734375, -90.685546875, -88.0283203125, -85.37109375, -82.7138671875, -80.056640625, -77.3994140625, -74.7421875, -72.0849609375, -69.427734375, -66.7705078125, -64.11328125, -61.4560546875, -58.798828125, -56.1416015625, -53.484375, -50.8271484375, -48.169921875, -45.5126953125, -42.85546875, -40.1982421875, -37.541015625, -34.8837890625, -32.2265625, -29.5693359375, -26.912109375, -24.2548828125, -21.59765625, -18.9404296875, -16.283203125, -13.6259765625, -10.96875, -8.3115234375, -5.654296875, -2.9970703125, -0.33984375, 2.3173828125, 4.974609375, 7.6318359375, 10.2890625, 12.9462890625, 15.603515625, 18.2607421875, 20.91796875, 23.5751953125, 26.232421875, 28.8896484375, 31.546875, 34.2041015625, 36.861328125, 39.5185546875, 42.17578125, 44.8330078125, 47.490234375, 50.1474609375, 52.8046875, 55.4619140625, 58.119140625, 60.7763671875, 63.43359375, 66.0908203125, 68.748046875, 71.4052734375, 74.0625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 5.0, 12.0, 15.0, 21.0, 41.0, 48.0, 90.0, 196.0, 401.0, 867.0, 2558.0, 10359.0, 68254.0, 604173.0, 316037.0, 35899.0, 6373.0, 1809.0, 698.0, 325.0, 168.0, 83.0, 57.0, 37.0, 12.0, 7.0, 11.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -21.081787109375, -20.11669921875, -19.151611328125, -18.1865234375, -17.221435546875, -16.25634765625, -15.291259765625, -14.326171875, -13.361083984375, -12.39599609375, -11.430908203125, -10.4658203125, -9.500732421875, -8.53564453125, -7.570556640625, -6.60546875, -5.640380859375, -4.67529296875, -3.710205078125, -2.7451171875, -1.780029296875, -0.81494140625, 0.150146484375, 1.115234375, 2.080322265625, 3.04541015625, 4.010498046875, 4.9755859375, 5.940673828125, 6.90576171875, 7.870849609375, 8.8359375, 9.801025390625, 10.76611328125, 11.731201171875, 12.6962890625, 13.661376953125, 14.62646484375, 15.591552734375, 16.556640625, 17.521728515625, 18.48681640625, 19.451904296875, 20.4169921875, 21.382080078125, 22.34716796875, 23.312255859375, 24.27734375, 25.242431640625, 26.20751953125, 27.172607421875, 28.1376953125, 29.102783203125, 30.06787109375, 31.032958984375, 31.998046875, 32.963134765625, 33.92822265625, 34.893310546875, 35.8583984375, 36.823486328125, 37.78857421875, 38.753662109375, 39.71875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 9.0, 15.0, 17.0, 21.0, 27.0, 23.0, 31.0, 45.0, 75.0, 107.0, 131.0, 119.0, 73.0, 56.0, 55.0, 42.0, 28.0, 30.0, 17.0, 14.0, 15.0, 6.0, 4.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004326164722442627, -0.004166245460510254, -0.004006326198577881, -0.003846406936645508, -0.0036864876747131348, -0.0035265684127807617, -0.0033666491508483887, -0.0032067298889160156, -0.0030468106269836426, -0.0028868913650512695, -0.0027269721031188965, -0.0025670528411865234, -0.0024071335792541504, -0.0022472143173217773, -0.0020872950553894043, -0.0019273757934570312, -0.0017674565315246582, -0.0016075372695922852, -0.0014476180076599121, -0.001287698745727539, -0.001127779483795166, -0.000967860221862793, -0.0008079409599304199, -0.0006480216979980469, -0.00048810243606567383, -0.0003281831741333008, -0.00016826391220092773, -8.344650268554688e-06, 0.00015157461166381836, 0.0003114938735961914, 0.00047141313552856445, 0.0006313323974609375, 0.0007912516593933105, 0.0009511709213256836, 0.0011110901832580566, 0.0012710094451904297, 0.0014309287071228027, 0.0015908479690551758, 0.0017507672309875488, 0.0019106864929199219, 0.002070605754852295, 0.002230525016784668, 0.002390444278717041, 0.002550363540649414, 0.002710282802581787, 0.00287020206451416, 0.003030121326446533, 0.0031900405883789062, 0.0033499598503112793, 0.0035098791122436523, 0.0036697983741760254, 0.0038297176361083984, 0.0039896368980407715, 0.0041495561599731445, 0.004309475421905518, 0.004469394683837891, 0.004629313945770264, 0.004789233207702637, 0.00494915246963501, 0.005109071731567383, 0.005268990993499756, 0.005428910255432129, 0.005588829517364502, 0.005748748779296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 8.0, 12.0, 29.0, 57.0, 72.0, 170.0, 306.0, 666.0, 1739.0, 7314.0, 76359.0, 799994.0, 147079.0, 11071.0, 2084.0, 804.0, 352.0, 186.0, 122.0, 55.0, 25.0, 11.0, 15.0, 10.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -28.777587890625, -27.44580078125, -26.114013671875, -24.7822265625, -23.450439453125, -22.11865234375, -20.786865234375, -19.455078125, -18.123291015625, -16.79150390625, -15.459716796875, -14.1279296875, -12.796142578125, -11.46435546875, -10.132568359375, -8.80078125, -7.468994140625, -6.13720703125, -4.805419921875, -3.4736328125, -2.141845703125, -0.81005859375, 0.521728515625, 1.853515625, 3.185302734375, 4.51708984375, 5.848876953125, 7.1806640625, 8.512451171875, 9.84423828125, 11.176025390625, 12.5078125, 13.839599609375, 15.17138671875, 16.503173828125, 17.8349609375, 19.166748046875, 20.49853515625, 21.830322265625, 23.162109375, 24.493896484375, 25.82568359375, 27.157470703125, 28.4892578125, 29.821044921875, 31.15283203125, 32.484619140625, 33.81640625, 35.148193359375, 36.47998046875, 37.811767578125, 39.1435546875, 40.475341796875, 41.80712890625, 43.138916015625, 44.470703125, 45.802490234375, 47.13427734375, 48.466064453125, 49.7978515625, 51.129638671875, 52.46142578125, 53.793212890625, 55.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 3.0, 7.0, 9.0, 12.0, 19.0, 17.0, 26.0, 32.0, 26.0, 26.0, 36.0, 42.0, 64.0, 45.0, 45.0, 71.0, 62.0, 56.0, 60.0, 47.0, 49.0, 44.0, 29.0, 32.0, 20.0, 15.0, 14.0, 17.0, 9.0, 14.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.25, -19.65625, -19.0625, -18.46875, -17.875, -17.28125, -16.6875, -16.09375, -15.5, -14.90625, -14.3125, -13.71875, -13.125, -12.53125, -11.9375, -11.34375, -10.75, -10.15625, -9.5625, -8.96875, -8.375, -7.78125, -7.1875, -6.59375, -6.0, -5.40625, -4.8125, -4.21875, -3.625, -3.03125, -2.4375, -1.84375, -1.25, -0.65625, -0.0625, 0.53125, 1.125, 1.71875, 2.3125, 2.90625, 3.5, 4.09375, 4.6875, 5.28125, 5.875, 6.46875, 7.0625, 7.65625, 8.25, 8.84375, 9.4375, 10.03125, 10.625, 11.21875, 11.8125, 12.40625, 13.0, 13.59375, 14.1875, 14.78125, 15.375, 15.96875, 16.5625, 17.15625, 17.75]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 10.0, 56.0, 245.0, 430.0, 210.0, 44.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-664.328369140625, -600.9441528320312, -537.5599975585938, -474.17578125, -410.7915954589844, -347.40740966796875, -284.023193359375, -220.63900756835938, -157.25482177734375, -93.8706283569336, -30.486434936523438, 32.89776611328125, 96.28195190429688, 159.6661376953125, 223.05035400390625, 286.4345397949219, 349.8187255859375, 413.2029113769531, 476.58709716796875, 539.9713134765625, 603.35546875, 666.7396850585938, 730.1239013671875, 793.508056640625, 856.8922729492188, 920.2764892578125, 983.66064453125, 1047.044921875, 1110.4290771484375, 1173.813232421875, 1237.197509765625, 1300.5816650390625, 1363.9658203125, 1427.3499755859375, 1490.7342529296875, 1554.118408203125, 1617.5025634765625, 1680.88671875, 1744.27099609375, 1807.6551513671875, 1871.039306640625, 1934.4234619140625, 1997.8077392578125, 2061.19189453125, 2124.576171875, 2187.960205078125, 2251.344482421875, 2314.728759765625, 2378.11279296875, 2441.4970703125, 2504.881103515625, 2568.265380859375, 2631.649658203125, 2695.03369140625, 2758.41796875, 2821.80224609375, 2885.1865234375, 2948.57080078125, 3011.954833984375, 3075.339111328125, 3138.723388671875, 3202.107421875, 3265.49169921875, 3328.8759765625, 3392.260009765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 1.0, 4.0, 4.0, 10.0, 14.0, 15.0, 7.0, 14.0, 16.0, 32.0, 18.0, 37.0, 41.0, 36.0, 55.0, 62.0, 63.0, 56.0, 56.0, 52.0, 54.0, 40.0, 39.0, 55.0, 38.0, 28.0, 29.0, 22.0, 27.0, 17.0, 10.0, 13.0, 7.0, 8.0, 8.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.4562683105469, -313.5807800292969, -300.705322265625, -287.829833984375, -274.9543762207031, -262.0788879394531, -249.2034149169922, -236.32794189453125, -223.4524688720703, -210.57699584960938, -197.70152282714844, -184.8260498046875, -171.9505615234375, -159.07510375976562, -146.19961547851562, -133.3241424560547, -120.44866943359375, -107.57319641113281, -94.69772338867188, -81.8222427368164, -68.94676971435547, -56.07129669189453, -43.19581604003906, -30.320343017578125, -17.444869995117188, -4.569395065307617, 8.306079864501953, 21.181556701660156, 34.057029724121094, 46.93250274658203, 59.8079833984375, 72.68345642089844, 85.5589599609375, 98.43443298339844, 111.30990600585938, 124.18538665771484, 137.06085205078125, 149.93634033203125, 162.8118133544922, 175.68728637695312, 188.56275939941406, 201.438232421875, 214.31370544433594, 227.18917846679688, 240.06466674804688, 252.94012451171875, 265.81561279296875, 278.69110107421875, 291.5665588378906, 304.4420471191406, 317.3175048828125, 330.1929931640625, 343.0684509277344, 355.9439392089844, 368.81939697265625, 381.69488525390625, 394.57037353515625, 407.44586181640625, 420.3213195800781, 433.1968078613281, 446.072265625, 458.94775390625, 471.8232421875, 484.6986999511719, 497.57415771484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 13.0, 18.0, 34.0, 41.0, 74.0, 160.0, 303.0, 750.0, 1757.0, 5009.0, 18738.0, 108123.0, 2945614.0, 1031156.0, 63566.0, 12635.0, 3696.0, 1359.0, 596.0, 285.0, 133.0, 90.0, 39.0, 37.0, 22.0, 17.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.240234375, -62.98046875, -60.720703125, -58.4609375, -56.201171875, -53.94140625, -51.681640625, -49.421875, -47.162109375, -44.90234375, -42.642578125, -40.3828125, -38.123046875, -35.86328125, -33.603515625, -31.34375, -29.083984375, -26.82421875, -24.564453125, -22.3046875, -20.044921875, -17.78515625, -15.525390625, -13.265625, -11.005859375, -8.74609375, -6.486328125, -4.2265625, -1.966796875, 0.29296875, 2.552734375, 4.8125, 7.072265625, 9.33203125, 11.591796875, 13.8515625, 16.111328125, 18.37109375, 20.630859375, 22.890625, 25.150390625, 27.41015625, 29.669921875, 31.9296875, 34.189453125, 36.44921875, 38.708984375, 40.96875, 43.228515625, 45.48828125, 47.748046875, 50.0078125, 52.267578125, 54.52734375, 56.787109375, 59.046875, 61.306640625, 63.56640625, 65.826171875, 68.0859375, 70.345703125, 72.60546875, 74.865234375, 77.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 16.0, 16.0, 20.0, 33.0, 37.0, 31.0, 33.0, 42.0, 61.0, 68.0, 63.0, 76.0, 54.0, 61.0, 48.0, 60.0, 42.0, 37.0, 31.0, 26.0, 27.0, 20.0, 10.0, 15.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.265625, -20.547119140625, -19.82861328125, -19.110107421875, -18.3916015625, -17.673095703125, -16.95458984375, -16.236083984375, -15.517578125, -14.799072265625, -14.08056640625, -13.362060546875, -12.6435546875, -11.925048828125, -11.20654296875, -10.488037109375, -9.76953125, -9.051025390625, -8.33251953125, -7.614013671875, -6.8955078125, -6.177001953125, -5.45849609375, -4.739990234375, -4.021484375, -3.302978515625, -2.58447265625, -1.865966796875, -1.1474609375, -0.428955078125, 0.28955078125, 1.008056640625, 1.7265625, 2.445068359375, 3.16357421875, 3.882080078125, 4.6005859375, 5.319091796875, 6.03759765625, 6.756103515625, 7.474609375, 8.193115234375, 8.91162109375, 9.630126953125, 10.3486328125, 11.067138671875, 11.78564453125, 12.504150390625, 13.22265625, 13.941162109375, 14.65966796875, 15.378173828125, 16.0966796875, 16.815185546875, 17.53369140625, 18.252197265625, 18.970703125, 19.689208984375, 20.40771484375, 21.126220703125, 21.8447265625, 22.563232421875, 23.28173828125, 24.000244140625, 24.71875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 8.0, 7.0, 8.0, 17.0, 17.0, 31.0, 49.0, 125.0, 205.0, 427.0, 1051.0, 3144.0, 12364.0, 76986.0, 2855718.0, 1178103.0, 52257.0, 9431.0, 2583.0, 836.0, 407.0, 195.0, 122.0, 66.0, 31.0, 29.0, 19.0, 16.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-86.6875, -84.2041015625, -81.720703125, -79.2373046875, -76.75390625, -74.2705078125, -71.787109375, -69.3037109375, -66.8203125, -64.3369140625, -61.853515625, -59.3701171875, -56.88671875, -54.4033203125, -51.919921875, -49.4365234375, -46.953125, -44.4697265625, -41.986328125, -39.5029296875, -37.01953125, -34.5361328125, -32.052734375, -29.5693359375, -27.0859375, -24.6025390625, -22.119140625, -19.6357421875, -17.15234375, -14.6689453125, -12.185546875, -9.7021484375, -7.21875, -4.7353515625, -2.251953125, 0.2314453125, 2.71484375, 5.1982421875, 7.681640625, 10.1650390625, 12.6484375, 15.1318359375, 17.615234375, 20.0986328125, 22.58203125, 25.0654296875, 27.548828125, 30.0322265625, 32.515625, 34.9990234375, 37.482421875, 39.9658203125, 42.44921875, 44.9326171875, 47.416015625, 49.8994140625, 52.3828125, 54.8662109375, 57.349609375, 59.8330078125, 62.31640625, 64.7998046875, 67.283203125, 69.7666015625, 72.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 15.0, 15.0, 20.0, 25.0, 56.0, 90.0, 144.0, 300.0, 633.0, 1146.0, 749.0, 349.0, 197.0, 114.0, 65.0, 41.0, 38.0, 16.0, 9.0, 7.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.25439453125, -47.1650390625, -45.07568359375, -42.986328125, -40.89697265625, -38.8076171875, -36.71826171875, -34.62890625, -32.53955078125, -30.4501953125, -28.36083984375, -26.271484375, -24.18212890625, -22.0927734375, -20.00341796875, -17.9140625, -15.82470703125, -13.7353515625, -11.64599609375, -9.556640625, -7.46728515625, -5.3779296875, -3.28857421875, -1.19921875, 0.89013671875, 2.9794921875, 5.06884765625, 7.158203125, 9.24755859375, 11.3369140625, 13.42626953125, 15.515625, 17.60498046875, 19.6943359375, 21.78369140625, 23.873046875, 25.96240234375, 28.0517578125, 30.14111328125, 32.23046875, 34.31982421875, 36.4091796875, 38.49853515625, 40.587890625, 42.67724609375, 44.7666015625, 46.85595703125, 48.9453125, 51.03466796875, 53.1240234375, 55.21337890625, 57.302734375, 59.39208984375, 61.4814453125, 63.57080078125, 65.66015625, 67.74951171875, 69.8388671875, 71.92822265625, 74.017578125, 76.10693359375, 78.1962890625, 80.28564453125, 82.375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 11.0, 26.0, 53.0, 138.0, 232.0, 226.0, 133.0, 93.0, 42.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-734.3699951171875, -711.4608154296875, -688.5516357421875, -665.6424560546875, -642.7332763671875, -619.8240966796875, -596.9149169921875, -574.0057373046875, -551.0965576171875, -528.1873779296875, -505.2781982421875, -482.3690185546875, -459.4598388671875, -436.5506591796875, -413.6414794921875, -390.7322998046875, -367.8231201171875, -344.9139404296875, -322.0047607421875, -299.0955810546875, -276.1864013671875, -253.2772216796875, -230.3680419921875, -207.4588623046875, -184.5496826171875, -161.6405029296875, -138.7313232421875, -115.8221435546875, -92.9129638671875, -70.0037841796875, -47.0946044921875, -24.1854248046875, -1.27618408203125, 21.63299560546875, 44.54217529296875, 67.45135498046875, 90.36053466796875, 113.26971435546875, 136.17889404296875, 159.08807373046875, 181.99725341796875, 204.90643310546875, 227.81561279296875, 250.72479248046875, 273.63397216796875, 296.54315185546875, 319.45233154296875, 342.36151123046875, 365.27069091796875, 388.17987060546875, 411.08905029296875, 433.99822998046875, 456.90740966796875, 479.81658935546875, 502.72576904296875, 525.6349487304688, 548.5441284179688, 571.4533081054688, 594.3624877929688, 617.2716674804688, 640.1808471679688, 663.0900268554688, 685.9992065429688, 708.9083862304688, 731.8175659179688]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 14.0, 16.0, 13.0, 20.0, 17.0, 34.0, 26.0, 43.0, 30.0, 40.0, 42.0, 49.0, 54.0, 44.0, 61.0, 57.0, 57.0, 52.0, 40.0, 30.0, 49.0, 31.0, 30.0, 30.0, 16.0, 24.0, 16.0, 8.0, 9.0, 10.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-266.94854736328125, -258.3462829589844, -249.74400329589844, -241.1417236328125, -232.53945922851562, -223.93719482421875, -215.3349151611328, -206.73263549804688, -198.13037109375, -189.52810668945312, -180.9258270263672, -172.32354736328125, -163.72128295898438, -155.1190185546875, -146.51673889160156, -137.91445922851562, -129.31219482421875, -120.70992279052734, -112.10765075683594, -103.50537872314453, -94.90310668945312, -86.30083465576172, -77.69856262207031, -69.0962905883789, -60.4940185546875, -51.891746520996094, -43.28947448730469, -34.68720245361328, -26.084930419921875, -17.48265838623047, -8.880386352539062, -0.27811431884765625, 8.32415771484375, 16.926429748535156, 25.528701782226562, 34.13097381591797, 42.733245849609375, 51.33551788330078, 59.93778991699219, 68.5400619506836, 77.142333984375, 85.7446060180664, 94.34687805175781, 102.94915008544922, 111.55142211914062, 120.15369415283203, 128.75596618652344, 137.35824584960938, 145.96051025390625, 154.56277465820312, 163.16505432128906, 171.767333984375, 180.36959838867188, 188.97186279296875, 197.5741424560547, 206.17642211914062, 214.7786865234375, 223.38095092773438, 231.9832305908203, 240.58551025390625, 249.18777465820312, 257.7900390625, 266.392333984375, 274.9945983886719, 283.59686279296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 7.0, 15.0, 17.0, 31.0, 48.0, 93.0, 119.0, 215.0, 371.0, 835.0, 1771.0, 3938.0, 10504.0, 31021.0, 99929.0, 392748.0, 367411.0, 93260.0, 28984.0, 10039.0, 3878.0, 1718.0, 742.0, 347.0, 198.0, 133.0, 67.0, 34.0, 28.0, 15.0, 10.0, 6.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-74.5, -72.58837890625, -70.6767578125, -68.76513671875, -66.853515625, -64.94189453125, -63.0302734375, -61.11865234375, -59.20703125, -57.29541015625, -55.3837890625, -53.47216796875, -51.560546875, -49.64892578125, -47.7373046875, -45.82568359375, -43.9140625, -42.00244140625, -40.0908203125, -38.17919921875, -36.267578125, -34.35595703125, -32.4443359375, -30.53271484375, -28.62109375, -26.70947265625, -24.7978515625, -22.88623046875, -20.974609375, -19.06298828125, -17.1513671875, -15.23974609375, -13.328125, -11.41650390625, -9.5048828125, -7.59326171875, -5.681640625, -3.77001953125, -1.8583984375, 0.05322265625, 1.96484375, 3.87646484375, 5.7880859375, 7.69970703125, 9.611328125, 11.52294921875, 13.4345703125, 15.34619140625, 17.2578125, 19.16943359375, 21.0810546875, 22.99267578125, 24.904296875, 26.81591796875, 28.7275390625, 30.63916015625, 32.55078125, 34.46240234375, 36.3740234375, 38.28564453125, 40.197265625, 42.10888671875, 44.0205078125, 45.93212890625, 47.84375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 14.0, 16.0, 13.0, 24.0, 26.0, 45.0, 30.0, 47.0, 67.0, 61.0, 50.0, 73.0, 54.0, 66.0, 67.0, 40.0, 45.0, 43.0, 48.0, 36.0, 25.0, 21.0, 14.0, 14.0, 11.0, 3.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.078125, -21.35009765625, -20.6220703125, -19.89404296875, -19.166015625, -18.43798828125, -17.7099609375, -16.98193359375, -16.25390625, -15.52587890625, -14.7978515625, -14.06982421875, -13.341796875, -12.61376953125, -11.8857421875, -11.15771484375, -10.4296875, -9.70166015625, -8.9736328125, -8.24560546875, -7.517578125, -6.78955078125, -6.0615234375, -5.33349609375, -4.60546875, -3.87744140625, -3.1494140625, -2.42138671875, -1.693359375, -0.96533203125, -0.2373046875, 0.49072265625, 1.21875, 1.94677734375, 2.6748046875, 3.40283203125, 4.130859375, 4.85888671875, 5.5869140625, 6.31494140625, 7.04296875, 7.77099609375, 8.4990234375, 9.22705078125, 9.955078125, 10.68310546875, 11.4111328125, 12.13916015625, 12.8671875, 13.59521484375, 14.3232421875, 15.05126953125, 15.779296875, 16.50732421875, 17.2353515625, 17.96337890625, 18.69140625, 19.41943359375, 20.1474609375, 20.87548828125, 21.603515625, 22.33154296875, 23.0595703125, 23.78759765625, 24.515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 13.0, 15.0, 19.0, 28.0, 38.0, 56.0, 85.0, 135.0, 238.0, 433.0, 821.0, 1879.0, 6205.0, 66074.0, 857591.0, 102792.0, 7960.0, 2121.0, 874.0, 438.0, 250.0, 173.0, 100.0, 60.0, 40.0, 19.0, 20.0, 18.0, 12.0, 2.0, 8.0, 2.0, 6.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.8125, -124.115234375, -120.41796875, -116.720703125, -113.0234375, -109.326171875, -105.62890625, -101.931640625, -98.234375, -94.537109375, -90.83984375, -87.142578125, -83.4453125, -79.748046875, -76.05078125, -72.353515625, -68.65625, -64.958984375, -61.26171875, -57.564453125, -53.8671875, -50.169921875, -46.47265625, -42.775390625, -39.078125, -35.380859375, -31.68359375, -27.986328125, -24.2890625, -20.591796875, -16.89453125, -13.197265625, -9.5, -5.802734375, -2.10546875, 1.591796875, 5.2890625, 8.986328125, 12.68359375, 16.380859375, 20.078125, 23.775390625, 27.47265625, 31.169921875, 34.8671875, 38.564453125, 42.26171875, 45.958984375, 49.65625, 53.353515625, 57.05078125, 60.748046875, 64.4453125, 68.142578125, 71.83984375, 75.537109375, 79.234375, 82.931640625, 86.62890625, 90.326171875, 94.0234375, 97.720703125, 101.41796875, 105.115234375, 108.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 9.0, 13.0, 14.0, 13.0, 21.0, 20.0, 27.0, 32.0, 28.0, 26.0, 27.0, 46.0, 35.0, 43.0, 48.0, 52.0, 39.0, 43.0, 58.0, 39.0, 45.0, 33.0, 46.0, 41.0, 36.0, 18.0, 21.0, 26.0, 28.0, 17.0, 10.0, 4.0, 10.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-77.8125, -75.61474609375, -73.4169921875, -71.21923828125, -69.021484375, -66.82373046875, -64.6259765625, -62.42822265625, -60.23046875, -58.03271484375, -55.8349609375, -53.63720703125, -51.439453125, -49.24169921875, -47.0439453125, -44.84619140625, -42.6484375, -40.45068359375, -38.2529296875, -36.05517578125, -33.857421875, -31.65966796875, -29.4619140625, -27.26416015625, -25.06640625, -22.86865234375, -20.6708984375, -18.47314453125, -16.275390625, -14.07763671875, -11.8798828125, -9.68212890625, -7.484375, -5.28662109375, -3.0888671875, -0.89111328125, 1.306640625, 3.50439453125, 5.7021484375, 7.89990234375, 10.09765625, 12.29541015625, 14.4931640625, 16.69091796875, 18.888671875, 21.08642578125, 23.2841796875, 25.48193359375, 27.6796875, 29.87744140625, 32.0751953125, 34.27294921875, 36.470703125, 38.66845703125, 40.8662109375, 43.06396484375, 45.26171875, 47.45947265625, 49.6572265625, 51.85498046875, 54.052734375, 56.25048828125, 58.4482421875, 60.64599609375, 62.84375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 1.0, 9.0, 15.0, 23.0, 40.0, 49.0, 71.0, 139.0, 265.0, 743.0, 3135.0, 36056.0, 909496.0, 91629.0, 5102.0, 1009.0, 341.0, 171.0, 73.0, 61.0, 46.0, 24.0, 10.0, 7.0, 5.0, 11.0, 1.0, 6.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -41.77294921875, -40.0771484375, -38.38134765625, -36.685546875, -34.98974609375, -33.2939453125, -31.59814453125, -29.90234375, -28.20654296875, -26.5107421875, -24.81494140625, -23.119140625, -21.42333984375, -19.7275390625, -18.03173828125, -16.3359375, -14.64013671875, -12.9443359375, -11.24853515625, -9.552734375, -7.85693359375, -6.1611328125, -4.46533203125, -2.76953125, -1.07373046875, 0.6220703125, 2.31787109375, 4.013671875, 5.70947265625, 7.4052734375, 9.10107421875, 10.796875, 12.49267578125, 14.1884765625, 15.88427734375, 17.580078125, 19.27587890625, 20.9716796875, 22.66748046875, 24.36328125, 26.05908203125, 27.7548828125, 29.45068359375, 31.146484375, 32.84228515625, 34.5380859375, 36.23388671875, 37.9296875, 39.62548828125, 41.3212890625, 43.01708984375, 44.712890625, 46.40869140625, 48.1044921875, 49.80029296875, 51.49609375, 53.19189453125, 54.8876953125, 56.58349609375, 58.279296875, 59.97509765625, 61.6708984375, 63.36669921875, 65.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 1.0, 7.0, 5.0, 5.0, 7.0, 14.0, 14.0, 19.0, 10.0, 22.0, 32.0, 39.0, 46.0, 74.0, 84.0, 132.0, 118.0, 81.0, 61.0, 51.0, 30.0, 23.0, 21.0, 12.0, 18.0, 10.0, 13.0, 5.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035114288330078125, -0.0033857524394989014, -0.0032600760459899902, -0.003134399652481079, -0.003008723258972168, -0.002883046865463257, -0.0027573704719543457, -0.0026316940784454346, -0.0025060176849365234, -0.0023803412914276123, -0.002254664897918701, -0.00212898850440979, -0.002003312110900879, -0.0018776357173919678, -0.0017519593238830566, -0.0016262829303741455, -0.0015006065368652344, -0.0013749301433563232, -0.0012492537498474121, -0.001123577356338501, -0.0009979009628295898, -0.0008722245693206787, -0.0007465481758117676, -0.0006208717823028564, -0.0004951953887939453, -0.0003695189952850342, -0.00024384260177612305, -0.00011816620826721191, 7.510185241699219e-06, 0.00013318657875061035, 0.0002588629722595215, 0.0003845393657684326, 0.0005102157592773438, 0.0006358921527862549, 0.000761568546295166, 0.0008872449398040771, 0.0010129213333129883, 0.0011385977268218994, 0.0012642741203308105, 0.0013899505138397217, 0.0015156269073486328, 0.001641303300857544, 0.001766979694366455, 0.0018926560878753662, 0.0020183324813842773, 0.0021440088748931885, 0.0022696852684020996, 0.0023953616619110107, 0.002521038055419922, 0.002646714448928833, 0.002772390842437744, 0.0028980672359466553, 0.0030237436294555664, 0.0031494200229644775, 0.0032750964164733887, 0.0034007728099823, 0.003526449203491211, 0.003652125597000122, 0.003777801990509033, 0.0039034783840179443, 0.0040291547775268555, 0.004154831171035767, 0.004280507564544678, 0.004406183958053589, 0.0045318603515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 22.0, 31.0, 38.0, 64.0, 89.0, 130.0, 255.0, 477.0, 1075.0, 3029.0, 14420.0, 254126.0, 735664.0, 31528.0, 4734.0, 1441.0, 626.0, 311.0, 160.0, 100.0, 59.0, 49.0, 25.0, 22.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -43.076171875, -41.77734375, -40.478515625, -39.1796875, -37.880859375, -36.58203125, -35.283203125, -33.984375, -32.685546875, -31.38671875, -30.087890625, -28.7890625, -27.490234375, -26.19140625, -24.892578125, -23.59375, -22.294921875, -20.99609375, -19.697265625, -18.3984375, -17.099609375, -15.80078125, -14.501953125, -13.203125, -11.904296875, -10.60546875, -9.306640625, -8.0078125, -6.708984375, -5.41015625, -4.111328125, -2.8125, -1.513671875, -0.21484375, 1.083984375, 2.3828125, 3.681640625, 4.98046875, 6.279296875, 7.578125, 8.876953125, 10.17578125, 11.474609375, 12.7734375, 14.072265625, 15.37109375, 16.669921875, 17.96875, 19.267578125, 20.56640625, 21.865234375, 23.1640625, 24.462890625, 25.76171875, 27.060546875, 28.359375, 29.658203125, 30.95703125, 32.255859375, 33.5546875, 34.853515625, 36.15234375, 37.451171875, 38.75]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 14.0, 23.0, 28.0, 42.0, 62.0, 78.0, 136.0, 159.0, 142.0, 114.0, 78.0, 39.0, 22.0, 19.0, 10.0, 8.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.78125, -48.555908203125, -47.33056640625, -46.105224609375, -44.8798828125, -43.654541015625, -42.42919921875, -41.203857421875, -39.978515625, -38.753173828125, -37.52783203125, -36.302490234375, -35.0771484375, -33.851806640625, -32.62646484375, -31.401123046875, -30.17578125, -28.950439453125, -27.72509765625, -26.499755859375, -25.2744140625, -24.049072265625, -22.82373046875, -21.598388671875, -20.373046875, -19.147705078125, -17.92236328125, -16.697021484375, -15.4716796875, -14.246337890625, -13.02099609375, -11.795654296875, -10.5703125, -9.344970703125, -8.11962890625, -6.894287109375, -5.6689453125, -4.443603515625, -3.21826171875, -1.992919921875, -0.767578125, 0.457763671875, 1.68310546875, 2.908447265625, 4.1337890625, 5.359130859375, 6.58447265625, 7.809814453125, 9.03515625, 10.260498046875, 11.48583984375, 12.711181640625, 13.9365234375, 15.161865234375, 16.38720703125, 17.612548828125, 18.837890625, 20.063232421875, 21.28857421875, 22.513916015625, 23.7392578125, 24.964599609375, 26.18994140625, 27.415283203125, 28.640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 14.0, 32.0, 88.0, 198.0, 270.0, 204.0, 104.0, 43.0, 23.0, 14.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.6337890625, -474.1600036621094, -449.68621826171875, -425.21240234375, -400.7386169433594, -376.26483154296875, -351.791015625, -327.3172302246094, -302.84344482421875, -278.3696594238281, -253.89585876464844, -229.42205810546875, -204.94827270507812, -180.4744873046875, -156.0006866455078, -131.52688598632812, -107.0531005859375, -82.57930755615234, -58.10551452636719, -33.63172149658203, -9.157928466796875, 15.315864562988281, 39.78965759277344, 64.26345825195312, 88.73724365234375, 113.2110366821289, 137.68482971191406, 162.15863037109375, 186.63241577148438, 211.106201171875, 235.5800018310547, 260.0538024902344, 284.527587890625, 309.0013732910156, 333.47515869140625, 357.948974609375, 382.4227600097656, 406.89654541015625, 431.370361328125, 455.8441467285156, 480.31793212890625, 504.7917175292969, 529.2655029296875, 553.7393188476562, 578.213134765625, 602.6868896484375, 627.1607055664062, 651.634521484375, 676.1082763671875, 700.5820922851562, 725.0558471679688, 749.5296630859375, 774.00341796875, 798.4772338867188, 822.9510498046875, 847.4248046875, 871.8986206054688, 896.3724365234375, 920.84619140625, 945.3200073242188, 969.7938232421875, 994.267578125, 1018.7413940429688, 1043.2152099609375, 1067.68896484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 5.0, 12.0, 14.0, 9.0, 20.0, 21.0, 27.0, 22.0, 28.0, 36.0, 36.0, 29.0, 45.0, 58.0, 48.0, 49.0, 74.0, 55.0, 59.0, 50.0, 43.0, 42.0, 35.0, 31.0, 19.0, 15.0, 28.0, 20.0, 16.0, 7.0, 9.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.7347412109375, -330.76318359375, -320.7916259765625, -310.820068359375, -300.8485107421875, -290.876953125, -280.9053955078125, -270.933837890625, -260.9622802734375, -250.99072265625, -241.0191650390625, -231.047607421875, -221.0760498046875, -211.1044921875, -201.13291931152344, -191.16136169433594, -181.18978881835938, -171.21823120117188, -161.24667358398438, -151.27511596679688, -141.30355834960938, -131.33200073242188, -121.36042785644531, -111.38887023925781, -101.41731262207031, -91.44575500488281, -81.47419738769531, -71.50263214111328, -61.53107452392578, -51.55951690673828, -41.587955474853516, -31.61639404296875, -21.644805908203125, -11.673246383666992, -1.7016868591308594, 8.269872665405273, 18.241432189941406, 28.212989807128906, 38.18455123901367, 48.15611267089844, 58.12767028808594, 68.09922790527344, 78.07078552246094, 88.04235076904297, 98.01390838623047, 107.98546600341797, 117.95703125, 127.9285888671875, 137.900146484375, 147.8717041015625, 157.84326171875, 167.8148193359375, 177.786376953125, 187.7579345703125, 197.72950744628906, 207.70106506347656, 217.67262268066406, 227.64418029785156, 237.61573791503906, 247.58729553222656, 257.5588684082031, 267.5304260253906, 277.5019836425781, 287.4735412597656, 297.4450988769531]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 21.0, 21.0, 29.0, 33.0, 55.0, 131.0, 183.0, 329.0, 696.0, 1556.0, 3804.0, 10465.0, 38890.0, 292841.0, 3507547.0, 282224.0, 38204.0, 10391.0, 3764.0, 1567.0, 643.0, 342.0, 208.0, 103.0, 66.0, 56.0, 36.0, 19.0, 14.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.37060546875, -42.8662109375, -41.36181640625, -39.857421875, -38.35302734375, -36.8486328125, -35.34423828125, -33.83984375, -32.33544921875, -30.8310546875, -29.32666015625, -27.822265625, -26.31787109375, -24.8134765625, -23.30908203125, -21.8046875, -20.30029296875, -18.7958984375, -17.29150390625, -15.787109375, -14.28271484375, -12.7783203125, -11.27392578125, -9.76953125, -8.26513671875, -6.7607421875, -5.25634765625, -3.751953125, -2.24755859375, -0.7431640625, 0.76123046875, 2.265625, 3.77001953125, 5.2744140625, 6.77880859375, 8.283203125, 9.78759765625, 11.2919921875, 12.79638671875, 14.30078125, 15.80517578125, 17.3095703125, 18.81396484375, 20.318359375, 21.82275390625, 23.3271484375, 24.83154296875, 26.3359375, 27.84033203125, 29.3447265625, 30.84912109375, 32.353515625, 33.85791015625, 35.3623046875, 36.86669921875, 38.37109375, 39.87548828125, 41.3798828125, 42.88427734375, 44.388671875, 45.89306640625, 47.3974609375, 48.90185546875, 50.40625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 14.0, 6.0, 7.0, 15.0, 12.0, 25.0, 30.0, 37.0, 45.0, 57.0, 64.0, 63.0, 65.0, 55.0, 60.0, 83.0, 65.0, 56.0, 35.0, 39.0, 43.0, 27.0, 22.0, 16.0, 11.0, 13.0, 14.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.625, -21.889404296875, -21.15380859375, -20.418212890625, -19.6826171875, -18.947021484375, -18.21142578125, -17.475830078125, -16.740234375, -16.004638671875, -15.26904296875, -14.533447265625, -13.7978515625, -13.062255859375, -12.32666015625, -11.591064453125, -10.85546875, -10.119873046875, -9.38427734375, -8.648681640625, -7.9130859375, -7.177490234375, -6.44189453125, -5.706298828125, -4.970703125, -4.235107421875, -3.49951171875, -2.763916015625, -2.0283203125, -1.292724609375, -0.55712890625, 0.178466796875, 0.9140625, 1.649658203125, 2.38525390625, 3.120849609375, 3.8564453125, 4.592041015625, 5.32763671875, 6.063232421875, 6.798828125, 7.534423828125, 8.27001953125, 9.005615234375, 9.7412109375, 10.476806640625, 11.21240234375, 11.947998046875, 12.68359375, 13.419189453125, 14.15478515625, 14.890380859375, 15.6259765625, 16.361572265625, 17.09716796875, 17.832763671875, 18.568359375, 19.303955078125, 20.03955078125, 20.775146484375, 21.5107421875, 22.246337890625, 22.98193359375, 23.717529296875, 24.453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 10.0, 20.0, 22.0, 37.0, 54.0, 99.0, 133.0, 273.0, 480.0, 777.0, 1427.0, 2820.0, 5508.0, 11802.0, 29706.0, 92721.0, 521512.0, 2881772.0, 499189.0, 92201.0, 29738.0, 11998.0, 5513.0, 2918.0, 1571.0, 863.0, 457.0, 235.0, 139.0, 93.0, 56.0, 35.0, 17.0, 19.0, 12.0, 3.0, 10.0, 4.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.796875, -29.81884765625, -28.8408203125, -27.86279296875, -26.884765625, -25.90673828125, -24.9287109375, -23.95068359375, -22.97265625, -21.99462890625, -21.0166015625, -20.03857421875, -19.060546875, -18.08251953125, -17.1044921875, -16.12646484375, -15.1484375, -14.17041015625, -13.1923828125, -12.21435546875, -11.236328125, -10.25830078125, -9.2802734375, -8.30224609375, -7.32421875, -6.34619140625, -5.3681640625, -4.39013671875, -3.412109375, -2.43408203125, -1.4560546875, -0.47802734375, 0.5, 1.47802734375, 2.4560546875, 3.43408203125, 4.412109375, 5.39013671875, 6.3681640625, 7.34619140625, 8.32421875, 9.30224609375, 10.2802734375, 11.25830078125, 12.236328125, 13.21435546875, 14.1923828125, 15.17041015625, 16.1484375, 17.12646484375, 18.1044921875, 19.08251953125, 20.060546875, 21.03857421875, 22.0166015625, 22.99462890625, 23.97265625, 24.95068359375, 25.9287109375, 26.90673828125, 27.884765625, 28.86279296875, 29.8408203125, 30.81884765625, 31.796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 19.0, 18.0, 21.0, 24.0, 54.0, 65.0, 94.0, 136.0, 251.0, 463.0, 834.0, 794.0, 486.0, 255.0, 182.0, 112.0, 66.0, 38.0, 34.0, 29.0, 7.0, 14.0, 13.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.7666015625, -34.533203125, -33.2998046875, -32.06640625, -30.8330078125, -29.599609375, -28.3662109375, -27.1328125, -25.8994140625, -24.666015625, -23.4326171875, -22.19921875, -20.9658203125, -19.732421875, -18.4990234375, -17.265625, -16.0322265625, -14.798828125, -13.5654296875, -12.33203125, -11.0986328125, -9.865234375, -8.6318359375, -7.3984375, -6.1650390625, -4.931640625, -3.6982421875, -2.46484375, -1.2314453125, 0.001953125, 1.2353515625, 2.46875, 3.7021484375, 4.935546875, 6.1689453125, 7.40234375, 8.6357421875, 9.869140625, 11.1025390625, 12.3359375, 13.5693359375, 14.802734375, 16.0361328125, 17.26953125, 18.5029296875, 19.736328125, 20.9697265625, 22.203125, 23.4365234375, 24.669921875, 25.9033203125, 27.13671875, 28.3701171875, 29.603515625, 30.8369140625, 32.0703125, 33.3037109375, 34.537109375, 35.7705078125, 37.00390625, 38.2373046875, 39.470703125, 40.7041015625, 41.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 5.0, 10.0, 22.0, 70.0, 141.0, 275.0, 243.0, 143.0, 48.0, 20.0, 10.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.0661010742188, -501.0537414550781, -483.0414123535156, -465.029052734375, -447.0167236328125, -429.0043640136719, -410.99200439453125, -392.97967529296875, -374.9673156738281, -356.9549560546875, -338.942626953125, -320.9302673339844, -302.91790771484375, -284.90557861328125, -266.8932189941406, -248.88087463378906, -230.8685302734375, -212.85618591308594, -194.84384155273438, -176.83148193359375, -158.8191375732422, -140.80679321289062, -122.79444122314453, -104.78208923339844, -86.76974487304688, -68.75740051269531, -50.74504852294922, -32.73270034790039, -14.720352172851562, 3.2919921875, 21.304344177246094, 39.31669616699219, 57.32904052734375, 75.34138488769531, 93.3537368774414, 111.3660888671875, 129.37843322753906, 147.39077758789062, 165.40313720703125, 183.4154815673828, 201.42782592773438, 219.44017028808594, 237.4525146484375, 255.46487426757812, 273.47723388671875, 291.48956298828125, 309.5019226074219, 327.5142822265625, 345.526611328125, 363.5389709472656, 381.5513000488281, 399.56365966796875, 417.57598876953125, 435.5883483886719, 453.6007080078125, 471.613037109375, 489.6253967285156, 507.63775634765625, 525.6500854492188, 543.6624145507812, 561.6748046875, 579.6871337890625, 597.699462890625, 615.7118530273438, 633.7241821289062]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 13.0, 17.0, 6.0, 12.0, 24.0, 22.0, 25.0, 25.0, 39.0, 44.0, 44.0, 48.0, 49.0, 63.0, 65.0, 61.0, 63.0, 63.0, 50.0, 39.0, 32.0, 31.0, 30.0, 33.0, 22.0, 22.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-232.88919067382812, -226.7714080810547, -220.65362548828125, -214.53582763671875, -208.4180450439453, -202.30026245117188, -196.18247985839844, -190.064697265625, -183.9468994140625, -177.82911682128906, -171.71133422851562, -165.59353637695312, -159.4757537841797, -153.35797119140625, -147.2401885986328, -141.12240600585938, -135.00462341308594, -128.8868408203125, -122.76905059814453, -116.6512680053711, -110.53347778320312, -104.41569519042969, -98.29791259765625, -92.18013000488281, -86.06233978271484, -79.9445571899414, -73.82676696777344, -67.708984375, -61.5911979675293, -55.473411560058594, -49.355628967285156, -43.23784255981445, -37.12005615234375, -31.002269744873047, -24.884485244750977, -18.766700744628906, -12.648914337158203, -6.5311279296875, -0.4133453369140625, 5.704441070556641, 11.822227478027344, 17.940013885498047, 24.057798385620117, 30.175582885742188, 36.29336929321289, 42.411155700683594, 48.52893829345703, 54.646724700927734, 60.76451110839844, 66.88229370117188, 73.00008392333984, 79.11786651611328, 85.23565673828125, 91.35343933105469, 97.47122192382812, 103.58900451660156, 109.70679473876953, 115.82457733154297, 121.94236755371094, 128.06015014648438, 134.1779327392578, 140.29571533203125, 146.41351318359375, 152.5312957763672, 158.64907836914062]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 7.0, 15.0, 18.0, 11.0, 29.0, 57.0, 78.0, 123.0, 177.0, 317.0, 534.0, 1027.0, 1856.0, 3789.0, 8344.0, 19460.0, 50334.0, 155024.0, 431578.0, 249975.0, 76224.0, 27791.0, 11331.0, 5163.0, 2327.0, 1284.0, 658.0, 354.0, 238.0, 131.0, 72.0, 78.0, 40.0, 24.0, 25.0, 12.0, 14.0, 5.0, 5.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.3125, -41.9013671875, -40.490234375, -39.0791015625, -37.66796875, -36.2568359375, -34.845703125, -33.4345703125, -32.0234375, -30.6123046875, -29.201171875, -27.7900390625, -26.37890625, -24.9677734375, -23.556640625, -22.1455078125, -20.734375, -19.3232421875, -17.912109375, -16.5009765625, -15.08984375, -13.6787109375, -12.267578125, -10.8564453125, -9.4453125, -8.0341796875, -6.623046875, -5.2119140625, -3.80078125, -2.3896484375, -0.978515625, 0.4326171875, 1.84375, 3.2548828125, 4.666015625, 6.0771484375, 7.48828125, 8.8994140625, 10.310546875, 11.7216796875, 13.1328125, 14.5439453125, 15.955078125, 17.3662109375, 18.77734375, 20.1884765625, 21.599609375, 23.0107421875, 24.421875, 25.8330078125, 27.244140625, 28.6552734375, 30.06640625, 31.4775390625, 32.888671875, 34.2998046875, 35.7109375, 37.1220703125, 38.533203125, 39.9443359375, 41.35546875, 42.7666015625, 44.177734375, 45.5888671875, 47.0]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 8.0, 16.0, 10.0, 20.0, 19.0, 31.0, 27.0, 43.0, 55.0, 54.0, 59.0, 71.0, 60.0, 46.0, 66.0, 68.0, 54.0, 45.0, 44.0, 34.0, 29.0, 24.0, 30.0, 18.0, 12.0, 14.0, 11.0, 3.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.921875, -20.2099609375, -19.498046875, -18.7861328125, -18.07421875, -17.3623046875, -16.650390625, -15.9384765625, -15.2265625, -14.5146484375, -13.802734375, -13.0908203125, -12.37890625, -11.6669921875, -10.955078125, -10.2431640625, -9.53125, -8.8193359375, -8.107421875, -7.3955078125, -6.68359375, -5.9716796875, -5.259765625, -4.5478515625, -3.8359375, -3.1240234375, -2.412109375, -1.7001953125, -0.98828125, -0.2763671875, 0.435546875, 1.1474609375, 1.859375, 2.5712890625, 3.283203125, 3.9951171875, 4.70703125, 5.4189453125, 6.130859375, 6.8427734375, 7.5546875, 8.2666015625, 8.978515625, 9.6904296875, 10.40234375, 11.1142578125, 11.826171875, 12.5380859375, 13.25, 13.9619140625, 14.673828125, 15.3857421875, 16.09765625, 16.8095703125, 17.521484375, 18.2333984375, 18.9453125, 19.6572265625, 20.369140625, 21.0810546875, 21.79296875, 22.5048828125, 23.216796875, 23.9287109375, 24.640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 5.0, 5.0, 10.0, 9.0, 17.0, 26.0, 21.0, 33.0, 48.0, 74.0, 108.0, 165.0, 255.0, 483.0, 927.0, 2213.0, 6987.0, 30102.0, 194346.0, 680504.0, 105142.0, 18817.0, 4656.0, 1690.0, 790.0, 409.0, 263.0, 145.0, 76.0, 48.0, 47.0, 35.0, 29.0, 20.0, 11.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-87.0625, -84.90478515625, -82.7470703125, -80.58935546875, -78.431640625, -76.27392578125, -74.1162109375, -71.95849609375, -69.80078125, -67.64306640625, -65.4853515625, -63.32763671875, -61.169921875, -59.01220703125, -56.8544921875, -54.69677734375, -52.5390625, -50.38134765625, -48.2236328125, -46.06591796875, -43.908203125, -41.75048828125, -39.5927734375, -37.43505859375, -35.27734375, -33.11962890625, -30.9619140625, -28.80419921875, -26.646484375, -24.48876953125, -22.3310546875, -20.17333984375, -18.015625, -15.85791015625, -13.7001953125, -11.54248046875, -9.384765625, -7.22705078125, -5.0693359375, -2.91162109375, -0.75390625, 1.40380859375, 3.5615234375, 5.71923828125, 7.876953125, 10.03466796875, 12.1923828125, 14.35009765625, 16.5078125, 18.66552734375, 20.8232421875, 22.98095703125, 25.138671875, 27.29638671875, 29.4541015625, 31.61181640625, 33.76953125, 35.92724609375, 38.0849609375, 40.24267578125, 42.400390625, 44.55810546875, 46.7158203125, 48.87353515625, 51.03125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 5.0, 12.0, 6.0, 8.0, 15.0, 13.0, 16.0, 15.0, 23.0, 23.0, 27.0, 22.0, 19.0, 35.0, 26.0, 32.0, 32.0, 37.0, 37.0, 24.0, 42.0, 37.0, 42.0, 47.0, 23.0, 42.0, 33.0, 46.0, 32.0, 30.0, 23.0, 28.0, 19.0, 20.0, 13.0, 19.0, 10.0, 10.0, 8.0, 7.0, 3.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.25, -49.5703125, -47.890625, -46.2109375, -44.53125, -42.8515625, -41.171875, -39.4921875, -37.8125, -36.1328125, -34.453125, -32.7734375, -31.09375, -29.4140625, -27.734375, -26.0546875, -24.375, -22.6953125, -21.015625, -19.3359375, -17.65625, -15.9765625, -14.296875, -12.6171875, -10.9375, -9.2578125, -7.578125, -5.8984375, -4.21875, -2.5390625, -0.859375, 0.8203125, 2.5, 4.1796875, 5.859375, 7.5390625, 9.21875, 10.8984375, 12.578125, 14.2578125, 15.9375, 17.6171875, 19.296875, 20.9765625, 22.65625, 24.3359375, 26.015625, 27.6953125, 29.375, 31.0546875, 32.734375, 34.4140625, 36.09375, 37.7734375, 39.453125, 41.1328125, 42.8125, 44.4921875, 46.171875, 47.8515625, 49.53125, 51.2109375, 52.890625, 54.5703125, 56.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 7.0, 0.0, 3.0, 10.0, 9.0, 15.0, 20.0, 25.0, 41.0, 59.0, 101.0, 250.0, 528.0, 1472.0, 6477.0, 74201.0, 863922.0, 91378.0, 7305.0, 1645.0, 525.0, 229.0, 119.0, 58.0, 44.0, 21.0, 16.0, 13.0, 8.0, 8.0, 5.0, 1.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.71875, -36.4833984375, -35.248046875, -34.0126953125, -32.77734375, -31.5419921875, -30.306640625, -29.0712890625, -27.8359375, -26.6005859375, -25.365234375, -24.1298828125, -22.89453125, -21.6591796875, -20.423828125, -19.1884765625, -17.953125, -16.7177734375, -15.482421875, -14.2470703125, -13.01171875, -11.7763671875, -10.541015625, -9.3056640625, -8.0703125, -6.8349609375, -5.599609375, -4.3642578125, -3.12890625, -1.8935546875, -0.658203125, 0.5771484375, 1.8125, 3.0478515625, 4.283203125, 5.5185546875, 6.75390625, 7.9892578125, 9.224609375, 10.4599609375, 11.6953125, 12.9306640625, 14.166015625, 15.4013671875, 16.63671875, 17.8720703125, 19.107421875, 20.3427734375, 21.578125, 22.8134765625, 24.048828125, 25.2841796875, 26.51953125, 27.7548828125, 28.990234375, 30.2255859375, 31.4609375, 32.6962890625, 33.931640625, 35.1669921875, 36.40234375, 37.6376953125, 38.873046875, 40.1083984375, 41.34375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 12.0, 4.0, 10.0, 11.0, 11.0, 16.0, 16.0, 22.0, 31.0, 39.0, 53.0, 51.0, 62.0, 78.0, 119.0, 97.0, 66.0, 60.0, 49.0, 38.0, 29.0, 24.0, 16.0, 9.0, 7.0, 14.0, 6.0, 8.0, 2.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031871795654296875, -0.0030864179134368896, -0.002985656261444092, -0.002884894609451294, -0.002784132957458496, -0.0026833713054656982, -0.0025826096534729004, -0.0024818480014801025, -0.0023810863494873047, -0.002280324697494507, -0.002179563045501709, -0.002078801393508911, -0.0019780397415161133, -0.0018772780895233154, -0.0017765164375305176, -0.0016757547855377197, -0.0015749931335449219, -0.001474231481552124, -0.0013734698295593262, -0.0012727081775665283, -0.0011719465255737305, -0.0010711848735809326, -0.0009704232215881348, -0.0008696615695953369, -0.0007688999176025391, -0.0006681382656097412, -0.0005673766136169434, -0.0004666149616241455, -0.00036585330963134766, -0.0002650916576385498, -0.00016433000564575195, -6.35683536529541e-05, 3.719329833984375e-05, 0.0001379549503326416, 0.00023871660232543945, 0.0003394782543182373, 0.00044023990631103516, 0.000541001558303833, 0.0006417632102966309, 0.0007425248622894287, 0.0008432865142822266, 0.0009440481662750244, 0.0010448098182678223, 0.0011455714702606201, 0.001246333122253418, 0.0013470947742462158, 0.0014478564262390137, 0.0015486180782318115, 0.0016493797302246094, 0.0017501413822174072, 0.001850903034210205, 0.001951664686203003, 0.0020524263381958008, 0.0021531879901885986, 0.0022539496421813965, 0.0023547112941741943, 0.002455472946166992, 0.00255623459815979, 0.002656996250152588, 0.0027577579021453857, 0.0028585195541381836, 0.0029592812061309814, 0.0030600428581237793, 0.003160804510116577, 0.003261566162109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 11.0, 16.0, 15.0, 32.0, 49.0, 78.0, 124.0, 197.0, 381.0, 763.0, 1741.0, 4964.0, 20367.0, 166016.0, 735871.0, 96833.0, 14318.0, 3791.0, 1410.0, 672.0, 377.0, 176.0, 113.0, 83.0, 52.0, 25.0, 22.0, 16.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.581787109375, -21.75732421875, -20.932861328125, -20.1083984375, -19.283935546875, -18.45947265625, -17.635009765625, -16.810546875, -15.986083984375, -15.16162109375, -14.337158203125, -13.5126953125, -12.688232421875, -11.86376953125, -11.039306640625, -10.21484375, -9.390380859375, -8.56591796875, -7.741455078125, -6.9169921875, -6.092529296875, -5.26806640625, -4.443603515625, -3.619140625, -2.794677734375, -1.97021484375, -1.145751953125, -0.3212890625, 0.503173828125, 1.32763671875, 2.152099609375, 2.9765625, 3.801025390625, 4.62548828125, 5.449951171875, 6.2744140625, 7.098876953125, 7.92333984375, 8.747802734375, 9.572265625, 10.396728515625, 11.22119140625, 12.045654296875, 12.8701171875, 13.694580078125, 14.51904296875, 15.343505859375, 16.16796875, 16.992431640625, 17.81689453125, 18.641357421875, 19.4658203125, 20.290283203125, 21.11474609375, 21.939208984375, 22.763671875, 23.588134765625, 24.41259765625, 25.237060546875, 26.0615234375, 26.885986328125, 27.71044921875, 28.534912109375, 29.359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 11.0, 19.0, 22.0, 43.0, 44.0, 58.0, 58.0, 95.0, 106.0, 110.0, 94.0, 72.0, 68.0, 47.0, 46.0, 27.0, 14.0, 6.0, 11.0, 10.0, 8.0, 1.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.597412109375, -20.88232421875, -20.167236328125, -19.4521484375, -18.737060546875, -18.02197265625, -17.306884765625, -16.591796875, -15.876708984375, -15.16162109375, -14.446533203125, -13.7314453125, -13.016357421875, -12.30126953125, -11.586181640625, -10.87109375, -10.156005859375, -9.44091796875, -8.725830078125, -8.0107421875, -7.295654296875, -6.58056640625, -5.865478515625, -5.150390625, -4.435302734375, -3.72021484375, -3.005126953125, -2.2900390625, -1.574951171875, -0.85986328125, -0.144775390625, 0.5703125, 1.285400390625, 2.00048828125, 2.715576171875, 3.4306640625, 4.145751953125, 4.86083984375, 5.575927734375, 6.291015625, 7.006103515625, 7.72119140625, 8.436279296875, 9.1513671875, 9.866455078125, 10.58154296875, 11.296630859375, 12.01171875, 12.726806640625, 13.44189453125, 14.156982421875, 14.8720703125, 15.587158203125, 16.30224609375, 17.017333984375, 17.732421875, 18.447509765625, 19.16259765625, 19.877685546875, 20.5927734375, 21.307861328125, 22.02294921875, 22.738037109375, 23.453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 14.0, 37.0, 83.0, 142.0, 202.0, 229.0, 148.0, 66.0, 32.0, 13.0, 6.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-354.76593017578125, -336.0225524902344, -317.2791748046875, -298.5357971191406, -279.79241943359375, -261.04901123046875, -242.30563354492188, -223.562255859375, -204.81887817382812, -186.07550048828125, -167.33212280273438, -148.58872985839844, -129.84535217285156, -111.10197448730469, -92.35858917236328, -73.61520385742188, -54.871826171875, -36.12844467163086, -17.38506317138672, 1.3583183288574219, 20.101699829101562, 38.84507751464844, 57.588462829589844, 76.33184814453125, 95.07522583007812, 113.818603515625, 132.56198120117188, 151.3053741455078, 170.0487518310547, 188.79212951660156, 207.5355224609375, 226.27890014648438, 245.0223388671875, 263.7657165527344, 282.50909423828125, 301.2524719238281, 319.995849609375, 338.7392578125, 357.4826354980469, 376.22601318359375, 394.9693908691406, 413.7127685546875, 432.4561462402344, 451.19952392578125, 469.94293212890625, 488.686279296875, 507.4296875, 526.173095703125, 544.9164428710938, 563.6598510742188, 582.4031982421875, 601.1466064453125, 619.8899536132812, 638.6333618164062, 657.376708984375, 676.1201171875, 694.863525390625, 713.60693359375, 732.3502807617188, 751.0936889648438, 769.8370361328125, 788.5804443359375, 807.3237915039062, 826.0671997070312, 844.810546875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 7.0, 4.0, 13.0, 13.0, 16.0, 15.0, 17.0, 21.0, 28.0, 22.0, 23.0, 36.0, 39.0, 42.0, 35.0, 46.0, 44.0, 56.0, 52.0, 38.0, 47.0, 38.0, 37.0, 34.0, 29.0, 34.0, 31.0, 26.0, 22.0, 25.0, 13.0, 13.0, 8.0, 14.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-239.80885314941406, -232.10250854492188, -224.39614868164062, -216.68980407714844, -208.98345947265625, -201.27711486816406, -193.57077026367188, -185.86441040039062, -178.15806579589844, -170.45172119140625, -162.745361328125, -155.0390167236328, -147.33267211914062, -139.62632751464844, -131.91998291015625, -124.213623046875, -116.50727844238281, -108.80093383789062, -101.0945816040039, -93.38822937011719, -85.681884765625, -77.97554016113281, -70.2691879272461, -62.56283950805664, -54.85649108886719, -47.150142669677734, -39.44379425048828, -31.737445831298828, -24.031097412109375, -16.324748992919922, -8.618400573730469, -0.9120521545410156, 6.794281005859375, 14.500629425048828, 22.20697784423828, 29.913326263427734, 37.61967468261719, 45.32602310180664, 53.032371520996094, 60.73871994018555, 68.445068359375, 76.15141296386719, 83.8577651977539, 91.56411743164062, 99.27046203613281, 106.976806640625, 114.68315887451172, 122.38951110839844, 130.09585571289062, 137.8022003173828, 145.508544921875, 153.21490478515625, 160.92124938964844, 168.62759399414062, 176.33395385742188, 184.04029846191406, 191.74664306640625, 199.45298767089844, 207.15933227539062, 214.86569213867188, 222.57203674316406, 230.27838134765625, 237.9847412109375, 245.6910858154297, 253.39743041992188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 5.0, 13.0, 17.0, 14.0, 30.0, 39.0, 59.0, 100.0, 165.0, 301.0, 518.0, 1005.0, 2194.0, 4992.0, 12806.0, 38807.0, 147231.0, 895032.0, 2398496.0, 544207.0, 102121.0, 28669.0, 9783.0, 3852.0, 1763.0, 837.0, 460.0, 266.0, 151.0, 89.0, 68.0, 46.0, 37.0, 30.0, 14.0, 12.0, 15.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.46875, -22.6416015625, -21.814453125, -20.9873046875, -20.16015625, -19.3330078125, -18.505859375, -17.6787109375, -16.8515625, -16.0244140625, -15.197265625, -14.3701171875, -13.54296875, -12.7158203125, -11.888671875, -11.0615234375, -10.234375, -9.4072265625, -8.580078125, -7.7529296875, -6.92578125, -6.0986328125, -5.271484375, -4.4443359375, -3.6171875, -2.7900390625, -1.962890625, -1.1357421875, -0.30859375, 0.5185546875, 1.345703125, 2.1728515625, 3.0, 3.8271484375, 4.654296875, 5.4814453125, 6.30859375, 7.1357421875, 7.962890625, 8.7900390625, 9.6171875, 10.4443359375, 11.271484375, 12.0986328125, 12.92578125, 13.7529296875, 14.580078125, 15.4072265625, 16.234375, 17.0615234375, 17.888671875, 18.7158203125, 19.54296875, 20.3701171875, 21.197265625, 22.0244140625, 22.8515625, 23.6787109375, 24.505859375, 25.3330078125, 26.16015625, 26.9873046875, 27.814453125, 28.6416015625, 29.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 11.0, 8.0, 13.0, 23.0, 33.0, 30.0, 39.0, 42.0, 66.0, 65.0, 56.0, 50.0, 62.0, 83.0, 68.0, 54.0, 57.0, 51.0, 37.0, 40.0, 30.0, 21.0, 14.0, 9.0, 13.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-22.296875, -21.5703125, -20.84375, -20.1171875, -19.390625, -18.6640625, -17.9375, -17.2109375, -16.484375, -15.7578125, -15.03125, -14.3046875, -13.578125, -12.8515625, -12.125, -11.3984375, -10.671875, -9.9453125, -9.21875, -8.4921875, -7.765625, -7.0390625, -6.3125, -5.5859375, -4.859375, -4.1328125, -3.40625, -2.6796875, -1.953125, -1.2265625, -0.5, 0.2265625, 0.953125, 1.6796875, 2.40625, 3.1328125, 3.859375, 4.5859375, 5.3125, 6.0390625, 6.765625, 7.4921875, 8.21875, 8.9453125, 9.671875, 10.3984375, 11.125, 11.8515625, 12.578125, 13.3046875, 14.03125, 14.7578125, 15.484375, 16.2109375, 16.9375, 17.6640625, 18.390625, 19.1171875, 19.84375, 20.5703125, 21.296875, 22.0234375, 22.75, 23.4765625, 24.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 0.0, 5.0, 14.0, 13.0, 18.0, 24.0, 41.0, 70.0, 105.0, 217.0, 412.0, 949.0, 2695.0, 8453.0, 34324.0, 196254.0, 2555527.0, 1248742.0, 113224.0, 23144.0, 6357.0, 2123.0, 765.0, 375.0, 164.0, 106.0, 53.0, 47.0, 16.0, 17.0, 10.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.591796875, -38.30859375, -37.025390625, -35.7421875, -34.458984375, -33.17578125, -31.892578125, -30.609375, -29.326171875, -28.04296875, -26.759765625, -25.4765625, -24.193359375, -22.91015625, -21.626953125, -20.34375, -19.060546875, -17.77734375, -16.494140625, -15.2109375, -13.927734375, -12.64453125, -11.361328125, -10.078125, -8.794921875, -7.51171875, -6.228515625, -4.9453125, -3.662109375, -2.37890625, -1.095703125, 0.1875, 1.470703125, 2.75390625, 4.037109375, 5.3203125, 6.603515625, 7.88671875, 9.169921875, 10.453125, 11.736328125, 13.01953125, 14.302734375, 15.5859375, 16.869140625, 18.15234375, 19.435546875, 20.71875, 22.001953125, 23.28515625, 24.568359375, 25.8515625, 27.134765625, 28.41796875, 29.701171875, 30.984375, 32.267578125, 33.55078125, 34.833984375, 36.1171875, 37.400390625, 38.68359375, 39.966796875, 41.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 7.0, 9.0, 12.0, 15.0, 12.0, 20.0, 29.0, 37.0, 44.0, 58.0, 76.0, 105.0, 130.0, 192.0, 296.0, 389.0, 503.0, 505.0, 430.0, 313.0, 224.0, 156.0, 127.0, 87.0, 54.0, 42.0, 40.0, 35.0, 25.0, 22.0, 16.0, 8.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -29.074951171875, -28.04052734375, -27.006103515625, -25.9716796875, -24.937255859375, -23.90283203125, -22.868408203125, -21.833984375, -20.799560546875, -19.76513671875, -18.730712890625, -17.6962890625, -16.661865234375, -15.62744140625, -14.593017578125, -13.55859375, -12.524169921875, -11.48974609375, -10.455322265625, -9.4208984375, -8.386474609375, -7.35205078125, -6.317626953125, -5.283203125, -4.248779296875, -3.21435546875, -2.179931640625, -1.1455078125, -0.111083984375, 0.92333984375, 1.957763671875, 2.9921875, 4.026611328125, 5.06103515625, 6.095458984375, 7.1298828125, 8.164306640625, 9.19873046875, 10.233154296875, 11.267578125, 12.302001953125, 13.33642578125, 14.370849609375, 15.4052734375, 16.439697265625, 17.47412109375, 18.508544921875, 19.54296875, 20.577392578125, 21.61181640625, 22.646240234375, 23.6806640625, 24.715087890625, 25.74951171875, 26.783935546875, 27.818359375, 28.852783203125, 29.88720703125, 30.921630859375, 31.9560546875, 32.990478515625, 34.02490234375, 35.059326171875, 36.09375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 13.0, 19.0, 25.0, 63.0, 154.0, 198.0, 206.0, 161.0, 80.0, 43.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.93560791015625, -351.4669189453125, -333.9981994628906, -316.52947998046875, -299.060791015625, -281.59210205078125, -264.1233825683594, -246.65467834472656, -229.18597412109375, -211.71726989746094, -194.24856567382812, -176.7798614501953, -159.3111572265625, -141.8424530029297, -124.37374877929688, -106.90504455566406, -89.43634033203125, -71.96763610839844, -54.498931884765625, -37.03022766113281, -19.5615234375, -2.0928192138671875, 15.375885009765625, 32.84458923339844, 50.31329345703125, 67.78199768066406, 85.25070190429688, 102.71940612792969, 120.1881103515625, 137.6568145751953, 155.12551879882812, 172.59422302246094, 190.0628662109375, 207.5315704345703, 225.00027465820312, 242.46897888183594, 259.93768310546875, 277.4063720703125, 294.8750915527344, 312.34381103515625, 329.8125, 347.28118896484375, 364.7499084472656, 382.2186279296875, 399.68731689453125, 417.156005859375, 434.6247253417969, 452.09344482421875, 469.5621337890625, 487.03082275390625, 504.4995422363281, 521.96826171875, 539.4369506835938, 556.9056396484375, 574.3743896484375, 591.8430786132812, 609.311767578125, 626.7804565429688, 644.2491455078125, 661.7178955078125, 679.1865844726562, 696.6552734375, 714.1240234375, 731.5927124023438, 749.0614013671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 25.0, 16.0, 35.0, 36.0, 47.0, 49.0, 65.0, 56.0, 52.0, 84.0, 81.0, 71.0, 64.0, 61.0, 40.0, 42.0, 34.0, 29.0, 23.0, 11.0, 17.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.9528045654297, -219.63490295410156, -210.3170166015625, -200.99911499023438, -191.68121337890625, -182.36331176757812, -173.04541015625, -163.72752380371094, -154.4096221923828, -145.0917205810547, -135.77383422851562, -126.4559326171875, -117.13803100585938, -107.82012939453125, -98.50223541259766, -89.18434143066406, -79.86643981933594, -70.54853820800781, -61.23064422607422, -51.91274642944336, -42.5948486328125, -33.27695083618164, -23.95905303955078, -14.641159057617188, -5.3232574462890625, 3.994640350341797, 13.312538146972656, 22.630435943603516, 31.948333740234375, 41.266231536865234, 50.584129333496094, 59.90202331542969, 69.21990966796875, 78.53781127929688, 87.85570526123047, 97.17359924316406, 106.49150085449219, 115.80940246582031, 125.1272964477539, 134.4451904296875, 143.76309204101562, 153.08099365234375, 162.39889526367188, 171.71678161621094, 181.03468322753906, 190.3525848388672, 199.67047119140625, 208.98837280273438, 218.3062744140625, 227.62417602539062, 236.94207763671875, 246.2599639892578, 255.57786560058594, 264.895751953125, 274.2136535644531, 283.53155517578125, 292.8494567871094, 302.1673583984375, 311.4852600097656, 320.80316162109375, 330.12103271484375, 339.4389343261719, 348.7568359375, 358.0747375488281, 367.39263916015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 14.0, 11.0, 14.0, 17.0, 28.0, 43.0, 62.0, 77.0, 118.0, 162.0, 280.0, 440.0, 772.0, 1412.0, 2620.0, 5191.0, 11386.0, 27034.0, 65894.0, 157826.0, 332175.0, 255070.0, 108109.0, 44473.0, 18664.0, 8127.0, 3883.0, 1930.0, 1061.0, 602.0, 345.0, 214.0, 140.0, 97.0, 56.0, 58.0, 41.0, 38.0, 18.0, 16.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-35.96875, -34.87158203125, -33.7744140625, -32.67724609375, -31.580078125, -30.48291015625, -29.3857421875, -28.28857421875, -27.19140625, -26.09423828125, -24.9970703125, -23.89990234375, -22.802734375, -21.70556640625, -20.6083984375, -19.51123046875, -18.4140625, -17.31689453125, -16.2197265625, -15.12255859375, -14.025390625, -12.92822265625, -11.8310546875, -10.73388671875, -9.63671875, -8.53955078125, -7.4423828125, -6.34521484375, -5.248046875, -4.15087890625, -3.0537109375, -1.95654296875, -0.859375, 0.23779296875, 1.3349609375, 2.43212890625, 3.529296875, 4.62646484375, 5.7236328125, 6.82080078125, 7.91796875, 9.01513671875, 10.1123046875, 11.20947265625, 12.306640625, 13.40380859375, 14.5009765625, 15.59814453125, 16.6953125, 17.79248046875, 18.8896484375, 19.98681640625, 21.083984375, 22.18115234375, 23.2783203125, 24.37548828125, 25.47265625, 26.56982421875, 27.6669921875, 28.76416015625, 29.861328125, 30.95849609375, 32.0556640625, 33.15283203125, 34.25]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 12.0, 2.0, 9.0, 11.0, 13.0, 24.0, 30.0, 23.0, 38.0, 45.0, 54.0, 58.0, 59.0, 61.0, 72.0, 64.0, 62.0, 56.0, 55.0, 43.0, 47.0, 41.0, 35.0, 29.0, 17.0, 12.0, 10.0, 3.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.3125, -20.599365234375, -19.88623046875, -19.173095703125, -18.4599609375, -17.746826171875, -17.03369140625, -16.320556640625, -15.607421875, -14.894287109375, -14.18115234375, -13.468017578125, -12.7548828125, -12.041748046875, -11.32861328125, -10.615478515625, -9.90234375, -9.189208984375, -8.47607421875, -7.762939453125, -7.0498046875, -6.336669921875, -5.62353515625, -4.910400390625, -4.197265625, -3.484130859375, -2.77099609375, -2.057861328125, -1.3447265625, -0.631591796875, 0.08154296875, 0.794677734375, 1.5078125, 2.220947265625, 2.93408203125, 3.647216796875, 4.3603515625, 5.073486328125, 5.78662109375, 6.499755859375, 7.212890625, 7.926025390625, 8.63916015625, 9.352294921875, 10.0654296875, 10.778564453125, 11.49169921875, 12.204833984375, 12.91796875, 13.631103515625, 14.34423828125, 15.057373046875, 15.7705078125, 16.483642578125, 17.19677734375, 17.909912109375, 18.623046875, 19.336181640625, 20.04931640625, 20.762451171875, 21.4755859375, 22.188720703125, 22.90185546875, 23.614990234375, 24.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 4.0, 18.0, 15.0, 26.0, 32.0, 39.0, 60.0, 91.0, 155.0, 205.0, 368.0, 604.0, 1089.0, 2167.0, 5434.0, 30777.0, 475876.0, 490164.0, 30936.0, 5622.0, 2171.0, 1049.0, 620.0, 347.0, 221.0, 140.0, 89.0, 75.0, 44.0, 28.0, 21.0, 16.0, 17.0, 7.0, 8.0, 8.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.1875, -100.3212890625, -97.455078125, -94.5888671875, -91.72265625, -88.8564453125, -85.990234375, -83.1240234375, -80.2578125, -77.3916015625, -74.525390625, -71.6591796875, -68.79296875, -65.9267578125, -63.060546875, -60.1943359375, -57.328125, -54.4619140625, -51.595703125, -48.7294921875, -45.86328125, -42.9970703125, -40.130859375, -37.2646484375, -34.3984375, -31.5322265625, -28.666015625, -25.7998046875, -22.93359375, -20.0673828125, -17.201171875, -14.3349609375, -11.46875, -8.6025390625, -5.736328125, -2.8701171875, -0.00390625, 2.8623046875, 5.728515625, 8.5947265625, 11.4609375, 14.3271484375, 17.193359375, 20.0595703125, 22.92578125, 25.7919921875, 28.658203125, 31.5244140625, 34.390625, 37.2568359375, 40.123046875, 42.9892578125, 45.85546875, 48.7216796875, 51.587890625, 54.4541015625, 57.3203125, 60.1865234375, 63.052734375, 65.9189453125, 68.78515625, 71.6513671875, 74.517578125, 77.3837890625, 80.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 1.0, 8.0, 8.0, 7.0, 9.0, 14.0, 17.0, 22.0, 22.0, 37.0, 30.0, 32.0, 32.0, 52.0, 58.0, 34.0, 53.0, 54.0, 46.0, 51.0, 38.0, 39.0, 35.0, 44.0, 36.0, 40.0, 29.0, 30.0, 32.0, 13.0, 16.0, 18.0, 12.0, 7.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.0, -66.5927734375, -64.185546875, -61.7783203125, -59.37109375, -56.9638671875, -54.556640625, -52.1494140625, -49.7421875, -47.3349609375, -44.927734375, -42.5205078125, -40.11328125, -37.7060546875, -35.298828125, -32.8916015625, -30.484375, -28.0771484375, -25.669921875, -23.2626953125, -20.85546875, -18.4482421875, -16.041015625, -13.6337890625, -11.2265625, -8.8193359375, -6.412109375, -4.0048828125, -1.59765625, 0.8095703125, 3.216796875, 5.6240234375, 8.03125, 10.4384765625, 12.845703125, 15.2529296875, 17.66015625, 20.0673828125, 22.474609375, 24.8818359375, 27.2890625, 29.6962890625, 32.103515625, 34.5107421875, 36.91796875, 39.3251953125, 41.732421875, 44.1396484375, 46.546875, 48.9541015625, 51.361328125, 53.7685546875, 56.17578125, 58.5830078125, 60.990234375, 63.3974609375, 65.8046875, 68.2119140625, 70.619140625, 73.0263671875, 75.43359375, 77.8408203125, 80.248046875, 82.6552734375, 85.0625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 11.0, 13.0, 16.0, 27.0, 30.0, 61.0, 104.0, 144.0, 303.0, 625.0, 1649.0, 7050.0, 57928.0, 744085.0, 212395.0, 18881.0, 3225.0, 973.0, 433.0, 218.0, 122.0, 78.0, 44.0, 28.0, 24.0, 11.0, 15.0, 12.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.546875, -24.7900390625, -24.033203125, -23.2763671875, -22.51953125, -21.7626953125, -21.005859375, -20.2490234375, -19.4921875, -18.7353515625, -17.978515625, -17.2216796875, -16.46484375, -15.7080078125, -14.951171875, -14.1943359375, -13.4375, -12.6806640625, -11.923828125, -11.1669921875, -10.41015625, -9.6533203125, -8.896484375, -8.1396484375, -7.3828125, -6.6259765625, -5.869140625, -5.1123046875, -4.35546875, -3.5986328125, -2.841796875, -2.0849609375, -1.328125, -0.5712890625, 0.185546875, 0.9423828125, 1.69921875, 2.4560546875, 3.212890625, 3.9697265625, 4.7265625, 5.4833984375, 6.240234375, 6.9970703125, 7.75390625, 8.5107421875, 9.267578125, 10.0244140625, 10.78125, 11.5380859375, 12.294921875, 13.0517578125, 13.80859375, 14.5654296875, 15.322265625, 16.0791015625, 16.8359375, 17.5927734375, 18.349609375, 19.1064453125, 19.86328125, 20.6201171875, 21.376953125, 22.1337890625, 22.890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 6.0, 9.0, 15.0, 16.0, 12.0, 19.0, 19.0, 21.0, 29.0, 39.0, 52.0, 39.0, 75.0, 108.0, 106.0, 92.0, 61.0, 46.0, 45.0, 31.0, 20.0, 20.0, 15.0, 14.0, 7.0, 12.0, 9.0, 8.0, 13.0, 5.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00330352783203125, -0.003193795680999756, -0.0030840635299682617, -0.0029743313789367676, -0.0028645992279052734, -0.0027548670768737793, -0.002645134925842285, -0.002535402774810791, -0.002425670623779297, -0.0023159384727478027, -0.0022062063217163086, -0.0020964741706848145, -0.0019867420196533203, -0.0018770098686218262, -0.001767277717590332, -0.0016575455665588379, -0.0015478134155273438, -0.0014380812644958496, -0.0013283491134643555, -0.0012186169624328613, -0.0011088848114013672, -0.000999152660369873, -0.0008894205093383789, -0.0007796883583068848, -0.0006699562072753906, -0.0005602240562438965, -0.00045049190521240234, -0.0003407597541809082, -0.00023102760314941406, -0.00012129545211791992, -1.1563301086425781e-05, 9.816884994506836e-05, 0.0002079010009765625, 0.00031763315200805664, 0.0004273653030395508, 0.0005370974540710449, 0.0006468296051025391, 0.0007565617561340332, 0.0008662939071655273, 0.0009760260581970215, 0.0010857582092285156, 0.0011954903602600098, 0.001305222511291504, 0.001414954662322998, 0.0015246868133544922, 0.0016344189643859863, 0.0017441511154174805, 0.0018538832664489746, 0.0019636154174804688, 0.002073347568511963, 0.002183079719543457, 0.002292811870574951, 0.0024025440216064453, 0.0025122761726379395, 0.0026220083236694336, 0.0027317404747009277, 0.002841472625732422, 0.002951204776763916, 0.00306093692779541, 0.0031706690788269043, 0.0032804012298583984, 0.0033901333808898926, 0.0034998655319213867, 0.003609597682952881, 0.003719329833984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 16.0, 18.0, 28.0, 59.0, 46.0, 67.0, 84.0, 154.0, 224.0, 330.0, 518.0, 869.0, 1738.0, 3684.0, 10095.0, 41938.0, 302061.0, 596766.0, 66708.0, 13624.0, 4622.0, 2009.0, 1043.0, 604.0, 360.0, 253.0, 166.0, 129.0, 84.0, 47.0, 31.0, 34.0, 25.0, 23.0, 16.0, 5.0, 8.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.0146484375, -13.498046875, -12.9814453125, -12.46484375, -11.9482421875, -11.431640625, -10.9150390625, -10.3984375, -9.8818359375, -9.365234375, -8.8486328125, -8.33203125, -7.8154296875, -7.298828125, -6.7822265625, -6.265625, -5.7490234375, -5.232421875, -4.7158203125, -4.19921875, -3.6826171875, -3.166015625, -2.6494140625, -2.1328125, -1.6162109375, -1.099609375, -0.5830078125, -0.06640625, 0.4501953125, 0.966796875, 1.4833984375, 2.0, 2.5166015625, 3.033203125, 3.5498046875, 4.06640625, 4.5830078125, 5.099609375, 5.6162109375, 6.1328125, 6.6494140625, 7.166015625, 7.6826171875, 8.19921875, 8.7158203125, 9.232421875, 9.7490234375, 10.265625, 10.7822265625, 11.298828125, 11.8154296875, 12.33203125, 12.8486328125, 13.365234375, 13.8818359375, 14.3984375, 14.9150390625, 15.431640625, 15.9482421875, 16.46484375, 16.9814453125, 17.498046875, 18.0146484375, 18.53125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 14.0, 18.0, 11.0, 21.0, 30.0, 28.0, 32.0, 38.0, 48.0, 66.0, 55.0, 72.0, 86.0, 68.0, 80.0, 61.0, 54.0, 41.0, 35.0, 20.0, 30.0, 23.0, 15.0, 14.0, 2.0, 10.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.3974609375, -14.888671875, -14.3798828125, -13.87109375, -13.3623046875, -12.853515625, -12.3447265625, -11.8359375, -11.3271484375, -10.818359375, -10.3095703125, -9.80078125, -9.2919921875, -8.783203125, -8.2744140625, -7.765625, -7.2568359375, -6.748046875, -6.2392578125, -5.73046875, -5.2216796875, -4.712890625, -4.2041015625, -3.6953125, -3.1865234375, -2.677734375, -2.1689453125, -1.66015625, -1.1513671875, -0.642578125, -0.1337890625, 0.375, 0.8837890625, 1.392578125, 1.9013671875, 2.41015625, 2.9189453125, 3.427734375, 3.9365234375, 4.4453125, 4.9541015625, 5.462890625, 5.9716796875, 6.48046875, 6.9892578125, 7.498046875, 8.0068359375, 8.515625, 9.0244140625, 9.533203125, 10.0419921875, 10.55078125, 11.0595703125, 11.568359375, 12.0771484375, 12.5859375, 13.0947265625, 13.603515625, 14.1123046875, 14.62109375, 15.1298828125, 15.638671875, 16.1474609375, 16.65625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 10.0, 16.0, 15.0, 26.0, 65.0, 117.0, 190.0, 245.0, 139.0, 94.0, 39.0, 20.0, 7.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-676.3380737304688, -661.01611328125, -645.694091796875, -630.3721313476562, -615.0501708984375, -599.7281494140625, -584.4061889648438, -569.084228515625, -553.76220703125, -538.4402465820312, -523.1182250976562, -507.7962646484375, -492.4742736816406, -477.15228271484375, -461.830322265625, -446.5083312988281, -431.18634033203125, -415.8643493652344, -400.5423889160156, -385.22039794921875, -369.8984069824219, -354.576416015625, -339.25445556640625, -323.9324645996094, -308.6105041503906, -293.28851318359375, -277.966552734375, -262.6445617675781, -247.32257080078125, -232.00059509277344, -216.67861938476562, -201.35662841796875, -186.03463745117188, -170.71266174316406, -155.3906707763672, -140.06869506835938, -124.7467041015625, -109.42472839355469, -94.10274505615234, -78.78076171875, -63.458778381347656, -48.13679504394531, -32.81481170654297, -17.49283218383789, -2.170848846435547, 13.151130676269531, 28.473114013671875, 43.79509735107422, 59.11708068847656, 74.4390640258789, 89.76104736328125, 105.08302307128906, 120.40501403808594, 135.72698974609375, 151.04898071289062, 166.37095642089844, 181.69293212890625, 197.01490783691406, 212.33689880371094, 227.65887451171875, 242.98086547851562, 258.3028564453125, 273.62481689453125, 288.9468078613281, 304.268798828125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 4.0, 9.0, 12.0, 6.0, 21.0, 15.0, 18.0, 37.0, 28.0, 36.0, 42.0, 26.0, 34.0, 55.0, 61.0, 63.0, 94.0, 65.0, 50.0, 39.0, 34.0, 32.0, 31.0, 27.0, 30.0, 19.0, 14.0, 17.0, 19.0, 5.0, 10.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-347.7723388671875, -337.8692321777344, -327.96612548828125, -318.0630187988281, -308.159912109375, -298.2568054199219, -288.35369873046875, -278.45062255859375, -268.5474853515625, -258.6443786621094, -248.74127197265625, -238.83816528320312, -228.93505859375, -219.03195190429688, -209.1288604736328, -199.2257537841797, -189.32266235351562, -179.4195556640625, -169.51644897460938, -159.61334228515625, -149.71023559570312, -139.80712890625, -129.90403747558594, -120.00093078613281, -110.09782409667969, -100.19471740722656, -90.29161071777344, -80.38851165771484, -70.48540496826172, -60.582298278808594, -50.679195404052734, -40.776092529296875, -30.872955322265625, -20.969850540161133, -11.06674575805664, -1.1636409759521484, 8.739463806152344, 18.64257049560547, 28.545673370361328, 38.44877624511719, 48.35188293457031, 58.25498962402344, 68.15809631347656, 78.06119537353516, 87.96430206298828, 97.8674087524414, 107.7705078125, 117.67361450195312, 127.57672119140625, 137.47982788085938, 147.3829345703125, 157.28604125976562, 167.18914794921875, 177.09225463867188, 186.99534606933594, 196.89845275878906, 206.8015594482422, 216.7046661376953, 226.60777282714844, 236.51087951660156, 246.41397094726562, 256.31707763671875, 266.2201843261719, 276.123291015625, 286.0263977050781]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 22.0, 37.0, 55.0, 120.0, 229.0, 470.0, 1176.0, 3073.0, 10243.0, 42843.0, 326889.0, 2895487.0, 813525.0, 77343.0, 15426.0, 4471.0, 1523.0, 670.0, 281.0, 147.0, 82.0, 53.0, 41.0, 14.0, 17.0, 10.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.486083984375, -27.45654296875, -26.427001953125, -25.3974609375, -24.367919921875, -23.33837890625, -22.308837890625, -21.279296875, -20.249755859375, -19.22021484375, -18.190673828125, -17.1611328125, -16.131591796875, -15.10205078125, -14.072509765625, -13.04296875, -12.013427734375, -10.98388671875, -9.954345703125, -8.9248046875, -7.895263671875, -6.86572265625, -5.836181640625, -4.806640625, -3.777099609375, -2.74755859375, -1.718017578125, -0.6884765625, 0.341064453125, 1.37060546875, 2.400146484375, 3.4296875, 4.459228515625, 5.48876953125, 6.518310546875, 7.5478515625, 8.577392578125, 9.60693359375, 10.636474609375, 11.666015625, 12.695556640625, 13.72509765625, 14.754638671875, 15.7841796875, 16.813720703125, 17.84326171875, 18.872802734375, 19.90234375, 20.931884765625, 21.96142578125, 22.990966796875, 24.0205078125, 25.050048828125, 26.07958984375, 27.109130859375, 28.138671875, 29.168212890625, 30.19775390625, 31.227294921875, 32.2568359375, 33.286376953125, 34.31591796875, 35.345458984375, 36.375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 8.0, 13.0, 8.0, 19.0, 26.0, 31.0, 28.0, 43.0, 47.0, 48.0, 44.0, 55.0, 65.0, 59.0, 63.0, 54.0, 64.0, 44.0, 44.0, 44.0, 40.0, 31.0, 20.0, 25.0, 17.0, 13.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.515625, -18.83740234375, -18.1591796875, -17.48095703125, -16.802734375, -16.12451171875, -15.4462890625, -14.76806640625, -14.08984375, -13.41162109375, -12.7333984375, -12.05517578125, -11.376953125, -10.69873046875, -10.0205078125, -9.34228515625, -8.6640625, -7.98583984375, -7.3076171875, -6.62939453125, -5.951171875, -5.27294921875, -4.5947265625, -3.91650390625, -3.23828125, -2.56005859375, -1.8818359375, -1.20361328125, -0.525390625, 0.15283203125, 0.8310546875, 1.50927734375, 2.1875, 2.86572265625, 3.5439453125, 4.22216796875, 4.900390625, 5.57861328125, 6.2568359375, 6.93505859375, 7.61328125, 8.29150390625, 8.9697265625, 9.64794921875, 10.326171875, 11.00439453125, 11.6826171875, 12.36083984375, 13.0390625, 13.71728515625, 14.3955078125, 15.07373046875, 15.751953125, 16.43017578125, 17.1083984375, 17.78662109375, 18.46484375, 19.14306640625, 19.8212890625, 20.49951171875, 21.177734375, 21.85595703125, 22.5341796875, 23.21240234375, 23.890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 6.0, 13.0, 14.0, 17.0, 33.0, 58.0, 88.0, 157.0, 297.0, 664.0, 1554.0, 4203.0, 13980.0, 64304.0, 719418.0, 3113223.0, 223387.0, 36680.0, 9658.0, 3442.0, 1452.0, 674.0, 334.0, 230.0, 145.0, 81.0, 49.0, 35.0, 24.0, 15.0, 7.0, 12.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.875, -40.578125, -39.28125, -37.984375, -36.6875, -35.390625, -34.09375, -32.796875, -31.5, -30.203125, -28.90625, -27.609375, -26.3125, -25.015625, -23.71875, -22.421875, -21.125, -19.828125, -18.53125, -17.234375, -15.9375, -14.640625, -13.34375, -12.046875, -10.75, -9.453125, -8.15625, -6.859375, -5.5625, -4.265625, -2.96875, -1.671875, -0.375, 0.921875, 2.21875, 3.515625, 4.8125, 6.109375, 7.40625, 8.703125, 10.0, 11.296875, 12.59375, 13.890625, 15.1875, 16.484375, 17.78125, 19.078125, 20.375, 21.671875, 22.96875, 24.265625, 25.5625, 26.859375, 28.15625, 29.453125, 30.75, 32.046875, 33.34375, 34.640625, 35.9375, 37.234375, 38.53125, 39.828125, 41.125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 7.0, 7.0, 17.0, 15.0, 30.0, 50.0, 65.0, 143.0, 281.0, 551.0, 877.0, 847.0, 520.0, 246.0, 133.0, 86.0, 58.0, 40.0, 23.0, 19.0, 16.0, 10.0, 5.0, 8.0, 4.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.625, -30.90234375, -29.1796875, -27.45703125, -25.734375, -24.01171875, -22.2890625, -20.56640625, -18.84375, -17.12109375, -15.3984375, -13.67578125, -11.953125, -10.23046875, -8.5078125, -6.78515625, -5.0625, -3.33984375, -1.6171875, 0.10546875, 1.828125, 3.55078125, 5.2734375, 6.99609375, 8.71875, 10.44140625, 12.1640625, 13.88671875, 15.609375, 17.33203125, 19.0546875, 20.77734375, 22.5, 24.22265625, 25.9453125, 27.66796875, 29.390625, 31.11328125, 32.8359375, 34.55859375, 36.28125, 38.00390625, 39.7265625, 41.44921875, 43.171875, 44.89453125, 46.6171875, 48.33984375, 50.0625, 51.78515625, 53.5078125, 55.23046875, 56.953125, 58.67578125, 60.3984375, 62.12109375, 63.84375, 65.56640625, 67.2890625, 69.01171875, 70.734375, 72.45703125, 74.1796875, 75.90234375, 77.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 31.0, 64.0, 131.0, 216.0, 263.0, 143.0, 75.0, 31.0, 15.0, 5.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-428.302734375, -410.3797607421875, -392.456787109375, -374.5338439941406, -356.6108703613281, -338.6878967285156, -320.76495361328125, -302.84197998046875, -284.91900634765625, -266.99603271484375, -249.0730743408203, -231.15011596679688, -213.22714233398438, -195.30416870117188, -177.38121032714844, -159.458251953125, -141.5352783203125, -123.61231231689453, -105.68934631347656, -87.7663803100586, -69.84341430664062, -51.920448303222656, -33.99748229980469, -16.07451629638672, 1.84844970703125, 19.77141571044922, 37.69438171386719, 55.617347717285156, 73.54031372070312, 91.4632797241211, 109.38624572753906, 127.30921173095703, 145.23223876953125, 163.15521240234375, 181.0781707763672, 199.00112915039062, 216.92410278320312, 234.84707641601562, 252.77003479003906, 270.6929931640625, 288.615966796875, 306.5389404296875, 324.4619140625, 342.3848571777344, 360.3078308105469, 378.2308044433594, 396.15374755859375, 414.07672119140625, 431.99969482421875, 449.92266845703125, 467.84564208984375, 485.7685852050781, 503.6915588378906, 521.614501953125, 539.5374755859375, 557.46044921875, 575.3834228515625, 593.306396484375, 611.2293701171875, 629.15234375, 647.0753173828125, 664.9982299804688, 682.9212036132812, 700.8441772460938, 718.7671508789062]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 10.0, 11.0, 20.0, 13.0, 19.0, 40.0, 39.0, 50.0, 55.0, 52.0, 61.0, 66.0, 57.0, 71.0, 74.0, 67.0, 58.0, 54.0, 35.0, 32.0, 38.0, 20.0, 20.0, 12.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-404.4827880859375, -395.73114013671875, -386.9794921875, -378.22784423828125, -369.4761962890625, -360.72454833984375, -351.972900390625, -343.22125244140625, -334.4696044921875, -325.71795654296875, -316.96630859375, -308.21466064453125, -299.4630126953125, -290.71136474609375, -281.959716796875, -273.20806884765625, -264.4563903808594, -255.70474243164062, -246.95309448242188, -238.20144653320312, -229.44979858398438, -220.69815063476562, -211.9464874267578, -203.19483947753906, -194.4431915283203, -185.69154357910156, -176.9398956298828, -168.18824768066406, -159.43658447265625, -150.6849365234375, -141.93328857421875, -133.181640625, -124.43002319335938, -115.67837524414062, -106.92672729492188, -98.1750717163086, -89.42342376708984, -80.6717758178711, -71.92012023925781, -63.16847229003906, -54.41682434082031, -45.66517639160156, -36.91352462768555, -28.161874771118164, -19.41022491455078, -10.658576965332031, -1.9069252014160156, 6.8447265625, 15.59637451171875, 24.348024368286133, 33.099674224853516, 41.85132598876953, 50.60297393798828, 59.35462188720703, 68.10627746582031, 76.85792541503906, 85.60957336425781, 94.36122131347656, 103.11286926269531, 111.8645248413086, 120.61617279052734, 129.36782836914062, 138.11947631835938, 146.87112426757812, 155.62277221679688]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 11.0, 10.0, 14.0, 20.0, 35.0, 42.0, 54.0, 86.0, 141.0, 198.0, 360.0, 573.0, 1098.0, 1866.0, 3598.0, 6731.0, 13620.0, 30019.0, 71353.0, 190099.0, 372944.0, 212491.0, 79620.0, 33091.0, 14969.0, 7093.0, 3609.0, 1986.0, 1087.0, 638.0, 431.0, 245.0, 155.0, 78.0, 55.0, 51.0, 26.0, 19.0, 15.0, 9.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.607666015625, -29.60595703125, -28.604248046875, -27.6025390625, -26.600830078125, -25.59912109375, -24.597412109375, -23.595703125, -22.593994140625, -21.59228515625, -20.590576171875, -19.5888671875, -18.587158203125, -17.58544921875, -16.583740234375, -15.58203125, -14.580322265625, -13.57861328125, -12.576904296875, -11.5751953125, -10.573486328125, -9.57177734375, -8.570068359375, -7.568359375, -6.566650390625, -5.56494140625, -4.563232421875, -3.5615234375, -2.559814453125, -1.55810546875, -0.556396484375, 0.4453125, 1.447021484375, 2.44873046875, 3.450439453125, 4.4521484375, 5.453857421875, 6.45556640625, 7.457275390625, 8.458984375, 9.460693359375, 10.46240234375, 11.464111328125, 12.4658203125, 13.467529296875, 14.46923828125, 15.470947265625, 16.47265625, 17.474365234375, 18.47607421875, 19.477783203125, 20.4794921875, 21.481201171875, 22.48291015625, 23.484619140625, 24.486328125, 25.488037109375, 26.48974609375, 27.491455078125, 28.4931640625, 29.494873046875, 30.49658203125, 31.498291015625, 32.5]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 14.0, 9.0, 14.0, 23.0, 18.0, 23.0, 32.0, 39.0, 43.0, 42.0, 67.0, 57.0, 50.0, 53.0, 78.0, 63.0, 55.0, 48.0, 61.0, 38.0, 29.0, 28.0, 22.0, 22.0, 18.0, 6.0, 5.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.53125, -18.848388671875, -18.16552734375, -17.482666015625, -16.7998046875, -16.116943359375, -15.43408203125, -14.751220703125, -14.068359375, -13.385498046875, -12.70263671875, -12.019775390625, -11.3369140625, -10.654052734375, -9.97119140625, -9.288330078125, -8.60546875, -7.922607421875, -7.23974609375, -6.556884765625, -5.8740234375, -5.191162109375, -4.50830078125, -3.825439453125, -3.142578125, -2.459716796875, -1.77685546875, -1.093994140625, -0.4111328125, 0.271728515625, 0.95458984375, 1.637451171875, 2.3203125, 3.003173828125, 3.68603515625, 4.368896484375, 5.0517578125, 5.734619140625, 6.41748046875, 7.100341796875, 7.783203125, 8.466064453125, 9.14892578125, 9.831787109375, 10.5146484375, 11.197509765625, 11.88037109375, 12.563232421875, 13.24609375, 13.928955078125, 14.61181640625, 15.294677734375, 15.9775390625, 16.660400390625, 17.34326171875, 18.026123046875, 18.708984375, 19.391845703125, 20.07470703125, 20.757568359375, 21.4404296875, 22.123291015625, 22.80615234375, 23.489013671875, 24.171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 15.0, 23.0, 32.0, 41.0, 63.0, 96.0, 156.0, 204.0, 369.0, 530.0, 866.0, 1657.0, 3743.0, 13423.0, 85766.0, 748121.0, 162616.0, 20902.0, 5027.0, 2028.0, 1063.0, 642.0, 378.0, 249.0, 163.0, 110.0, 76.0, 63.0, 29.0, 22.0, 15.0, 14.0, 7.0, 6.0, 7.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-77.0, -74.7109375, -72.421875, -70.1328125, -67.84375, -65.5546875, -63.265625, -60.9765625, -58.6875, -56.3984375, -54.109375, -51.8203125, -49.53125, -47.2421875, -44.953125, -42.6640625, -40.375, -38.0859375, -35.796875, -33.5078125, -31.21875, -28.9296875, -26.640625, -24.3515625, -22.0625, -19.7734375, -17.484375, -15.1953125, -12.90625, -10.6171875, -8.328125, -6.0390625, -3.75, -1.4609375, 0.828125, 3.1171875, 5.40625, 7.6953125, 9.984375, 12.2734375, 14.5625, 16.8515625, 19.140625, 21.4296875, 23.71875, 26.0078125, 28.296875, 30.5859375, 32.875, 35.1640625, 37.453125, 39.7421875, 42.03125, 44.3203125, 46.609375, 48.8984375, 51.1875, 53.4765625, 55.765625, 58.0546875, 60.34375, 62.6328125, 64.921875, 67.2109375, 69.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 5.0, 6.0, 6.0, 5.0, 6.0, 6.0, 16.0, 15.0, 14.0, 17.0, 25.0, 36.0, 24.0, 32.0, 32.0, 50.0, 45.0, 40.0, 39.0, 47.0, 47.0, 53.0, 48.0, 52.0, 31.0, 39.0, 32.0, 36.0, 25.0, 19.0, 25.0, 27.0, 13.0, 19.0, 14.0, 14.0, 9.0, 10.0, 1.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-69.1875, -67.2275390625, -65.267578125, -63.3076171875, -61.34765625, -59.3876953125, -57.427734375, -55.4677734375, -53.5078125, -51.5478515625, -49.587890625, -47.6279296875, -45.66796875, -43.7080078125, -41.748046875, -39.7880859375, -37.828125, -35.8681640625, -33.908203125, -31.9482421875, -29.98828125, -28.0283203125, -26.068359375, -24.1083984375, -22.1484375, -20.1884765625, -18.228515625, -16.2685546875, -14.30859375, -12.3486328125, -10.388671875, -8.4287109375, -6.46875, -4.5087890625, -2.548828125, -0.5888671875, 1.37109375, 3.3310546875, 5.291015625, 7.2509765625, 9.2109375, 11.1708984375, 13.130859375, 15.0908203125, 17.05078125, 19.0107421875, 20.970703125, 22.9306640625, 24.890625, 26.8505859375, 28.810546875, 30.7705078125, 32.73046875, 34.6904296875, 36.650390625, 38.6103515625, 40.5703125, 42.5302734375, 44.490234375, 46.4501953125, 48.41015625, 50.3701171875, 52.330078125, 54.2900390625, 56.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 7.0, 12.0, 17.0, 19.0, 38.0, 43.0, 77.0, 92.0, 172.0, 375.0, 731.0, 2084.0, 8908.0, 64161.0, 776486.0, 171333.0, 18342.0, 3527.0, 1047.0, 456.0, 222.0, 134.0, 77.0, 45.0, 35.0, 31.0, 24.0, 14.0, 11.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.79931640625, -16.1455078125, -15.49169921875, -14.837890625, -14.18408203125, -13.5302734375, -12.87646484375, -12.22265625, -11.56884765625, -10.9150390625, -10.26123046875, -9.607421875, -8.95361328125, -8.2998046875, -7.64599609375, -6.9921875, -6.33837890625, -5.6845703125, -5.03076171875, -4.376953125, -3.72314453125, -3.0693359375, -2.41552734375, -1.76171875, -1.10791015625, -0.4541015625, 0.19970703125, 0.853515625, 1.50732421875, 2.1611328125, 2.81494140625, 3.46875, 4.12255859375, 4.7763671875, 5.43017578125, 6.083984375, 6.73779296875, 7.3916015625, 8.04541015625, 8.69921875, 9.35302734375, 10.0068359375, 10.66064453125, 11.314453125, 11.96826171875, 12.6220703125, 13.27587890625, 13.9296875, 14.58349609375, 15.2373046875, 15.89111328125, 16.544921875, 17.19873046875, 17.8525390625, 18.50634765625, 19.16015625, 19.81396484375, 20.4677734375, 21.12158203125, 21.775390625, 22.42919921875, 23.0830078125, 23.73681640625, 24.390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 6.0, 7.0, 14.0, 10.0, 17.0, 12.0, 22.0, 27.0, 48.0, 48.0, 82.0, 119.0, 138.0, 111.0, 70.0, 48.0, 43.0, 26.0, 23.0, 17.0, 17.0, 22.0, 13.0, 8.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.00366973876953125, -0.003556668758392334, -0.003443598747253418, -0.003330528736114502, -0.003217458724975586, -0.00310438871383667, -0.002991318702697754, -0.002878248691558838, -0.002765178680419922, -0.002652108669281006, -0.00253903865814209, -0.002425968647003174, -0.002312898635864258, -0.002199828624725342, -0.0020867586135864258, -0.0019736886024475098, -0.0018606185913085938, -0.0017475485801696777, -0.0016344785690307617, -0.0015214085578918457, -0.0014083385467529297, -0.0012952685356140137, -0.0011821985244750977, -0.0010691285133361816, -0.0009560585021972656, -0.0008429884910583496, -0.0007299184799194336, -0.0006168484687805176, -0.0005037784576416016, -0.00039070844650268555, -0.00027763843536376953, -0.00016456842422485352, -5.14984130859375e-05, 6.157159805297852e-05, 0.00017464160919189453, 0.00028771162033081055, 0.00040078163146972656, 0.0005138516426086426, 0.0006269216537475586, 0.0007399916648864746, 0.0008530616760253906, 0.0009661316871643066, 0.0010792016983032227, 0.0011922717094421387, 0.0013053417205810547, 0.0014184117317199707, 0.0015314817428588867, 0.0016445517539978027, 0.0017576217651367188, 0.0018706917762756348, 0.0019837617874145508, 0.002096831798553467, 0.002209901809692383, 0.002322971820831299, 0.002436041831970215, 0.002549111843109131, 0.002662181854248047, 0.002775251865386963, 0.002888321876525879, 0.003001391887664795, 0.003114461898803711, 0.003227531909942627, 0.003340601921081543, 0.003453671932220459, 0.003566741943359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 23.0, 16.0, 22.0, 39.0, 70.0, 167.0, 315.0, 547.0, 1277.0, 3435.0, 14415.0, 161009.0, 797280.0, 57896.0, 7933.0, 2291.0, 950.0, 427.0, 210.0, 101.0, 63.0, 23.0, 20.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.8173828125, -21.181640625, -20.5458984375, -19.91015625, -19.2744140625, -18.638671875, -18.0029296875, -17.3671875, -16.7314453125, -16.095703125, -15.4599609375, -14.82421875, -14.1884765625, -13.552734375, -12.9169921875, -12.28125, -11.6455078125, -11.009765625, -10.3740234375, -9.73828125, -9.1025390625, -8.466796875, -7.8310546875, -7.1953125, -6.5595703125, -5.923828125, -5.2880859375, -4.65234375, -4.0166015625, -3.380859375, -2.7451171875, -2.109375, -1.4736328125, -0.837890625, -0.2021484375, 0.43359375, 1.0693359375, 1.705078125, 2.3408203125, 2.9765625, 3.6123046875, 4.248046875, 4.8837890625, 5.51953125, 6.1552734375, 6.791015625, 7.4267578125, 8.0625, 8.6982421875, 9.333984375, 9.9697265625, 10.60546875, 11.2412109375, 11.876953125, 12.5126953125, 13.1484375, 13.7841796875, 14.419921875, 15.0556640625, 15.69140625, 16.3271484375, 16.962890625, 17.5986328125, 18.234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 9.0, 9.0, 9.0, 24.0, 13.0, 11.0, 16.0, 28.0, 39.0, 37.0, 61.0, 59.0, 70.0, 79.0, 65.0, 90.0, 61.0, 52.0, 38.0, 45.0, 34.0, 27.0, 28.0, 20.0, 7.0, 16.0, 7.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.099853515625, -9.73095703125, -9.362060546875, -8.9931640625, -8.624267578125, -8.25537109375, -7.886474609375, -7.517578125, -7.148681640625, -6.77978515625, -6.410888671875, -6.0419921875, -5.673095703125, -5.30419921875, -4.935302734375, -4.56640625, -4.197509765625, -3.82861328125, -3.459716796875, -3.0908203125, -2.721923828125, -2.35302734375, -1.984130859375, -1.615234375, -1.246337890625, -0.87744140625, -0.508544921875, -0.1396484375, 0.229248046875, 0.59814453125, 0.967041015625, 1.3359375, 1.704833984375, 2.07373046875, 2.442626953125, 2.8115234375, 3.180419921875, 3.54931640625, 3.918212890625, 4.287109375, 4.656005859375, 5.02490234375, 5.393798828125, 5.7626953125, 6.131591796875, 6.50048828125, 6.869384765625, 7.23828125, 7.607177734375, 7.97607421875, 8.344970703125, 8.7138671875, 9.082763671875, 9.45166015625, 9.820556640625, 10.189453125, 10.558349609375, 10.92724609375, 11.296142578125, 11.6650390625, 12.033935546875, 12.40283203125, 12.771728515625, 13.140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 14.0, 39.0, 65.0, 182.0, 284.0, 193.0, 107.0, 49.0, 23.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-566.0093383789062, -550.6088256835938, -535.2083740234375, -519.807861328125, -504.4073791503906, -489.00689697265625, -473.6064147949219, -458.2059326171875, -442.805419921875, -427.4049377441406, -412.00445556640625, -396.60394287109375, -381.2034606933594, -365.802978515625, -350.4024963378906, -335.00201416015625, -319.60150146484375, -304.2010192871094, -288.800537109375, -273.4000244140625, -257.9995422363281, -242.59906005859375, -227.19857788085938, -211.79808044433594, -196.39761352539062, -180.99713134765625, -165.5966339111328, -150.19615173339844, -134.795654296875, -119.39517211914062, -103.99468231201172, -88.59419250488281, -73.19369506835938, -57.79320526123047, -42.39271545410156, -26.992229461669922, -11.591739654541016, 3.808746337890625, 19.20923614501953, 34.60972595214844, 50.010215759277344, 65.41070556640625, 80.81119537353516, 96.21168518066406, 111.61216735839844, 127.01265716552734, 142.41314697265625, 157.81362915039062, 173.21412658691406, 188.61460876464844, 204.01510620117188, 219.41558837890625, 234.8160858154297, 250.21656799316406, 265.6170654296875, 281.0175476074219, 296.41802978515625, 311.8185119628906, 327.218994140625, 342.6195068359375, 358.0199890136719, 373.42047119140625, 388.8209533691406, 404.221435546875, 419.6219482421875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 3.0, 4.0, 10.0, 13.0, 12.0, 10.0, 21.0, 23.0, 24.0, 17.0, 26.0, 30.0, 24.0, 29.0, 34.0, 38.0, 48.0, 58.0, 72.0, 65.0, 52.0, 44.0, 41.0, 30.0, 38.0, 34.0, 25.0, 21.0, 26.0, 15.0, 17.0, 14.0, 17.0, 11.0, 10.0, 6.0, 8.0, 4.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.12289428710938, -191.53216552734375, -183.94142150878906, -176.35069274902344, -168.75994873046875, -161.16921997070312, -153.5784912109375, -145.9877471923828, -138.3970184326172, -130.80628967285156, -123.21554565429688, -115.62481689453125, -108.0340805053711, -100.44334411621094, -92.85260772705078, -85.26187133789062, -77.67113494873047, -70.08039855957031, -62.48966598510742, -54.898929595947266, -47.308197021484375, -39.71746063232422, -32.12672424316406, -24.535991668701172, -16.945255279541016, -9.354520797729492, -1.7637853622436523, 5.8269500732421875, 13.417684555053711, 21.008419036865234, 28.59915542602539, 36.18988800048828, 43.78062438964844, 51.371360778808594, 58.962093353271484, 66.55282592773438, 74.14356231689453, 81.73429870605469, 89.32503509521484, 96.915771484375, 104.50650024414062, 112.09723663330078, 119.68797302246094, 127.27870178222656, 134.86944580078125, 142.46017456054688, 150.0509033203125, 157.6416473388672, 165.23239135742188, 172.8231201171875, 180.4138641357422, 188.0045928955078, 195.5953369140625, 203.18606567382812, 210.77679443359375, 218.36753845214844, 225.95826721191406, 233.5489959716797, 241.13973999023438, 248.73046875, 256.3211975097656, 263.91192626953125, 271.502685546875, 279.0934143066406, 286.68414306640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 6.0, 12.0, 22.0, 20.0, 20.0, 43.0, 60.0, 68.0, 96.0, 165.0, 274.0, 484.0, 878.0, 1573.0, 3396.0, 7974.0, 24701.0, 124338.0, 1216053.0, 2452150.0, 297871.0, 43155.0, 11485.0, 4564.0, 2169.0, 1064.0, 610.0, 380.0, 217.0, 128.0, 84.0, 52.0, 35.0, 34.0, 25.0, 21.0, 9.0, 12.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.833984375, -24.01171875, -23.189453125, -22.3671875, -21.544921875, -20.72265625, -19.900390625, -19.078125, -18.255859375, -17.43359375, -16.611328125, -15.7890625, -14.966796875, -14.14453125, -13.322265625, -12.5, -11.677734375, -10.85546875, -10.033203125, -9.2109375, -8.388671875, -7.56640625, -6.744140625, -5.921875, -5.099609375, -4.27734375, -3.455078125, -2.6328125, -1.810546875, -0.98828125, -0.166015625, 0.65625, 1.478515625, 2.30078125, 3.123046875, 3.9453125, 4.767578125, 5.58984375, 6.412109375, 7.234375, 8.056640625, 8.87890625, 9.701171875, 10.5234375, 11.345703125, 12.16796875, 12.990234375, 13.8125, 14.634765625, 15.45703125, 16.279296875, 17.1015625, 17.923828125, 18.74609375, 19.568359375, 20.390625, 21.212890625, 22.03515625, 22.857421875, 23.6796875, 24.501953125, 25.32421875, 26.146484375, 26.96875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 7.0, 6.0, 11.0, 13.0, 12.0, 28.0, 18.0, 22.0, 28.0, 38.0, 46.0, 50.0, 47.0, 65.0, 64.0, 53.0, 47.0, 57.0, 66.0, 61.0, 48.0, 40.0, 33.0, 22.0, 22.0, 34.0, 21.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.640625, -17.972412109375, -17.30419921875, -16.635986328125, -15.9677734375, -15.299560546875, -14.63134765625, -13.963134765625, -13.294921875, -12.626708984375, -11.95849609375, -11.290283203125, -10.6220703125, -9.953857421875, -9.28564453125, -8.617431640625, -7.94921875, -7.281005859375, -6.61279296875, -5.944580078125, -5.2763671875, -4.608154296875, -3.93994140625, -3.271728515625, -2.603515625, -1.935302734375, -1.26708984375, -0.598876953125, 0.0693359375, 0.737548828125, 1.40576171875, 2.073974609375, 2.7421875, 3.410400390625, 4.07861328125, 4.746826171875, 5.4150390625, 6.083251953125, 6.75146484375, 7.419677734375, 8.087890625, 8.756103515625, 9.42431640625, 10.092529296875, 10.7607421875, 11.428955078125, 12.09716796875, 12.765380859375, 13.43359375, 14.101806640625, 14.77001953125, 15.438232421875, 16.1064453125, 16.774658203125, 17.44287109375, 18.111083984375, 18.779296875, 19.447509765625, 20.11572265625, 20.783935546875, 21.4521484375, 22.120361328125, 22.78857421875, 23.456787109375, 24.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 7.0, 15.0, 15.0, 35.0, 45.0, 60.0, 114.0, 210.0, 432.0, 1112.0, 3151.0, 11685.0, 72234.0, 2225509.0, 1798473.0, 64908.0, 11227.0, 3010.0, 1031.0, 435.0, 211.0, 123.0, 67.0, 62.0, 37.0, 16.0, 21.0, 11.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.3603515625, -31.908203125, -30.4560546875, -29.00390625, -27.5517578125, -26.099609375, -24.6474609375, -23.1953125, -21.7431640625, -20.291015625, -18.8388671875, -17.38671875, -15.9345703125, -14.482421875, -13.0302734375, -11.578125, -10.1259765625, -8.673828125, -7.2216796875, -5.76953125, -4.3173828125, -2.865234375, -1.4130859375, 0.0390625, 1.4912109375, 2.943359375, 4.3955078125, 5.84765625, 7.2998046875, 8.751953125, 10.2041015625, 11.65625, 13.1083984375, 14.560546875, 16.0126953125, 17.46484375, 18.9169921875, 20.369140625, 21.8212890625, 23.2734375, 24.7255859375, 26.177734375, 27.6298828125, 29.08203125, 30.5341796875, 31.986328125, 33.4384765625, 34.890625, 36.3427734375, 37.794921875, 39.2470703125, 40.69921875, 42.1513671875, 43.603515625, 45.0556640625, 46.5078125, 47.9599609375, 49.412109375, 50.8642578125, 52.31640625, 53.7685546875, 55.220703125, 56.6728515625, 58.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 15.0, 19.0, 24.0, 30.0, 47.0, 85.0, 134.0, 210.0, 393.0, 632.0, 790.0, 639.0, 434.0, 210.0, 140.0, 73.0, 48.0, 26.0, 23.0, 30.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.5625, -29.32080078125, -28.0791015625, -26.83740234375, -25.595703125, -24.35400390625, -23.1123046875, -21.87060546875, -20.62890625, -19.38720703125, -18.1455078125, -16.90380859375, -15.662109375, -14.42041015625, -13.1787109375, -11.93701171875, -10.6953125, -9.45361328125, -8.2119140625, -6.97021484375, -5.728515625, -4.48681640625, -3.2451171875, -2.00341796875, -0.76171875, 0.47998046875, 1.7216796875, 2.96337890625, 4.205078125, 5.44677734375, 6.6884765625, 7.93017578125, 9.171875, 10.41357421875, 11.6552734375, 12.89697265625, 14.138671875, 15.38037109375, 16.6220703125, 17.86376953125, 19.10546875, 20.34716796875, 21.5888671875, 22.83056640625, 24.072265625, 25.31396484375, 26.5556640625, 27.79736328125, 29.0390625, 30.28076171875, 31.5224609375, 32.76416015625, 34.005859375, 35.24755859375, 36.4892578125, 37.73095703125, 38.97265625, 40.21435546875, 41.4560546875, 42.69775390625, 43.939453125, 45.18115234375, 46.4228515625, 47.66455078125, 48.90625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 14.0, 37.0, 157.0, 356.0, 287.0, 99.0, 24.0, 13.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-724.652587890625, -702.5910034179688, -680.5293579101562, -658.4677734375, -636.4061279296875, -614.3445434570312, -592.282958984375, -570.2213134765625, -548.1597290039062, -526.09814453125, -504.0364990234375, -481.97491455078125, -459.9132995605469, -437.8516845703125, -415.7900695800781, -393.72845458984375, -371.6668395996094, -349.605224609375, -327.5436096191406, -305.48199462890625, -283.42041015625, -261.3587951660156, -239.29718017578125, -217.23558044433594, -195.17396545410156, -173.1123504638672, -151.05075073242188, -128.9891357421875, -106.92752838134766, -84.86592102050781, -62.80430603027344, -40.742706298828125, -18.68109130859375, 3.3805179595947266, 25.442127227783203, 47.50373840332031, 69.56534576416016, 91.626953125, 113.68856811523438, 135.7501678466797, 157.81178283691406, 179.87339782714844, 201.93499755859375, 223.99661254882812, 246.0582275390625, 268.11981201171875, 290.18145751953125, 312.2430419921875, 334.3046569824219, 356.36627197265625, 378.4278869628906, 400.489501953125, 422.55108642578125, 444.6127014160156, 466.67431640625, 488.73590087890625, 510.79754638671875, 532.859130859375, 554.9207763671875, 576.9823608398438, 599.0440063476562, 621.1055908203125, 643.167236328125, 665.2288208007812, 687.2904052734375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 8.0, 16.0, 13.0, 19.0, 17.0, 13.0, 27.0, 38.0, 35.0, 30.0, 35.0, 43.0, 43.0, 41.0, 55.0, 50.0, 45.0, 58.0, 48.0, 42.0, 41.0, 45.0, 24.0, 24.0, 30.0, 23.0, 15.0, 12.0, 21.0, 13.0, 15.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.69329833984375, -141.41461181640625, -136.13592529296875, -130.85723876953125, -125.57854461669922, -120.29985809326172, -115.02116394042969, -109.74247741699219, -104.46379089355469, -99.18510437011719, -93.90641784667969, -88.62772369384766, -83.34903717041016, -78.07035064697266, -72.79165649414062, -67.51296997070312, -62.234283447265625, -56.955596923828125, -51.67690658569336, -46.398216247558594, -41.119529724121094, -35.840843200683594, -30.562152862548828, -25.283462524414062, -20.004776000976562, -14.72608757019043, -9.447399139404297, -4.168710708618164, 1.1099777221679688, 6.388666152954102, 11.667354583740234, 16.946044921875, 22.2247314453125, 27.503419876098633, 32.782108306884766, 38.06079864501953, 43.33948516845703, 48.61817169189453, 53.8968620300293, 59.17555236816406, 64.45423889160156, 69.73292541503906, 75.01161193847656, 80.2903060913086, 85.5689926147461, 90.8476791381836, 96.12637329101562, 101.40505981445312, 106.68374633789062, 111.96243286132812, 117.24111938476562, 122.51981353759766, 127.79850006103516, 133.0771942138672, 138.3558807373047, 143.6345672607422, 148.9132537841797, 154.1919403076172, 159.4706268310547, 164.7493133544922, 170.02801513671875, 175.30670166015625, 180.58538818359375, 185.86407470703125, 191.14276123046875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 9.0, 22.0, 28.0, 45.0, 49.0, 98.0, 129.0, 223.0, 418.0, 755.0, 1435.0, 3012.0, 6507.0, 15646.0, 42884.0, 126853.0, 319138.0, 325674.0, 131781.0, 44615.0, 16171.0, 6740.0, 3004.0, 1442.0, 791.0, 415.0, 226.0, 141.0, 81.0, 61.0, 52.0, 25.0, 23.0, 9.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.375, -23.56298828125, -22.7509765625, -21.93896484375, -21.126953125, -20.31494140625, -19.5029296875, -18.69091796875, -17.87890625, -17.06689453125, -16.2548828125, -15.44287109375, -14.630859375, -13.81884765625, -13.0068359375, -12.19482421875, -11.3828125, -10.57080078125, -9.7587890625, -8.94677734375, -8.134765625, -7.32275390625, -6.5107421875, -5.69873046875, -4.88671875, -4.07470703125, -3.2626953125, -2.45068359375, -1.638671875, -0.82666015625, -0.0146484375, 0.79736328125, 1.609375, 2.42138671875, 3.2333984375, 4.04541015625, 4.857421875, 5.66943359375, 6.4814453125, 7.29345703125, 8.10546875, 8.91748046875, 9.7294921875, 10.54150390625, 11.353515625, 12.16552734375, 12.9775390625, 13.78955078125, 14.6015625, 15.41357421875, 16.2255859375, 17.03759765625, 17.849609375, 18.66162109375, 19.4736328125, 20.28564453125, 21.09765625, 21.90966796875, 22.7216796875, 23.53369140625, 24.345703125, 25.15771484375, 25.9697265625, 26.78173828125, 27.59375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 7.0, 12.0, 12.0, 15.0, 17.0, 18.0, 30.0, 29.0, 35.0, 41.0, 60.0, 59.0, 54.0, 67.0, 47.0, 51.0, 46.0, 56.0, 42.0, 42.0, 44.0, 33.0, 33.0, 27.0, 28.0, 21.0, 13.0, 17.0, 6.0, 7.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.109375, -16.468994140625, -15.82861328125, -15.188232421875, -14.5478515625, -13.907470703125, -13.26708984375, -12.626708984375, -11.986328125, -11.345947265625, -10.70556640625, -10.065185546875, -9.4248046875, -8.784423828125, -8.14404296875, -7.503662109375, -6.86328125, -6.222900390625, -5.58251953125, -4.942138671875, -4.3017578125, -3.661376953125, -3.02099609375, -2.380615234375, -1.740234375, -1.099853515625, -0.45947265625, 0.180908203125, 0.8212890625, 1.461669921875, 2.10205078125, 2.742431640625, 3.3828125, 4.023193359375, 4.66357421875, 5.303955078125, 5.9443359375, 6.584716796875, 7.22509765625, 7.865478515625, 8.505859375, 9.146240234375, 9.78662109375, 10.427001953125, 11.0673828125, 11.707763671875, 12.34814453125, 12.988525390625, 13.62890625, 14.269287109375, 14.90966796875, 15.550048828125, 16.1904296875, 16.830810546875, 17.47119140625, 18.111572265625, 18.751953125, 19.392333984375, 20.03271484375, 20.673095703125, 21.3134765625, 21.953857421875, 22.59423828125, 23.234619140625, 23.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 16.0, 25.0, 39.0, 51.0, 81.0, 146.0, 308.0, 714.0, 2034.0, 7183.0, 37290.0, 298868.0, 621885.0, 64353.0, 10954.0, 2798.0, 925.0, 408.0, 184.0, 115.0, 59.0, 31.0, 19.0, 15.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0625, -48.4013671875, -46.740234375, -45.0791015625, -43.41796875, -41.7568359375, -40.095703125, -38.4345703125, -36.7734375, -35.1123046875, -33.451171875, -31.7900390625, -30.12890625, -28.4677734375, -26.806640625, -25.1455078125, -23.484375, -21.8232421875, -20.162109375, -18.5009765625, -16.83984375, -15.1787109375, -13.517578125, -11.8564453125, -10.1953125, -8.5341796875, -6.873046875, -5.2119140625, -3.55078125, -1.8896484375, -0.228515625, 1.4326171875, 3.09375, 4.7548828125, 6.416015625, 8.0771484375, 9.73828125, 11.3994140625, 13.060546875, 14.7216796875, 16.3828125, 18.0439453125, 19.705078125, 21.3662109375, 23.02734375, 24.6884765625, 26.349609375, 28.0107421875, 29.671875, 31.3330078125, 32.994140625, 34.6552734375, 36.31640625, 37.9775390625, 39.638671875, 41.2998046875, 42.9609375, 44.6220703125, 46.283203125, 47.9443359375, 49.60546875, 51.2666015625, 52.927734375, 54.5888671875, 56.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 9.0, 15.0, 24.0, 17.0, 18.0, 24.0, 31.0, 26.0, 32.0, 44.0, 47.0, 44.0, 48.0, 50.0, 47.0, 42.0, 36.0, 50.0, 42.0, 50.0, 45.0, 39.0, 35.0, 29.0, 28.0, 19.0, 16.0, 13.0, 12.0, 12.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-73.125, -71.17919921875, -69.2333984375, -67.28759765625, -65.341796875, -63.39599609375, -61.4501953125, -59.50439453125, -57.55859375, -55.61279296875, -53.6669921875, -51.72119140625, -49.775390625, -47.82958984375, -45.8837890625, -43.93798828125, -41.9921875, -40.04638671875, -38.1005859375, -36.15478515625, -34.208984375, -32.26318359375, -30.3173828125, -28.37158203125, -26.42578125, -24.47998046875, -22.5341796875, -20.58837890625, -18.642578125, -16.69677734375, -14.7509765625, -12.80517578125, -10.859375, -8.91357421875, -6.9677734375, -5.02197265625, -3.076171875, -1.13037109375, 0.8154296875, 2.76123046875, 4.70703125, 6.65283203125, 8.5986328125, 10.54443359375, 12.490234375, 14.43603515625, 16.3818359375, 18.32763671875, 20.2734375, 22.21923828125, 24.1650390625, 26.11083984375, 28.056640625, 30.00244140625, 31.9482421875, 33.89404296875, 35.83984375, 37.78564453125, 39.7314453125, 41.67724609375, 43.623046875, 45.56884765625, 47.5146484375, 49.46044921875, 51.40625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 9.0, 11.0, 25.0, 39.0, 58.0, 84.0, 145.0, 283.0, 582.0, 1147.0, 3358.0, 11381.0, 50913.0, 287257.0, 591155.0, 78452.0, 16296.0, 4434.0, 1496.0, 646.0, 283.0, 152.0, 105.0, 61.0, 39.0, 34.0, 26.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.796875, -10.498046875, -10.19921875, -9.900390625, -9.6015625, -9.302734375, -9.00390625, -8.705078125, -8.40625, -8.107421875, -7.80859375, -7.509765625, -7.2109375, -6.912109375, -6.61328125, -6.314453125, -6.015625, -5.716796875, -5.41796875, -5.119140625, -4.8203125, -4.521484375, -4.22265625, -3.923828125, -3.625, -3.326171875, -3.02734375, -2.728515625, -2.4296875, -2.130859375, -1.83203125, -1.533203125, -1.234375, -0.935546875, -0.63671875, -0.337890625, -0.0390625, 0.259765625, 0.55859375, 0.857421875, 1.15625, 1.455078125, 1.75390625, 2.052734375, 2.3515625, 2.650390625, 2.94921875, 3.248046875, 3.546875, 3.845703125, 4.14453125, 4.443359375, 4.7421875, 5.041015625, 5.33984375, 5.638671875, 5.9375, 6.236328125, 6.53515625, 6.833984375, 7.1328125, 7.431640625, 7.73046875, 8.029296875, 8.328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 12.0, 7.0, 10.0, 9.0, 29.0, 35.0, 50.0, 65.0, 80.0, 107.0, 135.0, 115.0, 103.0, 60.0, 47.0, 38.0, 18.0, 22.0, 14.0, 3.0, 9.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023784637451171875, -0.0023027658462524414, -0.0022270679473876953, -0.0021513700485229492, -0.002075672149658203, -0.001999974250793457, -0.001924276351928711, -0.0018485784530639648, -0.0017728805541992188, -0.0016971826553344727, -0.0016214847564697266, -0.0015457868576049805, -0.0014700889587402344, -0.0013943910598754883, -0.0013186931610107422, -0.001242995262145996, -0.00116729736328125, -0.001091599464416504, -0.0010159015655517578, -0.0009402036666870117, -0.0008645057678222656, -0.0007888078689575195, -0.0007131099700927734, -0.0006374120712280273, -0.0005617141723632812, -0.00048601627349853516, -0.00041031837463378906, -0.00033462047576904297, -0.0002589225769042969, -0.00018322467803955078, -0.00010752677917480469, -3.1828880310058594e-05, 4.38690185546875e-05, 0.0001195669174194336, 0.0001952648162841797, 0.0002709627151489258, 0.0003466606140136719, 0.00042235851287841797, 0.0004980564117431641, 0.0005737543106079102, 0.0006494522094726562, 0.0007251501083374023, 0.0008008480072021484, 0.0008765459060668945, 0.0009522438049316406, 0.0010279417037963867, 0.0011036396026611328, 0.001179337501525879, 0.001255035400390625, 0.001330733299255371, 0.0014064311981201172, 0.0014821290969848633, 0.0015578269958496094, 0.0016335248947143555, 0.0017092227935791016, 0.0017849206924438477, 0.0018606185913085938, 0.0019363164901733398, 0.002012014389038086, 0.002087712287902832, 0.002163410186767578, 0.0022391080856323242, 0.0023148059844970703, 0.0023905038833618164, 0.0024662017822265625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 8.0, 6.0, 10.0, 10.0, 11.0, 19.0, 32.0, 39.0, 53.0, 94.0, 160.0, 341.0, 707.0, 1543.0, 4042.0, 13263.0, 61250.0, 481474.0, 405758.0, 59754.0, 12928.0, 4072.0, 1516.0, 671.0, 323.0, 185.0, 103.0, 59.0, 38.0, 26.0, 18.0, 12.0, 11.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.919921875, -7.58984375, -7.259765625, -6.9296875, -6.599609375, -6.26953125, -5.939453125, -5.609375, -5.279296875, -4.94921875, -4.619140625, -4.2890625, -3.958984375, -3.62890625, -3.298828125, -2.96875, -2.638671875, -2.30859375, -1.978515625, -1.6484375, -1.318359375, -0.98828125, -0.658203125, -0.328125, 0.001953125, 0.33203125, 0.662109375, 0.9921875, 1.322265625, 1.65234375, 1.982421875, 2.3125, 2.642578125, 2.97265625, 3.302734375, 3.6328125, 3.962890625, 4.29296875, 4.623046875, 4.953125, 5.283203125, 5.61328125, 5.943359375, 6.2734375, 6.603515625, 6.93359375, 7.263671875, 7.59375, 7.923828125, 8.25390625, 8.583984375, 8.9140625, 9.244140625, 9.57421875, 9.904296875, 10.234375, 10.564453125, 10.89453125, 11.224609375, 11.5546875, 11.884765625, 12.21484375, 12.544921875, 12.875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 11.0, 11.0, 6.0, 17.0, 21.0, 27.0, 27.0, 43.0, 46.0, 52.0, 55.0, 70.0, 69.0, 68.0, 69.0, 61.0, 66.0, 56.0, 38.0, 23.0, 30.0, 16.0, 19.0, 10.0, 14.0, 10.0, 11.0, 4.0, 4.0, 6.0, 8.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.078125, -6.827392578125, -6.57666015625, -6.325927734375, -6.0751953125, -5.824462890625, -5.57373046875, -5.322998046875, -5.072265625, -4.821533203125, -4.57080078125, -4.320068359375, -4.0693359375, -3.818603515625, -3.56787109375, -3.317138671875, -3.06640625, -2.815673828125, -2.56494140625, -2.314208984375, -2.0634765625, -1.812744140625, -1.56201171875, -1.311279296875, -1.060546875, -0.809814453125, -0.55908203125, -0.308349609375, -0.0576171875, 0.193115234375, 0.44384765625, 0.694580078125, 0.9453125, 1.196044921875, 1.44677734375, 1.697509765625, 1.9482421875, 2.198974609375, 2.44970703125, 2.700439453125, 2.951171875, 3.201904296875, 3.45263671875, 3.703369140625, 3.9541015625, 4.204833984375, 4.45556640625, 4.706298828125, 4.95703125, 5.207763671875, 5.45849609375, 5.709228515625, 5.9599609375, 6.210693359375, 6.46142578125, 6.712158203125, 6.962890625, 7.213623046875, 7.46435546875, 7.715087890625, 7.9658203125, 8.216552734375, 8.46728515625, 8.718017578125, 8.96875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 14.0, 17.0, 39.0, 89.0, 168.0, 310.0, 181.0, 98.0, 33.0, 27.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-606.7669677734375, -594.0113525390625, -581.2557373046875, -568.5000610351562, -555.7444458007812, -542.9888305664062, -530.2332153320312, -517.4776000976562, -504.7219543457031, -491.9663391113281, -479.210693359375, -466.455078125, -453.699462890625, -440.9438171386719, -428.1882019042969, -415.43255615234375, -402.67694091796875, -389.92132568359375, -377.1656799316406, -364.4100646972656, -351.6544189453125, -338.8988037109375, -326.1431884765625, -313.3875732421875, -300.6319274902344, -287.8763122558594, -275.12066650390625, -262.36505126953125, -249.6094207763672, -236.85379028320312, -224.09817504882812, -211.34254455566406, -198.58688354492188, -185.8312530517578, -173.07562255859375, -160.32000732421875, -147.5643768310547, -134.80874633789062, -122.0531234741211, -109.29750061035156, -96.5418701171875, -83.78623962402344, -71.0306167602539, -58.27499008178711, -45.51936340332031, -32.763736724853516, -20.00811004638672, -7.2524871826171875, 5.503143310546875, 18.258769989013672, 31.01439666748047, 43.770023345947266, 56.52565002441406, 69.28128051757812, 82.03690338134766, 94.79252624511719, 107.54815673828125, 120.30378723144531, 133.05941772460938, 145.81503295898438, 158.57066345214844, 171.3262939453125, 184.0819091796875, 196.83753967285156, 209.59317016601562]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 9.0, 11.0, 11.0, 11.0, 17.0, 24.0, 17.0, 29.0, 28.0, 35.0, 33.0, 33.0, 46.0, 49.0, 79.0, 86.0, 84.0, 41.0, 44.0, 32.0, 31.0, 33.0, 22.0, 29.0, 33.0, 13.0, 13.0, 17.0, 12.0, 6.0, 11.0, 9.0, 8.0, 9.0, 1.0, 5.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.49673461914062, -212.74285888671875, -204.9889678955078, -197.23509216308594, -189.48121643066406, -181.72732543945312, -173.97344970703125, -166.21957397460938, -158.46568298339844, -150.71180725097656, -142.95791625976562, -135.20404052734375, -127.45015716552734, -119.69627380371094, -111.94239807128906, -104.18851470947266, -96.43463897705078, -88.68075561523438, -80.9268798828125, -73.1729965209961, -65.41911315917969, -57.66523361206055, -49.911354064941406, -42.157470703125, -34.40359115600586, -26.649709701538086, -18.895828247070312, -11.141948699951172, -3.3880672454833984, 4.365814208984375, 12.119693756103516, 19.873577117919922, 27.627456665039062, 35.3813362121582, 43.13521957397461, 50.88909912109375, 58.642982482910156, 66.39686584472656, 74.15074157714844, 81.90462493896484, 89.65850830078125, 97.41239166259766, 105.16626739501953, 112.92015075683594, 120.67403411865234, 128.42791748046875, 136.18179321289062, 143.9356689453125, 151.68954467773438, 159.44342041015625, 167.1973114013672, 174.95118713378906, 182.70506286621094, 190.45895385742188, 198.21282958984375, 205.96670532226562, 213.72059631347656, 221.47447204589844, 229.22836303710938, 236.98223876953125, 244.73611450195312, 252.49000549316406, 260.243896484375, 267.9977722167969, 275.75164794921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 14.0, 14.0, 25.0, 33.0, 44.0, 88.0, 137.0, 222.0, 362.0, 639.0, 1305.0, 2677.0, 5859.0, 14531.0, 45595.0, 197626.0, 991298.0, 2075615.0, 668873.0, 136142.0, 33735.0, 10826.0, 4293.0, 1928.0, 978.0, 579.0, 303.0, 172.0, 109.0, 76.0, 42.0, 33.0, 22.0, 13.0, 13.0, 14.0, 8.0, 1.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.640625, -15.14208984375, -14.6435546875, -14.14501953125, -13.646484375, -13.14794921875, -12.6494140625, -12.15087890625, -11.65234375, -11.15380859375, -10.6552734375, -10.15673828125, -9.658203125, -9.15966796875, -8.6611328125, -8.16259765625, -7.6640625, -7.16552734375, -6.6669921875, -6.16845703125, -5.669921875, -5.17138671875, -4.6728515625, -4.17431640625, -3.67578125, -3.17724609375, -2.6787109375, -2.18017578125, -1.681640625, -1.18310546875, -0.6845703125, -0.18603515625, 0.3125, 0.81103515625, 1.3095703125, 1.80810546875, 2.306640625, 2.80517578125, 3.3037109375, 3.80224609375, 4.30078125, 4.79931640625, 5.2978515625, 5.79638671875, 6.294921875, 6.79345703125, 7.2919921875, 7.79052734375, 8.2890625, 8.78759765625, 9.2861328125, 9.78466796875, 10.283203125, 10.78173828125, 11.2802734375, 11.77880859375, 12.27734375, 12.77587890625, 13.2744140625, 13.77294921875, 14.271484375, 14.77001953125, 15.2685546875, 15.76708984375, 16.265625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 1.0, 6.0, 2.0, 7.0, 6.0, 11.0, 13.0, 18.0, 16.0, 25.0, 32.0, 30.0, 21.0, 37.0, 43.0, 51.0, 55.0, 56.0, 50.0, 54.0, 46.0, 43.0, 67.0, 35.0, 43.0, 41.0, 41.0, 34.0, 23.0, 20.0, 20.0, 14.0, 11.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.890625, -15.289306640625, -14.68798828125, -14.086669921875, -13.4853515625, -12.884033203125, -12.28271484375, -11.681396484375, -11.080078125, -10.478759765625, -9.87744140625, -9.276123046875, -8.6748046875, -8.073486328125, -7.47216796875, -6.870849609375, -6.26953125, -5.668212890625, -5.06689453125, -4.465576171875, -3.8642578125, -3.262939453125, -2.66162109375, -2.060302734375, -1.458984375, -0.857666015625, -0.25634765625, 0.344970703125, 0.9462890625, 1.547607421875, 2.14892578125, 2.750244140625, 3.3515625, 3.952880859375, 4.55419921875, 5.155517578125, 5.7568359375, 6.358154296875, 6.95947265625, 7.560791015625, 8.162109375, 8.763427734375, 9.36474609375, 9.966064453125, 10.5673828125, 11.168701171875, 11.77001953125, 12.371337890625, 12.97265625, 13.573974609375, 14.17529296875, 14.776611328125, 15.3779296875, 15.979248046875, 16.58056640625, 17.181884765625, 17.783203125, 18.384521484375, 18.98583984375, 19.587158203125, 20.1884765625, 20.789794921875, 21.39111328125, 21.992431640625, 22.59375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 19.0, 19.0, 38.0, 61.0, 101.0, 137.0, 398.0, 1271.0, 6478.0, 54622.0, 2897339.0, 1196139.0, 31236.0, 4521.0, 1044.0, 373.0, 178.0, 105.0, 71.0, 36.0, 20.0, 18.0, 10.0, 11.0, 4.0, 5.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.78125, -52.36181640625, -50.9423828125, -49.52294921875, -48.103515625, -46.68408203125, -45.2646484375, -43.84521484375, -42.42578125, -41.00634765625, -39.5869140625, -38.16748046875, -36.748046875, -35.32861328125, -33.9091796875, -32.48974609375, -31.0703125, -29.65087890625, -28.2314453125, -26.81201171875, -25.392578125, -23.97314453125, -22.5537109375, -21.13427734375, -19.71484375, -18.29541015625, -16.8759765625, -15.45654296875, -14.037109375, -12.61767578125, -11.1982421875, -9.77880859375, -8.359375, -6.93994140625, -5.5205078125, -4.10107421875, -2.681640625, -1.26220703125, 0.1572265625, 1.57666015625, 2.99609375, 4.41552734375, 5.8349609375, 7.25439453125, 8.673828125, 10.09326171875, 11.5126953125, 12.93212890625, 14.3515625, 15.77099609375, 17.1904296875, 18.60986328125, 20.029296875, 21.44873046875, 22.8681640625, 24.28759765625, 25.70703125, 27.12646484375, 28.5458984375, 29.96533203125, 31.384765625, 32.80419921875, 34.2236328125, 35.64306640625, 37.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 14.0, 10.0, 20.0, 34.0, 51.0, 70.0, 184.0, 267.0, 462.0, 757.0, 749.0, 600.0, 363.0, 184.0, 117.0, 44.0, 44.0, 26.0, 20.0, 8.0, 9.0, 6.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.305908203125, -18.18994140625, -17.073974609375, -15.9580078125, -14.842041015625, -13.72607421875, -12.610107421875, -11.494140625, -10.378173828125, -9.26220703125, -8.146240234375, -7.0302734375, -5.914306640625, -4.79833984375, -3.682373046875, -2.56640625, -1.450439453125, -0.33447265625, 0.781494140625, 1.8974609375, 3.013427734375, 4.12939453125, 5.245361328125, 6.361328125, 7.477294921875, 8.59326171875, 9.709228515625, 10.8251953125, 11.941162109375, 13.05712890625, 14.173095703125, 15.2890625, 16.405029296875, 17.52099609375, 18.636962890625, 19.7529296875, 20.868896484375, 21.98486328125, 23.100830078125, 24.216796875, 25.332763671875, 26.44873046875, 27.564697265625, 28.6806640625, 29.796630859375, 30.91259765625, 32.028564453125, 33.14453125, 34.260498046875, 35.37646484375, 36.492431640625, 37.6083984375, 38.724365234375, 39.84033203125, 40.956298828125, 42.072265625, 43.188232421875, 44.30419921875, 45.420166015625, 46.5361328125, 47.652099609375, 48.76806640625, 49.884033203125, 51.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 40.0, 89.0, 195.0, 266.0, 189.0, 112.0, 58.0, 20.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.63174438476562, -215.13035583496094, -203.62896728515625, -192.12759399414062, -180.62620544433594, -169.12481689453125, -157.62344360351562, -146.12205505371094, -134.62066650390625, -123.11927795410156, -111.6178970336914, -100.11651611328125, -88.61512756347656, -77.11373901367188, -65.61235809326172, -54.11097717285156, -42.609588623046875, -31.108203887939453, -19.60681915283203, -8.10543441772461, 3.3959503173828125, 14.897335052490234, 26.398719787597656, 37.90010070800781, 49.4014892578125, 60.90287399291992, 72.40425872802734, 83.9056396484375, 95.40702819824219, 106.90841674804688, 118.40979766845703, 129.9111785888672, 141.41253662109375, 152.91392517089844, 164.41531372070312, 175.91668701171875, 187.41807556152344, 198.91946411132812, 210.42083740234375, 221.92222595214844, 233.42361450195312, 244.9250030517578, 256.4263916015625, 267.9277648925781, 279.42913818359375, 290.9305419921875, 302.4319152832031, 313.93328857421875, 325.4346923828125, 336.9360656738281, 348.4374694824219, 359.9388427734375, 371.44024658203125, 382.9416198730469, 394.4429931640625, 405.94439697265625, 417.4457702636719, 428.9471435546875, 440.44854736328125, 451.9499206542969, 463.4512939453125, 474.95269775390625, 486.4540710449219, 497.9554443359375, 509.45684814453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 15.0, 14.0, 16.0, 16.0, 24.0, 21.0, 35.0, 36.0, 31.0, 58.0, 43.0, 69.0, 55.0, 61.0, 73.0, 61.0, 56.0, 44.0, 37.0, 42.0, 42.0, 24.0, 24.0, 22.0, 15.0, 11.0, 7.0, 7.0, 5.0, 4.0, 10.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.08407592773438, -167.24609375, -162.4081268310547, -157.57015991210938, -152.732177734375, -147.89419555664062, -143.0562286376953, -138.21826171875, -133.38027954101562, -128.54229736328125, -123.70433044433594, -118.8663558959961, -114.02838134765625, -109.1904067993164, -104.35243225097656, -99.51445770263672, -94.67648315429688, -89.83850860595703, -85.00053405761719, -80.16255950927734, -75.3245849609375, -70.48661041259766, -65.64863586425781, -60.81066131591797, -55.972686767578125, -51.13471221923828, -46.29673767089844, -41.458763122558594, -36.62078857421875, -31.782814025878906, -26.944839477539062, -22.10686492919922, -17.268905639648438, -12.430931091308594, -7.59295654296875, -2.7549819946289062, 2.0829925537109375, 6.920967102050781, 11.758941650390625, 16.59691619873047, 21.434890747070312, 26.272865295410156, 31.11083984375, 35.948814392089844, 40.78678894042969, 45.62476348876953, 50.462738037109375, 55.30071258544922, 60.13868713378906, 64.9766616821289, 69.81463623046875, 74.6526107788086, 79.49058532714844, 84.32855987548828, 89.16653442382812, 94.00450897216797, 98.84248352050781, 103.68045806884766, 108.5184326171875, 113.35640716552734, 118.19438171386719, 123.03235626220703, 127.87033081054688, 132.70831298828125, 137.54627990722656]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 17.0, 15.0, 20.0, 30.0, 43.0, 73.0, 121.0, 197.0, 361.0, 598.0, 1092.0, 2155.0, 4328.0, 9998.0, 23598.0, 60687.0, 164255.0, 345789.0, 265438.0, 102615.0, 38464.0, 15242.0, 6796.0, 3018.0, 1555.0, 811.0, 490.0, 266.0, 164.0, 115.0, 68.0, 49.0, 24.0, 23.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375, -18.701416015625, -18.02783203125, -17.354248046875, -16.6806640625, -16.007080078125, -15.33349609375, -14.659912109375, -13.986328125, -13.312744140625, -12.63916015625, -11.965576171875, -11.2919921875, -10.618408203125, -9.94482421875, -9.271240234375, -8.59765625, -7.924072265625, -7.25048828125, -6.576904296875, -5.9033203125, -5.229736328125, -4.55615234375, -3.882568359375, -3.208984375, -2.535400390625, -1.86181640625, -1.188232421875, -0.5146484375, 0.158935546875, 0.83251953125, 1.506103515625, 2.1796875, 2.853271484375, 3.52685546875, 4.200439453125, 4.8740234375, 5.547607421875, 6.22119140625, 6.894775390625, 7.568359375, 8.241943359375, 8.91552734375, 9.589111328125, 10.2626953125, 10.936279296875, 11.60986328125, 12.283447265625, 12.95703125, 13.630615234375, 14.30419921875, 14.977783203125, 15.6513671875, 16.324951171875, 16.99853515625, 17.672119140625, 18.345703125, 19.019287109375, 19.69287109375, 20.366455078125, 21.0400390625, 21.713623046875, 22.38720703125, 23.060791015625, 23.734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 4.0, 14.0, 8.0, 10.0, 24.0, 20.0, 30.0, 26.0, 32.0, 29.0, 37.0, 52.0, 60.0, 45.0, 55.0, 58.0, 43.0, 57.0, 57.0, 50.0, 41.0, 36.0, 40.0, 31.0, 20.0, 24.0, 24.0, 20.0, 11.0, 7.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.42822265625, -14.8251953125, -14.22216796875, -13.619140625, -13.01611328125, -12.4130859375, -11.81005859375, -11.20703125, -10.60400390625, -10.0009765625, -9.39794921875, -8.794921875, -8.19189453125, -7.5888671875, -6.98583984375, -6.3828125, -5.77978515625, -5.1767578125, -4.57373046875, -3.970703125, -3.36767578125, -2.7646484375, -2.16162109375, -1.55859375, -0.95556640625, -0.3525390625, 0.25048828125, 0.853515625, 1.45654296875, 2.0595703125, 2.66259765625, 3.265625, 3.86865234375, 4.4716796875, 5.07470703125, 5.677734375, 6.28076171875, 6.8837890625, 7.48681640625, 8.08984375, 8.69287109375, 9.2958984375, 9.89892578125, 10.501953125, 11.10498046875, 11.7080078125, 12.31103515625, 12.9140625, 13.51708984375, 14.1201171875, 14.72314453125, 15.326171875, 15.92919921875, 16.5322265625, 17.13525390625, 17.73828125, 18.34130859375, 18.9443359375, 19.54736328125, 20.150390625, 20.75341796875, 21.3564453125, 21.95947265625, 22.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 17.0, 12.0, 14.0, 17.0, 31.0, 39.0, 40.0, 73.0, 81.0, 135.0, 175.0, 251.0, 363.0, 544.0, 949.0, 1759.0, 4064.0, 11319.0, 40445.0, 178185.0, 626778.0, 135235.0, 31314.0, 9227.0, 3369.0, 1569.0, 804.0, 561.0, 339.0, 226.0, 145.0, 122.0, 83.0, 61.0, 52.0, 35.0, 26.0, 24.0, 14.0, 11.0, 11.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.921875, -30.905517578125, -29.88916015625, -28.872802734375, -27.8564453125, -26.840087890625, -25.82373046875, -24.807373046875, -23.791015625, -22.774658203125, -21.75830078125, -20.741943359375, -19.7255859375, -18.709228515625, -17.69287109375, -16.676513671875, -15.66015625, -14.643798828125, -13.62744140625, -12.611083984375, -11.5947265625, -10.578369140625, -9.56201171875, -8.545654296875, -7.529296875, -6.512939453125, -5.49658203125, -4.480224609375, -3.4638671875, -2.447509765625, -1.43115234375, -0.414794921875, 0.6015625, 1.617919921875, 2.63427734375, 3.650634765625, 4.6669921875, 5.683349609375, 6.69970703125, 7.716064453125, 8.732421875, 9.748779296875, 10.76513671875, 11.781494140625, 12.7978515625, 13.814208984375, 14.83056640625, 15.846923828125, 16.86328125, 17.879638671875, 18.89599609375, 19.912353515625, 20.9287109375, 21.945068359375, 22.96142578125, 23.977783203125, 24.994140625, 26.010498046875, 27.02685546875, 28.043212890625, 29.0595703125, 30.075927734375, 31.09228515625, 32.108642578125, 33.125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 7.0, 16.0, 16.0, 14.0, 15.0, 30.0, 29.0, 37.0, 31.0, 30.0, 41.0, 36.0, 49.0, 50.0, 64.0, 49.0, 60.0, 33.0, 45.0, 32.0, 41.0, 29.0, 31.0, 31.0, 23.0, 30.0, 24.0, 19.0, 14.0, 13.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -48.87646484375, -47.0966796875, -45.31689453125, -43.537109375, -41.75732421875, -39.9775390625, -38.19775390625, -36.41796875, -34.63818359375, -32.8583984375, -31.07861328125, -29.298828125, -27.51904296875, -25.7392578125, -23.95947265625, -22.1796875, -20.39990234375, -18.6201171875, -16.84033203125, -15.060546875, -13.28076171875, -11.5009765625, -9.72119140625, -7.94140625, -6.16162109375, -4.3818359375, -2.60205078125, -0.822265625, 0.95751953125, 2.7373046875, 4.51708984375, 6.296875, 8.07666015625, 9.8564453125, 11.63623046875, 13.416015625, 15.19580078125, 16.9755859375, 18.75537109375, 20.53515625, 22.31494140625, 24.0947265625, 25.87451171875, 27.654296875, 29.43408203125, 31.2138671875, 32.99365234375, 34.7734375, 36.55322265625, 38.3330078125, 40.11279296875, 41.892578125, 43.67236328125, 45.4521484375, 47.23193359375, 49.01171875, 50.79150390625, 52.5712890625, 54.35107421875, 56.130859375, 57.91064453125, 59.6904296875, 61.47021484375, 63.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 13.0, 15.0, 10.0, 26.0, 43.0, 55.0, 98.0, 193.0, 295.0, 580.0, 1318.0, 3135.0, 8912.0, 29052.0, 142221.0, 719361.0, 106591.0, 24078.0, 7479.0, 2745.0, 1127.0, 526.0, 260.0, 152.0, 91.0, 46.0, 47.0, 29.0, 15.0, 7.0, 13.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.59765625, -6.34796142578125, -6.0982666015625, -5.84857177734375, -5.598876953125, -5.34918212890625, -5.0994873046875, -4.84979248046875, -4.60009765625, -4.35040283203125, -4.1007080078125, -3.85101318359375, -3.601318359375, -3.35162353515625, -3.1019287109375, -2.85223388671875, -2.6025390625, -2.35284423828125, -2.1031494140625, -1.85345458984375, -1.603759765625, -1.35406494140625, -1.1043701171875, -0.85467529296875, -0.60498046875, -0.35528564453125, -0.1055908203125, 0.14410400390625, 0.393798828125, 0.64349365234375, 0.8931884765625, 1.14288330078125, 1.392578125, 1.64227294921875, 1.8919677734375, 2.14166259765625, 2.391357421875, 2.64105224609375, 2.8907470703125, 3.14044189453125, 3.39013671875, 3.63983154296875, 3.8895263671875, 4.13922119140625, 4.388916015625, 4.63861083984375, 4.8883056640625, 5.13800048828125, 5.3876953125, 5.63739013671875, 5.8870849609375, 6.13677978515625, 6.386474609375, 6.63616943359375, 6.8858642578125, 7.13555908203125, 7.38525390625, 7.63494873046875, 7.8846435546875, 8.13433837890625, 8.384033203125, 8.63372802734375, 8.8834228515625, 9.13311767578125, 9.3828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 1.0, 4.0, 6.0, 7.0, 9.0, 16.0, 16.0, 29.0, 49.0, 86.0, 129.0, 181.0, 170.0, 111.0, 54.0, 37.0, 24.0, 17.0, 16.0, 16.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029430389404296875, -0.0028631985187530518, -0.002783358097076416, -0.0027035176753997803, -0.0026236772537231445, -0.002543836832046509, -0.002463996410369873, -0.0023841559886932373, -0.0023043155670166016, -0.002224475145339966, -0.00214463472366333, -0.0020647943019866943, -0.0019849538803100586, -0.0019051134586334229, -0.0018252730369567871, -0.0017454326152801514, -0.0016655921936035156, -0.0015857517719268799, -0.0015059113502502441, -0.0014260709285736084, -0.0013462305068969727, -0.001266390085220337, -0.0011865496635437012, -0.0011067092418670654, -0.0010268688201904297, -0.0009470283985137939, -0.0008671879768371582, -0.0007873475551605225, -0.0007075071334838867, -0.000627666711807251, -0.0005478262901306152, -0.0004679858684539795, -0.00038814544677734375, -0.000308305025100708, -0.00022846460342407227, -0.00014862418174743652, -6.878376007080078e-05, 1.1056661605834961e-05, 9.08970832824707e-05, 0.00017073750495910645, 0.0002505779266357422, 0.00033041834831237793, 0.00041025876998901367, 0.0004900991916656494, 0.0005699396133422852, 0.0006497800350189209, 0.0007296204566955566, 0.0008094608783721924, 0.0008893013000488281, 0.0009691417217254639, 0.0010489821434020996, 0.0011288225650787354, 0.001208662986755371, 0.0012885034084320068, 0.0013683438301086426, 0.0014481842517852783, 0.001528024673461914, 0.0016078650951385498, 0.0016877055168151855, 0.0017675459384918213, 0.001847386360168457, 0.0019272267818450928, 0.0020070672035217285, 0.0020869076251983643, 0.002166748046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 13.0, 11.0, 14.0, 25.0, 36.0, 42.0, 51.0, 95.0, 179.0, 229.0, 393.0, 781.0, 1599.0, 3568.0, 10009.0, 34870.0, 170444.0, 687990.0, 101815.0, 23666.0, 7097.0, 2740.0, 1292.0, 630.0, 367.0, 203.0, 117.0, 83.0, 63.0, 31.0, 30.0, 23.0, 11.0, 12.0, 11.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9571533203125, -7.703369140625, -7.4495849609375, -7.19580078125, -6.9420166015625, -6.688232421875, -6.4344482421875, -6.1806640625, -5.9268798828125, -5.673095703125, -5.4193115234375, -5.16552734375, -4.9117431640625, -4.657958984375, -4.4041748046875, -4.150390625, -3.8966064453125, -3.642822265625, -3.3890380859375, -3.13525390625, -2.8814697265625, -2.627685546875, -2.3739013671875, -2.1201171875, -1.8663330078125, -1.612548828125, -1.3587646484375, -1.10498046875, -0.8511962890625, -0.597412109375, -0.3436279296875, -0.08984375, 0.1639404296875, 0.417724609375, 0.6715087890625, 0.92529296875, 1.1790771484375, 1.432861328125, 1.6866455078125, 1.9404296875, 2.1942138671875, 2.447998046875, 2.7017822265625, 2.95556640625, 3.2093505859375, 3.463134765625, 3.7169189453125, 3.970703125, 4.2244873046875, 4.478271484375, 4.7320556640625, 4.98583984375, 5.2396240234375, 5.493408203125, 5.7471923828125, 6.0009765625, 6.2547607421875, 6.508544921875, 6.7623291015625, 7.01611328125, 7.2698974609375, 7.523681640625, 7.7774658203125, 8.03125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 10.0, 8.0, 17.0, 18.0, 23.0, 38.0, 33.0, 43.0, 70.0, 76.0, 88.0, 89.0, 89.0, 77.0, 67.0, 39.0, 46.0, 38.0, 25.0, 21.0, 13.0, 11.0, 9.0, 10.0, 1.0, 4.0, 1.0, 6.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.569580078125, -7.29541015625, -7.021240234375, -6.7470703125, -6.472900390625, -6.19873046875, -5.924560546875, -5.650390625, -5.376220703125, -5.10205078125, -4.827880859375, -4.5537109375, -4.279541015625, -4.00537109375, -3.731201171875, -3.45703125, -3.182861328125, -2.90869140625, -2.634521484375, -2.3603515625, -2.086181640625, -1.81201171875, -1.537841796875, -1.263671875, -0.989501953125, -0.71533203125, -0.441162109375, -0.1669921875, 0.107177734375, 0.38134765625, 0.655517578125, 0.9296875, 1.203857421875, 1.47802734375, 1.752197265625, 2.0263671875, 2.300537109375, 2.57470703125, 2.848876953125, 3.123046875, 3.397216796875, 3.67138671875, 3.945556640625, 4.2197265625, 4.493896484375, 4.76806640625, 5.042236328125, 5.31640625, 5.590576171875, 5.86474609375, 6.138916015625, 6.4130859375, 6.687255859375, 6.96142578125, 7.235595703125, 7.509765625, 7.783935546875, 8.05810546875, 8.332275390625, 8.6064453125, 8.880615234375, 9.15478515625, 9.428955078125, 9.703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 12.0, 28.0, 42.0, 98.0, 198.0, 342.0, 133.0, 72.0, 31.0, 16.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-318.91046142578125, -308.029052734375, -297.1476745605469, -286.2662658691406, -275.3848876953125, -264.50347900390625, -253.6220703125, -242.7406768798828, -231.85928344726562, -220.97789001464844, -210.09649658203125, -199.215087890625, -188.3336944580078, -177.45230102539062, -166.57089233398438, -155.6894989013672, -144.80810546875, -133.9267120361328, -123.0453109741211, -112.16390991210938, -101.28251647949219, -90.401123046875, -79.51972198486328, -68.63832092285156, -57.756927490234375, -46.87553024291992, -35.99413299560547, -25.112735748291016, -14.231338500976562, -3.3499412536621094, 7.531455993652344, 18.412857055664062, 29.294281005859375, 40.17567825317383, 51.05707550048828, 61.938472747802734, 72.81986999511719, 83.70126342773438, 94.5826644897461, 105.46406555175781, 116.345458984375, 127.22685241699219, 138.10824584960938, 148.98965454101562, 159.8710479736328, 170.75244140625, 181.63385009765625, 192.51524353027344, 203.39663696289062, 214.2780303955078, 225.159423828125, 236.04083251953125, 246.92222595214844, 257.8036193847656, 268.6850280761719, 279.56640625, 290.44781494140625, 301.3292236328125, 312.2106018066406, 323.0920104980469, 333.973388671875, 344.85479736328125, 355.7362060546875, 366.61761474609375, 377.4989929199219]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 12.0, 9.0, 5.0, 14.0, 17.0, 20.0, 15.0, 13.0, 26.0, 26.0, 26.0, 26.0, 37.0, 46.0, 70.0, 79.0, 93.0, 85.0, 53.0, 32.0, 40.0, 38.0, 27.0, 26.0, 20.0, 16.0, 14.0, 15.0, 14.0, 17.0, 7.0, 11.0, 10.0, 2.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-212.47348022460938, -205.71902465820312, -198.96456909179688, -192.2101287841797, -185.45567321777344, -178.7012176513672, -171.94677734375, -165.19232177734375, -158.4378662109375, -151.68341064453125, -144.928955078125, -138.1745147705078, -131.42005920410156, -124.66560363769531, -117.9111557006836, -111.15670776367188, -104.40225219726562, -97.64779663085938, -90.89334869384766, -84.13890075683594, -77.38444519042969, -70.62998962402344, -63.87554168701172, -57.121089935302734, -50.36663818359375, -43.612186431884766, -36.85773468017578, -30.103282928466797, -23.348831176757812, -16.594379425048828, -9.839927673339844, -3.0854759216308594, 3.668975830078125, 10.42342758178711, 17.177879333496094, 23.932331085205078, 30.686782836914062, 37.44123458862305, 44.19568634033203, 50.950138092041016, 57.70458984375, 64.45904541015625, 71.21349334716797, 77.96794128417969, 84.72239685058594, 91.47685241699219, 98.2313003540039, 104.98574829101562, 111.74020385742188, 118.49465942382812, 125.24910736083984, 132.00355529785156, 138.7580108642578, 145.51246643066406, 152.26690673828125, 159.0213623046875, 165.77581787109375, 172.5302734375, 179.28472900390625, 186.03916931152344, 192.7936248779297, 199.54808044433594, 206.30252075195312, 213.05697631835938, 219.81143188476562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 13.0, 17.0, 20.0, 30.0, 75.0, 125.0, 294.0, 709.0, 2756.0, 15258.0, 167309.0, 2613241.0, 1317059.0, 67194.0, 7507.0, 1602.0, 549.0, 241.0, 106.0, 61.0, 38.0, 30.0, 18.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -20.989013671875, -19.93115234375, -18.873291015625, -17.8154296875, -16.757568359375, -15.69970703125, -14.641845703125, -13.583984375, -12.526123046875, -11.46826171875, -10.410400390625, -9.3525390625, -8.294677734375, -7.23681640625, -6.178955078125, -5.12109375, -4.063232421875, -3.00537109375, -1.947509765625, -0.8896484375, 0.168212890625, 1.22607421875, 2.283935546875, 3.341796875, 4.399658203125, 5.45751953125, 6.515380859375, 7.5732421875, 8.631103515625, 9.68896484375, 10.746826171875, 11.8046875, 12.862548828125, 13.92041015625, 14.978271484375, 16.0361328125, 17.093994140625, 18.15185546875, 19.209716796875, 20.267578125, 21.325439453125, 22.38330078125, 23.441162109375, 24.4990234375, 25.556884765625, 26.61474609375, 27.672607421875, 28.73046875, 29.788330078125, 30.84619140625, 31.904052734375, 32.9619140625, 34.019775390625, 35.07763671875, 36.135498046875, 37.193359375, 38.251220703125, 39.30908203125, 40.366943359375, 41.4248046875, 42.482666015625, 43.54052734375, 44.598388671875, 45.65625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 4.0, 8.0, 10.0, 12.0, 9.0, 25.0, 21.0, 24.0, 32.0, 37.0, 47.0, 42.0, 44.0, 54.0, 48.0, 53.0, 55.0, 60.0, 56.0, 56.0, 51.0, 39.0, 36.0, 37.0, 33.0, 18.0, 20.0, 15.0, 13.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -15.98681640625, -15.3798828125, -14.77294921875, -14.166015625, -13.55908203125, -12.9521484375, -12.34521484375, -11.73828125, -11.13134765625, -10.5244140625, -9.91748046875, -9.310546875, -8.70361328125, -8.0966796875, -7.48974609375, -6.8828125, -6.27587890625, -5.6689453125, -5.06201171875, -4.455078125, -3.84814453125, -3.2412109375, -2.63427734375, -2.02734375, -1.42041015625, -0.8134765625, -0.20654296875, 0.400390625, 1.00732421875, 1.6142578125, 2.22119140625, 2.828125, 3.43505859375, 4.0419921875, 4.64892578125, 5.255859375, 5.86279296875, 6.4697265625, 7.07666015625, 7.68359375, 8.29052734375, 8.8974609375, 9.50439453125, 10.111328125, 10.71826171875, 11.3251953125, 11.93212890625, 12.5390625, 13.14599609375, 13.7529296875, 14.35986328125, 14.966796875, 15.57373046875, 16.1806640625, 16.78759765625, 17.39453125, 18.00146484375, 18.6083984375, 19.21533203125, 19.822265625, 20.42919921875, 21.0361328125, 21.64306640625, 22.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 6.0, 9.0, 20.0, 14.0, 19.0, 30.0, 39.0, 55.0, 114.0, 194.0, 385.0, 980.0, 3459.0, 16478.0, 228685.0, 3649084.0, 271282.0, 17771.0, 3626.0, 1134.0, 386.0, 183.0, 107.0, 72.0, 31.0, 26.0, 18.0, 16.0, 12.0, 10.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-39.71875, -38.49755859375, -37.2763671875, -36.05517578125, -34.833984375, -33.61279296875, -32.3916015625, -31.17041015625, -29.94921875, -28.72802734375, -27.5068359375, -26.28564453125, -25.064453125, -23.84326171875, -22.6220703125, -21.40087890625, -20.1796875, -18.95849609375, -17.7373046875, -16.51611328125, -15.294921875, -14.07373046875, -12.8525390625, -11.63134765625, -10.41015625, -9.18896484375, -7.9677734375, -6.74658203125, -5.525390625, -4.30419921875, -3.0830078125, -1.86181640625, -0.640625, 0.58056640625, 1.8017578125, 3.02294921875, 4.244140625, 5.46533203125, 6.6865234375, 7.90771484375, 9.12890625, 10.35009765625, 11.5712890625, 12.79248046875, 14.013671875, 15.23486328125, 16.4560546875, 17.67724609375, 18.8984375, 20.11962890625, 21.3408203125, 22.56201171875, 23.783203125, 25.00439453125, 26.2255859375, 27.44677734375, 28.66796875, 29.88916015625, 31.1103515625, 32.33154296875, 33.552734375, 34.77392578125, 35.9951171875, 37.21630859375, 38.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 9.0, 12.0, 12.0, 19.0, 39.0, 43.0, 76.0, 134.0, 195.0, 272.0, 446.0, 599.0, 652.0, 542.0, 342.0, 238.0, 146.0, 80.0, 70.0, 54.0, 19.0, 15.0, 16.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.015625, -29.030029296875, -28.04443359375, -27.058837890625, -26.0732421875, -25.087646484375, -24.10205078125, -23.116455078125, -22.130859375, -21.145263671875, -20.15966796875, -19.174072265625, -18.1884765625, -17.202880859375, -16.21728515625, -15.231689453125, -14.24609375, -13.260498046875, -12.27490234375, -11.289306640625, -10.3037109375, -9.318115234375, -8.33251953125, -7.346923828125, -6.361328125, -5.375732421875, -4.39013671875, -3.404541015625, -2.4189453125, -1.433349609375, -0.44775390625, 0.537841796875, 1.5234375, 2.509033203125, 3.49462890625, 4.480224609375, 5.4658203125, 6.451416015625, 7.43701171875, 8.422607421875, 9.408203125, 10.393798828125, 11.37939453125, 12.364990234375, 13.3505859375, 14.336181640625, 15.32177734375, 16.307373046875, 17.29296875, 18.278564453125, 19.26416015625, 20.249755859375, 21.2353515625, 22.220947265625, 23.20654296875, 24.192138671875, 25.177734375, 26.163330078125, 27.14892578125, 28.134521484375, 29.1201171875, 30.105712890625, 31.09130859375, 32.076904296875, 33.0625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 11.0, 20.0, 41.0, 117.0, 264.0, 309.0, 165.0, 48.0, 14.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-675.2928466796875, -660.3777465820312, -645.4627075195312, -630.547607421875, -615.632568359375, -600.7174682617188, -585.8024291992188, -570.8873291015625, -555.9722900390625, -541.0571899414062, -526.1421508789062, -511.2270812988281, -496.31201171875, -481.3969421386719, -466.48187255859375, -451.5667724609375, -436.6517028808594, -421.73663330078125, -406.8215637207031, -391.906494140625, -376.9914245605469, -362.07635498046875, -347.1612548828125, -332.2462158203125, -317.33111572265625, -302.4160461425781, -287.5009765625, -272.5859069824219, -257.67083740234375, -242.75576782226562, -227.84068298339844, -212.9256134033203, -198.01052856445312, -183.095458984375, -168.18038940429688, -153.26531982421875, -138.35025024414062, -123.43517303466797, -108.52009582519531, -93.60502624511719, -78.68995666503906, -63.77488708496094, -48.85981369018555, -33.944740295410156, -19.02967071533203, -4.114601135253906, 10.80047607421875, 25.715545654296875, 40.630615234375, 55.545684814453125, 70.46075439453125, 85.3758316040039, 100.29090118408203, 115.20597076416016, 130.1210479736328, 145.03611755371094, 159.95118713378906, 174.8662567138672, 189.7813262939453, 204.6964111328125, 219.61148071289062, 234.52655029296875, 249.44161987304688, 264.356689453125, 279.2717590332031]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 15.0, 16.0, 10.0, 12.0, 18.0, 15.0, 16.0, 24.0, 24.0, 28.0, 18.0, 34.0, 47.0, 33.0, 39.0, 41.0, 36.0, 30.0, 40.0, 36.0, 35.0, 43.0, 27.0, 36.0, 33.0, 26.0, 28.0, 31.0, 29.0, 25.0, 20.0, 22.0, 21.0, 11.0, 12.0, 8.0, 9.0, 6.0, 11.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-129.9894561767578, -126.17731475830078, -122.36516571044922, -118.55302429199219, -114.74087524414062, -110.9287338256836, -107.11659240722656, -103.304443359375, -99.49230194091797, -95.68016052246094, -91.86801147460938, -88.05587005615234, -84.24372863769531, -80.43157958984375, -76.61943817138672, -72.80729675292969, -68.99514770507812, -65.1830062866211, -61.37085723876953, -57.5587158203125, -53.7465705871582, -49.934425354003906, -46.122283935546875, -42.31013870239258, -38.49799346923828, -34.685848236083984, -30.87370491027832, -27.061561584472656, -23.24941635131836, -19.437271118164062, -15.625127792358398, -11.812984466552734, -8.000839233398438, -4.188694953918457, -0.37655067443847656, 3.435593605041504, 7.247737884521484, 11.059883117675781, 14.872026443481445, 18.68416976928711, 22.496315002441406, 26.308460235595703, 30.120603561401367, 33.93274688720703, 37.74489212036133, 41.557037353515625, 45.369178771972656, 49.18132400512695, 52.99346923828125, 56.80561447143555, 60.617759704589844, 64.42990112304688, 68.24205017089844, 72.05419158935547, 75.8663330078125, 79.67848205566406, 83.4906234741211, 87.30276489257812, 91.11491394042969, 94.92705535888672, 98.73919677734375, 102.55134582519531, 106.36348724365234, 110.17562866210938, 113.98777770996094]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 3.0, 16.0, 16.0, 35.0, 62.0, 88.0, 122.0, 221.0, 287.0, 476.0, 856.0, 1562.0, 3030.0, 6335.0, 13825.0, 34181.0, 92223.0, 254336.0, 375443.0, 163774.0, 59249.0, 22749.0, 9858.0, 4482.0, 2278.0, 1231.0, 657.0, 429.0, 255.0, 156.0, 90.0, 68.0, 37.0, 44.0, 27.0, 16.0, 10.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.546875, -23.809326171875, -23.07177734375, -22.334228515625, -21.5966796875, -20.859130859375, -20.12158203125, -19.384033203125, -18.646484375, -17.908935546875, -17.17138671875, -16.433837890625, -15.6962890625, -14.958740234375, -14.22119140625, -13.483642578125, -12.74609375, -12.008544921875, -11.27099609375, -10.533447265625, -9.7958984375, -9.058349609375, -8.32080078125, -7.583251953125, -6.845703125, -6.108154296875, -5.37060546875, -4.633056640625, -3.8955078125, -3.157958984375, -2.42041015625, -1.682861328125, -0.9453125, -0.207763671875, 0.52978515625, 1.267333984375, 2.0048828125, 2.742431640625, 3.47998046875, 4.217529296875, 4.955078125, 5.692626953125, 6.43017578125, 7.167724609375, 7.9052734375, 8.642822265625, 9.38037109375, 10.117919921875, 10.85546875, 11.593017578125, 12.33056640625, 13.068115234375, 13.8056640625, 14.543212890625, 15.28076171875, 16.018310546875, 16.755859375, 17.493408203125, 18.23095703125, 18.968505859375, 19.7060546875, 20.443603515625, 21.18115234375, 21.918701171875, 22.65625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 7.0, 8.0, 3.0, 15.0, 22.0, 24.0, 31.0, 37.0, 26.0, 48.0, 41.0, 43.0, 46.0, 49.0, 58.0, 73.0, 61.0, 43.0, 58.0, 39.0, 47.0, 34.0, 23.0, 35.0, 29.0, 22.0, 13.0, 9.0, 7.0, 9.0, 5.0, 2.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.0166015625, -15.408203125, -14.7998046875, -14.19140625, -13.5830078125, -12.974609375, -12.3662109375, -11.7578125, -11.1494140625, -10.541015625, -9.9326171875, -9.32421875, -8.7158203125, -8.107421875, -7.4990234375, -6.890625, -6.2822265625, -5.673828125, -5.0654296875, -4.45703125, -3.8486328125, -3.240234375, -2.6318359375, -2.0234375, -1.4150390625, -0.806640625, -0.1982421875, 0.41015625, 1.0185546875, 1.626953125, 2.2353515625, 2.84375, 3.4521484375, 4.060546875, 4.6689453125, 5.27734375, 5.8857421875, 6.494140625, 7.1025390625, 7.7109375, 8.3193359375, 8.927734375, 9.5361328125, 10.14453125, 10.7529296875, 11.361328125, 11.9697265625, 12.578125, 13.1865234375, 13.794921875, 14.4033203125, 15.01171875, 15.6201171875, 16.228515625, 16.8369140625, 17.4453125, 18.0537109375, 18.662109375, 19.2705078125, 19.87890625, 20.4873046875, 21.095703125, 21.7041015625, 22.3125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 13.0, 15.0, 21.0, 24.0, 35.0, 50.0, 55.0, 67.0, 115.0, 108.0, 198.0, 224.0, 325.0, 514.0, 753.0, 1226.0, 2198.0, 4966.0, 15461.0, 69731.0, 677927.0, 220224.0, 36122.0, 9548.0, 3515.0, 1849.0, 1021.0, 638.0, 421.0, 330.0, 225.0, 131.0, 123.0, 90.0, 58.0, 43.0, 39.0, 34.0, 30.0, 17.0, 15.0, 9.0, 16.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-42.09375, -40.88427734375, -39.6748046875, -38.46533203125, -37.255859375, -36.04638671875, -34.8369140625, -33.62744140625, -32.41796875, -31.20849609375, -29.9990234375, -28.78955078125, -27.580078125, -26.37060546875, -25.1611328125, -23.95166015625, -22.7421875, -21.53271484375, -20.3232421875, -19.11376953125, -17.904296875, -16.69482421875, -15.4853515625, -14.27587890625, -13.06640625, -11.85693359375, -10.6474609375, -9.43798828125, -8.228515625, -7.01904296875, -5.8095703125, -4.60009765625, -3.390625, -2.18115234375, -0.9716796875, 0.23779296875, 1.447265625, 2.65673828125, 3.8662109375, 5.07568359375, 6.28515625, 7.49462890625, 8.7041015625, 9.91357421875, 11.123046875, 12.33251953125, 13.5419921875, 14.75146484375, 15.9609375, 17.17041015625, 18.3798828125, 19.58935546875, 20.798828125, 22.00830078125, 23.2177734375, 24.42724609375, 25.63671875, 26.84619140625, 28.0556640625, 29.26513671875, 30.474609375, 31.68408203125, 32.8935546875, 34.10302734375, 35.3125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 12.0, 14.0, 19.0, 14.0, 27.0, 26.0, 23.0, 34.0, 32.0, 31.0, 43.0, 39.0, 51.0, 42.0, 48.0, 46.0, 44.0, 53.0, 52.0, 41.0, 34.0, 40.0, 31.0, 30.0, 26.0, 22.0, 14.0, 16.0, 11.0, 12.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-65.5, -63.67626953125, -61.8525390625, -60.02880859375, -58.205078125, -56.38134765625, -54.5576171875, -52.73388671875, -50.91015625, -49.08642578125, -47.2626953125, -45.43896484375, -43.615234375, -41.79150390625, -39.9677734375, -38.14404296875, -36.3203125, -34.49658203125, -32.6728515625, -30.84912109375, -29.025390625, -27.20166015625, -25.3779296875, -23.55419921875, -21.73046875, -19.90673828125, -18.0830078125, -16.25927734375, -14.435546875, -12.61181640625, -10.7880859375, -8.96435546875, -7.140625, -5.31689453125, -3.4931640625, -1.66943359375, 0.154296875, 1.97802734375, 3.8017578125, 5.62548828125, 7.44921875, 9.27294921875, 11.0966796875, 12.92041015625, 14.744140625, 16.56787109375, 18.3916015625, 20.21533203125, 22.0390625, 23.86279296875, 25.6865234375, 27.51025390625, 29.333984375, 31.15771484375, 32.9814453125, 34.80517578125, 36.62890625, 38.45263671875, 40.2763671875, 42.10009765625, 43.923828125, 45.74755859375, 47.5712890625, 49.39501953125, 51.21875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 5.0, 7.0, 13.0, 12.0, 17.0, 33.0, 53.0, 61.0, 57.0, 141.0, 263.0, 566.0, 1407.0, 5103.0, 32928.0, 900049.0, 95150.0, 9066.0, 2100.0, 745.0, 301.0, 167.0, 93.0, 61.0, 35.0, 40.0, 18.0, 12.0, 10.0, 7.0, 5.0, 8.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8748779296875, -12.468505859375, -12.0621337890625, -11.65576171875, -11.2493896484375, -10.843017578125, -10.4366455078125, -10.0302734375, -9.6239013671875, -9.217529296875, -8.8111572265625, -8.40478515625, -7.9984130859375, -7.592041015625, -7.1856689453125, -6.779296875, -6.3729248046875, -5.966552734375, -5.5601806640625, -5.15380859375, -4.7474365234375, -4.341064453125, -3.9346923828125, -3.5283203125, -3.1219482421875, -2.715576171875, -2.3092041015625, -1.90283203125, -1.4964599609375, -1.090087890625, -0.6837158203125, -0.27734375, 0.1290283203125, 0.535400390625, 0.9417724609375, 1.34814453125, 1.7545166015625, 2.160888671875, 2.5672607421875, 2.9736328125, 3.3800048828125, 3.786376953125, 4.1927490234375, 4.59912109375, 5.0054931640625, 5.411865234375, 5.8182373046875, 6.224609375, 6.6309814453125, 7.037353515625, 7.4437255859375, 7.85009765625, 8.2564697265625, 8.662841796875, 9.0692138671875, 9.4755859375, 9.8819580078125, 10.288330078125, 10.6947021484375, 11.10107421875, 11.5074462890625, 11.913818359375, 12.3201904296875, 12.7265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 11.0, 3.0, 11.0, 20.0, 40.0, 60.0, 157.0, 299.0, 176.0, 86.0, 35.0, 27.0, 12.0, 14.0, 5.0, 8.0, 7.0, 1.0, 5.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00255584716796875, -0.00244748592376709, -0.0023391246795654297, -0.0022307634353637695, -0.0021224021911621094, -0.0020140409469604492, -0.001905679702758789, -0.001797318458557129, -0.0016889572143554688, -0.0015805959701538086, -0.0014722347259521484, -0.0013638734817504883, -0.0012555122375488281, -0.001147150993347168, -0.0010387897491455078, -0.0009304285049438477, -0.0008220672607421875, -0.0007137060165405273, -0.0006053447723388672, -0.000496983528137207, -0.0003886222839355469, -0.0002802610397338867, -0.00017189979553222656, -6.35385513305664e-05, 4.482269287109375e-05, 0.0001531839370727539, 0.00026154518127441406, 0.0003699064254760742, 0.0004782676696777344, 0.0005866289138793945, 0.0006949901580810547, 0.0008033514022827148, 0.000911712646484375, 0.0010200738906860352, 0.0011284351348876953, 0.0012367963790893555, 0.0013451576232910156, 0.0014535188674926758, 0.001561880111694336, 0.001670241355895996, 0.0017786026000976562, 0.0018869638442993164, 0.0019953250885009766, 0.0021036863327026367, 0.002212047576904297, 0.002320408821105957, 0.002428770065307617, 0.0025371313095092773, 0.0026454925537109375, 0.0027538537979125977, 0.002862215042114258, 0.002970576286315918, 0.003078937530517578, 0.0031872987747192383, 0.0032956600189208984, 0.0034040212631225586, 0.0035123825073242188, 0.003620743751525879, 0.003729104995727539, 0.0038374662399291992, 0.003945827484130859, 0.0040541887283325195, 0.00416254997253418, 0.00427091121673584, 0.0043792724609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 26.0, 22.0, 30.0, 37.0, 48.0, 54.0, 75.0, 99.0, 155.0, 261.0, 332.0, 606.0, 900.0, 1755.0, 3424.0, 7188.0, 18987.0, 74523.0, 681406.0, 199580.0, 36747.0, 11378.0, 5020.0, 2286.0, 1347.0, 750.0, 467.0, 298.0, 184.0, 147.0, 105.0, 90.0, 48.0, 48.0, 30.0, 23.0, 15.0, 11.0, 11.0, 7.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.7421875, -5.5555419921875, -5.368896484375, -5.1822509765625, -4.99560546875, -4.8089599609375, -4.622314453125, -4.4356689453125, -4.2490234375, -4.0623779296875, -3.875732421875, -3.6890869140625, -3.50244140625, -3.3157958984375, -3.129150390625, -2.9425048828125, -2.755859375, -2.5692138671875, -2.382568359375, -2.1959228515625, -2.00927734375, -1.8226318359375, -1.635986328125, -1.4493408203125, -1.2626953125, -1.0760498046875, -0.889404296875, -0.7027587890625, -0.51611328125, -0.3294677734375, -0.142822265625, 0.0438232421875, 0.23046875, 0.4171142578125, 0.603759765625, 0.7904052734375, 0.97705078125, 1.1636962890625, 1.350341796875, 1.5369873046875, 1.7236328125, 1.9102783203125, 2.096923828125, 2.2835693359375, 2.47021484375, 2.6568603515625, 2.843505859375, 3.0301513671875, 3.216796875, 3.4034423828125, 3.590087890625, 3.7767333984375, 3.96337890625, 4.1500244140625, 4.336669921875, 4.5233154296875, 4.7099609375, 4.8966064453125, 5.083251953125, 5.2698974609375, 5.45654296875, 5.6431884765625, 5.829833984375, 6.0164794921875, 6.203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 8.0, 5.0, 13.0, 14.0, 14.0, 20.0, 22.0, 28.0, 41.0, 50.0, 87.0, 101.0, 112.0, 114.0, 83.0, 58.0, 58.0, 40.0, 24.0, 23.0, 13.0, 16.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.4920654296875, -7.241943359375, -6.9918212890625, -6.74169921875, -6.4915771484375, -6.241455078125, -5.9913330078125, -5.7412109375, -5.4910888671875, -5.240966796875, -4.9908447265625, -4.74072265625, -4.4906005859375, -4.240478515625, -3.9903564453125, -3.740234375, -3.4901123046875, -3.239990234375, -2.9898681640625, -2.73974609375, -2.4896240234375, -2.239501953125, -1.9893798828125, -1.7392578125, -1.4891357421875, -1.239013671875, -0.9888916015625, -0.73876953125, -0.4886474609375, -0.238525390625, 0.0115966796875, 0.26171875, 0.5118408203125, 0.761962890625, 1.0120849609375, 1.26220703125, 1.5123291015625, 1.762451171875, 2.0125732421875, 2.2626953125, 2.5128173828125, 2.762939453125, 3.0130615234375, 3.26318359375, 3.5133056640625, 3.763427734375, 4.0135498046875, 4.263671875, 4.5137939453125, 4.763916015625, 5.0140380859375, 5.26416015625, 5.5142822265625, 5.764404296875, 6.0145263671875, 6.2646484375, 6.5147705078125, 6.764892578125, 7.0150146484375, 7.26513671875, 7.5152587890625, 7.765380859375, 8.0155029296875, 8.265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 11.0, 17.0, 34.0, 45.0, 81.0, 176.0, 329.0, 133.0, 62.0, 37.0, 22.0, 15.0, 7.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-201.1312255859375, -192.88150024414062, -184.63177490234375, -176.38204956054688, -168.13232421875, -159.88259887695312, -151.63287353515625, -143.38314819335938, -135.1334228515625, -126.88369750976562, -118.63397216796875, -110.38424682617188, -102.134521484375, -93.88479614257812, -85.63507080078125, -77.38534545898438, -69.1356201171875, -60.885894775390625, -52.63616943359375, -44.386444091796875, -36.13671875, -27.886993408203125, -19.63726806640625, -11.387542724609375, -3.1378173828125, 5.111907958984375, 13.36163330078125, 21.611358642578125, 29.861083984375, 38.110809326171875, 46.36053466796875, 54.610260009765625, 62.860015869140625, 71.1097412109375, 79.35946655273438, 87.60919189453125, 95.85891723632812, 104.108642578125, 112.35836791992188, 120.60809326171875, 128.85781860351562, 137.1075439453125, 145.35726928710938, 153.60699462890625, 161.85671997070312, 170.1064453125, 178.35617065429688, 186.60589599609375, 194.85562133789062, 203.1053466796875, 211.35507202148438, 219.60479736328125, 227.85452270507812, 236.104248046875, 244.35397338867188, 252.60369873046875, 260.8534240722656, 269.1031494140625, 277.3528747558594, 285.60260009765625, 293.8523254394531, 302.10205078125, 310.3517761230469, 318.60150146484375, 326.8512268066406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 10.0, 12.0, 13.0, 11.0, 10.0, 18.0, 20.0, 23.0, 24.0, 26.0, 28.0, 25.0, 27.0, 71.0, 89.0, 122.0, 114.0, 47.0, 35.0, 37.0, 26.0, 20.0, 20.0, 16.0, 20.0, 24.0, 14.0, 17.0, 10.0, 11.0, 14.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.0072784423828, -200.46408081054688, -192.9208984375, -185.37770080566406, -177.83450317382812, -170.29132080078125, -162.7481231689453, -155.20492553710938, -147.6617431640625, -140.11854553222656, -132.5753631591797, -125.03216552734375, -117.48897552490234, -109.94578552246094, -102.402587890625, -94.8593978881836, -87.31620788574219, -79.77301788330078, -72.22982788085938, -64.68663024902344, -57.14344024658203, -49.600250244140625, -42.05705642700195, -34.51386260986328, -26.970672607421875, -19.427480697631836, -11.884288787841797, -4.341096878051758, 3.2020950317382812, 10.745285034179688, 18.28847885131836, 25.83167266845703, 33.374847412109375, 40.91803741455078, 48.46123123168945, 56.004425048828125, 63.54761505126953, 71.09080505371094, 78.63400268554688, 86.17719268798828, 93.72038269042969, 101.2635726928711, 108.8067626953125, 116.34996032714844, 123.89315032958984, 131.43634033203125, 138.9795379638672, 146.52273559570312, 154.06591796875, 161.60911560058594, 169.1522979736328, 176.69549560546875, 184.23867797851562, 191.78187561035156, 199.3250732421875, 206.86825561523438, 214.4114532470703, 221.95465087890625, 229.49783325195312, 237.04103088378906, 244.584228515625, 252.12741088867188, 259.67059326171875, 267.21380615234375, 274.7569885253906]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 7.0, 12.0, 17.0, 19.0, 36.0, 61.0, 70.0, 128.0, 188.0, 350.0, 568.0, 999.0, 2220.0, 6292.0, 22037.0, 128437.0, 1080382.0, 2386092.0, 490875.0, 57563.0, 10795.0, 3471.0, 1548.0, 864.0, 484.0, 264.0, 174.0, 100.0, 58.0, 44.0, 37.0, 25.0, 18.0, 13.0, 11.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.6875, -23.815185546875, -22.94287109375, -22.070556640625, -21.1982421875, -20.325927734375, -19.45361328125, -18.581298828125, -17.708984375, -16.836669921875, -15.96435546875, -15.092041015625, -14.2197265625, -13.347412109375, -12.47509765625, -11.602783203125, -10.73046875, -9.858154296875, -8.98583984375, -8.113525390625, -7.2412109375, -6.368896484375, -5.49658203125, -4.624267578125, -3.751953125, -2.879638671875, -2.00732421875, -1.135009765625, -0.2626953125, 0.609619140625, 1.48193359375, 2.354248046875, 3.2265625, 4.098876953125, 4.97119140625, 5.843505859375, 6.7158203125, 7.588134765625, 8.46044921875, 9.332763671875, 10.205078125, 11.077392578125, 11.94970703125, 12.822021484375, 13.6943359375, 14.566650390625, 15.43896484375, 16.311279296875, 17.18359375, 18.055908203125, 18.92822265625, 19.800537109375, 20.6728515625, 21.545166015625, 22.41748046875, 23.289794921875, 24.162109375, 25.034423828125, 25.90673828125, 26.779052734375, 27.6513671875, 28.523681640625, 29.39599609375, 30.268310546875, 31.140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 7.0, 19.0, 21.0, 25.0, 33.0, 45.0, 41.0, 43.0, 39.0, 60.0, 55.0, 74.0, 56.0, 56.0, 70.0, 56.0, 48.0, 46.0, 25.0, 37.0, 27.0, 23.0, 23.0, 11.0, 10.0, 11.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.030517578125, -15.42041015625, -14.810302734375, -14.2001953125, -13.590087890625, -12.97998046875, -12.369873046875, -11.759765625, -11.149658203125, -10.53955078125, -9.929443359375, -9.3193359375, -8.709228515625, -8.09912109375, -7.489013671875, -6.87890625, -6.268798828125, -5.65869140625, -5.048583984375, -4.4384765625, -3.828369140625, -3.21826171875, -2.608154296875, -1.998046875, -1.387939453125, -0.77783203125, -0.167724609375, 0.4423828125, 1.052490234375, 1.66259765625, 2.272705078125, 2.8828125, 3.492919921875, 4.10302734375, 4.713134765625, 5.3232421875, 5.933349609375, 6.54345703125, 7.153564453125, 7.763671875, 8.373779296875, 8.98388671875, 9.593994140625, 10.2041015625, 10.814208984375, 11.42431640625, 12.034423828125, 12.64453125, 13.254638671875, 13.86474609375, 14.474853515625, 15.0849609375, 15.695068359375, 16.30517578125, 16.915283203125, 17.525390625, 18.135498046875, 18.74560546875, 19.355712890625, 19.9658203125, 20.575927734375, 21.18603515625, 21.796142578125, 22.40625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 9.0, 12.0, 13.0, 30.0, 38.0, 36.0, 86.0, 147.0, 273.0, 516.0, 1359.0, 4894.0, 45361.0, 3962462.0, 167551.0, 8266.0, 1832.0, 646.0, 300.0, 172.0, 83.0, 64.0, 41.0, 18.0, 21.0, 11.0, 10.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.6875, -69.1865234375, -66.685546875, -64.1845703125, -61.68359375, -59.1826171875, -56.681640625, -54.1806640625, -51.6796875, -49.1787109375, -46.677734375, -44.1767578125, -41.67578125, -39.1748046875, -36.673828125, -34.1728515625, -31.671875, -29.1708984375, -26.669921875, -24.1689453125, -21.66796875, -19.1669921875, -16.666015625, -14.1650390625, -11.6640625, -9.1630859375, -6.662109375, -4.1611328125, -1.66015625, 0.8408203125, 3.341796875, 5.8427734375, 8.34375, 10.8447265625, 13.345703125, 15.8466796875, 18.34765625, 20.8486328125, 23.349609375, 25.8505859375, 28.3515625, 30.8525390625, 33.353515625, 35.8544921875, 38.35546875, 40.8564453125, 43.357421875, 45.8583984375, 48.359375, 50.8603515625, 53.361328125, 55.8623046875, 58.36328125, 60.8642578125, 63.365234375, 65.8662109375, 68.3671875, 70.8681640625, 73.369140625, 75.8701171875, 78.37109375, 80.8720703125, 83.373046875, 85.8740234375, 88.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 13.0, 6.0, 7.0, 11.0, 21.0, 22.0, 44.0, 56.0, 73.0, 130.0, 204.0, 303.0, 539.0, 701.0, 663.0, 504.0, 285.0, 180.0, 97.0, 61.0, 43.0, 42.0, 16.0, 10.0, 12.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -50.50341796875, -48.9755859375, -47.44775390625, -45.919921875, -44.39208984375, -42.8642578125, -41.33642578125, -39.80859375, -38.28076171875, -36.7529296875, -35.22509765625, -33.697265625, -32.16943359375, -30.6416015625, -29.11376953125, -27.5859375, -26.05810546875, -24.5302734375, -23.00244140625, -21.474609375, -19.94677734375, -18.4189453125, -16.89111328125, -15.36328125, -13.83544921875, -12.3076171875, -10.77978515625, -9.251953125, -7.72412109375, -6.1962890625, -4.66845703125, -3.140625, -1.61279296875, -0.0849609375, 1.44287109375, 2.970703125, 4.49853515625, 6.0263671875, 7.55419921875, 9.08203125, 10.60986328125, 12.1376953125, 13.66552734375, 15.193359375, 16.72119140625, 18.2490234375, 19.77685546875, 21.3046875, 22.83251953125, 24.3603515625, 25.88818359375, 27.416015625, 28.94384765625, 30.4716796875, 31.99951171875, 33.52734375, 35.05517578125, 36.5830078125, 38.11083984375, 39.638671875, 41.16650390625, 42.6943359375, 44.22216796875, 45.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 10.0, 16.0, 25.0, 35.0, 80.0, 158.0, 240.0, 173.0, 116.0, 53.0, 34.0, 13.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.818603515625, -325.2418518066406, -309.66510009765625, -294.0883483886719, -278.5115966796875, -262.934814453125, -247.35806274414062, -231.78131103515625, -216.20455932617188, -200.6278076171875, -185.05105590820312, -169.4742889404297, -153.8975372314453, -138.32078552246094, -122.74402618408203, -107.16726684570312, -91.59051513671875, -76.01376342773438, -60.43700408935547, -44.86024856567383, -29.283493041992188, -13.706741333007812, 1.8700180053710938, 17.44677734375, 33.023529052734375, 48.600284576416016, 64.17704010009766, 79.75379943847656, 95.33055114746094, 110.90730285644531, 126.48406219482422, 142.06082153320312, 157.6375732421875, 173.21432495117188, 188.79107666015625, 204.3678436279297, 219.94459533691406, 235.52134704589844, 251.09811401367188, 266.67486572265625, 282.2516174316406, 297.828369140625, 313.4051208496094, 328.98187255859375, 344.55865478515625, 360.1353759765625, 375.712158203125, 391.2889099121094, 406.86566162109375, 422.4424133300781, 438.0191650390625, 453.5959167480469, 469.17266845703125, 484.74945068359375, 500.3262023925781, 515.9029541015625, 531.479736328125, 547.0565185546875, 562.6332397460938, 578.2100219726562, 593.7867431640625, 609.363525390625, 624.9402465820312, 640.5170288085938, 656.09375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 13.0, 9.0, 17.0, 29.0, 19.0, 27.0, 28.0, 45.0, 41.0, 43.0, 53.0, 63.0, 68.0, 54.0, 73.0, 47.0, 48.0, 30.0, 41.0, 49.0, 36.0, 33.0, 15.0, 20.0, 20.0, 17.0, 13.0, 6.0, 10.0, 6.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-266.8985900878906, -258.9678039550781, -251.03701782226562, -243.10623168945312, -235.17544555664062, -227.24465942382812, -219.31385803222656, -211.38307189941406, -203.45228576660156, -195.52149963378906, -187.59071350097656, -179.65992736816406, -171.7291259765625, -163.79833984375, -155.8675537109375, -147.936767578125, -140.0059814453125, -132.0751953125, -124.1444091796875, -116.21361541748047, -108.28282928466797, -100.35204315185547, -92.42124938964844, -84.49046325683594, -76.55967712402344, -68.62889099121094, -60.69810104370117, -52.767311096191406, -44.836524963378906, -36.905738830566406, -28.97494888305664, -21.044158935546875, -13.113388061523438, -5.182600021362305, 2.748188018798828, 10.678976058959961, 18.609764099121094, 26.540550231933594, 34.47134017944336, 42.402130126953125, 50.332916259765625, 58.263702392578125, 66.19448852539062, 74.12528228759766, 82.05606842041016, 89.98685455322266, 97.91764831542969, 105.84843444824219, 113.77922058105469, 121.71000671386719, 129.6407928466797, 137.5715789794922, 145.50238037109375, 153.43316650390625, 161.36395263671875, 169.29473876953125, 177.22552490234375, 185.15631103515625, 193.08709716796875, 201.01788330078125, 208.94866943359375, 216.87945556640625, 224.8102569580078, 232.7410430908203, 240.6718292236328]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 9.0, 16.0, 24.0, 28.0, 45.0, 76.0, 101.0, 180.0, 307.0, 466.0, 771.0, 1520.0, 3077.0, 6498.0, 15982.0, 44897.0, 145213.0, 444968.0, 262200.0, 77619.0, 25582.0, 9835.0, 4389.0, 2043.0, 1115.0, 619.0, 338.0, 217.0, 111.0, 95.0, 70.0, 32.0, 32.0, 23.0, 8.0, 14.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.703125, -23.970947265625, -23.23876953125, -22.506591796875, -21.7744140625, -21.042236328125, -20.31005859375, -19.577880859375, -18.845703125, -18.113525390625, -17.38134765625, -16.649169921875, -15.9169921875, -15.184814453125, -14.45263671875, -13.720458984375, -12.98828125, -12.256103515625, -11.52392578125, -10.791748046875, -10.0595703125, -9.327392578125, -8.59521484375, -7.863037109375, -7.130859375, -6.398681640625, -5.66650390625, -4.934326171875, -4.2021484375, -3.469970703125, -2.73779296875, -2.005615234375, -1.2734375, -0.541259765625, 0.19091796875, 0.923095703125, 1.6552734375, 2.387451171875, 3.11962890625, 3.851806640625, 4.583984375, 5.316162109375, 6.04833984375, 6.780517578125, 7.5126953125, 8.244873046875, 8.97705078125, 9.709228515625, 10.44140625, 11.173583984375, 11.90576171875, 12.637939453125, 13.3701171875, 14.102294921875, 14.83447265625, 15.566650390625, 16.298828125, 17.031005859375, 17.76318359375, 18.495361328125, 19.2275390625, 19.959716796875, 20.69189453125, 21.424072265625, 22.15625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 16.0, 22.0, 23.0, 28.0, 44.0, 37.0, 26.0, 61.0, 55.0, 61.0, 44.0, 47.0, 50.0, 49.0, 59.0, 54.0, 52.0, 42.0, 34.0, 35.0, 22.0, 25.0, 20.0, 9.0, 10.0, 13.0, 10.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.984375, -17.385986328125, -16.78759765625, -16.189208984375, -15.5908203125, -14.992431640625, -14.39404296875, -13.795654296875, -13.197265625, -12.598876953125, -12.00048828125, -11.402099609375, -10.8037109375, -10.205322265625, -9.60693359375, -9.008544921875, -8.41015625, -7.811767578125, -7.21337890625, -6.614990234375, -6.0166015625, -5.418212890625, -4.81982421875, -4.221435546875, -3.623046875, -3.024658203125, -2.42626953125, -1.827880859375, -1.2294921875, -0.631103515625, -0.03271484375, 0.565673828125, 1.1640625, 1.762451171875, 2.36083984375, 2.959228515625, 3.5576171875, 4.156005859375, 4.75439453125, 5.352783203125, 5.951171875, 6.549560546875, 7.14794921875, 7.746337890625, 8.3447265625, 8.943115234375, 9.54150390625, 10.139892578125, 10.73828125, 11.336669921875, 11.93505859375, 12.533447265625, 13.1318359375, 13.730224609375, 14.32861328125, 14.927001953125, 15.525390625, 16.123779296875, 16.72216796875, 17.320556640625, 17.9189453125, 18.517333984375, 19.11572265625, 19.714111328125, 20.3125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 13.0, 26.0, 36.0, 42.0, 53.0, 86.0, 134.0, 205.0, 448.0, 985.0, 2988.0, 18795.0, 647429.0, 359052.0, 14020.0, 2409.0, 806.0, 418.0, 227.0, 109.0, 87.0, 57.0, 32.0, 27.0, 17.0, 10.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.83935546875, -31.5224609375, -30.20556640625, -28.888671875, -27.57177734375, -26.2548828125, -24.93798828125, -23.62109375, -22.30419921875, -20.9873046875, -19.67041015625, -18.353515625, -17.03662109375, -15.7197265625, -14.40283203125, -13.0859375, -11.76904296875, -10.4521484375, -9.13525390625, -7.818359375, -6.50146484375, -5.1845703125, -3.86767578125, -2.55078125, -1.23388671875, 0.0830078125, 1.39990234375, 2.716796875, 4.03369140625, 5.3505859375, 6.66748046875, 7.984375, 9.30126953125, 10.6181640625, 11.93505859375, 13.251953125, 14.56884765625, 15.8857421875, 17.20263671875, 18.51953125, 19.83642578125, 21.1533203125, 22.47021484375, 23.787109375, 25.10400390625, 26.4208984375, 27.73779296875, 29.0546875, 30.37158203125, 31.6884765625, 33.00537109375, 34.322265625, 35.63916015625, 36.9560546875, 38.27294921875, 39.58984375, 40.90673828125, 42.2236328125, 43.54052734375, 44.857421875, 46.17431640625, 47.4912109375, 48.80810546875, 50.125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 7.0, 16.0, 20.0, 23.0, 33.0, 41.0, 29.0, 79.0, 73.0, 102.0, 83.0, 98.0, 92.0, 60.0, 42.0, 29.0, 35.0, 27.0, 26.0, 18.0, 10.0, 6.0, 4.0, 8.0, 0.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.375, -71.69140625, -69.0078125, -66.32421875, -63.640625, -60.95703125, -58.2734375, -55.58984375, -52.90625, -50.22265625, -47.5390625, -44.85546875, -42.171875, -39.48828125, -36.8046875, -34.12109375, -31.4375, -28.75390625, -26.0703125, -23.38671875, -20.703125, -18.01953125, -15.3359375, -12.65234375, -9.96875, -7.28515625, -4.6015625, -1.91796875, 0.765625, 3.44921875, 6.1328125, 8.81640625, 11.5, 14.18359375, 16.8671875, 19.55078125, 22.234375, 24.91796875, 27.6015625, 30.28515625, 32.96875, 35.65234375, 38.3359375, 41.01953125, 43.703125, 46.38671875, 49.0703125, 51.75390625, 54.4375, 57.12109375, 59.8046875, 62.48828125, 65.171875, 67.85546875, 70.5390625, 73.22265625, 75.90625, 78.58984375, 81.2734375, 83.95703125, 86.640625, 89.32421875, 92.0078125, 94.69140625, 97.375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 10.0, 11.0, 11.0, 12.0, 32.0, 41.0, 60.0, 129.0, 246.0, 539.0, 1708.0, 8848.0, 170716.0, 848523.0, 14102.0, 2247.0, 671.0, 292.0, 131.0, 64.0, 50.0, 41.0, 14.0, 13.0, 10.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.5897216796875, -6.370849609375, -6.1519775390625, -5.93310546875, -5.7142333984375, -5.495361328125, -5.2764892578125, -5.0576171875, -4.8387451171875, -4.619873046875, -4.4010009765625, -4.18212890625, -3.9632568359375, -3.744384765625, -3.5255126953125, -3.306640625, -3.0877685546875, -2.868896484375, -2.6500244140625, -2.43115234375, -2.2122802734375, -1.993408203125, -1.7745361328125, -1.5556640625, -1.3367919921875, -1.117919921875, -0.8990478515625, -0.68017578125, -0.4613037109375, -0.242431640625, -0.0235595703125, 0.1953125, 0.4141845703125, 0.633056640625, 0.8519287109375, 1.07080078125, 1.2896728515625, 1.508544921875, 1.7274169921875, 1.9462890625, 2.1651611328125, 2.384033203125, 2.6029052734375, 2.82177734375, 3.0406494140625, 3.259521484375, 3.4783935546875, 3.697265625, 3.9161376953125, 4.135009765625, 4.3538818359375, 4.57275390625, 4.7916259765625, 5.010498046875, 5.2293701171875, 5.4482421875, 5.6671142578125, 5.885986328125, 6.1048583984375, 6.32373046875, 6.5426025390625, 6.761474609375, 6.9803466796875, 7.19921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 9.0, 6.0, 10.0, 9.0, 16.0, 21.0, 23.0, 32.0, 42.0, 53.0, 60.0, 90.0, 94.0, 91.0, 82.0, 85.0, 73.0, 47.0, 21.0, 21.0, 26.0, 10.0, 10.0, 14.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008563995361328125, -0.0008327588438987732, -0.0008091181516647339, -0.0007854774594306946, -0.0007618367671966553, -0.000738196074962616, -0.0007145553827285767, -0.0006909146904945374, -0.000667273998260498, -0.0006436333060264587, -0.0006199926137924194, -0.0005963519215583801, -0.0005727112293243408, -0.0005490705370903015, -0.0005254298448562622, -0.0005017891526222229, -0.0004781484603881836, -0.0004545077681541443, -0.000430867075920105, -0.0004072263836860657, -0.00038358569145202637, -0.00035994499921798706, -0.00033630430698394775, -0.00031266361474990845, -0.00028902292251586914, -0.00026538223028182983, -0.00024174153804779053, -0.00021810084581375122, -0.00019446015357971191, -0.0001708194613456726, -0.0001471787691116333, -0.000123538076877594, -9.989738464355469e-05, -7.625669240951538e-05, -5.2616000175476074e-05, -2.8975307941436768e-05, -5.334615707397461e-06, 1.8306076526641846e-05, 4.194676876068115e-05, 6.558746099472046e-05, 8.922815322875977e-05, 0.00011286884546279907, 0.00013650953769683838, 0.00016015022993087769, 0.000183790922164917, 0.0002074316143989563, 0.0002310723066329956, 0.0002547129988670349, 0.0002783536911010742, 0.0003019943833351135, 0.00032563507556915283, 0.00034927576780319214, 0.00037291646003723145, 0.00039655715227127075, 0.00042019784450531006, 0.00044383853673934937, 0.00046747922897338867, 0.000491119921207428, 0.0005147606134414673, 0.0005384013056755066, 0.0005620419979095459, 0.0005856826901435852, 0.0006093233823776245, 0.0006329640746116638, 0.0006566047668457031]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 14.0, 19.0, 30.0, 52.0, 69.0, 111.0, 200.0, 326.0, 565.0, 1187.0, 2597.0, 7025.0, 23391.0, 154762.0, 780903.0, 56076.0, 12888.0, 4442.0, 1932.0, 773.0, 469.0, 255.0, 150.0, 89.0, 60.0, 43.0, 30.0, 15.0, 9.0, 15.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5543212890625, -3.440673828125, -3.3270263671875, -3.21337890625, -3.0997314453125, -2.986083984375, -2.8724365234375, -2.7587890625, -2.6451416015625, -2.531494140625, -2.4178466796875, -2.30419921875, -2.1905517578125, -2.076904296875, -1.9632568359375, -1.849609375, -1.7359619140625, -1.622314453125, -1.5086669921875, -1.39501953125, -1.2813720703125, -1.167724609375, -1.0540771484375, -0.9404296875, -0.8267822265625, -0.713134765625, -0.5994873046875, -0.48583984375, -0.3721923828125, -0.258544921875, -0.1448974609375, -0.03125, 0.0823974609375, 0.196044921875, 0.3096923828125, 0.42333984375, 0.5369873046875, 0.650634765625, 0.7642822265625, 0.8779296875, 0.9915771484375, 1.105224609375, 1.2188720703125, 1.33251953125, 1.4461669921875, 1.559814453125, 1.6734619140625, 1.787109375, 1.9007568359375, 2.014404296875, 2.1280517578125, 2.24169921875, 2.3553466796875, 2.468994140625, 2.5826416015625, 2.6962890625, 2.8099365234375, 2.923583984375, 3.0372314453125, 3.15087890625, 3.2645263671875, 3.378173828125, 3.4918212890625, 3.60546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 0.0, 11.0, 6.0, 8.0, 8.0, 11.0, 7.0, 17.0, 22.0, 23.0, 61.0, 85.0, 133.0, 167.0, 126.0, 98.0, 56.0, 48.0, 25.0, 20.0, 10.0, 16.0, 10.0, 14.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73651123046875, -5.5433349609375, -5.35015869140625, -5.156982421875, -4.96380615234375, -4.7706298828125, -4.57745361328125, -4.38427734375, -4.19110107421875, -3.9979248046875, -3.80474853515625, -3.611572265625, -3.41839599609375, -3.2252197265625, -3.03204345703125, -2.8388671875, -2.64569091796875, -2.4525146484375, -2.25933837890625, -2.066162109375, -1.87298583984375, -1.6798095703125, -1.48663330078125, -1.29345703125, -1.10028076171875, -0.9071044921875, -0.71392822265625, -0.520751953125, -0.32757568359375, -0.1343994140625, 0.05877685546875, 0.251953125, 0.44512939453125, 0.6383056640625, 0.83148193359375, 1.024658203125, 1.21783447265625, 1.4110107421875, 1.60418701171875, 1.79736328125, 1.99053955078125, 2.1837158203125, 2.37689208984375, 2.570068359375, 2.76324462890625, 2.9564208984375, 3.14959716796875, 3.3427734375, 3.53594970703125, 3.7291259765625, 3.92230224609375, 4.115478515625, 4.30865478515625, 4.5018310546875, 4.69500732421875, 4.88818359375, 5.08135986328125, 5.2745361328125, 5.46771240234375, 5.660888671875, 5.85406494140625, 6.0472412109375, 6.24041748046875, 6.43359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 33.0, 65.0, 280.0, 453.0, 97.0, 29.0, 14.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-443.47271728515625, -431.5397033691406, -419.6067199707031, -407.6737060546875, -395.7406921386719, -383.80767822265625, -371.87469482421875, -359.9416809082031, -348.0086669921875, -336.0756530761719, -324.1426696777344, -312.20965576171875, -300.2766418457031, -288.3436279296875, -276.41064453125, -264.4776306152344, -252.54464721679688, -240.6116485595703, -228.6786346435547, -216.74563598632812, -204.8126220703125, -192.87962341308594, -180.94662475585938, -169.01361083984375, -157.0806121826172, -145.14761352539062, -133.214599609375, -121.28160095214844, -109.34859466552734, -97.41558837890625, -85.48258972167969, -73.5495834350586, -61.616607666015625, -49.68360137939453, -37.7505989074707, -25.817596435546875, -13.884590148925781, -1.9515838623046875, 9.981414794921875, 21.91442108154297, 33.84742736816406, 45.780433654785156, 57.713436126708984, 69.64643859863281, 81.5794448852539, 93.512451171875, 105.44544982910156, 117.37845611572266, 129.31146240234375, 141.2444610595703, 153.17747497558594, 165.1104736328125, 177.04348754882812, 188.9764862060547, 200.90948486328125, 212.84249877929688, 224.77549743652344, 236.70849609375, 248.64151000976562, 260.57452392578125, 272.50750732421875, 284.4405212402344, 296.37353515625, 308.3065185546875, 320.2395324707031]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 11.0, 13.0, 12.0, 17.0, 17.0, 18.0, 17.0, 26.0, 18.0, 37.0, 126.0, 123.0, 59.0, 109.0, 154.0, 35.0, 23.0, 33.0, 22.0, 19.0, 15.0, 24.0, 15.0, 9.0, 8.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-227.55841064453125, -220.78248596191406, -214.00656127929688, -207.23065185546875, -200.45472717285156, -193.67880249023438, -186.9028778076172, -180.126953125, -173.35104370117188, -166.5751190185547, -159.7991943359375, -153.02328491210938, -146.2473602294922, -139.471435546875, -132.6955108642578, -125.91959381103516, -119.14366912841797, -112.36774444580078, -105.59182739257812, -98.81590270996094, -92.03998565673828, -85.2640609741211, -78.48814392089844, -71.71221923828125, -64.93629455566406, -58.16037368774414, -51.38445281982422, -44.60852813720703, -37.832611083984375, -31.056686401367188, -24.280765533447266, -17.504844665527344, -10.728927612304688, -3.9530062675476074, 2.8229150772094727, 9.598836898803711, 16.374757766723633, 23.150680541992188, 29.92660140991211, 36.70252227783203, 43.47844314575195, 50.254364013671875, 57.0302848815918, 63.80620574951172, 70.5821304321289, 77.35804748535156, 84.13397216796875, 90.90989685058594, 97.6858139038086, 104.46173858642578, 111.23765563964844, 118.01358032226562, 124.78949737548828, 131.5654296875, 138.34133911132812, 145.1172637939453, 151.8931884765625, 158.6691131591797, 165.44503784179688, 172.220947265625, 178.9968719482422, 185.77279663085938, 192.54872131347656, 199.32464599609375, 206.10055541992188]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 8.0, 8.0, 5.0, 15.0, 18.0, 19.0, 23.0, 25.0, 21.0, 43.0, 32.0, 37.0, 62.0, 216.0, 182.0, 56.0, 44.0, 29.0, 20.0, 24.0, 19.0, 16.0, 20.0, 16.0, 7.0, 13.0, 5.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.8740234375, -16.310546875, -15.7470703125, -15.18359375, -14.6201171875, -14.056640625, -13.4931640625, -12.9296875, -12.3662109375, -11.802734375, -11.2392578125, -10.67578125, -10.1123046875, -9.548828125, -8.9853515625, -8.421875, -7.8583984375, -7.294921875, -6.7314453125, -6.16796875, -5.6044921875, -5.041015625, -4.4775390625, -3.9140625, -3.3505859375, -2.787109375, -2.2236328125, -1.66015625, -1.0966796875, -0.533203125, 0.0302734375, 0.59375, 1.1572265625, 1.720703125, 2.2841796875, 2.84765625, 3.4111328125, 3.974609375, 4.5380859375, 5.1015625, 5.6650390625, 6.228515625, 6.7919921875, 7.35546875, 7.9189453125, 8.482421875, 9.0458984375, 9.609375, 10.1728515625, 10.736328125, 11.2998046875, 11.86328125, 12.4267578125, 12.990234375, 13.5537109375, 14.1171875, 14.6806640625, 15.244140625, 15.8076171875, 16.37109375, 16.9345703125, 17.498046875, 18.0615234375, 18.625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 3.0, 8.0, 14.0, 15.0, 18.0, 18.0, 27.0, 28.0, 46.0, 93.0, 232.0, 562.0, 2174.0, 17322.0, 8354671.0, 10760.0, 1648.0, 466.0, 205.0, 96.0, 55.0, 18.0, 26.0, 20.0, 14.0, 6.0, 11.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-205.54661560058594, -199.00250244140625, -192.45838928222656, -185.91427612304688, -179.3701629638672, -172.8260498046875, -166.28192138671875, -159.73782348632812, -153.19369506835938, -146.6495819091797, -140.10546875, -133.5613555908203, -127.01724243164062, -120.47312927246094, -113.92900848388672, -107.38489532470703, -100.84078979492188, -94.29667663574219, -87.7525634765625, -81.20845031738281, -74.66433715820312, -68.12022399902344, -61.57610321044922, -55.03199005126953, -48.487876892089844, -41.943763732910156, -35.39965057373047, -28.855533599853516, -22.311420440673828, -15.76730728149414, -9.223190307617188, -2.6790771484375, 3.865020751953125, 10.409134864807129, 16.953248977661133, 23.497364044189453, 30.04147720336914, 36.58559036254883, 43.12970733642578, 49.67382049560547, 56.217933654785156, 62.762046813964844, 69.30615997314453, 75.85028076171875, 82.39439392089844, 88.93850708007812, 95.48262023925781, 102.0267333984375, 108.57084655761719, 115.11495971679688, 121.65907287597656, 128.20318603515625, 134.74729919433594, 141.29141235351562, 147.83554077148438, 154.379638671875, 160.92376708984375, 167.46788024902344, 174.01199340820312, 180.5561065673828, 187.1002197265625, 193.6443328857422, 200.18844604492188, 206.73257446289062, 213.27667236328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-186.46343994140625, -180.51824951171875, -174.5730743408203, -168.6278839111328, -162.68270874023438, -156.73751831054688, -150.79232788085938, -144.84715270996094, -138.90196228027344, -132.95677185058594, -127.0115966796875, -121.06640625, -115.12122344970703, -109.17604064941406, -103.2308578491211, -97.28567504882812, -91.34049224853516, -85.39530944824219, -79.45012664794922, -73.50494384765625, -67.55975341796875, -61.61457061767578, -55.66938781738281, -49.72420120239258, -43.77901840209961, -37.83383560180664, -31.888648986816406, -25.943466186523438, -19.998281478881836, -14.053096771240234, -8.107913970947266, -2.1627273559570312, 3.7824554443359375, 9.727640151977539, 15.672823905944824, 21.61800765991211, 27.56319236755371, 33.50837707519531, 39.45355987548828, 45.398746490478516, 51.343929290771484, 57.28911209106445, 63.23429870605469, 69.17948150634766, 75.12466430664062, 81.06985473632812, 87.01502990722656, 92.96022033691406, 98.90540313720703, 104.8505859375, 110.79576873779297, 116.74095153808594, 122.68614196777344, 128.63131713867188, 134.57650756835938, 140.52169799804688, 146.4668731689453, 152.4120635986328, 158.35723876953125, 164.30242919921875, 170.2476043701172, 176.1927947998047, 182.13796997070312, 188.08316040039062, 194.02835083007812]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 9.0, 15.0, 22.0, 35.0, 56.0, 79.0, 109.0, 200.0, 277.0, 471.0, 821.0, 1544.0, 2840.0, 5131.0, 9703.0, 18230.0, 34522.0, 65765.0, 112609.0, 117542.0, 72353.0, 38075.0, 20099.0, 10735.0, 5643.0, 3206.0, 1728.0, 933.0, 517.0, 380.0, 216.0, 143.0, 77.0, 48.0, 38.0, 24.0, 23.0, 15.0, 1.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.5625, -80.2734375, -77.984375, -75.6953125, -73.40625, -71.1171875, -68.828125, -66.5390625, -64.25, -61.9609375, -59.671875, -57.3828125, -55.09375, -52.8046875, -50.515625, -48.2265625, -45.9375, -43.6484375, -41.359375, -39.0703125, -36.78125, -34.4921875, -32.203125, -29.9140625, -27.625, -25.3359375, -23.046875, -20.7578125, -18.46875, -16.1796875, -13.890625, -11.6015625, -9.3125, -7.0234375, -4.734375, -2.4453125, -0.15625, 2.1328125, 4.421875, 6.7109375, 9.0, 11.2890625, 13.578125, 15.8671875, 18.15625, 20.4453125, 22.734375, 25.0234375, 27.3125, 29.6015625, 31.890625, 34.1796875, 36.46875, 38.7578125, 41.046875, 43.3359375, 45.625, 47.9140625, 50.203125, 52.4921875, 54.78125, 57.0703125, 59.359375, 61.6484375, 63.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 15.0, 21.0, 31.0, 26.0, 39.0, 45.0, 51.0, 62.0, 79.0, 63.0, 55.0, 62.0, 68.0, 66.0, 54.0, 53.0, 33.0, 33.0, 19.0, 19.0, 11.0, 15.0, 9.0, 4.0, 6.0, 9.0, 3.0, 9.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.6123046875, -16.990234375, -16.3681640625, -15.74609375, -15.1240234375, -14.501953125, -13.8798828125, -13.2578125, -12.6357421875, -12.013671875, -11.3916015625, -10.76953125, -10.1474609375, -9.525390625, -8.9033203125, -8.28125, -7.6591796875, -7.037109375, -6.4150390625, -5.79296875, -5.1708984375, -4.548828125, -3.9267578125, -3.3046875, -2.6826171875, -2.060546875, -1.4384765625, -0.81640625, -0.1943359375, 0.427734375, 1.0498046875, 1.671875, 2.2939453125, 2.916015625, 3.5380859375, 4.16015625, 4.7822265625, 5.404296875, 6.0263671875, 6.6484375, 7.2705078125, 7.892578125, 8.5146484375, 9.13671875, 9.7587890625, 10.380859375, 11.0029296875, 11.625, 12.2470703125, 12.869140625, 13.4912109375, 14.11328125, 14.7353515625, 15.357421875, 15.9794921875, 16.6015625, 17.2236328125, 17.845703125, 18.4677734375, 19.08984375, 19.7119140625, 20.333984375, 20.9560546875, 21.578125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 17.0, 19.0, 21.0, 30.0, 49.0, 72.0, 62.0, 64.0, 39.0, 35.0, 15.0, 15.0, 9.0, 10.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.70374298095703, -110.53536987304688, -107.36700439453125, -104.1986312866211, -101.03025817871094, -97.86189270019531, -94.69351959228516, -91.525146484375, -88.35678100585938, -85.18840789794922, -82.0200424194336, -78.85166931152344, -75.68330383300781, -72.51493072509766, -69.3465576171875, -66.17819213867188, -63.00981903076172, -59.84144973754883, -56.67308044433594, -53.50470733642578, -50.33633804321289, -47.16796875, -43.999595642089844, -40.83122634887695, -37.66285705566406, -34.49448776245117, -31.32611656188965, -28.157745361328125, -24.989376068115234, -21.821006774902344, -18.65263557434082, -15.484264373779297, -12.315902709960938, -9.14753246307373, -5.979162216186523, -2.8107919692993164, 0.3575782775878906, 3.5259485244750977, 6.694318771362305, 9.862689971923828, 13.031059265136719, 16.19942855834961, 19.367799758911133, 22.536170959472656, 25.704540252685547, 28.872909545898438, 32.041282653808594, 35.209651947021484, 38.378021240234375, 41.546390533447266, 44.714759826660156, 47.88313293457031, 51.0515022277832, 54.219871520996094, 57.38824462890625, 60.55661392211914, 63.72498321533203, 66.89335632324219, 70.06172180175781, 73.23009490966797, 76.39846801757812, 79.56683349609375, 82.7352066040039, 85.90357971191406, 89.07194519042969]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 12.0, 30.0, 55.0, 74.0, 85.0, 58.0, 39.0, 24.0, 16.0, 8.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.78057098388672, -66.1164321899414, -63.452293395996094, -60.78815460205078, -58.12401580810547, -55.459877014160156, -52.795738220214844, -50.13159942626953, -47.46746063232422, -44.803321838378906, -42.139183044433594, -39.47504425048828, -36.81090545654297, -34.146766662597656, -31.482627868652344, -28.81848907470703, -26.15435028076172, -23.490211486816406, -20.826072692871094, -18.16193389892578, -15.497795104980469, -12.833656311035156, -10.169517517089844, -7.505378723144531, -4.841239929199219, -2.1771011352539062, 0.48703765869140625, 3.1511764526367188, 5.815315246582031, 8.479454040527344, 11.143592834472656, 13.807731628417969, 16.47186279296875, 19.136001586914062, 21.800140380859375, 24.464279174804688, 27.12841796875, 29.792556762695312, 32.456695556640625, 35.12083435058594, 37.78497314453125, 40.44911193847656, 43.113250732421875, 45.77738952636719, 48.4415283203125, 51.10566711425781, 53.769805908203125, 56.43394470214844, 59.09808349609375, 61.76222229003906, 64.42636108398438, 67.09049987792969, 69.754638671875, 72.41877746582031, 75.08291625976562, 77.74705505371094, 80.41119384765625, 83.07533264160156, 85.73947143554688, 88.40361022949219, 91.0677490234375, 93.73188781738281, 96.39602661132812, 99.06016540527344, 101.72430419921875]}, "eval/loss": 0.9598673582077026, "eval/wer": 0.14415540607575847, "eval/runtime": 868.6571, "eval/samples_per_second": 3.041, "eval/steps_per_second": 0.381, "train/train_runtime": 116020.8621, "train/train_samples_per_second": 4.919, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 2.37383288616657} \ No newline at end of file